libretro: microphone support

2026-02-17 08:03:04 -07:00 · 2026-02-05 14:22:34 -05:00 · 2026-02-05 14:22:34 -05:00 · 2bc6a3e6d7
commit 2bc6a3e6d7
parent 2831ddf805
10 changed files with 388 additions and 11 deletions
--- a/src/audio_core/CMakeLists.txt
+++ b/src/audio_core/CMakeLists.txt
@ -38,7 +38,7 @@ add_library(audio_core STATIC

    $<$<BOOL:${ENABLE_SDL2}>:sdl2_sink.cpp sdl2_sink.h>
    $<$<BOOL:${ENABLE_CUBEB}>:cubeb_sink.cpp cubeb_sink.h cubeb_input.cpp cubeb_input.h>
-    $<$<BOOL:${ENABLE_LIBRETRO}>:libretro_sink.cpp libretro_sink.h>
+    $<$<BOOL:${ENABLE_LIBRETRO}>:libretro_sink.cpp libretro_sink.h libretro_input.cpp libretro_input.h>
    $<$<BOOL:${ENABLE_OPENAL}>:openal_input.cpp openal_input.h openal_sink.cpp openal_sink.h>
 )

--- a/src/audio_core/input_details.cpp
+++ b/src/audio_core/input_details.cpp
@ -16,7 +16,7 @@
 #include "audio_core/openal_input.h"
 #endif
 #ifdef HAVE_LIBRETRO
-// todo
+#include "audio_core/libretro_input.h"
 #endif
 #include "common/logging/log.h"
 #include "core/core.h"
@ -33,11 +33,9 @@ constexpr std::array input_details = {
                                     "Microphone permission denied, falling back to null input.");
                         return std::make_unique<NullInput>();
                     }
-                     // todo
-                     return std::make_unique<NullInput>();
+                     return std::make_unique<LibRetroInput>();
                 },
-                 // todo
-                 [] { return std::vector<std::string>{"None"}; }},
+                 [] { return std::vector<std::string>{"LibRetro Microphone"}; }},
 #endif
 #ifdef HAVE_CUBEB
    InputDetails{InputType::Cubeb, "Real Device (Cubeb)", true,
--- a/src/audio_core/libretro_input.cpp
+++ b/src/audio_core/libretro_input.cpp
@ -0,0 +1,327 @@
+// Copyright Citra Emulator Project / Azahar Emulator Project
+// Licensed under GPLv2 or any later version
+// Refer to the license.txt file included.
+
+#include <algorithm>
+#include <atomic>
+#include <cstring>
+#include <mutex>
+#include <optional>
+#include <vector>
+#include "audio_core/libretro_input.h"
+#include "citra_libretro/environment.h"
+#include "common/logging/log.h"
+#include "common/ring_buffer.h"
+#include "libretro.h"
+
+namespace AudioCore {
+
+namespace {
+// Global instance pointer for access from retro_run
+LibRetroInput* g_libretro_input = nullptr;
+} // namespace
+
+struct LibRetroInput::Impl {
+    std::optional<retro_microphone_interface> mic_interface;
+    retro_microphone_t* mic_handle = nullptr;
+    bool is_sampling = false;
+    u8 sample_size_in_bytes = 2;
+    int warmup_frames = 0;
+
+    // The rate at which the frontend actually provides samples (may differ from
+    // what the 3DS mic service requested). We open the mic at this rate to avoid
+    // RetroArch's internal resampler path, which has a convergence bug when
+    // downsampling (ratio < 1). We resample ourselves in Read() instead.
+    u32 native_sample_rate = 0;
+
+    // Ring buffer for thread-safe sample storage
+    // Capacity: 4096 samples should be plenty for buffering between frames
+    // The 3DS mic service reads 16 samples at a time at ~32728 Hz
+    Common::RingBuffer<s16, 4096> sample_buffer;
+
+    // Temporary buffer for reading from frontend
+    std::vector<s16> read_buffer;
+
+    Impl() {
+        // Try to get the microphone interface from the frontend
+        retro_microphone_interface interface{};
+        interface.interface_version = RETRO_MICROPHONE_INTERFACE_VERSION;
+
+        if (LibRetro::GetMicrophoneInterface(&interface)) {
+            if (interface.interface_version == RETRO_MICROPHONE_INTERFACE_VERSION) {
+                mic_interface = interface;
+                LOG_INFO(Audio, "LibRetro microphone interface available (version {})",
+                         interface.interface_version);
+            } else {
+                LOG_WARNING(Audio,
+                            "LibRetro microphone interface version mismatch: expected {}, got {}",
+                            RETRO_MICROPHONE_INTERFACE_VERSION, interface.interface_version);
+            }
+        } else {
+            LOG_WARNING(Audio, "LibRetro microphone interface not available");
+        }
+
+        // Keep this small enough that RetroArch's microphone_driver_read can
+        // fill its outgoing FIFO in a single flush iteration. The CoreAudio
+        // driver's internal FIFO is ~480 samples (10ms at 48kHz). If we
+        // request more than that, the blocking while-loop in
+        // microphone_driver_read must wait for the next hardware callback,
+        // and on ARM64 without memory barriers in the FIFO, it may never
+        // see the new data. 128 samples is conservative enough to succeed
+        // in one pass.
+        read_buffer.resize(128);
+    }
+
+    ~Impl() {
+        CloseMicrophone();
+    }
+
+    bool EnsureMicrophoneOpen() {
+        if (mic_handle) {
+            return true;
+        }
+
+        if (!mic_interface) {
+            return false;
+        }
+
+        // Always open at 48000 Hz regardless of what the game requests.
+        // RetroArch's microphone_driver_read has a resampler whose while-loop
+        // deadlocks when the ratio is < 1 (core rate < device rate). The
+        // libretro get_params API only returns the effective (requested) rate,
+        // not the device's native rate, so we can't detect the mismatch.
+        // Opening at 48000 Hz (the most common hardware rate) keeps the
+        // frontend's internal resampling ratio at or near 1.0, avoiding the
+        // bug. We resample to the game's requested rate ourselves in Read().
+        static constexpr u32 kMicOpenRate = 48000;
+        native_sample_rate = kMicOpenRate;
+
+        retro_microphone_params_t params{};
+        params.rate = kMicOpenRate;
+
+        mic_handle = mic_interface->open_mic(&params);
+        if (!mic_handle) {
+            LOG_ERROR(Audio, "Failed to open LibRetro microphone");
+            return false;
+        }
+
+        // The frontend may start recording immediately in open_mic (e.g.
+        // CoreAudio calls AudioOutputUnitStart). Pause it right away so the
+        // mic is available but idle until StartSampling enables it.
+        mic_interface->set_mic_state(mic_handle, false);
+
+        LOG_INFO(Audio, "LibRetro microphone opened at {} Hz (idle)", native_sample_rate);
+        return true;
+    }
+
+    void CloseMicrophone() {
+        if (mic_interface && mic_handle) {
+            mic_interface->close_mic(mic_handle);
+            mic_handle = nullptr;
+        }
+    }
+
+    bool SetMicrophoneActive(bool active) {
+        if (!mic_interface || !mic_handle) {
+            return false;
+        }
+        return mic_interface->set_mic_state(mic_handle, active);
+    }
+
+    bool IsMicrophoneActive() const {
+        if (!mic_interface || !mic_handle) {
+            return false;
+        }
+        return mic_interface->get_mic_state(mic_handle);
+    }
+};
+
+LibRetroInput::LibRetroInput() : impl(std::make_unique<Impl>()) {
+    g_libretro_input = this;
+}
+
+LibRetroInput::~LibRetroInput() {
+    StopSampling();
+    if (g_libretro_input == this) {
+        g_libretro_input = nullptr;
+    }
+}
+
+void LibRetroInput::StartSampling(const InputParameters& params) {
+    if (IsSampling()) {
+        return;
+    }
+
+    // LibRetro only provides signed 16-bit PCM samples
+    // We'll convert to the requested format in Read()
+    if (params.sign == Signedness::Unsigned) {
+        LOG_DEBUG(Audio, "Application requested unsigned PCM format; will convert from signed.");
+    }
+
+    parameters = params;
+    impl->sample_size_in_bytes = params.sample_size / 8;
+
+    if (!impl->EnsureMicrophoneOpen()) {
+        LOG_WARNING(Audio, "Cannot start sampling: microphone not available");
+        return;
+    }
+
+    // Enable the microphone (transitions from idle to recording)
+    if (!impl->SetMicrophoneActive(true)) {
+        LOG_ERROR(Audio, "Failed to activate microphone");
+        return;
+    }
+
+    impl->is_sampling = true;
+    // Give the audio hardware a few frames to start delivering data before
+    // we attempt a (blocking) read_mic call. Without this, the very first
+    // read can hang because the CoreAudio callback hasn't fired yet.
+    impl->warmup_frames = 10;
+    LOG_INFO(Audio, "LibRetro microphone sampling started at {} Hz, {} bit", params.sample_rate,
+             params.sample_size);
+}
+
+void LibRetroInput::StopSampling() {
+    if (!impl->is_sampling) {
+        return;
+    }
+
+    impl->SetMicrophoneActive(false);
+    impl->is_sampling = false;
+
+    LOG_INFO(Audio, "LibRetro microphone sampling stopped (mic remains idle)");
+}
+
+bool LibRetroInput::IsSampling() {
+    return impl->is_sampling;
+}
+
+void LibRetroInput::AdjustSampleRate(u32 sample_rate) {
+    if (!IsSampling()) {
+        return;
+    }
+
+    // Restart with new sample rate
+    auto new_parameters = parameters;
+    new_parameters.sample_rate = sample_rate;
+    StopSampling();
+    StartSampling(new_parameters);
+}
+
+void LibRetroInput::PollMicrophone() {
+    // This is called from the main thread (retro_run)
+    // Read samples from the frontend and push to the ring buffer
+
+    if (!impl->is_sampling || !impl->mic_interface || !impl->mic_handle) {
+        return;
+    }
+
+    // Wait for the audio hardware to start delivering data before making
+    // any blocking read_mic calls.
+    if (impl->warmup_frames > 0) {
+        impl->warmup_frames--;
+        return;
+    }
+
+    // Issue a memory fence before reading. RetroArch's CoreAudio mic driver
+    // fills its FIFO from a callback thread without memory barriers. On ARM64
+    // (weak memory model), the main thread may not see the callback's writes
+    // without an explicit barrier.
+    std::atomic_thread_fence(std::memory_order_acquire);
+
+    int samples_read = impl->mic_interface->read_mic(impl->mic_handle, impl->read_buffer.data(),
+                                                     static_cast<size_t>(impl->read_buffer.size()));
+
+    if (samples_read > 0) {
+        impl->sample_buffer.Push(
+            std::span<const s16>(impl->read_buffer.data(), static_cast<size_t>(samples_read)));
+    }
+}
+
+Samples LibRetroInput::Read() {
+    // This is called from the CoreTiming scheduler thread
+    // Pop samples from the ring buffer (thread-safe)
+
+    if (!impl->is_sampling) {
+        return {};
+    }
+
+    // Pop available samples from the buffer (at native device rate)
+    std::vector<s16> raw_samples = impl->sample_buffer.Pop();
+
+    if (raw_samples.empty()) {
+        return {};
+    }
+
+    // Resample from native device rate to the rate the 3DS mic service expects
+    if (impl->native_sample_rate != 0 && impl->native_sample_rate != parameters.sample_rate) {
+        double ratio = static_cast<double>(parameters.sample_rate) / impl->native_sample_rate;
+        auto output_count = static_cast<std::size_t>(raw_samples.size() * ratio);
+        if (output_count == 0) {
+            return {};
+        }
+        std::vector<s16> resampled(output_count);
+        for (std::size_t i = 0; i < output_count; i++) {
+            double src_pos = i / ratio;
+            auto idx = static_cast<std::size_t>(src_pos);
+            double frac = src_pos - idx;
+            if (idx + 1 < raw_samples.size()) {
+                resampled[i] =
+                    static_cast<s16>(raw_samples[idx] * (1.0 - frac) + raw_samples[idx + 1] * frac);
+            } else {
+                resampled[i] = raw_samples[std::min(idx, raw_samples.size() - 1)];
+            }
+        }
+        raw_samples = std::move(resampled);
+    }
+
+    // Convert sample format if needed
+    constexpr auto convert_s16_to_u16 = [](s16 sample) -> u16 {
+        return static_cast<u16>(sample) ^ 0x8000;
+    };
+
+    constexpr auto convert_s16_to_s8 = [](s16 sample) -> s8 {
+        return static_cast<s8>(sample >> 8);
+    };
+
+    constexpr auto convert_s16_to_u8 = [](s16 sample) -> u8 {
+        return static_cast<u8>((static_cast<u16>(sample) ^ 0x8000) >> 8);
+    };
+
+    Samples output;
+    output.reserve(raw_samples.size() * impl->sample_size_in_bytes);
+
+    if (impl->sample_size_in_bytes == 1) {
+        // 8-bit output
+        if (parameters.sign == Signedness::Unsigned) {
+            for (s16 sample : raw_samples) {
+                output.push_back(convert_s16_to_u8(sample));
+            }
+        } else {
+            for (s16 sample : raw_samples) {
+                output.push_back(static_cast<u8>(convert_s16_to_s8(sample)));
+            }
+        }
+    } else {
+        // 16-bit output
+        if (parameters.sign == Signedness::Unsigned) {
+            for (s16 sample : raw_samples) {
+                u16 converted = convert_s16_to_u16(sample);
+                output.push_back(static_cast<u8>(converted & 0xFF));
+                output.push_back(static_cast<u8>(converted >> 8));
+            }
+        } else {
+            // Signed 16-bit - just copy the raw bytes
+            const u8* data = reinterpret_cast<const u8*>(raw_samples.data());
+            output.insert(output.end(), data, data + raw_samples.size() * 2);
+        }
+    }
+
+    return output;
+}
+
+LibRetroInput* GetLibRetroInput() {
+    return g_libretro_input;
+}
+
+} // namespace AudioCore
--- a/src/audio_core/libretro_input.h
+++ b/src/audio_core/libretro_input.h
@ -0,0 +1,36 @@
+// Copyright Citra Emulator Project / Azahar Emulator Project
+// Licensed under GPLv2 or any later version
+// Refer to the license.txt file included.
+
+#pragma once
+
+#include <memory>
+#include "audio_core/input.h"
+
+namespace AudioCore {
+
+class LibRetroInput final : public Input {
+public:
+    LibRetroInput();
+    ~LibRetroInput() override;
+
+    void StartSampling(const InputParameters& params) override;
+    void StopSampling() override;
+    bool IsSampling() override;
+    void AdjustSampleRate(u32 sample_rate) override;
+    Samples Read() override;
+
+    /// Called from main thread (retro_run) to read samples from the frontend
+    /// and store them in the thread-safe buffer for Read() to consume.
+    void PollMicrophone();
+
+private:
+    struct Impl;
+    std::unique_ptr<Impl> impl;
+};
+
+/// Returns the global LibRetroInput instance, or nullptr if not initialized.
+/// This is used by citra_libretro.cpp to poll the microphone from the main thread.
+LibRetroInput* GetLibRetroInput();
+
+} // namespace AudioCore
--- a/src/audio_core/libretro_sink.h
+++ b/src/audio_core/libretro_sink.h
@ -21,7 +21,9 @@ public:
    // Not used for immediate submission sinks
    void SetCallback(std::function<void(s16*, std::size_t)> cb) override {};

-    bool ImmediateSubmission() override { return true; }
+    bool ImmediateSubmission() override {
+        return true;
+    }

    void PushSamples(const void* data, std::size_t num_samples) override;
 };
--- a/src/citra_libretro/citra_libretro.cpp
+++ b/src/citra_libretro/citra_libretro.cpp
@ -16,6 +16,7 @@
 #endif
 #include "libretro.h"

+#include "audio_core/libretro_input.h"
 #include "audio_core/libretro_sink.h"
 #include "video_core/gpu.h"
 #ifdef ENABLE_OPENGL
@ -245,6 +246,12 @@ void retro_run() {
        emu_instance->emu_window->UpdateLayout();
    }

+    // Poll microphone input from the frontend and buffer it for the emulator
+    // This must be done from the main thread as LibRetro's mic interface is not thread-safe
+    if (auto* mic_input = AudioCore::GetLibRetroInput()) {
+        mic_input->PollMicrophone();
+    }
+
    // Check if the screen swap button is pressed
    static bool screen_swap_btn_state = false;
    static bool screen_swap_toggled = false;
--- a/src/citra_libretro/core_settings.cpp
+++ b/src/citra_libretro/core_settings.cpp
@ -806,7 +806,7 @@ static void ParseAudioOptions(void) {
    } else if (input_type == "static_noise") {
        Settings::values.input_type = AudioCore::InputType::Static;
    } else if (input_type == "frontend") {
-        Settings::values.input_type = AudioCore::InputType::Cubeb; // Use Cubeb as frontend input
+        Settings::values.input_type = AudioCore::InputType::LibRetro;
    } else {
        Settings::values.input_type = AudioCore::InputType::Auto;
    }
--- a/src/citra_libretro/environment.cpp
+++ b/src/citra_libretro/environment.cpp
@ -54,6 +54,10 @@ bool GetSensorInterface(struct retro_sensor_interface* sensor_interface) {
    return environ_cb(RETRO_ENVIRONMENT_GET_SENSOR_INTERFACE, sensor_interface);
 }

+bool GetMicrophoneInterface(struct retro_microphone_interface* mic_interface) {
+    return environ_cb(RETRO_ENVIRONMENT_GET_MICROPHONE_INTERFACE, mic_interface);
+}
+
 Settings::GraphicsAPI GetPreferredRenderer() {
    // try and maintain the current driver
    retro_hw_context_type context_type = RETRO_HW_CONTEXT_OPENGL;
--- a/src/citra_libretro/environment.h
+++ b/src/citra_libretro/environment.h
@ -31,6 +31,9 @@ void PollInput();
 /// Gets the sensor interface for motion input
 bool GetSensorInterface(struct retro_sensor_interface* sensor_interface);

+/// Gets the microphone interface for audio input
+bool GetMicrophoneInterface(struct retro_microphone_interface* mic_interface);
+
 /// Sets the environmental variables used for settings.
 bool SetVariables(const retro_variable vars[]);

--- a/src/core/hle/service/mic/mic_u.cpp
+++ b/src/core/hle/service/mic/mic_u.cpp
@ -214,7 +214,6 @@ struct MIC_U::Impl {
            LOG_CRITICAL(Service_MIC,
                         "Application started sampling again before stopping sampling");
            mic->StopSampling();
-            mic.reset();
        }

        u8 sample_size = encoding == Encoding::PCM8Signed || encoding == Encoding::PCM8 ? 8 : 16;
@ -225,7 +224,9 @@ struct MIC_U::Impl {
        state.looped_buffer = audio_buffer_loop;
        state.size = audio_buffer_size;

-        CreateMic();
+        if (!mic) {
+            CreateMic();
+        }
        StartSampling();

        timing.ScheduleEvent(GetBufferUpdatePeriod(state.sample_rate), buffer_write_event);
@ -259,7 +260,6 @@ struct MIC_U::Impl {
        timing.RemoveEvent(buffer_write_event);
        if (mic) {
            mic->StopSampling();
-            mic.reset();
        }
        LOG_TRACE(Service_MIC, "called");
    }