ascii-chat/src_2client_2audio_8c_source.html

#include "audio.h"

#include <ascii-chat/audio/analysis.h>

#include "main.h"

#include "../main.h" // Global exit API

#include "server.h"

#include <ascii-chat/util/fps.h>

#include <ascii-chat/util/thread.h>

#include <ascii-chat/util/time.h> // For timing instrumentation


#include <ascii-chat/audio/audio.h>                 // lib/audio/audio.h for PortAudio wrapper

#include <ascii-chat/audio/client_audio_pipeline.h> // Unified audio processing pipeline

#include <ascii-chat/audio/wav_writer.h>            // WAV file dumping for debugging

#include <ascii-chat/common.h>

#include <ascii-chat/options/options.h>

#include <ascii-chat/options/rcu.h>     // For RCU-based options access

#include <ascii-chat/platform/system.h> // For platform_memcpy


#include <stdatomic.h>

#include <string.h>

#include <math.h>


#include <ascii-chat/platform/abstraction.h>

#include <ascii-chat/platform/init.h>

#include <ascii-chat/thread_pool.h>


/* ============================================================================

 * Audio System State

 * ============================================================================ */


static audio_context_t g_audio_context = {0};


static client_audio_pipeline_t *g_audio_pipeline = NULL;


/* ============================================================================

 * Audio Debugging - WAV File Dumpers

 * ============================================================================ */


static wav_writer_t *g_wav_capture_raw = NULL;


static wav_writer_t *g_wav_capture_processed = NULL;


static wav_writer_t *g_wav_playback_received = NULL;


/* ============================================================================

 * Audio Capture Thread Management

 * ============================================================================ */


static asciichat_thread_t g_audio_capture_thread;


static bool g_audio_capture_thread_created = false;


static atomic_bool g_audio_capture_thread_exited = false;


/* ============================================================================

 * Async Audio Packet Queue (decouples capture from network I/O)

 * ============================================================================ */


typedef struct {

  uint8_t data[8 * 4000]; // Max 8 frames * ~500 bytes each (with safety margin)

  size_t size;

  uint16_t frame_sizes[8];

  int frame_count;

} audio_send_packet_t;


#define AUDIO_SEND_QUEUE_SIZE 32

static audio_send_packet_t g_audio_send_queue[AUDIO_SEND_QUEUE_SIZE];

static int g_audio_send_queue_head = 0; // Write position

static int g_audio_send_queue_tail = 0; // Read position

static mutex_t g_audio_send_queue_mutex;

static cond_t g_audio_send_queue_cond;

static bool g_audio_send_queue_initialized = false;

static static_mutex_t g_audio_send_queue_init_mutex = STATIC_MUTEX_INIT;


static bool g_audio_sender_thread_created = false;

static atomic_bool g_audio_sender_should_exit = false;


static int audio_queue_packet(const uint8_t *opus_data, size_t opus_size, const uint16_t *frame_sizes,

                              int frame_count) {

  if (!g_audio_send_queue_initialized || !opus_data || opus_size == 0) {

    return -1;

  }


  mutex_lock(&g_audio_send_queue_mutex);


  // Check if queue is full

  int next_head = (g_audio_send_queue_head + 1) % AUDIO_SEND_QUEUE_SIZE;

  if (next_head == g_audio_send_queue_tail) {

    mutex_unlock(&g_audio_send_queue_mutex);

    log_warn_every(LOG_RATE_FAST, "Audio send queue full, dropping packet");

    return -1;

  }


  // Copy packet to queue

  audio_send_packet_t *packet = &g_audio_send_queue[g_audio_send_queue_head];

  if (opus_size <= sizeof(packet->data)) {

    memcpy(packet->data, opus_data, opus_size);

    packet->size = opus_size;

    packet->frame_count = frame_count;

    for (int i = 0; i < frame_count && i < 8; i++) {

      packet->frame_sizes[i] = frame_sizes[i];

    }

    g_audio_send_queue_head = next_head;

  }


  // Signal sender thread

  cond_signal(&g_audio_send_queue_cond);

  mutex_unlock(&g_audio_send_queue_mutex);


  return 0;

}


static void *audio_sender_thread_func(void *arg) {

  (void)arg;

  log_debug("Audio sender thread started");


  // Initialize timing system for performance profiling

  if (!timer_is_initialized()) {

    timer_system_init();

  }


  static int send_count = 0;


  while (!atomic_load(&g_audio_sender_should_exit)) {

    mutex_lock(&g_audio_send_queue_mutex);


    // Wait for packet or exit signal

    while (g_audio_send_queue_head == g_audio_send_queue_tail && !atomic_load(&g_audio_sender_should_exit)) {

      cond_wait(&g_audio_send_queue_cond, &g_audio_send_queue_mutex);

    }


    if (atomic_load(&g_audio_sender_should_exit)) {

      mutex_unlock(&g_audio_send_queue_mutex);

      break;

    }


    // Dequeue packet

    audio_send_packet_t packet = g_audio_send_queue[g_audio_send_queue_tail];

    g_audio_send_queue_tail = (g_audio_send_queue_tail + 1) % AUDIO_SEND_QUEUE_SIZE;


    mutex_unlock(&g_audio_send_queue_mutex);


    // Send packet (may block on network I/O - that's OK, we're not in capture thread)

    START_TIMER("network_send_audio");

    asciichat_error_t send_result =

        threaded_send_audio_opus_batch(packet.data, packet.size, packet.frame_sizes, packet.frame_count);

    double send_time_ns = STOP_TIMER("network_send_audio");


    send_count++;

    if (send_result < 0) {

      log_debug_every(LOG_RATE_VERY_FAST, "Failed to send audio packet");

    } else if (send_count % 50 == 0) {

      char duration_str[32];

      format_duration_ns(send_time_ns, duration_str, sizeof(duration_str));

      log_debug("Audio network send #%d: %zu bytes (%d frames) in %s", send_count, packet.size, packet.frame_count,

                duration_str);

    }

  }


  log_debug("Audio sender thread exiting");


  // Clean up thread-local error context before exit

  asciichat_errno_destroy();


  return NULL;

}


static void audio_sender_init(void) {

  static_mutex_lock(&g_audio_send_queue_init_mutex);


  // Check again under lock to prevent race condition

  if (g_audio_send_queue_initialized) {

    static_mutex_unlock(&g_audio_send_queue_init_mutex);

    return;

  }


  // Initialize queue structures under lock

  mutex_init(&g_audio_send_queue_mutex);

  cond_init(&g_audio_send_queue_cond);

  g_audio_send_queue_head = 0;

  g_audio_send_queue_tail = 0;

  g_audio_send_queue_initialized = true;

  atomic_store(&g_audio_sender_should_exit, false);


  static_mutex_unlock(&g_audio_send_queue_init_mutex);


  // Start sender thread (after lock release to avoid blocking other threads)

  if (thread_pool_spawn(g_client_worker_pool, audio_sender_thread_func, NULL, 5, "audio_sender") == ASCIICHAT_OK) {

    g_audio_sender_thread_created = true;

    log_debug("Audio sender thread created");

  } else {

    log_error("Failed to spawn audio sender thread in worker pool");

    LOG_ERRNO_IF_SET("Audio sender thread creation failed");

  }

}


static void audio_sender_cleanup(void) {

  if (!g_audio_send_queue_initialized) {

    return;

  }


  // Signal thread to exit

  atomic_store(&g_audio_sender_should_exit, true);

  mutex_lock(&g_audio_send_queue_mutex);

  cond_signal(&g_audio_send_queue_cond);

  mutex_unlock(&g_audio_send_queue_mutex);


  // Thread will be joined by thread_pool_stop_all() in protocol_stop_connection()

  if (THREAD_IS_CREATED(g_audio_sender_thread_created)) {

    g_audio_sender_thread_created = false;

    log_debug("Audio sender thread will be joined by thread pool");

  }


  mutex_destroy(&g_audio_send_queue_mutex);

  cond_destroy(&g_audio_send_queue_cond);

  g_audio_send_queue_initialized = false;

}


/* ============================================================================

 * Audio Processing Constants

 * ============================================================================ */


#define AUDIO_VOLUME_BOOST 1.0f // No boost/attenuation


/* ============================================================================

 * Audio Processing Functions

 * ============================================================================ */


void audio_process_received_samples(const float *samples, int num_samples) {

  // Validate parameters

  if (!samples || num_samples <= 0) {

    SET_ERRNO(ERROR_INVALID_PARAM, "Invalid audio samples: samples=%p, num_samples=%d", (void *)samples, num_samples);

    return;

  }


  if (!GET_OPTION(audio_enabled)) {

    log_warn_every(NS_PER_MS_INT, "Received audio samples but audio is disabled");

    return;

  }


  // Allow both single packets and batched packets

  if (num_samples > AUDIO_BATCH_SAMPLES) {

    log_warn("Audio packet too large: %d samples (max %d)", num_samples, AUDIO_BATCH_SAMPLES);

    return;

  }


  // Calculate RMS energy of received samples

  float sum_squares = 0.0f;

  for (int i = 0; i < num_samples; i++) {

    sum_squares += samples[i] * samples[i];

  }

  float received_rms = sqrtf(sum_squares / num_samples);


  // DUMP: Received audio from server (before playback processing)

  if (g_wav_playback_received) {

    wav_writer_write(g_wav_playback_received, samples, num_samples);

  }


  // Track samples for analysis

  if (GET_OPTION(audio_analysis_enabled)) {

    for (int i = 0; i < num_samples; i++) {

      audio_analysis_track_received_sample(samples[i]);

    }

  }


  // Copy samples to playback buffer (no processing needed - mixer already handled clipping)

  float audio_buffer[AUDIO_BATCH_SAMPLES];

  memcpy(audio_buffer, samples, (size_t)num_samples * sizeof(float));


  // DEBUG: Log what we're writing to playback buffer (with first 4 samples to verify audio integrity)

  static int recv_count = 0;

  recv_count++;

  if (recv_count <= 10 || recv_count % 50 == 0) {

    float peak = 0.0f;

    for (int i = 0; i < num_samples; i++) {

      float abs_val = fabsf(samples[i]);

      if (abs_val > peak)

        peak = abs_val;

    }

    log_debug("CLIENT AUDIO RECV #%d: %d samples, RMS=%.6f, Peak=%.6f, first4=[%.4f,%.4f,%.4f,%.4f]", recv_count,

              num_samples, received_rms, peak, num_samples > 0 ? samples[0] : 0.0f, num_samples > 1 ? samples[1] : 0.0f,

              num_samples > 2 ? samples[2] : 0.0f, num_samples > 3 ? samples[3] : 0.0f);

  }


  // Submit to playback system (goes to jitter buffer and speakers)

  // NOTE: AEC3's AnalyzeRender is called in output_callback() when audio actually plays,

  // NOT here. The jitter buffer adds 50-100ms delay, so calling AnalyzeRender here

  // would give AEC3 the wrong timing and break echo cancellation.

  audio_write_samples(&g_audio_context, audio_buffer, num_samples);


  // Log latency after writing to playback buffer

  if (g_audio_context.playback_buffer) {

    size_t buffer_samples = audio_ring_buffer_available_read(g_audio_context.playback_buffer);

    float buffer_latency_ms = (float)buffer_samples / 48.0f;

    log_dev_every(500 * US_PER_MS_INT, "LATENCY: Client playback buffer after recv: %.1fms (%zu samples)",

                  buffer_latency_ms, buffer_samples);

  }


#ifdef DEBUG_AUDIO

  log_debug("Processed %d received audio samples", num_samples);

#endif

}


/* ============================================================================

 * Audio Capture Thread Implementation

 * ============================================================================ */


static void *audio_capture_thread_func(void *arg) {

  (void)arg;


  log_debug("Audio capture thread started");


  // Initialize timing system for performance profiling

  if (!timer_is_initialized()) {

    timer_system_init();

  }


  // FPS tracking for audio capture thread (tracking Opus frames, ~50 FPS at 20ms per frame)

  static fps_t fps_tracker = {0};

  static bool fps_tracker_initialized = false;

  if (!fps_tracker_initialized) {

    fps_init(&fps_tracker, 50, "AUDIO_TX");

    fps_tracker_initialized = true;

  }


  // Detailed timing stats

  static double total_loop_ns = 0;

  static double total_read_ns = 0;

  static double total_encode_ns = 0;

  static double total_queue_ns = 0;

  static double max_loop_ns = 0;

  static double max_read_ns = 0;

  static double max_encode_ns = 0;

  static double max_queue_ns = 0;

  static uint64_t timing_loop_count = 0;


// Opus frame size: 960 samples = 20ms @ 48kHz (must match pipeline config)

#define OPUS_FRAME_SAMPLES 960

#define OPUS_MAX_PACKET_SIZE 500 // Max Opus packet size


  // Read enough samples per iteration to drain faster than we fill

  // Buffer holds multiple Opus frames worth to prevent overflow

  // 4 frames = 3840 samples = 80ms, but we'll read what's available up to this

#define CAPTURE_READ_SIZE (OPUS_FRAME_SAMPLES * 4)


  float audio_buffer[CAPTURE_READ_SIZE];

  static bool wav_dumpers_initialized = false;


  // Initialize WAV dumpers only once (file handles persist)

  if (!wav_dumpers_initialized && wav_dump_enabled()) {

    g_wav_capture_raw = wav_writer_open("/tmp/audio_capture_raw.wav", AUDIO_SAMPLE_RATE, 1);

    g_wav_capture_processed = wav_writer_open("/tmp/audio_capture_processed.wav", AUDIO_SAMPLE_RATE, 1);

    log_debug("Audio debugging enabled: dumping to /tmp/audio_capture_*.wav");

    wav_dumpers_initialized = true;

  }


  // Accumulator for building complete Opus frames

  float opus_frame_buffer[OPUS_FRAME_SAMPLES];

  int opus_frame_samples_collected = 0;


  // Batch buffer for multiple Opus frames - send all at once to reduce blocking

#define MAX_BATCH_FRAMES 8

#define BATCH_TIMEOUT_NS (40LL * NS_PER_MS_INT) // Flush batch after 40ms even if not full (2 Opus frames @ 20ms each)

  static uint8_t batch_buffer[MAX_BATCH_FRAMES * OPUS_MAX_PACKET_SIZE];

  static uint16_t batch_frame_sizes[MAX_BATCH_FRAMES];

  static int batch_frame_count = 0;

  static size_t batch_total_size = 0;

  static uint64_t batch_start_time_ns = 0;

  static bool batch_has_data = false;


  while (!should_exit() && !server_connection_is_lost()) {

    START_TIMER("audio_capture_loop_iteration");

    timing_loop_count++;


    if (!server_connection_is_active()) {

      STOP_TIMER("audio_capture_loop_iteration"); // Don't count sleep time

      platform_sleep_us(100 * US_PER_MS_INT);     // Wait for connection

      continue;

    }


    // Check if pipeline is ready

    if (!g_audio_pipeline) {

      STOP_TIMER("audio_capture_loop_iteration"); // Don't count sleep time

      platform_sleep_us(100 * US_PER_MS_INT);

      continue;

    }


    // Check how many samples are available in the ring buffer

    int available = audio_ring_buffer_available_read(g_audio_context.capture_buffer);

    if (available <= 0) {

      // Flush partial batch before sleeping (prevent starvation during idle periods)

      if (batch_has_data && batch_frame_count > 0) {

        uint64_t now_ns = time_get_ns();

        uint64_t elapsed_ns = time_elapsed_ns(batch_start_time_ns, now_ns);


        if (elapsed_ns >= BATCH_TIMEOUT_NS) {

          long elapsed_ms = (long)time_ns_to_ms(elapsed_ns);

          log_debug_every(LOG_RATE_FAST, "Idle timeout flush: %d frames (%zu bytes) after %ld ms", batch_frame_count,

                          batch_total_size, elapsed_ms);

          (void)audio_queue_packet(batch_buffer, batch_total_size, batch_frame_sizes, batch_frame_count);

          batch_frame_count = 0;

          batch_total_size = 0;

          batch_has_data = false;

        }

      }


      // Sleep briefly to reduce CPU usage when idle

      // 5ms polling = 200 times/sec, fast enough to catch audio promptly

      // Note: 50ms was causing 872ms gaps in audio transmission!

      STOP_TIMER("audio_capture_loop_iteration"); // Must stop before loop repeats

      platform_sleep_us(5 * US_PER_MS_INT);       // 5ms (was 50ms - caused huge gaps!)

      continue;

    }


    // Read as many samples as possible (up to CAPTURE_READ_SIZE) to drain faster

    // This prevents buffer overflow when processing is slower than capture

    int to_read = (available < CAPTURE_READ_SIZE) ? available : CAPTURE_READ_SIZE;


    START_TIMER("audio_read_samples");

    asciichat_error_t read_result = audio_read_samples(&g_audio_context, audio_buffer, to_read);

    double read_time_ns = STOP_TIMER("audio_read_samples");


    total_read_ns += read_time_ns;

    if (read_time_ns > max_read_ns)

      max_read_ns = read_time_ns;


    if (read_result != ASCIICHAT_OK) {

      log_error("Failed to read audio samples from ring buffer");

      STOP_TIMER("audio_capture_loop_iteration"); // Don't count sleep time

      platform_sleep_us(5 * US_PER_MS_INT);       // 5ms (error path - was 50ms, caused gaps!)

      continue;

    }


    int samples_read = to_read;


    // Log every 10 reads to see if we're getting samples

    static int total_reads = 0;

    total_reads++;

    if (total_reads % 10 == 0) {

      log_debug("Audio capture loop iteration #%d: available=%d, samples_read=%d", total_reads, available,

                samples_read);

    }


    if (samples_read > 0) {

      // Normalize input to prevent clipping: bring peak to ±0.99

      // Calculate peak level first

      float peak = 0.0f;

      for (int i = 0; i < samples_read; i++) {

        float abs_val = fabsf(audio_buffer[i]);

        if (abs_val > peak)

          peak = abs_val;

      }


      // Apply normalization if peak exceeds 1.0

      // Use 0.99 to leave headroom for processing

      if (peak > 1.0f) {

        float gain = 0.99f / peak;

        for (int i = 0; i < samples_read; i++) {

          audio_buffer[i] *= gain;

        }

        static int norm_count = 0;

        norm_count++;

        if (norm_count <= 5 || norm_count % 100 == 0) {

          log_debug("Input normalization #%d: peak=%.4f, gain=%.4f", norm_count, peak, gain);

        }

      }


      // DUMP: Raw captured audio (before any processing)

      if (g_wav_capture_raw) {

        wav_writer_write(g_wav_capture_raw, audio_buffer, samples_read);

      }


      // DEBUG: Log EVERY read to see what we're getting from the ring buffer

      static int read_count = 0;

      read_count++;

      float sum_squares = 0.0f;

      for (int i = 0; i < samples_read && i < 10; i++) {

        sum_squares += audio_buffer[i] * audio_buffer[i];

      }

      float rms = sqrtf(sum_squares / (samples_read > 10 ? 10 : samples_read));

      if (read_count <= 5 || read_count % 20 == 0) {

        log_debug("Audio capture read #%d: available=%d, samples_read=%d, first=[%.6f,%.6f,%.6f], RMS=%.6f", read_count,

                  available, samples_read, samples_read > 0 ? audio_buffer[0] : 0.0f,

                  samples_read > 1 ? audio_buffer[1] : 0.0f, samples_read > 2 ? audio_buffer[2] : 0.0f, rms);

      }


      // Track sent samples for analysis

      if (GET_OPTION(audio_analysis_enabled)) {

        for (int i = 0; i < samples_read; i++) {

          audio_analysis_track_sent_sample(audio_buffer[i]);

        }

      }


      // Accumulate samples into Opus frame buffer

      int samples_to_process = samples_read;

      int sample_offset = 0;


      while (samples_to_process > 0) {

        // How many samples can we add to current frame?

        int space_in_frame = OPUS_FRAME_SAMPLES - opus_frame_samples_collected;

        int samples_to_copy = (samples_to_process < space_in_frame) ? samples_to_process : space_in_frame;


        // Copy samples to frame buffer

        memcpy(&opus_frame_buffer[opus_frame_samples_collected], &audio_buffer[sample_offset],

               (size_t)samples_to_copy * sizeof(float));


        opus_frame_samples_collected += samples_to_copy;

        sample_offset += samples_to_copy;

        samples_to_process -= samples_to_copy;


        // Do we have a complete frame?

        if (opus_frame_samples_collected >= OPUS_FRAME_SAMPLES) {

          // Process through pipeline: AEC, filters, AGC, noise gate, Opus encode

          uint8_t opus_packet[OPUS_MAX_PACKET_SIZE];


          START_TIMER("opus_encode");

          int opus_len = client_audio_pipeline_capture(g_audio_pipeline, opus_frame_buffer, OPUS_FRAME_SAMPLES,

                                                       opus_packet, OPUS_MAX_PACKET_SIZE);


          static int encode_count = 0;

          encode_count++;

          double opus_elapsed_ns = STOP_TIMER("opus_encode");

          if (encode_count % 50 == 0) {

            if (opus_elapsed_ns >= 0.0) {

              char _duration_str[32];

              format_duration_ns(opus_elapsed_ns, _duration_str, sizeof(_duration_str));

              log_dev("Opus encode #%d: %d samples -> %d bytes in %s", encode_count, OPUS_FRAME_SAMPLES, opus_len,

                      _duration_str);

            }

          }


          double encode_time_ns = 0; // Timing already logged


          total_encode_ns += encode_time_ns;

          if (encode_time_ns > max_encode_ns)

            max_encode_ns = encode_time_ns;


          if (opus_len > 0) {


            log_debug_every(LOG_RATE_VERY_FAST, "Pipeline encoded: %d samples -> %d bytes (compression: %.1fx)",

                            OPUS_FRAME_SAMPLES, opus_len,

                            (float)(OPUS_FRAME_SAMPLES * sizeof(float)) / (float)opus_len);


            // Add to batch buffer

            if (batch_frame_count < MAX_BATCH_FRAMES && batch_total_size + (size_t)opus_len <= sizeof(batch_buffer)) {

              // Mark batch start time on first frame

              if (batch_frame_count == 0) {

                batch_start_time_ns = time_get_ns();

                batch_has_data = true;

              }


              memcpy(batch_buffer + batch_total_size, opus_packet, (size_t)opus_len);

              batch_frame_sizes[batch_frame_count] = (uint16_t)opus_len;

              batch_total_size += (size_t)opus_len;

              batch_frame_count++;


              if (GET_OPTION(audio_analysis_enabled)) {

                audio_analysis_track_sent_packet((size_t)opus_len);

              }

            }

          } else if (opus_len == 0) {

            // DTX frame (silence) - no data to send

            log_debug_every(LOG_RATE_VERY_FAST, "Pipeline DTX frame (silence detected)");

          }


          // Reset frame buffer

          opus_frame_samples_collected = 0;

        }

      }


      // Queue batch for async sending (non-blocking - sender thread handles network I/O)

      if (batch_frame_count > 0) {

        static int batch_send_count = 0;

        batch_send_count++;


        START_TIMER("audio_queue_packet");

        int queue_result = audio_queue_packet(batch_buffer, batch_total_size, batch_frame_sizes, batch_frame_count);

        double queue_time_ns = STOP_TIMER("audio_queue_packet");


        total_queue_ns += queue_time_ns;

        if (queue_time_ns > max_queue_ns)

          max_queue_ns = queue_time_ns;


        if (queue_result < 0) {

          log_debug_every(LOG_RATE_VERY_FAST, "Failed to queue audio batch (queue full)");

        } else {

          if (batch_send_count <= 10 || batch_send_count % 50 == 0) {

            char queue_duration_str[32];

            format_duration_ns(queue_time_ns, queue_duration_str, sizeof(queue_duration_str));

            log_debug("CLIENT: Queued Opus batch #%d (%d frames, %zu bytes) in %s", batch_send_count, batch_frame_count,

                      batch_total_size, queue_duration_str);

          }

          // Track audio frame for FPS reporting

          fps_frame_ns(&fps_tracker, time_get_ns(), "audio batch queued");

        }


        // Reset batch

        batch_frame_count = 0;

        batch_total_size = 0;

        batch_has_data = false;

      }


      // Log overall loop iteration time periodically

      double loop_time_ns = STOP_TIMER("audio_capture_loop_iteration");

      total_loop_ns += loop_time_ns;

      if (loop_time_ns > max_loop_ns)

        max_loop_ns = loop_time_ns;


      // Comprehensive timing report every 100 iterations (~2 seconds)

      if (timing_loop_count % 100 == 0) {

        char avg_loop_str[32], max_loop_str[32];

        char avg_read_str[32], max_read_str[32];

        char avg_encode_str[32], max_encode_str[32];

        char avg_queue_str[32], max_queue_str[32];


        format_duration_ns(total_loop_ns / timing_loop_count, avg_loop_str, sizeof(avg_loop_str));

        format_duration_ns(max_loop_ns, max_loop_str, sizeof(max_loop_str));

        format_duration_ns(total_read_ns / timing_loop_count, avg_read_str, sizeof(avg_read_str));

        format_duration_ns(max_read_ns, max_read_str, sizeof(max_read_str));

        format_duration_ns(total_encode_ns / timing_loop_count, avg_encode_str, sizeof(avg_encode_str));

        format_duration_ns(max_encode_ns, max_encode_str, sizeof(max_encode_str));

        format_duration_ns(total_queue_ns / timing_loop_count, avg_queue_str, sizeof(avg_queue_str));

        format_duration_ns(max_queue_ns, max_queue_str, sizeof(max_queue_str));


        log_debug("CAPTURE TIMING #%lu: loop avg=%s max=%s, read avg=%s max=%s", timing_loop_count, avg_loop_str,

                  max_loop_str, avg_read_str, max_read_str);

        log_info("  encode avg=%s max=%s, queue avg=%s max=%s", avg_encode_str, max_encode_str, avg_queue_str,

                 max_queue_str);

      }


      // Check if we have a partial batch that's been waiting too long (time-based flush)

      // This prevents batches from sitting indefinitely when audio capture is irregular

      if (batch_has_data && batch_frame_count > 0) {

        uint64_t now_ns = time_get_ns();

        uint64_t elapsed_ns = time_elapsed_ns(batch_start_time_ns, now_ns);


        if (elapsed_ns >= BATCH_TIMEOUT_NS) {

          static int timeout_flush_count = 0;

          timeout_flush_count++;


          long elapsed_ms = (long)time_ns_to_ms(elapsed_ns);

          log_debug_every(LOG_RATE_FAST, "Timeout flush #%d: %d frames (%zu bytes) after %ld ms", timeout_flush_count,

                          batch_frame_count, batch_total_size, elapsed_ms);


          // Queue partial batch

          int queue_result = audio_queue_packet(batch_buffer, batch_total_size, batch_frame_sizes, batch_frame_count);

          if (queue_result == 0) {

            // Track audio frame for FPS reporting

            fps_frame_ns(&fps_tracker, time_get_ns(), "audio batch timeout flush");

          }


          // Reset batch

          batch_frame_count = 0;

          batch_total_size = 0;

          batch_has_data = false;

        }

      }


      // Yield to reduce CPU usage - audio arrives at ~20ms per Opus frame (960 samples @ 48kHz)

      // Without sleep, thread spins at 90-100% CPU constantly checking for new samples

      // Even 1ms sleep reduces CPU usage from 90% to <10% with minimal latency impact

      platform_sleep_us(1 * US_PER_MS_INT); // 1ms

    } else {

      // Track loop time even when no samples processed

      double loop_time_ns = STOP_TIMER("audio_capture_loop_iteration");

      total_loop_ns += loop_time_ns;

      if (loop_time_ns > max_loop_ns)

        max_loop_ns = loop_time_ns;


      // Flush partial batch before sleeping on error path (prevent starvation)

      if (batch_has_data && batch_frame_count > 0) {

        uint64_t now_ns = time_get_ns();

        uint64_t elapsed_ns = time_elapsed_ns(batch_start_time_ns, now_ns);


        if (elapsed_ns >= BATCH_TIMEOUT_NS) {

          long elapsed_ms = (long)time_ns_to_ms(elapsed_ns);

          log_debug_every(LOG_RATE_FAST, "Error path timeout flush: %d frames (%zu bytes) after %ld ms",

                          batch_frame_count, batch_total_size, elapsed_ms);

          (void)audio_queue_packet(batch_buffer, batch_total_size, batch_frame_sizes, batch_frame_count);

          batch_frame_count = 0;

          batch_total_size = 0;

          batch_has_data = false;

        }

      }


      platform_sleep_us(5 * US_PER_MS_INT); // 5ms (error path - was 50ms, caused gaps!)

    }

  }


  log_debug("Audio capture thread stopped");

  atomic_store(&g_audio_capture_thread_exited, true);


  // Clean up thread-local error context before exit

  asciichat_errno_destroy();


  return NULL;

}


/* ============================================================================

 * Public Interface Functions

 * ============================================================================ */


int audio_client_init() {

  if (!GET_OPTION(audio_enabled)) {

    return 0; // Audio disabled - not an error

  }


  // Initialize WAV dumper for received audio if debugging enabled

  if (wav_dump_enabled()) {

    g_wav_playback_received = wav_writer_open("/tmp/audio_playback_received.wav", AUDIO_SAMPLE_RATE, 1);

    if (g_wav_playback_received) {

      log_debug("Audio debugging enabled: dumping received audio to /tmp/audio_playback_received.wav");

    }

  }


  // Initialize PortAudio context using library function

  log_debug("DEBUG: About to call audio_init()...");

  if (audio_init(&g_audio_context) != ASCIICHAT_OK) {

    log_error("Failed to initialize audio system");

    // Clean up WAV writer if it was opened

    if (g_wav_playback_received) {

      wav_writer_close(g_wav_playback_received);

      g_wav_playback_received = NULL;

    }

    return -1;

  }

  log_debug("DEBUG: audio_init() completed successfully");


  // Create unified audio pipeline (handles AEC, AGC, noise suppression, Opus)

  client_audio_pipeline_config_t pipeline_config = client_audio_pipeline_default_config();

  pipeline_config.opus_bitrate = 128000; // 128 kbps AUDIO mode for music quality


  // Enable echo cancellation, AGC, and essential processing for clear audio

  // Noise suppression and VAD can destroy music quality, so keep them disabled

  pipeline_config.flags.echo_cancel = true;     // ENABLE: removes echo

  pipeline_config.flags.jitter_buffer = true;   // ENABLE: needed for AEC sync

  pipeline_config.flags.noise_suppress = false; // DISABLED: destroys music quality

  pipeline_config.flags.agc = true;             // ENABLE: boost quiet microphones (35 dB gain)

  pipeline_config.flags.vad = false;            // DISABLED: destroys music quality

  pipeline_config.flags.compressor = true;      // ENABLE: prevent clipping from AGC boost

  pipeline_config.flags.noise_gate = false;     // DISABLED: would cut quiet music passages

  pipeline_config.flags.highpass = true;        // ENABLE: remove rumble and low-frequency feedback

  pipeline_config.flags.lowpass = false;        // DISABLED: preserve high-frequency content


  // Set jitter buffer margin for smooth playback without excessive delay

  // 100ms is conservative - AEC3 will adapt to actual network delay automatically

  // We don't tune this; let the system adapt to its actual conditions

  pipeline_config.jitter_margin_ns = 100;


  log_debug("DEBUG: About to create audio pipeline...");

  g_audio_pipeline = client_audio_pipeline_create(&pipeline_config);

  log_debug("DEBUG: client_audio_pipeline_create() returned");

  if (!g_audio_pipeline) {

    log_error("Failed to create audio pipeline");

    audio_destroy(&g_audio_context);

    // Clean up WAV writer if it was opened

    if (g_wav_playback_received) {

      wav_writer_close(g_wav_playback_received);

      g_wav_playback_received = NULL;

    }

    return -1;

  }


  log_debug("Audio pipeline created: %d Hz sample rate, %d bps bitrate", pipeline_config.sample_rate,

            pipeline_config.opus_bitrate);


  // Associate pipeline with audio context for echo cancellation

  // The audio output callback will feed playback samples directly to AEC3 from the speaker output,

  // ensuring proper timing synchronization (not from the decode path 50-100ms earlier)

  audio_set_pipeline(&g_audio_context, (void *)g_audio_pipeline);


  // Start full-duplex audio (simultaneous capture + playback for perfect AEC3 timing)

  if (audio_start_duplex(&g_audio_context) != ASCIICHAT_OK) {

    log_error("Failed to start full-duplex audio");

    client_audio_pipeline_destroy(g_audio_pipeline);

    g_audio_pipeline = NULL;

    audio_destroy(&g_audio_context);

    // Clean up WAV writer if it was opened

    if (g_wav_playback_received) {

      wav_writer_close(g_wav_playback_received);

      g_wav_playback_received = NULL;

    }

    return -1;

  }


  // Initialize async audio sender (decouples capture from network I/O)

  audio_sender_init();


  return 0;

}


int audio_start_thread() {

  log_debug("audio_start_thread called: audio_enabled=%d", GET_OPTION(audio_enabled));


  if (!GET_OPTION(audio_enabled)) {

    log_debug("Audio is disabled, skipping audio capture thread creation");

    return 0; // Audio disabled - not an error

  }


  // Check if thread is already running (not just created flag)

  if (g_audio_capture_thread_created && !atomic_load(&g_audio_capture_thread_exited)) {

    log_warn("Audio capture thread already running");

    return 0;

  }


  // If thread exited, allow recreation

  if (g_audio_capture_thread_created && atomic_load(&g_audio_capture_thread_exited)) {

    log_debug("Previous audio capture thread exited, recreating");

    // Use timeout to prevent indefinite blocking

    int join_result = asciichat_thread_join_timeout(&g_audio_capture_thread, NULL, 5000 * NS_PER_MS_INT);

    if (join_result != 0) {

      log_warn("Audio capture thread join timed out after 5s - thread may be deadlocked, "

               "forcing thread handle reset (stuck thread resources will not be cleaned up)");

      // Thread is stuck - we can't safely reuse the handle, but we can reset our tracking

      // This is a resource leak of the stuck thread but continuing is safer than hanging

    }

    g_audio_capture_thread_created = false;

  }


  // Notify server we're starting to send audio BEFORE spawning thread

  // IMPORTANT: Must send STREAM_START before thread starts sending packets to avoid protocol violation

  if (threaded_send_stream_start_packet(STREAM_TYPE_AUDIO) < 0) {

    log_error("Failed to send audio stream start packet");

    return -1; // Don't start thread if we can't notify server

  }


  // Start audio capture thread

  atomic_store(&g_audio_capture_thread_exited, false);

  if (thread_pool_spawn(g_client_worker_pool, audio_capture_thread_func, NULL, 4, "audio_capture") != ASCIICHAT_OK) {

    log_error("Failed to spawn audio capture thread in worker pool");

    LOG_ERRNO_IF_SET("Audio capture thread creation failed");

    return -1;

  }


  g_audio_capture_thread_created = true;


  return 0;

}


void audio_stop_thread() {

  // Signal audio sender thread to exit first.

  // This must happen before thread_pool_stop_all() is called, otherwise the sender

  // thread will be stuck in cond_wait() and thread_pool_stop_all() will hang forever.

  // The sender thread uses a condition variable to wait for packets - we must wake it up.

  if (g_audio_send_queue_initialized) {

    log_debug("Signaling audio sender thread to exit");

    atomic_store(&g_audio_sender_should_exit, true);

    mutex_lock(&g_audio_send_queue_mutex);

    cond_signal(&g_audio_send_queue_cond);

    mutex_unlock(&g_audio_send_queue_mutex);

  }


  if (!THREAD_IS_CREATED(g_audio_capture_thread_created)) {

    return;

  }


  // Note: We don't call signal_exit() here because that's for global shutdown only

  // The audio capture thread checks server_connection_is_active() to detect connection loss


  // Wait for thread to exit gracefully

  int wait_count = 0;

  while (wait_count < 20 && !atomic_load(&g_audio_capture_thread_exited)) {

    platform_sleep_us(100 * US_PER_MS_INT); // 100ms

    wait_count++;

  }


  if (!atomic_load(&g_audio_capture_thread_exited)) {

    log_warn("Audio capture thread not responding - will be joined by thread pool");

  }


  // Thread will be joined by thread_pool_stop_all() in protocol_stop_connection()

  g_audio_capture_thread_created = false;


  log_debug("Audio capture thread stopped");

}


bool audio_thread_exited() {

  return atomic_load(&g_audio_capture_thread_exited);

}


void audio_cleanup() {

  if (!GET_OPTION(audio_enabled)) {

    return;

  }


  // Stop capture thread first (stops producing packets)

  audio_stop_thread();


  // Stop async sender thread (drains queue and exits)

  audio_sender_cleanup();


  // Terminate PortAudio FIRST to properly free device resources before cleanup

  // This must happen before audio_stop_duplex() and audio_destroy()

  audio_terminate_portaudio_final();


  // Stop audio stream before destroying pipeline to prevent race condition.

  // PortAudio may invoke the callback one more time after we request stop.

  // We need to clear the pipeline pointer first so the callback can't access freed memory.

  if (g_audio_context.initialized) {

    audio_stop_duplex(&g_audio_context);

  }


  // Clear the pipeline pointer from audio context BEFORE destroying pipeline

  // This prevents any lingering PortAudio callbacks from trying to access freed memory

  audio_set_pipeline(&g_audio_context, NULL);


  // Sleep to allow CoreAudio threads to finish executing callbacks.

  // On macOS, CoreAudio's internal threads may continue running after Pa_StopStream() returns.

  // The duplex_callback may still be in-flight on other threads. Even after we set the pipeline

  // pointer to NULL, a CoreAudio thread may have already cached the pointer before the assignment.

  // This sleep ensures all in-flight callbacks have fully completed before we destroy the pipeline.

  // 500ms is sufficient on macOS for CoreAudio's internal thread pool to completely wind down.

  platform_sleep_us(500 * US_PER_MS_INT); // 500ms - macOS CoreAudio needs time to shut down all threads


  // Destroy audio pipeline (handles Opus, AEC, etc.)

  if (g_audio_pipeline) {

    client_audio_pipeline_destroy(g_audio_pipeline);

    g_audio_pipeline = NULL;

    log_debug("Audio pipeline destroyed");

  }


  // Close WAV dumpers

  if (g_wav_capture_raw) {

    wav_writer_close(g_wav_capture_raw);

    g_wav_capture_raw = NULL;

    log_debug("Closed audio capture raw dump");

  }

  if (g_wav_capture_processed) {

    wav_writer_close(g_wav_capture_processed);

    g_wav_capture_processed = NULL;

    log_debug("Closed audio capture processed dump");

  }

  if (g_wav_playback_received) {

    wav_writer_close(g_wav_playback_received);

    g_wav_playback_received = NULL;

    log_debug("Closed audio playback received dump");

  }


  // Finally destroy the audio context

  if (g_audio_context.initialized) {

    audio_destroy(&g_audio_context);

  }

}


client_audio_pipeline_t *audio_get_pipeline(void) {

  return g_audio_pipeline;

}


int audio_decode_opus(const uint8_t *opus_data, size_t opus_len, float *output, int max_samples) {

  if (!g_audio_pipeline || !output || max_samples <= 0) {

    return -1;

  }


  return client_audio_pipeline_playback(g_audio_pipeline, opus_data, (int)opus_len, output, max_samples);

}


audio_context_t *audio_get_context(void) {

  return &g_audio_context;

}


audio_analysis_track_received_sample
void audio_analysis_track_received_sample(float sample)
Definition analysis.c:272

audio_analysis_track_sent_sample
void audio_analysis_track_sent_sample(float sample)
Definition analysis.c:173

audio_analysis_track_sent_packet
void audio_analysis_track_sent_packet(size_t size)
Definition analysis.c:245

asciichat_errno_destroy
void asciichat_errno_destroy(void)
Definition asciichat_errno.c:502

g_client_worker_pool
thread_pool_t * g_client_worker_pool
Global client worker thread pool.
Definition client/main.c:139

client_audio_pipeline_playback
int client_audio_pipeline_playback(client_audio_pipeline_t *pipeline, const uint8_t *opus_in, int opus_len, float *output, int num_samples)
Definition client_audio_pipeline.cpp:453

client_audio_pipeline_create
client_audio_pipeline_t * client_audio_pipeline_create(const client_audio_pipeline_config_t *config)
Create and initialize a client audio pipeline.
Definition client_audio_pipeline.cpp:154

client_audio_pipeline_default_config
client_audio_pipeline_config_t client_audio_pipeline_default_config(void)
Definition client_audio_pipeline.cpp:101

client_audio_pipeline_capture
int client_audio_pipeline_capture(client_audio_pipeline_t *pipeline, const float *input, int num_samples, uint8_t *opus_out, int max_opus_len)
Definition client_audio_pipeline.cpp:432

client_audio_pipeline_destroy
void client_audio_pipeline_destroy(client_audio_pipeline_t *pipeline)
Definition client_audio_pipeline.cpp:361

should_exit
bool should_exit(void)
Definition main.c:90

server.h

fps_frame_ns
void fps_frame_ns(fps_t *tracker, uint64_t current_time_ns, const char *context)
Definition fps.c:52

fps_init
void fps_init(fps_t *tracker, int expected_fps, const char *name)
Definition fps.c:32

audio_process_received_samples
void audio_process_received_samples(const float *samples, int num_samples)
Process received audio samples from server.
Definition src/client/audio.c:399

audio_stop_thread
void audio_stop_thread()
Stop audio capture thread.
Definition src/client/audio.c:1059

audio_client_init
int audio_client_init()
Initialize audio subsystem.
Definition src/client/audio.c:904

audio_get_pipeline
client_audio_pipeline_t * audio_get_pipeline(void)
Get the audio pipeline (for advanced usage)
Definition src/client/audio.c:1185

audio_cleanup
void audio_cleanup()
Cleanup audio subsystem.
Definition src/client/audio.c:1115

audio_decode_opus
int audio_decode_opus(const uint8_t *opus_data, size_t opus_len, float *output, int max_samples)
Decode Opus packet using the audio pipeline.
Definition src/client/audio.c:1199

audio_thread_exited
bool audio_thread_exited()
Check if audio capture thread has exited.
Definition src/client/audio.c:1103

audio_get_context
audio_context_t * audio_get_context(void)
Get the global audio context for use by other subsystems.
Definition src/client/audio.c:1213

audio_start_thread
int audio_start_thread()
Start audio capture thread.
Definition src/client/audio.c:1003

server_connection_is_active
bool server_connection_is_active()
Check if server connection is currently active.
Definition src/client/server.c:732

server_connection_is_lost
bool server_connection_is_lost()
Check if connection loss has been detected.
Definition src/client/server.c:937

threaded_send_audio_opus_batch
asciichat_error_t threaded_send_audio_opus_batch(const uint8_t *opus_data, size_t opus_size, const uint16_t *frame_sizes, int frame_count)
Thread-safe Opus audio batch packet transmission.
Definition src/client/server.c:1122

threaded_send_stream_start_packet
asciichat_error_t threaded_send_stream_start_packet(uint32_t stream_type)
Thread-safe stream start packet transmission.
Definition src/client/server.c:1183

audio_init
asciichat_error_t audio_init(audio_context_t *ctx)
Definition lib/audio/audio.c:1132

audio_ring_buffer_available_read
size_t audio_ring_buffer_available_read(audio_ring_buffer_t *rb)
Definition lib/audio/audio.c:1106

audio_start_duplex
asciichat_error_t audio_start_duplex(audio_context_t *ctx)
Definition lib/audio/audio.c:1353

audio_destroy
void audio_destroy(audio_context_t *ctx)
Definition lib/audio/audio.c:1270

audio_stop_duplex
asciichat_error_t audio_stop_duplex(audio_context_t *ctx)
Definition lib/audio/audio.c:1703

audio_write_samples
asciichat_error_t audio_write_samples(audio_context_t *ctx, const float *buffer, int num_samples)
Definition lib/audio/audio.c:1802

audio_terminate_portaudio_final
void audio_terminate_portaudio_final(void)
Terminate PortAudio and free all device resources.
Definition lib/audio/audio.c:114

audio_set_pipeline
void audio_set_pipeline(audio_context_t *ctx, void *pipeline)
Definition lib/audio/audio.c:1328

audio_read_samples
asciichat_error_t audio_read_samples(audio_context_t *ctx, float *buffer, int num_samples)
Definition lib/audio/audio.c:1791

platform_sleep_us
void platform_sleep_us(unsigned int us)
Definition platform/wasm/time.c:31

main.h
ascii-chat Server Mode Entry Point Header

OPUS_FRAME_SAMPLES
#define OPUS_FRAME_SAMPLES

MAX_BATCH_FRAMES
#define MAX_BATCH_FRAMES

AUDIO_SEND_QUEUE_SIZE
#define AUDIO_SEND_QUEUE_SIZE
Definition src/client/audio.c:194

CAPTURE_READ_SIZE
#define CAPTURE_READ_SIZE

BATCH_TIMEOUT_NS
#define BATCH_TIMEOUT_NS

OPUS_MAX_PACKET_SIZE
#define OPUS_MAX_PACKET_SIZE

audio.h
ascii-chat Client Audio Processing Management Interface

audio_send_packet_t
Audio packet for async sending.
Definition src/client/audio.c:186

audio_send_packet_t::frame_count
int frame_count
Definition src/client/audio.c:190

audio_send_packet_t::data
uint8_t data[8 *4000]
Definition src/client/audio.c:187

audio_send_packet_t::frame_sizes
uint16_t frame_sizes[8]
Definition src/client/audio.c:189

audio_send_packet_t::size
size_t size
Definition src/client/audio.c:188

thread_pool_spawn
asciichat_error_t thread_pool_spawn(thread_pool_t *pool, void *(*thread_func)(void *), void *thread_arg, int stop_id, const char *thread_name)
Definition thread_pool.c:70

mutex_init
int mutex_init(mutex_t *mutex)
Definition threading.c:16

mutex_destroy
int mutex_destroy(mutex_t *mutex)
Definition threading.c:21

time_get_ns
uint64_t time_get_ns(void)
Definition util/time.c:48

format_duration_ns
int format_duration_ns(double nanoseconds, char *buffer, size_t buffer_size)
Definition util/time.c:275

time_elapsed_ns
uint64_t time_elapsed_ns(uint64_t start_ns, uint64_t end_ns)
Definition util/time.c:90

timer_is_initialized
bool timer_is_initialized(void)
Definition util/time.c:267

timer_system_init
bool timer_system_init(void)
Definition util/time.c:125

wav_dump_enabled
bool wav_dump_enabled(void)
Definition wav_writer.c:139

wav_writer_open
wav_writer_t * wav_writer_open(const char *filepath, int sample_rate, int channels)
Definition wav_writer.c:49

wav_writer_write
int wav_writer_write(wav_writer_t *writer, const float *samples, int num_samples)
Definition wav_writer.c:95

wav_writer_close
void wav_writer_close(wav_writer_t *writer)
Definition wav_writer.c:113