From 3e42e220863f5d443d2d546b2a0d82a638d26e4b Mon Sep 17 00:00:00 2001
From: Eason WaveKat <eason@wavekat.com>
Date: Thu, 14 May 2026 17:10:14 +1200
Subject: [PATCH 1/2] fix: resample short inputs when upsampling

AudioFrame::resample failed for any input shorter than rubato's chunk
size when upsampling (e.g. a 160-sample G.711 frame to 44.1 kHz) because
the output buffer was sized by input-times-ratio while rubato sizes its
output by chunk-times-ratio. Switch to rubato's
process_all_needed_output_len helper and match the chunk size to short
inputs.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 crates/wavekat-core/src/audio.rs    |  68 ++++++++++++-
 docs/04-resample-short-input-bug.md | 153 ++++++++++++++++++++++++++++
 2 files changed, 216 insertions(+), 5 deletions(-)
 create mode 100644 docs/04-resample-short-input-bug.md
diff --git a/crates/wavekat-core/src/audio.rs b/crates/wavekat-core/src/audio.rs
index fbf9b43..36862f4 100644
--- a/crates/wavekat-core/src/audio.rs
+++ b/crates/wavekat-core/src/audio.rs
@@ -149,11 +149,18 @@ impl AudioFrame<'_> {
             window: WindowFunction::BlackmanHarris2,
         };
 
-        let mut resampler = Async::<f32>::new_sinc(ratio, 1.0, &params, 1024, 1, FixedAsync::Input)
-            .map_err(|e| crate::CoreError::Audio(e.to_string()))?;
-
-        // Allocate output buffer with headroom
-        let out_len = (nbr_input_frames as f64 * ratio) as usize + 1024;
+        // Match chunk size to input when shorter than the default — avoids
+        // wasting work padding a 160-sample G.711 frame up to 1024 samples.
+        let chunk_size = nbr_input_frames.min(1024);
+
+        let mut resampler =
+            Async::<f32>::new_sinc(ratio, 1.0, &params, chunk_size, 1, FixedAsync::Input)
+                .map_err(|e| crate::CoreError::Audio(e.to_string()))?;
+
+        // Ask rubato exactly how much output space `process_all_into_buffer`
+        // needs — it accounts for the per-chunk pad-up, the resampler's
+        // internal delay, and the input-length-times-ratio expected output.
+        let out_len = resampler.process_all_needed_output_len(nbr_input_frames);
         let mut outdata = vec![0.0f32; out_len];
 
         let input_adapter = InterleavedSlice::new(self.samples.as_ref(), 1, nbr_input_frames)
@@ -474,6 +481,57 @@ mod tests {
         );
     }
 
+    #[cfg(feature = "resample")]
+    #[test]
+    fn resample_short_input_upsample_large_ratio() {
+        // The exact case from the wavekat-voice RTP path: a 20 ms G.711 frame
+        // (160 samples @ 8 kHz) upsampled to 44.1 kHz. Before the fix this
+        // returned `InsufficientOutputBufferSize`.
+        let frame = AudioFrame::from_vec(vec![0.0f32; 160], 8000);
+        let resampled = frame.resample(44_100).unwrap();
+        assert_eq!(resampled.sample_rate(), 44_100);
+        let expected = (160.0 * 44_100.0 / 8_000.0) as i64; // 882
+        let tolerance = 50;
+        assert!(
+            (resampled.len() as i64 - expected).unsigned_abs() < tolerance,
+            "expected ~{expected} samples, got {}",
+            resampled.len()
+        );
+    }
+
+    #[cfg(feature = "resample")]
+    #[test]
+    fn resample_short_input_upsample_small_ratio() {
+        // 160 samples @ 8 kHz → 16 kHz. Also failed before the fix even
+        // though the ratio is modest, because nbr_input_frames < chunk_size.
+        let frame = AudioFrame::from_vec(vec![0.0f32; 160], 8000);
+        let resampled = frame.resample(16_000).unwrap();
+        assert_eq!(resampled.sample_rate(), 16_000);
+        let expected = 320;
+        let tolerance = 50;
+        assert!(
+            (resampled.len() as i64 - expected as i64).unsigned_abs() < tolerance,
+            "expected ~{expected} samples, got {}",
+            resampled.len()
+        );
+    }
+
+    #[cfg(feature = "resample")]
+    #[test]
+    fn resample_single_g711_frame_to_48k() {
+        // The other common device rate: 160 @ 8 kHz → 48 kHz.
+        let frame = AudioFrame::from_vec(vec![0.0f32; 160], 8000);
+        let resampled = frame.resample(48_000).unwrap();
+        assert_eq!(resampled.sample_rate(), 48_000);
+        let expected = 960;
+        let tolerance = 50;
+        assert!(
+            (resampled.len() as i64 - expected as i64).unsigned_abs() < tolerance,
+            "expected ~{expected} samples, got {}",
+            resampled.len()
+        );
+    }
+
     #[cfg(feature = "resample")]
     #[test]
     fn resample_preserves_sine_frequency() {
diff --git a/docs/04-resample-short-input-bug.md b/docs/04-resample-short-input-bug.md
new file mode 100644
index 0000000..a32e1cb
--- /dev/null
+++ b/docs/04-resample-short-input-bug.md
@@ -0,0 +1,153 @@
+# 04 — Resample drops short inputs when upsampling
+
+> Status: bug · Date: 2026-05-14
+
+## Summary
+
+`AudioFrame::resample` returns `CoreError::Audio("Insufficient output
+buffer size N, expected M frames")` for any input whose length is
+**less than rubato's internal chunk size (1024 frames)** when the
+target rate is much higher than the source rate. Every call from
+`wavekat-voice`'s RTP receive path (160-sample G.711 frames →
+44.1 kHz speaker) hits this and the frame is dropped — the user hears
+silence from the remote even though signaling and RTP are working.
+
+The bug is in the output-buffer sizing, not in the resampler itself.
+
+## Reproduction
+
+```rust
+use wavekat_core::AudioFrame;
+
+let g711_frame: Vec<f32> = vec![0.0; 160];           // 20 ms at 8 kHz
+let frame = AudioFrame::from_vec(g711_frame, 8000);
+let resampled = frame.resample(44_100);              // Err
+```
+
+Observed log line from `wavekat-voice` during a live call:
+
+```
+WARN wavekat_voice::audio_io: resample failed — dropping frame
+  err=Audio("Insufficient output buffer size 1906, expected 5633 frames")
+```
+
+## Root cause
+
+`crates/wavekat-core/src/audio.rs:152` builds the resampler with a
+fixed input chunk size and an explicit `FixedAsync::Input` mode:
+
+```rust
+let mut resampler = Async::<f32>::new_sinc(
+    ratio, 1.0, &params, /* chunk_size: */ 1024, 1, FixedAsync::Input,
+)?;
+```
+
+Rubato in `FixedAsync::Input` mode processes input in fixed
+`chunk_size`-sized chunks, **regardless of how much input the caller
+actually supplied.** Each chunk produces `chunk_size * ratio` output
+frames.
+
+Line 156 sizes the output buffer for the *actual* input length:
+
+```rust
+let out_len = (nbr_input_frames as f64 * ratio) as usize + 1024;
+```
+
+For a 160-sample input upsampled 8 kHz → 44.1 kHz:
+
+| Quantity                                | Value |
+|-----------------------------------------|-------|
+| `nbr_input_frames`                      | 160   |
+| `ratio = 44_100 / 8_000`                | 5.5125 |
+| `out_len` (sized by caller)             | 160 × 5.5125 + 1024 = **1906** |
+| Output rubato actually requires         | 1024 × 5.5125 ≈ **5633** |
+
+Rubato sees the output buffer is too small and returns
+`InsufficientOutputBufferSize`. The wavekat-voice receive loop logs
+the error and drops the frame.
+
+Why this hasn't bitten before:
+
+- **Downsample paths** (e.g. 48 kHz mic → 8 kHz for G.711 encode): the
+  *output* per chunk is smaller than 1024, the heuristic `out_len`
+  almost always exceeds it. No failures.
+- **Upsample with large inputs** (e.g. a 1 s WAV at 8 kHz → 16 kHz for
+  VAD): `nbr_input_frames` ≥ chunk_size, so `nbr_input_frames * ratio`
+  already covers `chunk_size * ratio`.
+- **Upsample with short inputs and a small ratio** (e.g. 8 kHz →
+  16 kHz, 160 input frames → 320 output): `out_len = 1184`, rubato
+  needs `1024 × 2 = 2048`. Still fails, but the symptom is the same;
+  has just not been exercised.
+
+The bug is specifically when `nbr_input_frames < chunk_size` and
+`target_rate > source_rate`.
+
+## Recommended fix
+
+Two changes in `resample()`:
+
+1. **Size the output buffer with rubato's own API.** `Resampler` exposes
+   `output_frames_max()` (and `output_frames_next()` for streaming
+   callers), which returns the largest output any single chunk could
+   produce. Use it instead of the input-times-ratio heuristic:
+
+   ```rust
+   let out_len = resampler.output_frames_max() + 1024; // small headroom
+   let mut outdata = vec![0.0f32; out_len];
+   ```
+
+   This is what rubato's own examples recommend; it removes the
+   "guess and pad" pattern.
+
+2. **(Optional) Match the chunk size to short inputs.** For one-shot
+   `AudioFrame::resample` callers, processing one 160-sample input
+   in 1024-sample chunks is wasteful — rubato pads the chunk
+   internally and the extra output is truncated by `out_produced`.
+   Pick a chunk size matched to the input when the input is shorter
+   than the default:
+
+   ```rust
+   let chunk_size = nbr_input_frames.min(1024);
+   ```
+
+   This saves both CPU and memory on the hot path the RTP receive
+   loop drives.
+
+Either fix alone resolves the bug; doing both is the right shape.
+
+## Test additions (must land with the fix)
+
+Per the project's "tests ship with features" rule, add unit tests in
+`audio::tests` that fail before the fix and pass after:
+
+1. **`resample_short_input_upsample_large_ratio`** — the exact case
+   that bit us: 160 samples at 8 kHz → 44.1 kHz. Must return `Ok`
+   with an output length close to `160 * 5.5125 = 882` (allow a small
+   tolerance, rubato's edge behavior).
+2. **`resample_short_input_upsample_small_ratio`** — 160 samples at
+   8 kHz → 16 kHz. Today this also fails (output buffer 1344, rubato
+   needs 2048); the fix must cover it.
+3. **`resample_single_g711_frame_to_48k`** — 160 → 48 kHz (the
+   other common device rate); same shape.
+4. **`resample_does_not_regress_on_long_inputs`** — keep the existing
+   `resample_upsample` / `resample_downsample` tests passing
+   (regression guard).
+
+## Downstream impact
+
+After the fix lands:
+
+- **`wavekat-core` 0.0.10** (or whatever the next release-please bump
+  is).
+- **`wavekat-voice`** picks up the new version via workspace dep bump;
+  the existing per-frame `AudioFrame::resample` call in
+  `LocalDeviceSink` starts working. No other changes needed on the
+  consumer side.
+
+A streaming-resampler refactor in `LocalDeviceSink` (build one
+resampler at stream-open, feed it sample-by-sample, keep state across
+frames) is a separate, larger improvement and not required for this
+fix. The motivations for that refactor are CPU efficiency (no per-frame
+allocator churn) and quality (avoid edge artifacts at chunk
+boundaries), not correctness — once the buffer-sizing bug is fixed,
+per-frame stateless resampling is *correct*, just not optimal.

From 7ed62cb4111d60f5e9c5e7da74e4fe4ec0c96a54 Mon Sep 17 00:00:00 2001
From: Eason WaveKat <eason@wavekat.com>
Date: Thu, 14 May 2026 17:15:11 +1200
Subject: [PATCH 2/2] test: capture resample length unconditionally for
 coverage

Move resampled.len() into a local before the assert! so the value is
evaluated on the happy path, not only inside the panic-message format
args. Lets codecov see the new test lines as covered.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 crates/wavekat-core/src/audio.rs | 25 +++++++++++--------------
 1 file changed, 11 insertions(+), 14 deletions(-)

diff --git a/crates/wavekat-core/src/audio.rs b/crates/wavekat-core/src/audio.rs
index 36862f4..92b4242 100644
--- a/crates/wavekat-core/src/audio.rs
+++ b/crates/wavekat-core/src/audio.rs
@@ -491,11 +491,10 @@ mod tests {
         let resampled = frame.resample(44_100).unwrap();
         assert_eq!(resampled.sample_rate(), 44_100);
         let expected = (160.0 * 44_100.0 / 8_000.0) as i64; // 882
-        let tolerance = 50;
+        let actual = resampled.len() as i64;
         assert!(
-            (resampled.len() as i64 - expected).unsigned_abs() < tolerance,
-            "expected ~{expected} samples, got {}",
-            resampled.len()
+            (actual - expected).unsigned_abs() < 50,
+            "expected ~{expected} samples, got {actual}"
         );
     }
 
@@ -507,12 +506,11 @@ mod tests {
         let frame = AudioFrame::from_vec(vec![0.0f32; 160], 8000);
         let resampled = frame.resample(16_000).unwrap();
         assert_eq!(resampled.sample_rate(), 16_000);
-        let expected = 320;
-        let tolerance = 50;
+        let expected: i64 = 320;
+        let actual = resampled.len() as i64;
         assert!(
-            (resampled.len() as i64 - expected as i64).unsigned_abs() < tolerance,
-            "expected ~{expected} samples, got {}",
-            resampled.len()
+            (actual - expected).unsigned_abs() < 50,
+            "expected ~{expected} samples, got {actual}"
         );
     }
 
@@ -523,12 +521,11 @@ mod tests {
         let frame = AudioFrame::from_vec(vec![0.0f32; 160], 8000);
         let resampled = frame.resample(48_000).unwrap();
         assert_eq!(resampled.sample_rate(), 48_000);
-        let expected = 960;
-        let tolerance = 50;
+        let expected: i64 = 960;
+        let actual = resampled.len() as i64;
         assert!(
-            (resampled.len() as i64 - expected as i64).unsigned_abs() < tolerance,
-            "expected ~{expected} samples, got {}",
-            resampled.len()
+            (actual - expected).unsigned_abs() < 50,
+            "expected ~{expected} samples, got {actual}"
         );
     }