From b11c8b95b985863e5ad1a99705d1c91b88910240 Mon Sep 17 00:00:00 2001
From: Roderick van Domburg <roderick@vandomburg.net>
Date: Mon, 22 Dec 2025 23:10:02 +0100
Subject: [PATCH] fix: ensure frame-aligned spans in queue to prevent channel
 misalignment

Fixes two related issues with frame alignment in the queue:

1. Frame alignment for non-power-of-2 channel counts: The queue used a
   fixed threshold of 512 samples which could cause channel misalignment
   when the channel count doesn't evenly divide 512 (e.g., 6 channels:
   512 % 6 = 2 sample offset). Replaced with dynamic threshold function
   that rounds to nearest frame boundary.

2. Mid-span ending detection: Sources that end before their promised
   current_span_len() would cause the queue to immediately transition
   to the next source, potentially mid-frame. Added sample tracking and
   silence padding to complete frames before transitioning.

Changes:
- Replace THRESHOLD constant with threshold(channels) helper function
  that ensures frame-aligned span lengths
- Add sample tracking to detect mid-span source endings
- Inject silence padding to complete incomplete frames
- Add span_ending_mid_frame test to verify padding behavior

Supersedes #684
---
 CHANGELOG.md            |   2 +
 src/queue.rs            | 163 +++++++++++++++++++++++++++++++++++++---
 src/source/mod.rs       |   6 ++
 tests/channel_volume.rs |  63 ++++++++++++++++
 4 files changed, 225 insertions(+), 9 deletions(-)
 create mode 100644 tests/channel_volume.rs
diff --git a/CHANGELOG.md b/CHANGELOG.md
index b7bfc2d6..11eefdb8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -36,6 +36,8 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Fixed audio distortion when queueing sources with different sample rates/channel counts or transitioning from empty queue.
 - Fixed `SamplesBuffer` to correctly report exhaustion and remaining samples.
 - Improved precision in `SkipDuration` to avoid off-by-a-few-samples errors.
+- Fixed channel misalignment in queue with non-power-of-2 channel counts (e.g., 6 channels) by ensuring frame-aligned span lengths.
+- Fixed channel misalignment when sources end before their promised span length by padding with silence to complete frames.
 
 ### Changed
 - `output_to_wav` renamed to `wav_to_file` and now takes ownership of the `Source`.
diff --git a/src/queue.rs b/src/queue.rs
index 82dcdd63..7f869586 100644
--- a/src/queue.rs
+++ b/src/queue.rs
@@ -35,6 +35,8 @@ pub fn queue(keep_alive_if_empty: bool) -> (Arc<SourcesQueueInput>, SourcesQueue
         current: Box::new(Empty::new()) as Box<_>,
         signal_after_end: None,
         input: input.clone(),
+        samples_consumed_in_span: 0,
+        padding_samples_remaining: 0,
     };
 
     (input, output)
@@ -110,12 +112,29 @@ pub struct SourcesQueueOutput {
 
     // The next sounds.
     input: Arc<SourcesQueueInput>,
+
+    // Track samples consumed in the current span to detect mid-span endings.
+    samples_consumed_in_span: usize,
+
+    // When a source ends mid-frame, this counts how many silence samples to inject
+    // to complete the frame before transitioning to the next source.
+    padding_samples_remaining: usize,
 }
 
-const THRESHOLD: usize = 512;
 const SILENCE_SAMPLE_RATE: SampleRate = nz!(44100);
 const SILENCE_CHANNELS: ChannelCount = nz!(1);
 
+/// Returns a threshold span length that ensures frame alignment.
+///
+/// Spans must end on frame boundaries (multiples of channel count) to prevent
+/// channel misalignment. Returns ~512 samples rounded to the nearest frame.
+#[inline]
+fn threshold(channels: ChannelCount) -> usize {
+    const BASE_SAMPLES: usize = 512;
+    let ch = channels.get() as usize;
+    BASE_SAMPLES.div_ceil(ch) * ch
+}
+
 impl Source for SourcesQueueOutput {
     #[inline]
     fn current_span_len(&self) -> Option<usize> {
@@ -136,8 +155,8 @@ impl Source for SourcesQueueOutput {
         } else if self.input.keep_alive_if_empty.load(Ordering::Acquire)
             && self.input.next_sounds.lock().unwrap().is_empty()
         {
-            // The next source will be a filler silence which will have the length of `THRESHOLD`
-            return Some(THRESHOLD);
+            // The next source will be a filler silence which will have a frame-aligned length
+            return Some(threshold(self.current.channels()));
         }
 
         // Try the size hint.
@@ -148,8 +167,8 @@ impl Source for SourcesQueueOutput {
             return Some(lower_bound);
         }
 
-        // Otherwise we use the constant value.
-        Some(THRESHOLD)
+        // Otherwise we use a frame-aligned threshold value.
+        Some(threshold(self.current.channels()))
     }
 
     #[inline]
@@ -204,13 +223,33 @@ impl Iterator for SourcesQueueOutput {
     #[inline]
     fn next(&mut self) -> Option<Self::Item> {
         loop {
+            // If we're padding to complete a frame, return silence.
+            if self.padding_samples_remaining > 0 {
+                self.padding_samples_remaining -= 1;
+                return Some(0.0);
+            }
+
             // Basic situation that will happen most of the time.
             if let Some(sample) = self.current.next() {
+                self.samples_consumed_in_span += 1;
                 return Some(sample);
             }
 
-            // Since `self.current` has finished, we need to pick the next sound.
+            // Source ended - check if we ended mid-frame and need padding.
+            let channels = self.current.channels().get() as usize;
+            let incomplete_frame_samples = self.samples_consumed_in_span % channels;
+            if incomplete_frame_samples > 0 {
+                // We're mid-frame - need to pad with silence to complete it.
+                self.padding_samples_remaining = channels - incomplete_frame_samples;
+                // Reset counter now since we're transitioning to a new span.
+                self.samples_consumed_in_span = 0;
+                // Continue loop - next iteration will inject silence.
+                continue;
+            }
+
+            // Reset counter and move to next sound.
             // In order to avoid inlining this expensive operation, the code is in another function.
+            self.samples_consumed_in_span = 0;
             if self.go_next().is_err() {
                 return None;
             }
@@ -240,7 +279,7 @@ impl SourcesQueueOutput {
                 let silence = Box::new(Zero::new_samples(
                     SILENCE_CHANNELS,
                     SILENCE_SAMPLE_RATE,
-                    THRESHOLD,
+                    threshold(SILENCE_CHANNELS),
                 )) as Box<_>;
                 if self.input.keep_alive_if_empty.load(Ordering::Acquire) {
                     // Play a short silence in order to avoid spinlocking.
@@ -263,8 +302,9 @@ impl SourcesQueueOutput {
 mod tests {
     use crate::buffer::SamplesBuffer;
     use crate::math::nz;
-    use crate::queue;
-    use crate::source::Source;
+    use crate::source::{SeekError, Source};
+    use crate::{queue, ChannelCount, Sample, SampleRate};
+    use std::time::Duration;
 
     #[test]
     fn basic() {
@@ -340,4 +380,109 @@ mod tests {
         assert_eq!(rx.next(), Some(10.0));
         assert_eq!(rx.next(), Some(-10.0));
     }
+
+    #[test]
+    fn span_ending_mid_frame() {
+        let mut test_source1 = TestSource::new(&[0.1, 0.2, 0.1, 0.2, 0.1])
+            .with_channels(nz!(2))
+            .with_false_span_len(Some(6));
+        let mut test_source2 = TestSource::new(&[0.3, 0.4, 0.3, 0.4]).with_channels(nz!(2));
+
+        let (controls, mut source) = queue::queue(true);
+        controls.append(test_source1.clone());
+        controls.append(test_source2.clone());
+
+        assert_eq!(source.next(), test_source1.next());
+        assert_eq!(source.next(), test_source1.next());
+        assert_eq!(source.next(), test_source1.next());
+        assert_eq!(source.next(), test_source1.next());
+        assert_eq!(source.next(), test_source1.next());
+        assert_eq!(None, test_source1.next());
+
+        // Source promised span of 6 but only delivered 5 samples.
+        // With 2 channels, that's 2.5 frames. Queue should pad with silence.
+        assert_eq!(
+            source.next(),
+            Some(0.0),
+            "Expected silence to complete frame"
+        );
+
+        assert_eq!(source.next(), test_source2.next());
+        assert_eq!(source.next(), test_source2.next());
+        assert_eq!(source.next(), test_source2.next());
+        assert_eq!(source.next(), test_source2.next());
+    }
+
+    /// Test helper source that allows setting false span length to simulate
+    /// sources that end before their promised span length.
+    #[derive(Debug, Clone)]
+    struct TestSource {
+        samples: Vec<Sample>,
+        pos: usize,
+        channels: ChannelCount,
+        sample_rate: SampleRate,
+        total_span_len: Option<usize>,
+    }
+
+    impl TestSource {
+        fn new(samples: &[Sample]) -> Self {
+            let samples = samples.to_vec();
+            Self {
+                total_span_len: Some(samples.len()),
+                pos: 0,
+                channels: nz!(1),
+                sample_rate: nz!(44100),
+                samples,
+            }
+        }
+
+        fn with_channels(mut self, count: ChannelCount) -> Self {
+            self.channels = count;
+            self
+        }
+
+        fn with_false_span_len(mut self, total_len: Option<usize>) -> Self {
+            self.total_span_len = total_len;
+            self
+        }
+    }
+
+    impl Iterator for TestSource {
+        type Item = Sample;
+
+        fn next(&mut self) -> Option<Self::Item> {
+            let res = self.samples.get(self.pos).copied();
+            self.pos += 1;
+            res
+        }
+
+        fn size_hint(&self) -> (usize, Option<usize>) {
+            let remaining = self.samples.len().saturating_sub(self.pos);
+            (remaining, Some(remaining))
+        }
+    }
+
+    impl Source for TestSource {
+        fn current_span_len(&self) -> Option<usize> {
+            self.total_span_len
+        }
+
+        fn channels(&self) -> ChannelCount {
+            self.channels
+        }
+
+        fn sample_rate(&self) -> SampleRate {
+            self.sample_rate
+        }
+
+        fn total_duration(&self) -> Option<Duration> {
+            None
+        }
+
+        fn try_seek(&mut self, _: Duration) -> Result<(), SeekError> {
+            Err(SeekError::NotSupported {
+                underlying_source: std::any::type_name::<Self>(),
+            })
+        }
+    }
 }
diff --git a/src/source/mod.rs b/src/source/mod.rs
index bf222b92..5dc79813 100644
--- a/src/source/mod.rs
+++ b/src/source/mod.rs
@@ -176,6 +176,12 @@ pub trait Source: Iterator<Item = Sample> {
     /// After the engine has finished reading the specified number of samples, it will check
     /// whether the value of `channels()` and/or `sample_rate()` have changed.
     ///
+    /// # Frame Alignment
+    ///
+    /// Span lengths must be multiples of the channel count to ensure spans end on frame
+    /// boundaries. A "frame" is one sample for each channel. Returning a span length
+    /// that is not a multiple of `channels()` will cause channel misalignment issues.
+    ///
     /// Note: This returns the total span size, not the remaining samples. Use `Iterator::size_hint`
     /// to determine how many samples remain in the iterator.
     fn current_span_len(&self) -> Option<usize>;
diff --git a/tests/channel_volume.rs b/tests/channel_volume.rs
new file mode 100644
index 00000000..e04ebeff
--- /dev/null
+++ b/tests/channel_volume.rs
@@ -0,0 +1,63 @@
+use std::fs;
+use std::io::BufReader;
+
+use rodio::source::ChannelVolume;
+use rodio::{queue, Decoder, Sample, Source};
+
+fn create_6_channel_source() -> ChannelVolume<Decoder<BufReader<fs::File>>> {
+    let file = fs::File::open("assets/music.mp3").unwrap();
+    let decoder = Decoder::try_from(file).unwrap();
+    assert_eq!(decoder.channels().get(), 2);
+    let channel_volume = ChannelVolume::new(decoder, vec![1.0, 1.0, 0.0, 0.0, 0.0, 0.0]);
+    assert_eq!(channel_volume.channels().get(), 6);
+    channel_volume
+}
+
+#[test]
+fn channel_volume_without_queue() {
+    let channel_volume = create_6_channel_source();
+    assert_output_only_on_first_two_channels(channel_volume, 6);
+}
+
+#[test]
+fn channel_volume_with_queue() {
+    let channel_volume = create_6_channel_source();
+    let (controls, queue) = queue::queue(false);
+    controls.append(channel_volume);
+    assert_output_only_on_first_two_channels(queue, 6);
+}
+
+fn assert_output_only_on_first_two_channels(
+    mut source: impl Source<Item = Sample>,
+    channels: usize,
+) {
+    let mut frame_number = 0;
+    let mut samples_in_frame = Vec::new();
+
+    while let Some(sample) = source.next() {
+        samples_in_frame.push(sample);
+
+        if samples_in_frame.len() == channels {
+            // We have a complete frame - verify channels 2+ are zero
+            for (ch, &sample) in samples_in_frame[2..].iter().enumerate() {
+                assert_eq!(
+                    sample,
+                    0.0,
+                    "frame {} channel {} had nonzero value (should be zero)",
+                    frame_number,
+                    ch + 2
+                );
+            }
+
+            samples_in_frame.clear();
+            frame_number += 1;
+        }
+    }
+
+    assert_eq!(
+        samples_in_frame.len(),
+        0,
+        "Source ended with partial frame {} (should end on frame boundary)",
+        samples_in_frame.len()
+    );
+}