fastrepl · yujonglee · Aug 17, 2025 · coderabbitai · Aug 18, 2025
diff --git a/crates/transcribe-whisper-local/src/service/streaming.rs b/crates/transcribe-whisper-local/src/service/streaming.rs
@@ -297,6 +297,8 @@ where
                 Ok(chunk) => Some(hypr_whisper_local::SimpleAudioChunk {
                     samples: chunk.samples,
                     meta: Some(serde_json::json!({ "source": source_name })),
+                    start_timestamp_ms: Some(chunk.start_timestamp_ms),
+                    end_timestamp_ms: Some(chunk.end_timestamp_ms),
                 }),
             })
         })

diff --git a/crates/whisper-local/src/stream.rs b/crates/whisper-local/src/stream.rs
@@ -20,12 +20,16 @@ pub struct TranscriptionTask<S, T> {
 pub trait AudioChunk: Send + 'static {
     fn samples(&self) -> &[f32];
     fn meta(&self) -> Option<serde_json::Value>;
+    fn start_timestamp_ms(&self) -> Option<usize>;
+    fn end_timestamp_ms(&self) -> Option<usize>;
 }
 
 #[derive(Default)]
 pub struct SimpleAudioChunk {
     pub samples: Vec<f32>,
     pub meta: Option<serde_json::Value>,
+    pub start_timestamp_ms: Option<usize>,
+    pub end_timestamp_ms: Option<usize>,
 }
 
 impl AudioChunk for SimpleAudioChunk {
@@ -36,6 +40,14 @@ impl AudioChunk for SimpleAudioChunk {
     fn meta(&self) -> Option<serde_json::Value> {
         self.meta.clone()
     }
+
+    fn start_timestamp_ms(&self) -> Option<usize> {
+        self.start_timestamp_ms
+    }
+
+    fn end_timestamp_ms(&self) -> Option<usize> {
+        self.end_timestamp_ms
+    }
 }
 
 pub struct AudioChunkStream<S>(pub S);
@@ -116,6 +128,7 @@ where
                         &samples,
                         &mut this.current_segment_task,
                         None,
+                        (None, None),
                     ) {
                         Poll::Ready(result) => return Poll::Ready(result),
                         Poll::Pending => continue,
@@ -156,11 +169,14 @@ where
                     let meta = chunk.meta();
                     let samples = chunk.samples();
 
+                    let timestamps = (chunk.start_timestamp_ms(), chunk.end_timestamp_ms());
+
                     match process_transcription(
                         &mut this.whisper,
                         samples,
                         &mut this.current_segment_task,
                         meta,
+                        timestamps,
                     ) {
                         Poll::Ready(result) => return Poll::Ready(result),
                         Poll::Pending => continue,
@@ -178,6 +194,7 @@ fn process_transcription<'a>(
     samples: &'a [f32],
     current_segment_task: &'a mut Option<Pin<Box<dyn Stream<Item = Segment> + Send>>>,
     meta: Option<serde_json::Value>,
+    timestamps: (Option<usize>, Option<usize>),
 ) -> Poll<Option<Segment>> {
     if !samples.is_empty() {
         match whisper.transcribe(samples) {
@@ -190,6 +207,11 @@ fn process_transcription<'a>(
             Ok(mut segments) => {
                 for segment in &mut segments {
                     segment.meta = meta.clone();
+
+                    if let (Some(start_ms), Some(end_ms)) = timestamps {
+                        segment.start = start_ms as f64 / 1000.0;
+                        segment.end = end_ms as f64 / 1000.0;
+                    }
-                    if let (Some(start_ms), Some(end_ms)) = timestamps {
-                        segment.start = start_ms as f64 / 1000.0;
-                        segment.end = end_ms as f64 / 1000.0;
-                    }
+                    // Add chunk start offset; keep model-provided intra-chunk timing.
+                    if let (Some(start_ms), _) = timestamps {
+                        let offset_s = start_ms as f64 / 1000.0;
+                        segment.start += offset_s;
+                        segment.end += offset_s;
+                    }
+                    // Clamp segment end to the chunk end if provided.
+                    if let (_, Some(end_ms)) = timestamps {
+                        let end_limit_s = end_ms as f64 / 1000.0;
+                        if segment.end > end_limit_s {
+                            segment.end = end_limit_s;
+                        }
+                    }
-                    if let (Some(start_ms), Some(end_ms)) = timestamps {
-                        segment.start = start_ms as f64 / 1000.0;
-                        segment.end = end_ms as f64 / 1000.0;
-                    }
+                    // Add chunk start offset; keep model-provided intra-chunk timing.
+                    if let (Some(start_ms), _) = timestamps {
+                        let offset_s = start_ms as f64 / 1000.0;
+                        segment.start += offset_s;
+                        segment.end += offset_s;
+                    }
+                    // Clamp segment end to the chunk end if provided.
+                    if let (_, Some(end_ms)) = timestamps {
+                        let end_limit_s = end_ms as f64 / 1000.0;
+                        if segment.end > end_limit_s {
+                            segment.end = end_limit_s;
+                        }
+                    }
                 }
 
                 *current_segment_task = Some(Box::pin(futures_util::stream::iter(segments)));