From a9dea32c81ba436334eb68231f2cc9f8deafb0ee Mon Sep 17 00:00:00 2001
From: Niko <niko@niko.lgbt>
Date: Sat, 2 Aug 2025 19:42:32 -0700
Subject: [PATCH] Fix up `audio_transcription` example

---
 examples/audio_transcription.rs | 47 +++++++++++++--------------------
 1 file changed, 18 insertions(+), 29 deletions(-)

diff --git a/examples/audio_transcription.rs b/examples/audio_transcription.rs
index 60e5ea9..f584592 100644
--- a/examples/audio_transcription.rs
+++ b/examples/audio_transcription.rs
@@ -8,7 +8,13 @@ use whisper_rs::{FullParams, SamplingStrategy, WhisperContext, WhisperContextPar
 
 /// Loads a context and model, processes an audio file, and prints the resulting transcript to stdout.
 fn main() -> Result<(), &'static str> {
-    // Load a context and model.
+    let model_path = std::env::args()
+        .nth(1)
+        .expect("Please specify path to model as argument 1");
+    let wav_path = std::env::args()
+        .nth(2)
+        .expect("Please specify path to wav file as argument 2");
+
     let mut context_param = WhisperContextParameters::default();
 
     // Enable DTW token level timestamp for known model by using model preset
@@ -37,13 +43,11 @@ fn main() -> Result<(), &'static str> {
         aheads: &custom_aheads,
     };
 
-    let ctx = WhisperContext::new_with_params(
-        "example/path/to/model/whisper.cpp/models/ggml-base.en.bin",
-        context_param,
-    )
-    .expect("failed to load model");
+    // Load a context and model
+    let ctx =
+        WhisperContext::new_with_params(&model_path, context_param).expect("failed to load model");
     // Create a state
-    let mut state = ctx.create_state().expect("failed to create key");
+    let mut state = ctx.create_state().expect("failed to create state");
 
     // Create a params object for running the model.
     // The number of past samples to consider defaults to 0.
@@ -65,7 +69,7 @@ fn main() -> Result<(), &'static str> {
     params.set_token_timestamps(true);
 
     // Open the audio file.
-    let reader = hound::WavReader::open("audio.wav").expect("failed to open file");
+    let reader = hound::WavReader::open(wav_path).expect("failed to open file");
     #[allow(unused_variables)]
     let hound::WavSpec {
         channels,
@@ -84,7 +88,6 @@ fn main() -> Result<(), &'static str> {
 
     // Convert audio to 16KHz mono f32 samples, as required by the model.
     // These utilities are provided for convenience, but can be replaced with custom conversion logic.
-    // SIMD variants of these functions are also available on nightly Rust (see the docs).
     if channels == 2 {
         audio = whisper_rs::convert_stereo_to_mono_audio(&audio).expect("Conversion error");
     } else if channels != 1 {
@@ -102,28 +105,14 @@ fn main() -> Result<(), &'static str> {
     let mut file = File::create("transcript.txt").expect("failed to create file");
 
     // Iterate through the segments of the transcript.
-    let num_segments = state
-        .full_n_segments()
-        .expect("failed to get number of segments");
-    for i in 0..num_segments {
+    for segment in state.as_iter() {
         // Get the transcribed text and timestamps for the current segment.
-        let segment = state
-            .full_get_segment_text(i)
-            .expect("failed to get segment");
-        let start_timestamp = state
-            .full_get_segment_t0(i)
-            .expect("failed to get start timestamp");
-        let end_timestamp = state
-            .full_get_segment_t1(i)
-            .expect("failed to get end timestamp");
+        let start_timestamp = segment.start_timestamp();
+        let end_timestamp = segment.end_timestamp();
 
-        let first_token_dtw_ts = if let Ok(token_count) = state.full_n_tokens(i) {
-            if token_count > 0 {
-                if let Ok(token_data) = state.full_get_token_data(i, 0) {
-                    token_data.t_dtw
-                } else {
-                    -1i64
-                }
+        let first_token_dtw_ts = if segment.n_tokens() > 0 {
+            if let Some(token) = segment.get_token(0) {
+                token.token_data().map_or(0, |token| token.t_dtw)
             } else {
                 -1i64
             }