todo
parent
ec47d8142a
commit
8b5c18e65e
|
|
@ -25,7 +25,6 @@ pub fn wav_channel<F>(
|
||||||
) where F: FnMut(Result<rust_whisper_lib::Transcribed, String>) + Send + 'static {
|
) where F: FnMut(Result<rust_whisper_lib::Transcribed, String>) + Send + 'static {
|
||||||
flags.model_path = None;
|
flags.model_path = None;
|
||||||
flags.model_buffer = Some(include_bytes!("../../models/ggml-distil-medium.en.bin").to_vec());
|
flags.model_buffer = Some(include_bytes!("../../models/ggml-distil-medium.en.bin").to_vec());
|
||||||
flags.model_buffer = Some(include_bytes!("../../models/ggml-base.en.bin").to_vec());
|
|
||||||
rust_whisper_lib::wav_channel(flags, handler_fn);
|
rust_whisper_lib::wav_channel(flags, handler_fn);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -99,6 +99,7 @@ impl Destutterer {
|
||||||
|
|
||||||
let next_words = Words::from_string(next.clone());
|
let next_words = Words::from_string(next.clone());
|
||||||
let mut n = self.prev.to_comparable_words().len().clamp(0, next_words.to_comparable_words().len());
|
let mut n = self.prev.to_comparable_words().len().clamp(0, next_words.to_comparable_words().len());
|
||||||
|
//println!("n={} prev='{:?}' next='{:?}'", n, self.prev.to_comparable_words(), next_words.to_comparable_words());
|
||||||
while n > 0 {
|
while n > 0 {
|
||||||
let (prev_s, _) = self.prev.last_n_comparable_to_string(n);
|
let (prev_s, _) = self.prev.last_n_comparable_to_string(n);
|
||||||
let (next_s, next_idx) = next_words.first_n_comparable_to_string(n);
|
let (next_s, next_idx) = next_words.first_n_comparable_to_string(n);
|
||||||
|
|
|
||||||
|
|
@ -1,7 +1,9 @@
|
||||||
todo:
|
todo:
|
||||||
- overlap without stop words
|
- split on silence-ish instead of duration
|
||||||
- rust-whisper warn when transcription time ~ input time
|
- rust-whisper warn when transcription time ~ input time
|
||||||
scheduled: []
|
scheduled: []
|
||||||
done:
|
done:
|
||||||
- todo: need to overlap without ANY puctuation, which i can do by breaking into words
|
- todo: need to overlap without ANY puctuation, which i can do by breaking into words
|
||||||
ts: Tue Jan 2 18:23:00 MST 2024
|
ts: Tue Jan 2 18:23:00 MST 2024
|
||||||
|
- todo: overlap without stop words
|
||||||
|
ts: Wed Jan 3 08:22:14 MST 2024
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue