From 2d28497197b30d7f47999b15fdf6aa64b0f5e9b0 Mon Sep 17 00:00:00 2001 From: Laurent Mazare Date: Wed, 8 Nov 2023 06:42:52 +0100 Subject: Preliminary support for whisper v3. (#1294) * Preliminary support for whisper v3. * Add the missing files. --- candle-transformers/src/models/whisper/mod.rs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'candle-transformers/src/models/whisper/mod.rs') diff --git a/candle-transformers/src/models/whisper/mod.rs b/candle-transformers/src/models/whisper/mod.rs index 35d35e77..bf24045a 100644 --- a/candle-transformers/src/models/whisper/mod.rs +++ b/candle-transformers/src/models/whisper/mod.rs @@ -18,6 +18,7 @@ pub struct Config { // pub n_text_state: usize, pub decoder_attention_heads: usize, // n_text_head pub decoder_layers: usize, // n_text_layer + #[serde(default)] pub suppress_tokens: Vec, } @@ -26,7 +27,6 @@ pub const DTYPE: candle::DType = candle::DType::F32; // Audio parameters. pub const SAMPLE_RATE: usize = 16000; pub const N_FFT: usize = 400; -pub const N_MELS: usize = 80; pub const HOP_LENGTH: usize = 160; pub const CHUNK_LENGTH: usize = 30; pub const N_SAMPLES: usize = CHUNK_LENGTH * SAMPLE_RATE; // 480000 samples in a 30-second chunk -- cgit v1.2.3