Whisper quantized wasm (#1028)

* [Whisper] Update to use quantized model * [whisper] add language detection * [whisper] change assets location * [whisper] adapt js example with quantized models * [whisper] better task parsing * [whisper] minor fixes
2025-06-21 20:22:49 +00:00 · 2023-10-04 12:22:57 -07:00
parent c18a856e76
commit 27e70a5093
13 changed files with 540 additions and 596 deletions
--- a/candle-wasm-examples/whisper/src/audio.rs
+++ b/candle-wasm-examples/whisper/src/audio.rs
@ -168,7 +168,7 @@ fn log_mel_spectrogram_<T: Float + std::fmt::Display>(
    let n_len = samples.len() / fft_step;

    // pad audio with at least one extra chunk of zeros
-    let pad = 100 * worker::CHUNK_LENGTH / 2;
+    let pad = 100 * worker::m::CHUNK_LENGTH / 2;
    let n_len = if n_len % pad != 0 {
        (n_len / pad + 1) * pad
    } else {
@ -206,9 +206,9 @@ pub fn pcm_to_mel<T: Float + std::fmt::Display>(
    let mel = log_mel_spectrogram_(
        samples,
        filters,
-        worker::N_FFT,
-        worker::HOP_LENGTH,
-        worker::N_MELS,
+        worker::m::N_FFT,
+        worker::m::HOP_LENGTH,
+        worker::m::N_MELS,
        false,
    );
    Ok(mel)