Quant t5: Add coedit model to wasm demo and readme (#1031)

2025-06-17 11:08:52 +00:00 · 2023-10-04 15:57:33 -04:00
parent 27e70a5093
commit b86ac0c507
3 changed files with 70 additions and 5 deletions
--- a/candle-examples/examples/quantized-t5/README.md
+++ b/candle-examples/examples/quantized-t5/README.md
@ -13,5 +13,30 @@ generate quantized weight files from the original safetensors file by using the
 `tensor-tools` command line utility via:
 ```bash
-cargo run --example tensor-tools --release -- quantize --quantization q6k PATH/TO/T5/model.safetensors /tmp/model.gguf
+$ cargo run --example tensor-tools --release -- quantize --quantization q6k PATH/TO/T5/model.safetensors /tmp/model.gguf
 ```
 To use a different model, specify the `model-id`. For example, you can use
 quantized [CoEdit models](https://huggingface.co/jbochi/candle-coedit-quantized).
 ```bash
 $ cargo run --example quantized-t5 --release  -- \
  --model-id "jbochi/candle-coedit-quantized" \
  --prompt "Make this text coherent: Their flight is weak. They run quickly through the tree canopy." \
  --temperature 0
 ...
 Although their flight is weak, they run quickly through the tree canopy.
 By default, it will look for `model.gguf` and `config.json`, but you can specify
 custom local or remote `weight-file` and `config-file`s:
 ```bash
 cargo run --example quantized-t5 --release  -- \
  --model-id "jbochi/candle-coedit-quantized" \
  --weight-file "model-xl.gguf" \
  --config-file "config-xl.json" \
  --prompt "Rewrite to make this easier to understand: Note that a storm surge is what forecasters consider a hurricane's most treacherous aspect." \
  --temperature 0
 ...
 Note that a storm surge is what forecasters consider a hurricane's most dangerous part.
 ```
--- a/candle-wasm-examples/t5/index.html
+++ b/candle-wasm-examples/t5/index.html
@ -166,13 +166,19 @@
            target="_blank"
            class="link"
            >flan-t5-small</a
-          >
+          >,
-          and several t5
+          several
          <a
            href="https://huggingface.co/lmz/candle-quantized-t5/tree/main"
            target="_blank"
            class="link">
-            t5 quantized gguf</a
+            t5 quantized gguf models</a
          >, and also a quantized
          <a
            href="https://huggingface.co/jbochi/candle-coedit-quantized/tree/main"
            target="_blank"
            class="link">
            CoEdIT model for text rewrite</a
          >.
        </p>
      </div>
--- a/candle-wasm-examples/t5/utils.js
+++ b/candle-wasm-examples/t5/utils.js
@ -65,6 +65,7 @@ export async function generateText(
    worker.addEventListener("message", messageHandler);
  });
 }
 export const MODELS = {
  t5_small_quantized: {
    size: "64.4 MB",
@ -133,7 +134,6 @@ export const MODELS = {
      summarization: { prefix: "summarize: ", max_length: 200 },
    },
  },
  flan_t5_base_quantized: {
    size: "263 MB",
    base_url: "https://huggingface.co/lmz/candle-quantized-t5/resolve/main/",
@ -156,7 +156,41 @@ export const MODELS = {
      summarization: { prefix: "summarize: ", max_length: 200 },
    },
  },
  coedit_large_quantized: {
    size: "643 MB",
    base_url: "https://huggingface.co/jbochi/candle-coedit-quantized/resolve/main/",
    model: "model.gguf",
    tokenizer: "tokenizer.json",
    config: "config.json",
    tasks: {
      fluency: {
        prefix: "Fix the grammar: ",
        max_length: 300,
      },
      coherence: {
        prefix: "Rewrite to make this easier to understand: ",
        max_length: 300,
      },
      simplification: {
        prefix: "translate English to Romanian: ",
        max_length: 300,
      },
      simplification: {
        prefix: "Paraphrase this: ",
        max_length: 300,
      },
      formalization: {
        prefix: "Write this more formally: ",
        max_length: 300,
      },
      neutralize: {
        prefix: "Write in a more neutral way: ",
        max_length: 300,
      },
    },
  },
 };
 export function getModelInfo(id, taskID) {
  const model = MODELS[id];
  return {