smaller t5 models quantized (#934)

2025-06-15 10:26:33 +00:00 · 2023-09-22 14:31:23 -07:00
parent 912a3d63b0
commit cda1786eed
1 changed files with 2 additions and 2 deletions
--- a/candle-wasm-examples/t5/utils.js
+++ b/candle-wasm-examples/t5/utils.js
@ -67,7 +67,7 @@ export async function generateText(
 }
 export const MODELS = {
  t5_small_quantized: {
-    size: "102 MB",
+    size: "64.4 MB",
    base_url: "https://huggingface.co/lmz/candle-quantized-t5/resolve/main/",
    model: "model.gguf",
    tokenizer: "tokenizer.json",
@ -135,7 +135,7 @@ export const MODELS = {
  },

  flan_t5_base_quantized: {
-    size: "360 MB",
+    size: "263 MB",
    base_url: "https://huggingface.co/lmz/candle-quantized-t5/resolve/main/",
    model: "model-flan-t5-base.gguf",
    tokenizer: "tokenizer.json",