smaller t5 models quantized (#934)

This commit is contained in:
Radamés Ajna
2023-09-22 14:31:23 -07:00
committed by GitHub
parent 912a3d63b0
commit cda1786eed

View File

@ -67,7 +67,7 @@ export async function generateText(
}
export const MODELS = {
t5_small_quantized: {
size: "102 MB",
size: "64.4 MB",
base_url: "https://huggingface.co/lmz/candle-quantized-t5/resolve/main/",
model: "model.gguf",
tokenizer: "tokenizer.json",
@ -135,7 +135,7 @@ export const MODELS = {
},
flan_t5_base_quantized: {
size: "360 MB",
size: "263 MB",
base_url: "https://huggingface.co/lmz/candle-quantized-t5/resolve/main/",
model: "model-flan-t5-base.gguf",
tokenizer: "tokenizer.json",