Implement top_p / nucleus sampling (#819)

* Implement top_p / nucleus sampling * Update changelog * rustfmt * Add tests * Fix clippy warning * Fix another clippy error
2025-06-19 11:56:45 +00:00 · 2023-09-12 09:10:16 -07:00
parent 42da17694a
commit 805bf9ffa7
12 changed files with 199 additions and 43 deletions
--- a/candle-wasm-examples/llama2-c/lib-example.html
+++ b/candle-wasm-examples/llama2-c/lib-example.html
@ -56,6 +56,7 @@
        const weightsURL = `${MODELS_BASE_URL}/${model.url}`;
        const prompt = getValue("prompt");
        const temperature = getValue("temperature");
+        const topP = getValue("top-p");
        const repeatPenalty = getValue("repeat_penalty");
        const seed = getValue("seed");
        const maxSeqLen = getValue("max-seq");
@ -99,6 +100,7 @@
            tokenizerURL: "tokenizer.json",
            prompt,
            temp: temperature,
+            top_p: topP,
            repeatPenalty,
            seed: BigInt(seed),
            maxSeqLen,
@ -251,7 +253,7 @@
        <input
          type="range"
          id="max-seq"
-          name="temperature"
+          name="max-seq"
          min="1"
          max="256"
          step="1"
@ -279,6 +281,22 @@
        >
          0.50</output
        >
+        <label class="text-sm font-medium" for="top-p">Top-p</label>
+        <input
+          type="range"
+          id="top-p"
+          name="top-p"
+          min="0"
+          max="1"
+          step="0.01"
+          value="1.00"
+          oninput="this.nextElementSibling.value = Number(this.value).toFixed(2)"
+        />
+        <output
+          class="text-xs w-[50px] text-center font-light px-1 py-1 border border-gray-700 rounded-md"
+        >
+          1.00</output
+        >

        <label class="text-sm font-medium" for="repeat_penalty"
          >Repeat Penalty</label