[ tor-browser ].git.dasho

commit 2fa36d838798bc3c5741e436c9f161a37fa7468f
parent 80bda5622944c958757ff1295afe659deb532699
Author: Aristide Tossou <atossou@mozilla.com>
Date:   Wed,  8 Oct 2025 14:27:12 +0000

Bug 1992747 - Unit test llama.cpp additional sampling configuration. r=tarek

Differential Revision: https://phabricator.services.mozilla.com/D267618

Diffstat:
M toolkit/components/ml/tests/browser/browser_ml_native.js  | 94 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++

1 file changed, 94 insertions(+), 0 deletions(-)
diff --git a/toolkit/components/ml/tests/browser/browser_ml_native.js b/toolkit/components/ml/tests/browser/browser_ml_native.js
@@ -130,9 +130,30 @@ async function llama_works() {
       },
     ];
 
+    const samplers = [
+      {
+        type: "top-k",
+        topK: 3,
+      },
+      {
+        type: "top-p",
+        topP: 0.95,
+      },
+
+      {
+        type: "logit-bias",
+        logitBias: [{ token: 5, bias: -1000 }],
+      },
+
+      {
+        type: "dist",
+      },
+    ];
+
     info("Calling runWithGenerator for normal run");
     for await (const val of engine.runWithGenerator({
       prompt,
+      samplers,
     })) {
       info(val.text);
     }
@@ -147,6 +168,79 @@ async function llama_works() {
   }
 }
 
+async function llama_fails_with_wrong_samplers() {
+  await EngineProcess.destroyMLEngine();
+  await IndexedDBCache.init({ reset: true });
+
+  const { cleanup } = await setup();
+  try {
+    info("Create the engine for a normal run");
+    const engine = await createEngine({
+      taskName: "text-classification",
+      modelId: "Mozilla/test-llama",
+      modelFile: "TinyStories-656K.Q8_0.gguf",
+      kvCacheDtype: "q8_0",
+      modelRevision: "main",
+      backend: "llama.cpp",
+      logLevel: "Debug",
+    });
+
+    const prompt = [
+      { role: "system", content: "blah" },
+      {
+        role: "user",
+        content: "This is a test that works",
+      },
+    ];
+
+    const samplers = [
+      {
+        type: "top-k",
+        topK: 3,
+      },
+      {
+        type: "top-p",
+        topP: 0.95,
+      },
+
+      {
+        type: "logit-bias",
+        logitBias: [{ token: 5, bias: -1000 }],
+      },
+
+      {
+        type: "dist-invalid",
+      },
+    ];
+
+    info("Calling runWithGenerator for normal run with expected failure");
+    const runEngine = async () => {
+      await engine.run({ prompt, samplers });
+    };
+
+    await Assert.rejects(
+      runEngine(),
+      err =>
+        String(err?.message ?? err).includes(
+          "LlamaRunner.createGenerationStream: 'dist-invalid'"
+        ),
+      "The call should be rejected because it used an invalid sampler"
+    );
+  } finally {
+    info("Destroy the engine");
+    await EngineProcess.destroyMLEngine();
+    await IndexedDBCache.init({ reset: true });
+    await cleanup();
+  }
+}
+
+/**
+ * Runs a full end-to-end test on the llama.cpp backend with samplers and expected failure.
+ */
+add_task(async function test_ml_smoke_test_llama_fails() {
+  await llama_fails_with_wrong_samplers();
+});
+
 /**
  * Runs a full end-to-end test on the llama.cpp backend with a model that loads in llama but crashes during inference.
  */

	tor-browser The Tor Browser
	git clone https://git.dasho.dev/tor-browser.git
	Log \| Files \| Refs \| README \| LICENSE