Spaces:
Running
Running
Update src/worker.js
Browse files- src/worker.js +2 -2
src/worker.js
CHANGED
@@ -80,9 +80,9 @@ await transcriber(new Float32Array(INPUT_SAMPLE_RATE)); // Compile shaders
|
|
80 |
const llm_model_id = "onnx-community/Qwen3-1.7B-ONNX";
|
81 |
const tokenizer = await AutoTokenizer.from_pretrained("Qwen/Qwen3-1.7B"); // Load tokenizer from original repo
|
82 |
const llm = await AutoModelForCausalLM.from_pretrained(llm_model_id, {
|
83 |
-
dtype: "q4f16",
|
84 |
device: "webgpu",
|
85 |
-
|
86 |
});
|
87 |
|
88 |
const SYSTEM_MESSAGE = {
|
|
|
80 |
const llm_model_id = "onnx-community/Qwen3-1.7B-ONNX";
|
81 |
const tokenizer = await AutoTokenizer.from_pretrained("Qwen/Qwen3-1.7B"); // Load tokenizer from original repo
|
82 |
const llm = await AutoModelForCausalLM.from_pretrained(llm_model_id, {
|
83 |
+
dtype: "q4f16", // This alone should make it pick model_q4f16.onnx
|
84 |
device: "webgpu",
|
85 |
+
// Don't specify model_file_name - let Transformers.js construct the path
|
86 |
});
|
87 |
|
88 |
const SYSTEM_MESSAGE = {
|