nisten commited on
Commit
23f231e
·
verified ·
1 Parent(s): 277ac94

Update src/worker.js

Browse files
Files changed (1) hide show
  1. src/worker.js +2 -2
src/worker.js CHANGED
@@ -80,9 +80,9 @@ await transcriber(new Float32Array(INPUT_SAMPLE_RATE)); // Compile shaders
80
  const llm_model_id = "onnx-community/Qwen3-1.7B-ONNX";
81
  const tokenizer = await AutoTokenizer.from_pretrained("Qwen/Qwen3-1.7B"); // Load tokenizer from original repo
82
  const llm = await AutoModelForCausalLM.from_pretrained(llm_model_id, {
83
- dtype: "q4f16",
84
  device: "webgpu",
85
- model_file_name: "model_q4f16.onnx" // Specify exact file to avoid external data format
86
  });
87
 
88
  const SYSTEM_MESSAGE = {
 
80
  const llm_model_id = "onnx-community/Qwen3-1.7B-ONNX";
81
  const tokenizer = await AutoTokenizer.from_pretrained("Qwen/Qwen3-1.7B"); // Load tokenizer from original repo
82
  const llm = await AutoModelForCausalLM.from_pretrained(llm_model_id, {
83
+ dtype: "q4f16", // This alone should make it pick model_q4f16.onnx
84
  device: "webgpu",
85
+ // Don't specify model_file_name - let Transformers.js construct the path
86
  });
87
 
88
  const SYSTEM_MESSAGE = {