Update app.py
Browse filesSet the model back to Qwen/Qwen3-32B; max_new_tokens=2048; temperature=0.1.
app.py
CHANGED
@@ -20,8 +20,8 @@ subprocess.run(["playwright", "install"], check=True)
|
|
20 |
# (Keep Constants as is)
|
21 |
# --- Constants ---
|
22 |
DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
|
23 |
-
|
24 |
-
MODEL_ID = "Qwen/Qwen2.5-Coder-32B-Instruct"
|
25 |
|
26 |
class CachedWebSearchTool(WebSearchTool):
|
27 |
@lru_cache(maxsize=128)
|
@@ -104,8 +104,9 @@ class BasicModel:
|
|
104 |
model=mod,
|
105 |
tokenizer=tok,
|
106 |
max_new_tokens=2048,
|
|
|
107 |
return_full_text=False, # <— only get the completion, not the prompt + completion
|
108 |
-
|
109 |
)
|
110 |
|
111 |
def _serialize_messages(self, messages):
|
|
|
20 |
# (Keep Constants as is)
|
21 |
# --- Constants ---
|
22 |
DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
|
23 |
+
MODEL_ID = "Qwen/Qwen3-32B"
|
24 |
+
# MODEL_ID = "Qwen/Qwen2.5-Coder-32B-Instruct"
|
25 |
|
26 |
class CachedWebSearchTool(WebSearchTool):
|
27 |
@lru_cache(maxsize=128)
|
|
|
104 |
model=mod,
|
105 |
tokenizer=tok,
|
106 |
max_new_tokens=2048,
|
107 |
+
do_sample=True,
|
108 |
return_full_text=False, # <— only get the completion, not the prompt + completion
|
109 |
+
temperature=0.1,
|
110 |
)
|
111 |
|
112 |
def _serialize_messages(self, messages):
|