starsnatched commited on
Commit
f741707
·
1 Parent(s): 4582e1f

Update model names and configuration parameters for improved performance

Browse files
Files changed (3) hide show
  1. src/chat.py +2 -0
  2. src/config.py +3 -2
  3. src/vm.py +0 -1
src/chat.py CHANGED
@@ -8,6 +8,7 @@ from ollama import AsyncClient, ChatResponse, Message
8
  from .config import (
9
  MAX_TOOL_CALL_DEPTH,
10
  MODEL_NAME,
 
11
  NUM_CTX,
12
  OLLAMA_HOST,
13
  SYSTEM_PROMPT,
@@ -28,6 +29,7 @@ class ChatSession:
28
  session: str = "default",
29
  host: str = OLLAMA_HOST,
30
  model: str = MODEL_NAME,
 
31
  ) -> None:
32
  init_db()
33
  self._client = AsyncClient(host=host)
 
8
  from .config import (
9
  MAX_TOOL_CALL_DEPTH,
10
  MODEL_NAME,
11
+ EMBEDDING_MODEL_NAME,
12
  NUM_CTX,
13
  OLLAMA_HOST,
14
  SYSTEM_PROMPT,
 
29
  session: str = "default",
30
  host: str = OLLAMA_HOST,
31
  model: str = MODEL_NAME,
32
+ embedding_model: str = EMBEDDING_MODEL_NAME,
33
  ) -> None:
34
  init_db()
35
  self._client = AsyncClient(host=host)
src/config.py CHANGED
@@ -3,10 +3,11 @@ from __future__ import annotations
3
  import os
4
  from typing import Final
5
 
6
- MODEL_NAME: Final[str] = os.getenv("OLLAMA_MODEL", "qwen3")
 
7
  OLLAMA_HOST: Final[str] = os.getenv("OLLAMA_HOST", "http://localhost:11434")
8
  MAX_TOOL_CALL_DEPTH: Final[int] = 5
9
- NUM_CTX: Final[int] = int(os.getenv("OLLAMA_NUM_CTX", "32000"))
10
 
11
  SYSTEM_PROMPT: Final[str] = (
12
  "You are a versatile AI assistant named Starlette able to orchestrate several tools to "
 
3
  import os
4
  from typing import Final
5
 
6
+ MODEL_NAME: Final[str] = os.getenv("OLLAMA_MODEL", "qwen3:1.7b")
7
+ EMBEDDING_MODEL_NAME: Final[str] = os.getenv("OLLAMA_EMBEDDING_MODEL", "snowflake-arctic-embed:137m")
8
  OLLAMA_HOST: Final[str] = os.getenv("OLLAMA_HOST", "http://localhost:11434")
9
  MAX_TOOL_CALL_DEPTH: Final[int] = 5
10
+ NUM_CTX: Final[int] = int(os.getenv("OLLAMA_NUM_CTX", "16000"))
11
 
12
  SYSTEM_PROMPT: Final[str] = (
13
  "You are a versatile AI assistant named Starlette able to orchestrate several tools to "
src/vm.py CHANGED
@@ -1,6 +1,5 @@
1
  from __future__ import annotations
2
 
3
- from typing import Optional
4
  import subprocess
5
  import uuid
6
 
 
1
  from __future__ import annotations
2
 
 
3
  import subprocess
4
  import uuid
5