mobinln commited on
Commit
d637b43
·
verified ·
1 Parent(s): b83b316

Change to smaller llama3

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -4,7 +4,7 @@ from llama_cpp import Llama
4
  model = "SanctumAI/Meta-Llama-3-8B-Instruct-GGUF"
5
  llm = Llama.from_pretrained(
6
  repo_id=model,
7
- filename="meta-llama-3-8b-instruct.Q8_0.gguf",
8
  verbose=True,
9
  use_mmap=False,
10
  use_mlock=True,
 
4
  model = "SanctumAI/Meta-Llama-3-8B-Instruct-GGUF"
5
  llm = Llama.from_pretrained(
6
  repo_id=model,
7
+ filename="meta-llama-3-8b-instruct.Q4_K_S.gguf",
8
  verbose=True,
9
  use_mmap=False,
10
  use_mlock=True,