Spaces:

mobinln
/

chatbot

Running

mobinln commited on Jul 8, 2024

Commit

d637b43

verified ·

1 Parent(s): b83b316

Change to smaller llama3

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ from llama_cpp import Llama
 model = "SanctumAI/Meta-Llama-3-8B-Instruct-GGUF"
 llm = Llama.from_pretrained(
     repo_id=model,
-    filename="meta-llama-3-8b-instruct.Q8_0.gguf",
     verbose=True,
     use_mmap=False,
     use_mlock=True,

 model = "SanctumAI/Meta-Llama-3-8B-Instruct-GGUF"
 llm = Llama.from_pretrained(
     repo_id=model,
+    filename="meta-llama-3-8b-instruct.Q4_K_S.gguf",
     verbose=True,
     use_mmap=False,
     use_mlock=True,