File size: 198 Bytes
293ab16
 
 
 
 
 
1
2
3
4
5
6
from llama_cpp import Llama

llm = Llama(model_path="models/llama-3-8b-instruct.Q4_K_M.gguf")
output = llm("Q: What is the capital of Kenya? A:", max_tokens=32)
print(output["choices"][0]["text"])