qwerty45-uiop commited on
Commit
a7ce83d
·
verified ·
1 Parent(s): 98ae49c

Update src/streamlit_app.py

Browse files
Files changed (1) hide show
  1. src/streamlit_app.py +5 -0
src/streamlit_app.py CHANGED
@@ -73,6 +73,11 @@ def extract_numeric_ram(ram) -> Optional[int]:
73
 
74
  # Streamlined LLM database with popular models and download sizes
75
  LLM_DATABASE = {
 
 
 
 
 
76
  "ultra_low": { # ≤2GB
77
  "general": [
78
  {"name": "TinyLlama-1.1B-Chat", "size": "637MB", "description": "Compact chat model"},
 
73
 
74
  # Streamlined LLM database with popular models and download sizes
75
  LLM_DATABASE = {
76
+ QUANTIZATION_INFO = {
77
+ "fp16": {"multiplier": 1.0, "label": "FP16 (Full)", "description": "Best quality, largest size"},
78
+ "8bit": {"multiplier": 0.5, "label": "8-bit", "description": "Good quality, 50% smaller"},
79
+ "4bit": {"multiplier": 0.25, "label": "4-bit", "description": "Decent quality, 75% smaller"}
80
+ }
81
  "ultra_low": { # ≤2GB
82
  "general": [
83
  {"name": "TinyLlama-1.1B-Chat", "size": "637MB", "description": "Compact chat model"},