qwerty45-uiop commited on
Commit
1b7ef96
·
verified ·
1 Parent(s): 061b18f

Update src/streamlit_app.py

Browse files
Files changed (1) hide show
  1. src/streamlit_app.py +7 -5
src/streamlit_app.py CHANGED
@@ -72,6 +72,12 @@ def extract_numeric_ram(ram) -> Optional[int]:
72
  return None
73
 
74
  # Streamlined LLM database with popular models and download sizes
 
 
 
 
 
 
75
  LLM_DATABASE = {
76
 
77
  "ultra_low": { # ≤2GB
@@ -183,11 +189,7 @@ LLM_DATABASE = {
183
  ]
184
  }
185
  }
186
- QUANTIZATION_INFO = {
187
- "fp16": {"multiplier": 1.0, "label": "FP16 (Full)", "description": "Best quality, largest size"},
188
- "8bit": {"multiplier": 0.5, "label": "8-bit", "description": "Good quality, 50% smaller"},
189
- "4bit": {"multiplier": 0.25, "label": "4-bit", "description": "Decent quality, 75% smaller"}
190
- }
191
 
192
  # Enhanced LLM recommendation with performance tiers
193
  def recommend_llm(ram_str) -> Tuple[str, str, str, Dict[str, List[Dict]]]:
 
72
  return None
73
 
74
  # Streamlined LLM database with popular models and download sizes
75
+
76
+ QUANTIZATION_INFO = {
77
+ "fp16": {"multiplier": 1.0, "label": "FP16 (Full)", "description": "Best quality, largest size"},
78
+ "8bit": {"multiplier": 0.5, "label": "8-bit", "description": "Good quality, 50% smaller"},
79
+ "4bit": {"multiplier": 0.25, "label": "4-bit", "description": "Decent quality, 75% smaller"}
80
+ }
81
  LLM_DATABASE = {
82
 
83
  "ultra_low": { # ≤2GB
 
189
  ]
190
  }
191
  }
192
+
 
 
 
 
193
 
194
  # Enhanced LLM recommendation with performance tiers
195
  def recommend_llm(ram_str) -> Tuple[str, str, str, Dict[str, List[Dict]]]: