Spaces:

qwerty45-uiop
/

LLM-Compatibilty-Advisor

Sleeping

qwerty45-uiop commited on Jun 29

Commit

a7ce83d

verified ·

1 Parent(s): 98ae49c

Update src/streamlit_app.py

Files changed (1) hide show

src/streamlit_app.py CHANGED Viewed

@@ -73,6 +73,11 @@ def extract_numeric_ram(ram) -> Optional[int]:
 # Streamlined LLM database with popular models and download sizes
 LLM_DATABASE = {
     "ultra_low": {  # ≤2GB
         "general": [
             {"name": "TinyLlama-1.1B-Chat", "size": "637MB", "description": "Compact chat model"},

 # Streamlined LLM database with popular models and download sizes
 LLM_DATABASE = {
+    QUANTIZATION_INFO = {
+    "fp16": {"multiplier": 1.0, "label": "FP16 (Full)", "description": "Best quality, largest size"},
+    "8bit": {"multiplier": 0.5, "label": "8-bit", "description": "Good quality, 50% smaller"},
+    "4bit": {"multiplier": 0.25, "label": "4-bit", "description": "Decent quality, 75% smaller"}
+}
     "ultra_low": {  # ≤2GB
         "general": [
             {"name": "TinyLlama-1.1B-Chat", "size": "637MB", "description": "Compact chat model"},