Spaces:

kirakayy
/

er

Sleeping

App Files Files Community

kirakayy commited on Sep 13

Commit

69f0258

verified ·

1 Parent(s): a24df2b

Update app.py

Browse files

Files changed (1) hide show

app.py +98 -26

app.py CHANGED Viewed

@@ -1,5 +1,9 @@
-import os, json, joblib, numpy as np, gradio as gr
-from typing import Any, Dict, List
 from huggingface_hub import hf_hub_download
 import re
@@ -9,21 +13,28 @@ TOKEN = os.getenv("HF_TOKEN", None)  # add in Space Settings → Secrets if repo
 # ---------- Safe numeric helpers ----------
 NUM_RE = re.compile(r"[-+]?\d*\.?\d+")
 def _try_num(x: Any) -> float | None:
-    if x is None: return None
     s = str(x).strip().lower()
     mult = 1.0
-    if "k" in s and re.search(r"\d", s): s = s.replace("k",""); mult = 1000.0
-    if "m" in s and re.search(r"\d", s): s = s.replace("m",""); mult = 1_000_000.0
     s = re.sub(r"[^0-9.\-]", "", s)
-    if s in {"","-","."}: return None
-    try: return float(s) * mult
     except Exception:
         m = NUM_RE.search(str(x))
         return float(m.group(0)) if m else None
 def to_float(x: Any, default: float = 0.0) -> float:
-    if isinstance(x, (int,float)): return float(x)
     v = _try_num(x)
     return float(v) if v is not None else float(default)
@@ -41,42 +52,101 @@ feat_path   = hf_hub_download(repo_id=MODEL_REPO_ID, filename="feature_order.jso
 thresh_path = hf_hub_download(repo_id=MODEL_REPO_ID, filename="score_thresholds.json", token=TOKEN)
 reg = joblib.load(model_path)
-with open(feat_path) as f: FEATURE_ORDER: List[str] = json.load(f)
-with open(thresh_path) as f: THRESH: Dict[str, float] = json.load(f)
 def to_label(score: float) -> str:
-    low_lt = THRESH.get("low_lt", 40)
-    med_lt = THRESH.get("medium_lt", 70)
     return "low" if score < low_lt else ("medium" if score < med_lt else "high")
 # ---------- Prediction ----------
 def predict_readiness(savings_amount, monthly_income, entertainment_spending,
                       sales_skills_1_5, independence_1_5, risk_tolerance_1_10, age):
     values = {
         "savings_amount":         max(0.0, to_float(savings_amount)),
         "monthly_income":         max(0.0, to_float(monthly_income)),
         "entertainment_spending": max(0.0, to_float(entertainment_spending)),
         "sales_skills_1_5":       clip_range(sales_skills_1_5, 1, 5),
-        "independence_1_5":       clip_range(independence_1_5, 1, 5),  # <-- keep 'independence'
         "risk_tolerance_1_10":    clip_range(risk_tolerance_1_10, 1, 10),
         "age":                    int(round(clip_range(age, 13, 100))),
     }
-    # Build feature vector in EXACT order your model expects
     x = [values.get(name, 0.0) for name in FEATURE_ORDER]
-    x_arr = np.asarray([x], dtype=float)  # ensure numeric dtype
-    # Predict → coerce → clamp to 0–100
-    y_pred = reg.predict(x_arr)
-    raw = float(np.asarray(y_pred).ravel()[0]) if y_pred is not None else 0.0
-    score = clip01_100(raw)
-    low_lt = THRESH.get("low_lt", 40)
-    med_lt = THRESH.get("medium_lt", 70)
     return {
-        "readiness_score_0_100": round(score, 2),
-        "readiness_label": to_label(score),
         "thresholds": f"low<{low_lt}, medium {low_lt}–{med_lt-0.01:.2f}, high≥{med_lt}",
     }
@@ -92,7 +162,9 @@ inputs = [
 ]
 demo = gr.Interface(
-    fn=predict_readiness, inputs=inputs, outputs="json",
     title="Entrepreneurial Readiness — Simple Regressor",
     description="Enter details to estimate a 0–100 readiness score and label (low/medium/high)."
 )

+import os
+import json
+import joblib
+import numpy as np
+import gradio as gr
+from typing import Any, Dict, List, Tuple
 from huggingface_hub import hf_hub_download
 import re
 # ---------- Safe numeric helpers ----------
 NUM_RE = re.compile(r"[-+]?\d*\.?\d+")
 def _try_num(x: Any) -> float | None:
+    if x is None:
+        return None
     s = str(x).strip().lower()
     mult = 1.0
+    if "k" in s and re.search(r"\d", s):
+        s = s.replace("k", ""); mult = 1000.0
+    if "m" in s and re.search(r"\d", s):
+        s = s.replace("m", ""); mult = 1_000_000.0
     s = re.sub(r"[^0-9.\-]", "", s)
+    if s in {"", "-", "."}:
+        return None
+    try:
+        return float(s) * mult
     except Exception:
         m = NUM_RE.search(str(x))
         return float(m.group(0)) if m else None
 def to_float(x: Any, default: float = 0.0) -> float:
+    if isinstance(x, (int, float, np.integer, np.floating)):
+        return float(x)
     v = _try_num(x)
     return float(v) if v is not None else float(default)
 thresh_path = hf_hub_download(repo_id=MODEL_REPO_ID, filename="score_thresholds.json", token=TOKEN)
 reg = joblib.load(model_path)
+with open(feat_path) as f:
+    FEATURE_ORDER: List[str] = json.load(f)
+with open(thresh_path) as f:
+    THRESH: Dict[str, float] = json.load(f)
+# ---------- Label helpers ----------
+def thresholds() -> Tuple[float, float]:
+    return THRESH.get("low_lt", 40.0), THRESH.get("medium_lt", 70.0)
 def to_label(score: float) -> str:
+    low_lt, med_lt = thresholds()
     return "low" if score < low_lt else ("medium" if score < med_lt else "high")
+def anchors_from_thresholds() -> Dict[str, float]:
+    low_lt, med_lt = thresholds()
+    # Midpoints of the buckets: [0, low), [low, med), [med, 100]
+    return {
+        "low": low_lt / 2.0,                         # e.g., 20 if low_lt=40
+        "medium": (low_lt + med_lt) / 2.0,          # e.g., 55 if 40/70
+        "high": (med_lt + 100.0) / 2.0              # e.g., 85 if 70/100
+    }
+def score_from_label_only(label: str) -> float:
+    a = anchors_from_thresholds()
+    return float(a.get(str(label).lower(), a["medium"]))
+def score_from_proba(model, X: np.ndarray, fallback_label: str | None = None) -> Tuple[float, str]:
+    anchors = anchors_from_thresholds()
+    if hasattr(model, "predict_proba"):
+        try:
+            proba = model.predict_proba(X)[0]
+            classes = getattr(model, "classes_", None)
+            if classes is None:
+                # assume order low, medium, high
+                classes = np.array(["low", "medium", "high"], dtype=object)
+            # Normalize labels to lowercase strings
+            classes_l = [str(c).lower() for c in classes]
+            # Expected score = sum(p_c * anchor_c)
+            expected = 0.0
+            for c, p in zip(classes_l, proba):
+                expected += float(p) * float(anchors.get(c, anchors["medium"]))
+            # Choose label: max-proba if not provided
+            pred_label = fallback_label
+            if pred_label is None:
+                pred_label = classes_l[int(np.argmax(proba))]
+            return clip01_100(expected), pred_label
+        except Exception:
+            pass
+    # No predict_proba → map the label to its anchor
+    if fallback_label is None:
+        fallback_label = "medium"
+    return clip01_100(score_from_label_only(fallback_label)), str(fallback_label).lower()
 # ---------- Prediction ----------
 def predict_readiness(savings_amount, monthly_income, entertainment_spending,
                       sales_skills_1_5, independence_1_5, risk_tolerance_1_10, age):
+    # Coerce UI values safely
     values = {
         "savings_amount":         max(0.0, to_float(savings_amount)),
         "monthly_income":         max(0.0, to_float(monthly_income)),
         "entertainment_spending": max(0.0, to_float(entertainment_spending)),
         "sales_skills_1_5":       clip_range(sales_skills_1_5, 1, 5),
+        "independence_1_5":       clip_range(independence_1_5, 1, 5),
         "risk_tolerance_1_10":    clip_range(risk_tolerance_1_10, 1, 10),
         "age":                    int(round(clip_range(age, 13, 100))),
     }
+    # Build feature vector in exact training order
     x = [values.get(name, 0.0) for name in FEATURE_ORDER]
+    X = np.asarray([x], dtype=float)
+    # Try numeric prediction first
+    y_pred = reg.predict(X)
+    y0 = np.asarray(y_pred).ravel()[0]
+    # Case A: numeric output → clamp and label via thresholds
+    if isinstance(y0, (int, float, np.integer, np.floating)):
+        score = clip01_100(float(y0))
+        label = to_label(score)
+    else:
+        # Case B: string/label output (e.g., 'low'/'medium'/'high')
+        label_str = str(y0).lower()
+        score, label = score_from_proba(reg, X, fallback_label=label_str)
+    low_lt, med_lt = thresholds()
     return {
+        "readiness_score_0_100": round(float(score), 2),
+        "readiness_label": label,
         "thresholds": f"low<{low_lt}, medium {low_lt}–{med_lt-0.01:.2f}, high≥{med_lt}",
     }
 ]
 demo = gr.Interface(
+    fn=predict_readiness,
+    inputs=inputs,
+    outputs="json",
     title="Entrepreneurial Readiness — Simple Regressor",
     description="Enter details to estimate a 0–100 readiness score and label (low/medium/high)."
 )