Spaces:

BinKhoaLe1812
/

Tutorbot

Sleeping

App Files Files Community

LiamKhoaLe commited on Jun 14

Commit

425af9c

1 Parent(s): 20a6be7

Upd primary endpoint 32B and fallback 7B

Browse files

Files changed (1) hide show

app.py +57 -23

app.py CHANGED Viewed

@@ -60,23 +60,21 @@ def gemini_flash_completion(prompt, model="gemini-2.5-flash-preview-04-17", temp
         return "Error generating response from Gemini."
 # —— Qwen 2.5 VL Client Setup —————
-qwen_client = Client("prithivMLmods/Qwen2.5-VL-7B-Instruct")
 logger.info("[Qwen] Using remote API via Gradio Client")
 def qwen_image_summary(image_file: UploadFile, subject: str, level: str) -> str:
     from gradio_client import Client, handle_file
-    import tempfile
-    # Read file with appropriate format
     if image_file.content_type not in {"image/png", "image/jpeg", "image/jpg"}:
         raise HTTPException(415, "Only PNG or JPEG images are supported")
-    # Write/read file
-    try:
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".jpg") as tmp:
-            tmp.write(image_file.file.read())
-            tmp_path = tmp.name
-        logger.info(f"[Qwen] File saved at {tmp_path}, sending to /generate_image...")
-        # Prompt
-        instruction = f"""
         You are an academic tutor.
         The student has submitted an image that may contain multiple exam-style questions or study material. Your task is to:
@@ -97,12 +95,42 @@ def qwen_image_summary(image_file: UploadFile, subject: str, level: str) -> str:
         Only include what appears in the image. Be accurate and neat.
         """
-        # Client spec
-        client = Client("prithivMLmods/Qwen2.5-VL")
-        # Client configs
-        result = client.predict(
             model_name="Qwen2.5-VL-7B-Instruct",
-            text=instruction,
             image=handle_file(tmp_path),
             max_new_tokens=1024,
             temperature=0.6,
@@ -111,13 +139,19 @@ def qwen_image_summary(image_file: UploadFile, subject: str, level: str) -> str:
             repetition_penalty=1.2,
             api_name="/generate_image"
         )
-        logger.info("[Qwen] ✅ Summary returned from /generate_image")
         os.remove(tmp_path)
-        return result.strip()
-    # Error
-    except Exception as e:
-        logger.error(f"[QWEN_API_ERROR] {e}")
-        raise HTTPException(500, "❌ Qwen image analysis failed")
 # ————— Unified Chat Endpoint —————

         return "Error generating response from Gemini."
 # —— Qwen 2.5 VL Client Setup —————
 logger.info("[Qwen] Using remote API via Gradio Client")
+# Read and reasoning on image data sending over
 def qwen_image_summary(image_file: UploadFile, subject: str, level: str) -> str:
     from gradio_client import Client, handle_file
+    import tempfile, os
+    from fastapi import HTTPException
+    # Not accepted format
     if image_file.content_type not in {"image/png", "image/jpeg", "image/jpg"}:
         raise HTTPException(415, "Only PNG or JPEG images are supported")
+    # Write and save image sending over on cache
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".jpg") as tmp:
+        tmp.write(image_file.file.read())
+        tmp_path = tmp.name
+    # Engineered prompting
+    instruction = f"""
         You are an academic tutor.
         The student has submitted an image that may contain multiple exam-style questions or study material. Your task is to:
         Only include what appears in the image. Be accurate and neat.
         """
+    # ——— 1️⃣ Primary: 32B Model (Qwen/Qwen2.5-VL-32B-Instruct) ———
+    try:
+        logger.info("[Qwen32B] Using /predict ...")
+        client32 = Client("Qwen/Qwen2.5-VL-32B-Instruct")
+        # Payload handler
+        _chatbot_payload = [
+            (None, instruction.strip()),
+            (None, {"file": tmp_path})
+        ]
+        # Call client
+        result = client32.predict(_chatbot=_chatbot_payload, api_name="/predict")
+        # Clean result
+        if isinstance(result, (list, tuple)) and result:
+            assistant_reply = (result[0] or "").strip()
+        else:
+            assistant_reply = str(result).strip()
+        # Primary success
+        if assistant_reply:
+            logger.info("[Qwen32B] ✅ Successfully transcribed.")
+            os.remove(tmp_path)
+            return assistant_reply
+        # Empty return
+        raise ValueError("Empty result from 32B")
+    # Fail on primary
+    except Exception as e_32b:
+        logger.warning(f"[Qwen32B] ❌ Failed: {e_32b} — falling back to Qwen 7B")
+    # ——— 2️⃣ Fallback: 7B Model (prithivMLmods/Qwen2.5-VL) ———
+    try:
+        logger.info("[Qwen7B] Using /generate_image fallback ...")
+        client7 = Client("prithivMLmods/Qwen2.5-VL")
+        # Fallback client calling
+        result = client7.predict(
             model_name="Qwen2.5-VL-7B-Instruct",
+            text=instruction.strip(),
             image=handle_file(tmp_path),
             max_new_tokens=1024,
             temperature=0.6,
             repetition_penalty=1.2,
             api_name="/generate_image"
         )
+        # Clean result
+        result = (result or "").strip()
         os.remove(tmp_path)
+        # Extract fallback result
+        if result:
+            logger.info("[Qwen7B] ✅ Fallback succeeded.")
+            return result
+        # Empty return
+        raise ValueError("Empty result from 7B fallback")
+    # Fail on both
+    except Exception as e_7b:
+        logger.error(f"[Qwen7B] ❌ Fallback also failed: {e_7b}")
+        raise HTTPException(500, "❌ Both Qwen image models failed to process the image.")
 # ————— Unified Chat Endpoint —————