Spaces:

Bton
/

llama3_product-reviewer

Sleeping

App Files Files Community

Bton commited on Jun 7

Commit

ca3cfbc

verified ·

1 Parent(s): 17d8965

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -51

app.py CHANGED Viewed

@@ -1,84 +1,72 @@
 import gradio as gr
-from huggingface_hub import hf_hub_download
 from llama_cpp import Llama
-import json
-# --- Config ---
-MODEL_REPO = "Bton/llama3-product-reviewer"
-GGUF_FILENAME = "unsloth.Q4_K_M.gguf"
-# --- Download GGUF model from Hugging Face ---
-print("📦 Downloading model from Hugging Face Hub...")
-model_path = hf_hub_download(repo_id=MODEL_REPO, filename=GGUF_FILENAME)
-print("✅ Download complete:", model_path)
-# --- Load LLaMA model ---
 llm = Llama(
     model_path=model_path,
-    n_ctx=2048,
-    n_threads=8,     # adjust for Space CPU
-    n_batch=16,
-    verbose=True
 )
-# --- Gradio function ---
-def generate_review(product_title, rating, price, about_this_item):
-    input_data = {
-        "product_title": product_title,
-        "rating": rating,
         "price": price,
-        "about_this_item": about_this_item,
     }
     prompt = (
         "Write a helpful and natural-sounding customer review in JSON format with two fields: "
-        "\"title\" and \"review\" for the following product.\n\n"
-        "Product:\n"
-        f"{json.dumps(input_data, indent=2)}"
     )
-    response = llm(
-        prompt,
-        stop=["</s>"],
-        max_tokens=512,
-        temperature=0.7,
-        top_p=0.9,
-    )
     try:
-        # Extract JSON from model response
-        json_start = response["choices"][0]["text"].find("{")
-        json_str = response["choices"][0]["text"][json_start:]
-        review_data = json.loads(json_str)
-        return review_data.get("title", ""), review_data.get("review", "")
     except Exception as e:
-        return "Review Title Generation Failed", response["choices"][0]["text"]
-# --- Gradio UI ---
 with gr.Blocks() as demo:
-    gr.Markdown("🛍️ **LLaMA3 Product Review Generator**")
     with gr.Row():
-        product_title = gr.Textbox(label="Product Title", placeholder="Ergonomic Mesh Office Chair")
-        rating = gr.Textbox(label="Rating", placeholder="4.6 out of 5 stars")
         price = gr.Textbox(label="Price", placeholder="$129.99")
-    about_this_item = gr.Textbox(
         label="About This Item",
-        placeholder="• Breathable mesh back • Adjustable lumbar support • Smooth-rolling casters • Height-adjustable armrests",
         lines=4
     )
-    submit_btn = gr.Button("✍️ Generate Review")
-    review_title = gr.Textbox(label="Generated Review Title")
-    review_body = gr.Textbox(label="Generated Review Body", lines=5)
-    submit_btn.click(
-        fn=generate_review,
-        inputs=[product_title, rating, price, about_this_item],
-        outputs=[review_title, review_body]
-    )
-# --- Launch app ---
 demo.launch()

+import os
+import json
 import gradio as gr
 from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
+# Hugging Face model repo + filename
+REPO_ID = "Bton/llama3-product-reviewer"
+FILENAME = "llama3-pr-Q4_K_M.gguf"
+# Download model from Hugging Face Hub (if not cached)
+model_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME, local_dir=".")
+# Load model with llama-cpp-python
 llm = Llama(
     model_path=model_path,
+    n_ctx=1024,
+    n_batch=8,
+    n_threads=os.cpu_count(),
+    use_mlock=False,
+    verbose=False
 )
+# Prompt wrapper (finetuned prompt must remain unchanged!)
+def generate_review(title, price, rating, about):
+    product_data = {
+        "product_title": title,
         "price": price,
+        "rating": rating,
+        "about_this_item": about
     }
     prompt = (
         "Write a helpful and natural-sounding customer review in JSON format with two fields: "
+        "\"title\" and \"review\" for the product below.\n\n"
+        f"{json.dumps(product_data, ensure_ascii=False)}"
     )
+    response = llm(prompt, max_tokens=512)
+    raw = response["choices"][0]["text"]
     try:
+        # Find and parse JSON
+        json_start = raw.find("{")
+        review_data = json.loads(raw[json_start:])
+        return review_data.get("title", "Untitled"), review_data.get("review", raw.strip())
     except Exception as e:
+        return "Error", raw.strip()
+# Gradio interface
 with gr.Blocks() as demo:
+    gr.Markdown("## 📝 LLaMA3 Product Review Generator (CPU Only - ZeroGPU Space)")
     with gr.Row():
+        title = gr.Textbox(label="Product Title", placeholder="Ergonomic Office Chair")
         price = gr.Textbox(label="Price", placeholder="$129.99")
+        rating = gr.Textbox(label="Rating", placeholder="4.6 out of 5 stars")
+    about = gr.Textbox(
         label="About This Item",
+        placeholder="• Breathable mesh back\n• Adjustable lumbar support\n• Height-adjustable armrests",
         lines=4
     )
+    btn = gr.Button("Generate Review")
+    out_title = gr.Textbox(label="Generated Title")
+    out_review = gr.Textbox(label="Generated Review", lines=5)
+    btn.click(generate_review, inputs=[title, price, rating, about], outputs=[out_title, out_review])
 demo.launch()