Spaces:

quang227
/

moonshotai-Kimi-Dev-72B

Running

quang227 commited on 6 days ago

Commit

8d2f7ae

verified ·

1 Parent(s): e32e9f2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,10 +1,33 @@
 import gradio as gr
-with gr.Blocks(fill_height=True) as demo:
-    with gr.Sidebar():
-        gr.Markdown("# Inference Provider")
-        gr.Markdown("This Space showcases the moonshotai/Kimi-Dev-72B model, served by the featherless-ai API. Sign in with your Hugging Face account to use this API.")
-        button = gr.LoginButton("Sign in")
-    gr.load("models/moonshotai/Kimi-Dev-72B", accept_token=button, provider="featherless-ai")
-demo.launch()

 import gradio as gr
+from huggingface_hub import InferenceClient
+client = InferenceClient("moonshotai/Kimi-Dev-72B")
+def chat(message, system_prompt="", max_tokens=1024, temperature=0.9, top_p=0.95, top_k=40, repetition_penalty=1.0):
+    prompt = f"{system_prompt}\n{message}" if system_prompt else message
+    result = client.text_generation(
+        prompt=prompt,
+        max_new_tokens=max_tokens,
+        temperature=temperature,
+        top_p=top_p,
+        repetition_penalty=repetition_penalty,
+        do_sample=True,
+        return_full_text=False
+    )
+    return result
+demo = gr.Interface(
+    fn=chat,
+    inputs=[
+        gr.Textbox(label="Prompt"),
+        gr.Textbox(label="System Prompt", value=""),
+        gr.Slider(1, 2048, value=1024, label="Max Tokens"),
+        gr.Slider(0.1, 1.0, value=0.9, label="Temperature"),
+        gr.Slider(0.1, 1.0, value=0.95, label="Top-p"),
+        gr.Slider(1, 100, value=40, label="Top-k"),
+        gr.Slider(1.0, 2.0, value=1.0, label="Repetition Penalty")
+    ],
+    outputs=gr.Textbox(label="Response"),
+)
+demo.launch()