STC-demo-v2_dev

Runtime error

fCola commited on May 22

Commit

bdc2b04

verified ·

1 Parent(s): 8ade2ed

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -47,7 +47,7 @@ class HfModelWrapper:
         input_text = self.build_prompt(user_input, history)
         input_ids = self.tokenizer.encode(input_text, return_tensors="pt").to("cuda")
-        streamer = TextIteratorStreamer(self.tokenizer, skip_prompt=True)
         gen_kwargs = {
             "inputs": input_ids,
@@ -509,15 +509,12 @@ def send_message(message, history):
     partial = ""
     idx = 0
     for t in response_generator:
-        if idx <= 5:
             idx += 1
             continue
         else:
-            if t != "<|eot_id|>":
-                partial += t
-                yield history + [{"role": "assistant", "content": partial}]
-            else:
-                continue
 # Create the dashboard

         input_text = self.build_prompt(user_input, history)
         input_ids = self.tokenizer.encode(input_text, return_tensors="pt").to("cuda")
+        streamer = TextIteratorStreamer(self.tokenizer, skip_prompt=True, skip_special_tokens=True)
         gen_kwargs = {
             "inputs": input_ids,
     partial = ""
     idx = 0
     for t in response_generator:
+        if idx <= 3:
             idx += 1
             continue
         else:
+            partial += t
+            yield history + [{"role": "assistant", "content": partial}]
 # Create the dashboard