DeepSeek-R1-Qwen-7B

Running on Zero

nikravan commited on 3 days ago

Commit

5a07c64

verified ·

1 Parent(s): a259ca0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -55,7 +55,8 @@ latex_delimiters_set = [{
 def predict(message, history, system_prompt, temperature, max_new_tokens, top_k, repetition_penalty, top_p):
     # Format history with a given chat template
-    #stop_tokens = [tokenizer.eos_token_id]
     instruction = system_prompt + "\n\n"
     for user, assistant in history:
         instruction += f"<｜User｜>{user}<｜Assistant｜>{assistant}\n"
@@ -87,8 +88,8 @@ def predict(message, history, system_prompt, temperature, max_new_tokens, top_k,
     outputs = []
     for new_token in streamer:
         outputs.append(new_token)
-        #if new_token in stop_tokens:
-            #break
         yield "".join(outputs)

 def predict(message, history, system_prompt, temperature, max_new_tokens, top_k, repetition_penalty, top_p):
     # Format history with a given chat template
+    stop_tokens = [tokenizer.eos_token_id]
+    pad_token_id=[tokenizer.eos_token_id] #151643
     instruction = system_prompt + "\n\n"
     for user, assistant in history:
         instruction += f"<｜User｜>{user}<｜Assistant｜>{assistant}\n"
     outputs = []
     for new_token in streamer:
         outputs.append(new_token)
+        if new_token in stop_tokens:
+            break
         yield "".join(outputs)