vilarin commited on
Commit
e452aa8
·
verified ·
1 Parent(s): f55597f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -1
app.py CHANGED
@@ -128,10 +128,19 @@ async def gen_show(script):
128
  def generator(messages):
129
  input_ids = tokenizer.apply_chat_template(
130
  conversation=messages,
 
131
  tokenize=True,
132
  return_tensors='pt'
133
  )
134
- output_ids = model.generate(input_ids.to('cuda'), eos_token_id=tokenizer.eos_token_id)
 
 
 
 
 
 
 
 
135
  results = tokenizer.decode(output_ids[0][input_ids.shape[1]:], skip_special_tokens=True)
136
  return results
137
 
 
128
  def generator(messages):
129
  input_ids = tokenizer.apply_chat_template(
130
  conversation=messages,
131
+ add_generation_prompt=True,
132
  tokenize=True,
133
  return_tensors='pt'
134
  )
135
+
136
+ output_ids = model.generate(
137
+ input_ids.to('cuda'),
138
+ eos_token_id=tokenizer.eos_token_id,
139
+ max_new_tokens=4096,
140
+ temperature=0.5,
141
+ repetition_penalty=1.2,
142
+ )
143
+
144
  results = tokenizer.decode(output_ids[0][input_ids.shape[1]:], skip_special_tokens=True)
145
  return results
146