Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
|
@@ -35,7 +35,7 @@ def respond(
|
|
| 35 |
messages.append({"role": "user", "content": message})
|
| 36 |
print(messages)
|
| 37 |
inputs = tokenizer.apply_chat_template(messages, return_tensors="pt", add_generation_prompt=True, enable_reasoning=enable_reasoning, return_dict=True).to(device)
|
| 38 |
-
generation_kwargs = dict(inputs, streamer=streamer, max_new_tokens=max_tokens, temperature=temperature, repetition_penalty=repetition_penalty
|
| 39 |
thread = Thread(target=model.generate, kwargs=generation_kwargs)
|
| 40 |
|
| 41 |
thread.start()
|
|
|
|
| 35 |
messages.append({"role": "user", "content": message})
|
| 36 |
print(messages)
|
| 37 |
inputs = tokenizer.apply_chat_template(messages, return_tensors="pt", add_generation_prompt=True, enable_reasoning=enable_reasoning, return_dict=True).to(device)
|
| 38 |
+
generation_kwargs = dict(inputs, streamer=streamer, max_new_tokens=max_tokens, temperature=temperature, repetition_penalty=repetition_penalty)
|
| 39 |
thread = Thread(target=model.generate, kwargs=generation_kwargs)
|
| 40 |
|
| 41 |
thread.start()
|