Update app.py
Browse files
app.py
CHANGED
@@ -24,9 +24,6 @@ model = torch.compile(model)
|
|
24 |
model = model.eval()
|
25 |
|
26 |
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
DESCRIPTION = '''
|
31 |
<div>
|
32 |
<h1 style="text-align: center;">网文智能辅助写作 - 珠玑系列模型</h1>
|
@@ -118,11 +115,16 @@ def chat_zhuji(
|
|
118 |
t = Thread(target=model.generate, kwargs=generate_kwargs)
|
119 |
t.start()
|
120 |
|
121 |
-
outputs = []
|
122 |
-
for text in streamer:
|
123 |
-
|
124 |
-
|
125 |
-
|
|
|
|
|
|
|
|
|
|
|
126 |
|
127 |
# Gradio block
|
128 |
chatbot=gr.Chatbot(height=450, placeholder=PLACEHOLDER, label='Gradio ChatInterface')
|
@@ -142,10 +144,10 @@ with gr.Blocks(fill_height=True, css=css) as demo:
|
|
142 |
value=0.95,
|
143 |
label="Temperature",
|
144 |
render=False),
|
145 |
-
gr.Slider(minimum=
|
146 |
maximum=8192*2,
|
147 |
step=1,
|
148 |
-
value=8192
|
149 |
label="Max new tokens",
|
150 |
render=False ),
|
151 |
],
|
|
|
24 |
model = model.eval()
|
25 |
|
26 |
|
|
|
|
|
|
|
27 |
DESCRIPTION = '''
|
28 |
<div>
|
29 |
<h1 style="text-align: center;">网文智能辅助写作 - 珠玑系列模型</h1>
|
|
|
115 |
t = Thread(target=model.generate, kwargs=generate_kwargs)
|
116 |
t.start()
|
117 |
|
118 |
+
#outputs = []
|
119 |
+
#for text in streamer:
|
120 |
+
# outputs.append(text)
|
121 |
+
# yield "".join(outputs)
|
122 |
+
|
123 |
+
partial_message = ""
|
124 |
+
for new_token in streamer:
|
125 |
+
if new_token != '<|observation|>':
|
126 |
+
partial_message += new_token
|
127 |
+
yield partial_message
|
128 |
|
129 |
# Gradio block
|
130 |
chatbot=gr.Chatbot(height=450, placeholder=PLACEHOLDER, label='Gradio ChatInterface')
|
|
|
144 |
value=0.95,
|
145 |
label="Temperature",
|
146 |
render=False),
|
147 |
+
gr.Slider(minimum=128,
|
148 |
maximum=8192*2,
|
149 |
step=1,
|
150 |
+
value=8192,
|
151 |
label="Max new tokens",
|
152 |
render=False ),
|
153 |
],
|