mikeee commited on
Commit
97f4d75
1 Parent(s): 6ae67ec

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -181,8 +181,11 @@ with gr.Blocks(title="ChatGLM2-6B-int4", theme=gr.themes.Soft(text_size="sm")) a
181
 
182
  with gr.Accordion("Info", open=False):
183
  _ = """
184
- A query takes from 30 seconds to a few tens of seconds, dependent on the number of words/characters
185
- the question and answer contain.
 
 
 
186
 
187
  * Low temperature: responses will be more deterministic and focused; High temperature: responses more creative.
188
 
 
181
 
182
  with gr.Accordion("Info", open=False):
183
  _ = """
184
+ ## ChatGLM2-6B-int4
185
+
186
+ With a GPU, a query takes from a few seconds to a few tens of seconds, dependent on the number of words/characters
187
+ the question and responses contain. The quality of the responses varies quite a bit it seems. Even the same
188
+ question with the same parameters, asked at different times, can result in quite different responses.
189
 
190
  * Low temperature: responses will be more deterministic and focused; High temperature: responses more creative.
191