Spaces:
Runtime error
Runtime error
ffreemt
commited on
Commit
•
e92ff33
1
Parent(s):
c885b09
Adjust queue setup
Browse files
app.py
CHANGED
@@ -378,4 +378,9 @@ with gr.Blocks(title="ChatGLM2-6B-int4", theme=gr.themes.Soft(text_size="sm")) a
|
|
378 |
# demo.queue().launch(share=False, inbrowser=True)
|
379 |
# demo.queue().launch(share=True, inbrowser=True, debug=True)
|
380 |
|
381 |
-
|
|
|
|
|
|
|
|
|
|
|
|
378 |
# demo.queue().launch(share=False, inbrowser=True)
|
379 |
# demo.queue().launch(share=True, inbrowser=True, debug=True)
|
380 |
|
381 |
+
# concurrency_count > 1 requires more memory, max_size: queue size
|
382 |
+
# T4 medium: 30GB, model size: ~6G concurrency_count = 3
|
383 |
+
# leave one for api access
|
384 |
+
# reduce to 3 if OOM
|
385 |
+
|
386 |
+
block.queue(concurrency_count=4, max_size=20).launch(debug=True)
|