Spaces:
Runtime error
Runtime error
ffreemt
commited on
Commit
·
f073be5
1
Parent(s):
b01b8ee
Adjust queue size
Browse files
app.py
CHANGED
@@ -377,8 +377,8 @@ with gr.Blocks(title="ChatGLM2-6B-int4", theme=gr.themes.Soft(text_size="sm")) a
|
|
377 |
# demo.queue().launch(share=True, inbrowser=True, debug=True)
|
378 |
|
379 |
# concurrency_count > 1 requires more memory, max_size: queue size
|
380 |
-
# T4 medium: 30GB, model size: ~
|
381 |
# leave one for api access
|
382 |
-
# reduce to
|
383 |
|
384 |
-
demo.queue(concurrency_count=
|
|
|
377 |
# demo.queue().launch(share=True, inbrowser=True, debug=True)
|
378 |
|
379 |
# concurrency_count > 1 requires more memory, max_size: queue size
|
380 |
+
# T4 medium: 30GB, model size: ~4G concurrency_count = 6
|
381 |
# leave one for api access
|
382 |
+
# reduce to 5 if OOM occurs to often
|
383 |
|
384 |
+
demo.queue(concurrency_count=6, max_size=30).launch(debug=True)
|