diff --git a/llava/serve/gradio_web_server.py b/llava/serve/gradio_web_server.py index e22451bed..8763fddab 100644 --- a/llava/serve/gradio_web_server.py +++ b/llava/serve/gradio_web_server.py @@ -353,7 +353,7 @@ def build_demo(embed_mode): flag_btn = gr.Button(value="⚠ī¸ Flag", interactive=False) #stop_btn = gr.Button(value="⏚ī¸ Stop Generation", interactive=False) regenerate_btn = gr.Button(value="🔄 Regenerate", interactive=False) - clear_btn = gr.Button(value="🗑ī¸ Clear history", interactive=False) + clear_btn = gr.Button(value="🗑ī¸ Clear", interactive=False) if not embed_mode: gr.Markdown(tos_markdown) @@ -397,7 +397,7 @@ def build_demo(embed_mode): parser.add_argument("--host", type=str, default="0.0.0.0") parser.add_argument("--port", type=int) parser.add_argument("--controller-url", type=str, default="http://localhost:21001") - parser.add_argument("--concurrency-count", type=int, default=8) + parser.add_argument("--concurrency-count", type=int, default=10) parser.add_argument("--model-list-mode", type=str, default="once", choices=["once", "reload"]) parser.add_argument("--share", action="store_true") @@ -410,6 +410,11 @@ def build_demo(embed_mode): logger.info(args) demo = build_demo(args.embed) - demo.queue(concurrency_count=args.concurrency_count, status_update_rate=10, - api_open=False).launch( - server_name=args.host, server_port=args.port, share=args.share) + demo.queue( + concurrency_count=args.concurrency_count, + api_open=False + ).launch( + server_name=args.host, + server_port=args.port, + share=args.share + )