melt / fastchat /serve /gradio_web_server_multi.py
martinakaduc's picture
Upload folder using huggingface_hub
f3305db verified
"""
The gradio demo server with multiple tabs.
It supports chatting with a single model or chatting with two models side-by-side.
"""
import argparse
import pickle
import time
import gradio as gr
from fastchat.serve.gradio_block_arena_anony import (
build_side_by_side_ui_anony,
load_demo_side_by_side_anony,
set_global_vars_anony,
)
from fastchat.serve.gradio_block_arena_named import (
build_side_by_side_ui_named,
load_demo_side_by_side_named,
set_global_vars_named,
)
from fastchat.serve.gradio_block_arena_vision import (
build_single_vision_language_model_ui,
)
from fastchat.serve.gradio_block_arena_vision_anony import (
build_side_by_side_vision_ui_anony,
load_demo_side_by_side_vision_anony,
)
from fastchat.serve.gradio_block_arena_vision_named import (
build_side_by_side_vision_ui_named,
)
from fastchat.serve.gradio_web_server import (
set_global_vars,
block_css,
build_single_model_ui,
build_about,
get_model_list,
load_demo_single,
get_ip,
)
from fastchat.serve.monitor.monitor import build_leaderboard_tab
from fastchat.utils import (
build_logger,
get_window_url_params_js,
get_window_url_params_with_tos_js,
alert_js,
parse_gradio_auth_creds,
)
logger = build_logger("gradio_web_server_multi", "gradio_web_server_multi.log")
def load_demo(url_params, request: gr.Request):
global models, all_models, vl_models, all_vl_models
ip = get_ip(request)
logger.info(f"load_demo. ip: {ip}. params: {url_params}")
inner_selected = 0
if "arena" in url_params:
inner_selected = 0
elif "vision" in url_params:
inner_selected = 1
elif "compare" in url_params:
inner_selected = 1
elif "direct" in url_params or "model" in url_params:
inner_selected = 3
elif "leaderboard" in url_params:
inner_selected = 4
elif "about" in url_params:
inner_selected = 5
if args.model_list_mode == "reload":
models, all_models = get_model_list(
args.controller_url,
args.register_api_endpoint_file,
vision_arena=False,
)
vl_models, all_vl_models = get_model_list(
args.controller_url,
args.register_api_endpoint_file,
vision_arena=True,
)
single_updates = load_demo_single(models, url_params)
side_by_side_anony_updates = load_demo_side_by_side_anony(all_models, url_params)
side_by_side_named_updates = load_demo_side_by_side_named(models, url_params)
side_by_side_vision_anony_updates = load_demo_side_by_side_vision_anony(
all_models, all_vl_models, url_params
)
return (
(gr.Tabs(selected=inner_selected),)
+ single_updates
+ side_by_side_anony_updates
+ side_by_side_named_updates
+ side_by_side_vision_anony_updates
)
def build_demo(models, vl_models, elo_results_file, leaderboard_table_file):
if args.show_terms_of_use:
load_js = get_window_url_params_with_tos_js
else:
load_js = get_window_url_params_js
head_js = """
<script src="https://cdnjs.cloudflare.com/ajax/libs/html2canvas/1.4.1/html2canvas.min.js"></script>
"""
if args.ga_id is not None:
head_js += f"""
<script async src="https://www.googletagmanager.com/gtag/js?id={args.ga_id}"></script>
<script>
window.dataLayer = window.dataLayer || [];
function gtag(){{dataLayer.push(arguments);}}
gtag('js', new Date());
gtag('config', '{args.ga_id}');
window.__gradio_mode__ = "app";
</script>
"""
text_size = gr.themes.sizes.text_lg
with gr.Blocks(
title="Chat with Open Large Language Models",
theme=gr.themes.Default(text_size=text_size),
css=block_css,
head=head_js,
) as demo:
with gr.Tabs() as inner_tabs:
if args.vision_arena:
with gr.Tab("⚔️ Arena (battle)", id=0) as arena_tab:
arena_tab.select(None, None, None, js=load_js)
side_by_side_anony_list = build_side_by_side_vision_ui_anony(
all_models,
all_vl_models,
random_questions=args.random_questions,
)
else:
with gr.Tab("⚔️ Arena (battle)", id=0) as arena_tab:
arena_tab.select(None, None, None, js=load_js)
side_by_side_anony_list = build_side_by_side_ui_anony(models)
with gr.Tab("⚔️ Arena (side-by-side)", id=2) as side_by_side_tab:
side_by_side_tab.select(None, None, None, js=alert_js)
side_by_side_named_list = build_side_by_side_ui_named(models)
with gr.Tab("💬 Direct Chat", id=3) as direct_tab:
direct_tab.select(None, None, None, js=alert_js)
single_model_list = build_single_model_ui(
models, add_promotion_links=True
)
demo_tabs = (
[inner_tabs]
+ single_model_list
+ side_by_side_anony_list
+ side_by_side_named_list
)
if elo_results_file:
with gr.Tab("🏆 Leaderboard", id=4):
build_leaderboard_tab(
elo_results_file, leaderboard_table_file, show_plot=True
)
with gr.Tab("ℹ️ About Us", id=5):
about = build_about()
url_params = gr.JSON(visible=False)
if args.model_list_mode not in ["once", "reload"]:
raise ValueError(f"Unknown model list mode: {args.model_list_mode}")
demo.load(
load_demo,
[url_params],
demo_tabs,
js=load_js,
)
return demo
if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument("--host", type=str, default="0.0.0.0")
parser.add_argument("--port", type=int)
parser.add_argument(
"--share",
action="store_true",
help="Whether to generate a public, shareable link",
)
parser.add_argument(
"--controller-url",
type=str,
default="http://localhost:21001",
help="The address of the controller",
)
parser.add_argument(
"--concurrency-count",
type=int,
default=10,
help="The concurrency count of the gradio queue",
)
parser.add_argument(
"--model-list-mode",
type=str,
default="once",
choices=["once", "reload"],
help="Whether to load the model list once or reload the model list every time.",
)
parser.add_argument(
"--moderate",
action="store_true",
help="Enable content moderation to block unsafe inputs",
)
parser.add_argument(
"--show-terms-of-use",
action="store_true",
help="Shows term of use before loading the demo",
)
parser.add_argument(
"--vision-arena", action="store_true", help="Show tabs for vision arena."
)
parser.add_argument(
"--random-questions", type=str, help="Load random questions from a JSON file"
)
parser.add_argument(
"--register-api-endpoint-file",
type=str,
help="Register API-based model endpoints from a JSON file",
)
parser.add_argument(
"--gradio-auth-path",
type=str,
help='Set the gradio authentication file path. The file should contain one or more user:password pairs in this format: "u1:p1,u2:p2,u3:p3"',
default=None,
)
parser.add_argument(
"--elo-results-file", type=str, help="Load leaderboard results and plots"
)
parser.add_argument(
"--leaderboard-table-file", type=str, help="Load leaderboard results and plots"
)
parser.add_argument(
"--gradio-root-path",
type=str,
help="Sets the gradio root path, eg /abc/def. Useful when running behind a reverse-proxy or at a custom URL path prefix",
)
parser.add_argument(
"--ga-id",
type=str,
help="the Google Analytics ID",
default=None,
)
parser.add_argument(
"--use-remote-storage",
action="store_true",
default=False,
help="Uploads image files to google cloud storage if set to true",
)
parser.add_argument(
"--password",
type=str,
help="Set the password for the gradio web server",
)
args = parser.parse_args()
logger.info(f"args: {args}")
# Set global variables
set_global_vars(args.controller_url, args.moderate, args.use_remote_storage)
set_global_vars_named(args.moderate)
set_global_vars_anony(args.moderate)
models, all_models = get_model_list(
args.controller_url,
args.register_api_endpoint_file,
vision_arena=False,
)
vl_models, all_vl_models = get_model_list(
args.controller_url,
args.register_api_endpoint_file,
vision_arena=True,
)
# Set authorization credentials
auth = None
if args.gradio_auth_path is not None:
auth = parse_gradio_auth_creds(args.gradio_auth_path)
# Launch the demo
demo = build_demo(
models,
all_vl_models,
args.elo_results_file,
args.leaderboard_table_file,
)
demo.queue(
default_concurrency_limit=args.concurrency_count,
status_update_rate=10,
api_open=False,
).launch(
server_name=args.host,
server_port=args.port,
share=args.share,
max_threads=200,
auth=auth,
root_path=args.gradio_root_path,
show_api=False,
)