File size: 5,321 Bytes
50fb808
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
dfac81b
 
50fb808
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
import gradio as gr
import pandas as pd

from themes import Seafoam
from load_data import load_main_table
from constants import BANNER, CITATION_TEXT, css, js_code, all_task_types, js_light

TYPES = ["number", "markdown", "number"]
MAIN_TABLE_COLS = ['Model', 'Language', 'Average Toxicity', 'Expected Maximum Toxicity', 'Empirical Probability']



df_main = load_main_table()
available_models = df_main['Model'].unique()
MODEL_SIZE = list(df_main['Model Size'].unique())
MODEL_TYPE = list(df_main['Model Type'].unique())
LANGAUGES = list(df_main['Language'].unique())
MODEL_FAMILY = list(df_main['Model Family'].unique())


with open("_intro.md", "r") as f:
    INTRO_MD = f.read()

with open("_about_us.md", "r") as f:
    ABOUT_MD = f.read()

with open("_header.md", "r") as f:
    HEADER_MD = f.read()

with open("_metrics.md", "r") as f:
    METRIC_MD = f.read()

    
with gr.Blocks(theme=gr.themes.Soft(), css=css, js=js_light) as demo:
    gr.HTML(BANNER, elem_id="banner")
    # gr.HTML("<img src='file/image.png' alt='image One'>")
    gr.Markdown(HEADER_MD, elem_classes="markdown-text")
    # gr.Image("./data/ptp.png")
    gr.HTML("<img src='file/data/ptp.png' alt='image One'>")
    gr.Markdown(f"**Version**: PTP-Small | **# Examples**: 85K | **# Models**: {len(available_models)}", elem_classes="markdown-text")
    gr.Markdown(METRIC_MD, elem_classes="markdown-text")


    with gr.Tabs(elem_classes="tab-buttons") as tabs:

        with gr.TabItem("๐Ÿ… Multilingual Leaderboard", elem_id="od-benchmark-tab-table", id=0, elem_classes="subtab"):
            print(df_main.head())
            mling_df = df_main.loc[df_main['Multilingual']==True, MAIN_TABLE_COLS].copy()
            del mling_df['Language']
            
            mling_df = mling_df.groupby("Model").agg('mean').reset_index().round(3)
            mling_df = mling_df.sort_values(by="Average Toxicity")

            print(mling_df.head())

            ablation_table = gr.components.Dataframe(
                        value=mling_df,
                        datatype=TYPES,
                        height=1000,
                        elem_id="mling-table",
                        interactive=False,
                        visible=True,
                        min_width=60,
            )


        with gr.TabItem("๐Ÿ“Š Ablation Results", elem_id="od-benchmark-tab-table", id=1, elem_classes="subtab"):
            with gr.Row():
                language = gr.CheckboxGroup(
                    choices=LANGAUGES,
                    value=LANGAUGES,
                    label='Language',
                    interactive=True
                )
            with gr.Row():
                model_family = gr.CheckboxGroup(
                    choices=MODEL_FAMILY,
                    value=MODEL_FAMILY,
                    label='Model Family',
                    interactive=True
                )
                
            with gr.Row():
                model_size = gr.CheckboxGroup(
                    choices=MODEL_SIZE,
                    value=MODEL_SIZE,
                    label='Model Size',
                    interactive=True,
                )
                model_type = gr.CheckboxGroup(
                    choices=MODEL_TYPE,
                    value=MODEL_TYPE,
                    label='Model Type',
                    interactive=True
                )

            ablation_table = gr.components.Dataframe(
                        value=df_main[MAIN_TABLE_COLS],
                        datatype=TYPES,
                        height=500,
                        elem_id="full-table",
                        interactive=False,
                        visible=True,
                        min_width=60,
            )    


            def filter_df(model_size, model_type, language, model_family):
                df = df_main.copy()
                
                print(df.isnull().sum())

                df = df[df['Model Type'].isin(model_type)]
                df = df[df['Model Size'].isin(model_size)]
                df = df[df['Language'].isin(language)]
                df = df[df['Model Family'].isin(model_family)]

                df = df.sort_values(by="Average Toxicity")

                assert (df.isnull().sum().sum())==0


                comp = gr.components.DataFrame(
                    value=df[MAIN_TABLE_COLS],
                    datatype=TYPES,
                    interactive=False,
                    visible=True)
                return comp
            
            for cbox in [model_size, model_type, language, model_family]:
                cbox.change(fn=filter_df, inputs=[model_size, model_type, language, model_family], outputs=ablation_table)


        with gr.TabItem("๐Ÿ“ฎ About Us", elem_id="od-benchmark-tab-table", id=2):
                gr.Markdown(ABOUT_MD, elem_classes="markdown-text")
        
        with gr.Row():
            with gr.Accordion("๐Ÿ“™ Citation", open=False, elem_classes="accordion-label"):
                gr.Textbox(
                    value=CITATION_TEXT, 
                    lines=7,
                    label="Copy the BibTeX snippet to cite this source",
                    elem_id="citation-button",
                    show_copy_button=True)

if __name__ == '__main__':
    demo.launch(share=True, allowed_paths=["."])