Spaces:

JetBrains-Research
/

commit-labeling

Sleeping

App Files Files Community

Petr Tsvetkov commited on Feb 21, 2024

Commit

815e7fc

1 Parent(s): 14bb44e

Display multiple versions of a commit message

Browse files

Files changed (1) hide show

app.py +117 -96

app.py CHANGED Viewed

@@ -4,17 +4,16 @@ import random
 import uuid
 import gradio as gr
-from datasets import load_dataset
 HF_TOKEN = os.environ.get('HF_TOKEN')
 HF_DATASET = os.environ.get('HF_DATASET')
-configuration = "commitchronicle-py-long"  # select a configuration
-dataset = load_dataset("JetBrains-Research/lca-cmg",
-                       configuration,
-                       split="test",
-                       cache_dir="data")
-n_samples = len(dataset)
 saver = gr.HuggingFaceDatasetSaver(HF_TOKEN, HF_DATASET, private=True)
@@ -34,7 +33,7 @@ def convert_diff_to_unified(diff):
 def get_diff2html_view(raw_diff):
     html = f"""
-    <div style='width:100%; height:720px; overflow:auto; position: relative'>
         <div id='diff-raw' hidden>{raw_diff}</div>
         <div class="d2h-view-wrapper">
             <div id='diff-view'></div>
@@ -49,14 +48,19 @@ def update_commit_view(sample_ind):
     if sample_ind >= n_samples:
         return None
-    record = dataset[sample_ind]
     diff_view = get_diff2html_view(convert_diff_to_unified(record['mods']))
-    commit_msg = record['message']
     repo_val = record['repo']
     hash_val = record['hash']
     diff_loaded_timestamp = datetime.now().isoformat()
-    return diff_view, commit_msg, repo_val, hash_val, diff_loaded_timestamp
 def next_sample(current_sample_ind, shuffled_idx):
@@ -91,81 +95,96 @@ with gr.Blocks(theme=gr.themes.Soft(), head=head_html, css="style_overrides.css"
         with gr.Column(scale=2):
             diff_view = gr.HTML()
         with gr.Column(scale=1):
-            commit_msg = gr.Textbox(label="Commit message",
-                                    interactive=False,
-                                    )
-            gr.Markdown("## Please, rate your level of agreement with each statement\n"
-                        "\n"
-                        "*1 - strongly disagree, 2 - disagree, 3 - agree, 4 - strongly agree*")
-            is_correct = gr.Slider(
-                info='The information provided in the commit message is consistent with the code changes.',
-                label='is_correct',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=4)
-            has_what = gr.Slider(
-                info='The commit message answers the question of WHAT changes have been made.',
-                label='has_what',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=4)
-            has_why = gr.Slider(
-                info='The commit message answers the question of WHY these changes have been made.',
-                label='has_why',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=4)
-            is_not_verbose = gr.Slider(
-                info='The commit message can be substantially shortened without loss of important information.',
-                label='is_not_verbose',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=4)
-            has_headline = gr.Slider(
-                info='The commit message includes a short headline that provides a good overview of the changes.',
-                label='has_headline',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=4)
-            easy_to_read = gr.Slider(
-                info='The commit message is easy to read and to understand.',
-                label='easy_to_read',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=4)
-            overall_rating = gr.Slider(
-                info='Please, describe your overall impression of the commit message (1 - very bad, 5 - very good)',
-                label='overall_rating',
-                show_label=False,
-                minimum=1,
-                step=1,
-                interactive=True,
-                maximum=5)
-            comments = gr.Textbox(
-                info='Additional comments on the commit message',
-                label='comments',
-                show_label=False,
-                interactive=True)
             submit_btn = gr.Button("Submit and continue")
             session_val = gr.Textbox(info='Session', interactive=False, container=True, show_label=False,
@@ -181,10 +200,11 @@ with gr.Blocks(theme=gr.themes.Soft(), head=head_html, css="style_overrides.css"
     commit_view = [
         diff_view,
-        commit_msg,
         repo_val,
         hash_val,
-        sample_loaded_timestamp
     ]
     feedback_form = [
@@ -193,14 +213,15 @@ with gr.Blocks(theme=gr.themes.Soft(), head=head_html, css="style_overrides.css"
         hash_val,
         sample_loaded_timestamp,
         sample_submitted_timestamp,
-        is_correct,
-        has_what,
-        has_why,
-        is_not_verbose,
-        has_headline,
-        easy_to_read,
-        overall_rating,
-        comments
     ]
     saver.setup([current_sample_sld] + feedback_form, "feedback")

 import uuid
 import gradio as gr
+from data_loader import load_data
 HF_TOKEN = os.environ.get('HF_TOKEN')
 HF_DATASET = os.environ.get('HF_DATASET')
+data, models = load_data()
+n_samples = len(data)
+n_models = len(models)
 saver = gr.HuggingFaceDatasetSaver(HF_TOKEN, HF_DATASET, private=True)
 def get_diff2html_view(raw_diff):
     html = f"""
+    <div style='width:100%; height:1400px; overflow:auto; position: relative'>
         <div id='diff-raw' hidden>{raw_diff}</div>
         <div class="d2h-view-wrapper">
             <div id='diff-view'></div>
     if sample_ind >= n_samples:
         return None
+    record = data[sample_ind]
     diff_view = get_diff2html_view(convert_diff_to_unified(record['mods']))
     repo_val = record['repo']
     hash_val = record['hash']
     diff_loaded_timestamp = datetime.now().isoformat()
+    models_shuffled = models[:]
+    random.shuffle(models_shuffled)
+    commit_messages = tuple(record[model] for model in models_shuffled)
+    return (diff_view, repo_val, hash_val, diff_loaded_timestamp) + commit_messages + tuple(models_shuffled)
 def next_sample(current_sample_ind, shuffled_idx):
         with gr.Column(scale=2):
             diff_view = gr.HTML()
         with gr.Column(scale=1):
+            commit_msg = []
+            is_correct = []
+            has_what = []
+            has_why = []
+            is_not_verbose = []
+            has_headline = []
+            easy_to_read = []
+            overall_rating = []
+            comments = []
+            model_name = []
+            for model_ind in range(n_models):
+                with gr.Tab(f"Message #{model_ind + 1}"):
+                    commit_msg.append(gr.TextArea(label="Commit message (can be scrollable)",
+                                                  interactive=False,
+                                                  ))
+                    gr.Markdown("## Please, rate your level of agreement with each statement\n"
+                                "\n"
+                                "*1 - strongly disagree, 2 - disagree, 3 - agree, 4 - strongly agree*")
+                    is_correct.append(gr.Slider(
+                        info='The information provided in the commit message is consistent with the code changes.',
+                        label=f'is_correct_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=4))
+                    has_what.append(gr.Slider(
+                        info='The commit message answers the question of WHAT changes have been made.',
+                        label=f'has_what_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=4))
+                    has_why.append(gr.Slider(
+                        info='The commit message answers the question of WHY these changes have been made.',
+                        label=f'has_why_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=4))
+                    is_not_verbose.append(gr.Slider(
+                        info='The commit message can be substantially shortened without loss of important information.',
+                        label=f'is_not_verbose_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=4))
+                    has_headline.append(gr.Slider(
+                        info='The commit message includes a short headline that provides a good overview of the changes.',
+                        label=f'has_headline_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=4))
+                    easy_to_read.append(gr.Slider(
+                        info='The commit message is easy to read and to understand.',
+                        label=f'easy_to_read_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=4))
+                    overall_rating.append(gr.Slider(
+                        info='Please, describe your overall impression of the commit message (1 - very bad, 5 - very good)',
+                        label=f'overall_rating_{model_ind}',
+                        show_label=False,
+                        minimum=1,
+                        step=1,
+                        interactive=True,
+                        maximum=5))
+                    comments.append(gr.Textbox(
+                        info='Additional comments on the commit message',
+                        label=f'comments_{model_ind}',
+                        show_label=False,
+                        interactive=True))
+                    model_name.append(gr.Textbox(interactive=False, label=f'model_{model_ind}', visible=False))
             submit_btn = gr.Button("Submit and continue")
             session_val = gr.Textbox(info='Session', interactive=False, container=True, show_label=False,
     commit_view = [
         diff_view,
         repo_val,
         hash_val,
+        sample_loaded_timestamp,
+        *commit_msg,
+        *model_name
     ]
     feedback_form = [
         hash_val,
         sample_loaded_timestamp,
         sample_submitted_timestamp,
+        *is_correct,
+        *has_what,
+        *has_why,
+        *is_not_verbose,
+        *has_headline,
+        *easy_to_read,
+        *overall_rating,
+        *comments,
+        *model_name
     ]
     saver.setup([current_sample_sld] + feedback_form, "feedback")