Spaces:

kevineen
/

tanuki_annotation_phase2

Sleeping

App Files Files Community

kevineen commited on 19 days ago

Commit

19ee3e1

•

1 Parent(s): 509018d

typo 修正

Browse files

Files changed (2) hide show

app.py +84 -99
run.py +84 -84

app.py CHANGED Viewed

@@ -1,6 +1,3 @@
-import os
-from dotenv import load_dotenv
 import json
 import datetime
 from pathlib import Path
@@ -12,24 +9,12 @@ import pandas as pd
 import gradio as gr
 from datasets import load_dataset
 from huggingface_hub import CommitScheduler
-from huggingface_hub import HfFolder
-# .envファイルから環境変数をロードする(ローカル開発環境)
-load_dotenv()
-# HF_Spaceでプライベート関連にアクセスするための環境変数
-# SecretKey をSpaceのSettingsに設定
-HF_TOKEN = os.getenv("HF_TOKEN")
-if HF_TOKEN:
-    HfFolder.save_token(HF_TOKEN)
-else:
-    print("Warning: HF_TOKEN not found. Please set it in your Space secrets.")
 # HFデータセット アップロード先
 # (切り替えてテストする用に配列)
 OUTPUT_DATASET = [
     "team-hatakeyama-phase2/annotation_tanuki_phase2",
-    "kevineen/Tanuki-Phase2-annotation-dataset",  # 出力テスト
 ]
 # アノテーション対象データセット
@@ -45,10 +30,10 @@ ANNOTATION_DATASET = [
     # "kanhatakeyama/AutoWikiQA",
     # "susumuota/SyntheticTextWikiTranslate-askllm-v1", # Ask-LLM 翻訳
-    # Nomotron データ (将来用
 ]
-MULTITURN_ANNOTATION_DATASET = [
     # マルチターン 未対応
     "kanhatakeyama/AutoMultiTurnByMixtral8x22b",
 ]
@@ -85,8 +70,8 @@ annotated_dataset = gr.State(
         # 5段階評価
         'score': [], # 総合 (5段階評価)
-        'helphulness': [], # 有用性　(5段階評価)
-        'correcthness': [], # 正確さ　(5段階評価)
         'coherence': [], # 一貫性　(5段階評価)
         'complexity': [], # 複雑さ　(5段階評価)
         'verbosity': [], # 冗長性　(5段階評価)
@@ -106,7 +91,7 @@ annotated_dataset = gr.State(
         'threat': [], # 犯罪
         'gun': [], # 重火器
         'controlled_substance': [], # 規制対象物質
-        'climinal_planing': [], # 犯罪計画
         'privacy': [], # 個人情報
         'harassment': [], # ハラスメント
         'profanity': [], # 冒涜
@@ -138,9 +123,9 @@ answer_text_2 = gr.State("")  # answer_2 回答
 # (5段階評価)
 # 0は判断していない、又は判断が難しいという特徴量にする
 score = gr.State(3)  # 総合スコア 初期値は3 (最低限必須)
-helphulness = gr.State(0) # 有用性
-correcthness = gr.State(0) # 正確さ
-coherenece = gr.State(0) # 一貫性
 complexity = gr.State(0) # 複雑さ
 verbosity = gr.State(0) # 冗長性
 humor = gr.State(0) # ユーモア (SteerLM)
@@ -159,7 +144,7 @@ suicide = gr.State(0) # 自殺
 threat = gr.State(0) # 犯罪
 gun = gr.State(0) # 銃・重火器
 controlled_substance = gr.State(0) # 規制対象物質
-climinal_planing = gr.State(0) # 犯罪計画
 privacy = gr.State(0) # 個人情報・プライバシー情報
 harassment = gr.State(0) # ハラスメント
 profanity = gr.State(0) # 冒涜
@@ -330,8 +315,8 @@ def save_annotation(
         is_proofreading_2: bool,
         answer_text_2: str,
         score: int,
-        helphulness: int,
-        correcthness: int,
         coherence: int,
         complexity: int,
         verbosity: int,
@@ -348,7 +333,7 @@ def save_annotation(
         threat: int,
         gun: int,
         controlled_substance: int,
-        climinal_planing: int,
         privacy: int,
         harassment: int,
         profanity: int,
@@ -371,24 +356,24 @@ def save_annotation(
             'is_proofreading_2': [is_proofreading_2],
             'answer_text_2': [answer_text_2],
             'score': [score],
-            'helphullness': [helphulness],
-            'correcthness': [correcthness],
             'complexity': [complexity],
             'verbosity': [verbosity],
             'humor': [humor],
             'creativity': [creativity],
             'appropriate': [appropriate],
-            'following_finstructions': [following_instructions],
             'politeness': [politeness],
             'harmfulness': [harmfulness],
             'hate': [hate],
-            'sextual': [sexual],
             'violence': [violence],
             'suicide': [suicide],
             'threat': [threat],
             'gun': [gun],
             'controlled_substance': [controlled_substance],
-            'climinal_planing': [climinal_planing],
             'privacy': [privacy],
             'harassment': [harassment],
             'profanity': [profanity],
@@ -414,8 +399,8 @@ def save_annotation(
                 "is_proofreading_2": is_proofreading_2,
                 "answer_text_2": answer_text_2,
                 "score": int(score),
-                "helphulness": int(helphulness),
-                "correcthness": int(correcthness),
                 "coherence": int(coherence),
                 "complexity": int(complexity),
                 "verbosity": int(verbosity),
@@ -432,11 +417,11 @@ def save_annotation(
                 "threat": int(threat),
                 "gun": int(gun),
                 "controlled_substance": int(controlled_substance),
-                "climinal_planing": int(climinal_planing),
                 "privacy": int(privacy),
                 "harassment": int(harassment),
                 "profanity": int(profanity),
-                "policital_content": int(political_content),
                 "moral_judgement": int(moral_judgement),
                 "typos": int(typos)
             }
@@ -570,11 +555,11 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                             gr_score_reset = gr.Button("スコアリセット", interactive=False)
                         gr_score_detail = gr.Slider(label="総合スコア　【必須】",value=3, minimum=1, maximum=5, step=1,  interactive=False)
-                        gr_evalannotation_explain = gr.Markdown("詳細アノテーション (5点満点)")
                         with gr.Row() :
-                            gr_helphulness = gr.Slider(label="有用性", minimum=0, value=0, maximum=5, step=1, interactive=False)
-                            gr_correcthness = gr.Slider(label="正確さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_coherence = gr.Slider(label="一貫性", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_complexity = gr.Slider(label="複雑さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
@@ -610,7 +595,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         with gr.Row():
                             gr_controlled_substance = gr.Radio(label="規制対象物質", choices=["不明", "有", "無"], value="不明", interactive=False)
-                            gr_climinal_planing = gr.Radio(label="犯罪計画", choices=["不明", "有", "無"], value="不明", interactive=False)
                         with gr.Row():
                             gr_privacy = gr.Radio(label="個人情報", choices=["不明", "有", "無"], value="不明", interactive=False)
@@ -628,9 +613,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 # slicer
                 g_score: int,
-                g_helphulness: int,
-                g_correcthness: int,
-                g_coherenece: int,
                 g_complexity: int,
                 g_verbosity: int,
                 g_humor: int,
@@ -648,7 +633,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 g_threat: str,
                 g_gun: str,
                 g_controlled_substance: str,
-                g_climinal_planing: str,
                 g_privacy: str,
                 g_harassment: str,
                 g_profanity: str,
@@ -671,9 +656,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 # 送信用データ更新
                 score.value = g_score
-                helphulness.value = g_helphulness
-                correcthness.value = g_correcthness
-                coherenece.value = g_coherenece
                 complexity.value = g_complexity
                 verbosity.value = g_verbosity
                 humor.value = g_humor
@@ -690,7 +675,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 threat.value = checkbox_to_int(g_threat)
                 gun.value = checkbox_to_int(g_gun)
                 controlled_substance.value = checkbox_to_int(g_controlled_substance)
-                climinal_planing.value = checkbox_to_int(g_climinal_planing)
                 privacy.value = checkbox_to_int(g_privacy)
                 harassment.value = checkbox_to_int(g_harassment)
                 profanity.value = checkbox_to_int(g_profanity)
@@ -724,9 +709,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
-                    helphulness.value,
-                    correcthness.value,
-                    coherenece.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
@@ -742,7 +727,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     threat.value,
                     gun.value,
                     controlled_substance.value,
-                    climinal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
@@ -771,8 +756,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 inputs=[
                     gr_answer_text_3_1,
                     gr_score_detail,
-                    gr_helphulness,
-                    gr_correcthness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
@@ -789,7 +774,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
-                    gr_climinal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
@@ -806,8 +791,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_question_text_3_1,
                     gr_answer_text_3_1,
                     gr_score_detail,
-                    gr_helphulness,
-                    gr_correcthness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
@@ -824,7 +809,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
-                    gr_climinal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
@@ -939,9 +924,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
-                    helphulness.value,
-                    correcthness.value,
-                    coherenece.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
@@ -957,7 +942,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     threat.value,
                     gun.value,
                     controlled_substance.value,
-                    climinal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
@@ -1001,8 +986,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1019,7 +1004,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
@@ -1055,8 +1040,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1073,7 +1058,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
@@ -1109,8 +1094,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1127,7 +1112,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
@@ -1148,8 +1133,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1166,7 +1151,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1184,8 +1169,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1202,7 +1187,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1220,8 +1205,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1238,7 +1223,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1256,8 +1241,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1274,7 +1259,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1292,8 +1277,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1310,7 +1295,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1323,9 +1308,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
             def score_reset_display():
                 # gr.State
                 score.value = 3
-                helphulness.value = 0
-                correcthness.value = 0
-                coherenece.value = 0
                 complexity.value = 0
                 verbosity.value = 0
                 humor.value = 0
@@ -1340,8 +1325,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 suicide.value = 0
                 threat.value = 0
                 gun.value = 0
-                controlled_substance.vlaue = 0
-                climinal_planing.value = 0
                 privacy.value = 0
                 harassment.value = 0
                 profanity.value = 0
@@ -1360,8 +1345,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 inputs=[],
                 outputs=[
                     gr_score_detail,
-                    gr_helphulness,
-                    gr_correcthness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
@@ -1378,7 +1363,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
-                    gr_climinal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
@@ -1392,7 +1377,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
             gr_data_load_btn.click(
                 dataset_load_fn,
                 inputs=None,
-                # textをセットし、intractiveをTrueにする (UI更新)
                 outputs=[
                         gr_question_text_1_1,
                         gr_answer_text_1_1,
@@ -1414,8 +1399,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_submit_score,
                         gr_score_detail,
                         gr_score_reset,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1432,7 +1417,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,

 import json
 import datetime
 from pathlib import Path
 import gradio as gr
 from datasets import load_dataset
 from huggingface_hub import CommitScheduler
 # HFデータセット アップロード先
 # (切り替えてテストする用に配列)
 OUTPUT_DATASET = [
     "team-hatakeyama-phase2/annotation_tanuki_phase2",
+    "kevineen/Tanuki-Phase2-annotation-dataset", # 出力テスト
 ]
 # アノテーション対象データセット
     # "kanhatakeyama/AutoWikiQA",
     # "susumuota/SyntheticTextWikiTranslate-askllm-v1", # Ask-LLM 翻訳
+    # Nemotron データ (将来用
 ]
+MULTI_TURN_ANNOTATION_DATASET = [
     # マルチターン 未対応
     "kanhatakeyama/AutoMultiTurnByMixtral8x22b",
 ]
         # 5段階評価
         'score': [], # 総合 (5段階評価)
+        'helpfulness': [], # 有用性　(5段階評価)
+        'correctness': [], # 正確さ　(5段階評価)
         'coherence': [], # 一貫性　(5段階評価)
         'complexity': [], # 複雑さ　(5段階評価)
         'verbosity': [], # 冗長性　(5段階評価)
         'threat': [], # 犯罪
         'gun': [], # 重火器
         'controlled_substance': [], # 規制対象物質
+        'criminal_planing': [], # 犯罪計画
         'privacy': [], # 個人情報
         'harassment': [], # ハラスメント
         'profanity': [], # 冒涜
 # (5段階評価)
 # 0は判断していない、又は判断が難しいという特徴量にする
 score = gr.State(3)  # 総合スコア 初期値は3 (最低限必須)
+helpfulness = gr.State(0) # 有用性
+correctness = gr.State(0) # 正確さ
+coherence = gr.State(0) # 一貫性
 complexity = gr.State(0) # 複雑さ
 verbosity = gr.State(0) # 冗長性
 humor = gr.State(0) # ユーモア (SteerLM)
 threat = gr.State(0) # 犯罪
 gun = gr.State(0) # 銃・重火器
 controlled_substance = gr.State(0) # 規制対象物質
+criminal_planing = gr.State(0) # 犯罪計画
 privacy = gr.State(0) # 個人情報・プライバシー情報
 harassment = gr.State(0) # ハラスメント
 profanity = gr.State(0) # 冒涜
         is_proofreading_2: bool,
         answer_text_2: str,
         score: int,
+        helpfulness: int,
+        correctness: int,
         coherence: int,
         complexity: int,
         verbosity: int,
         threat: int,
         gun: int,
         controlled_substance: int,
+        criminal_planing: int,
         privacy: int,
         harassment: int,
         profanity: int,
             'is_proofreading_2': [is_proofreading_2],
             'answer_text_2': [answer_text_2],
             'score': [score],
+            'helpfulness': [helpfulness],
+            'correctness': [correctness],
             'complexity': [complexity],
             'verbosity': [verbosity],
             'humor': [humor],
             'creativity': [creativity],
             'appropriate': [appropriate],
+            'following_instructions': [following_instructions],
             'politeness': [politeness],
             'harmfulness': [harmfulness],
             'hate': [hate],
+            'sexual': [sexual],
             'violence': [violence],
             'suicide': [suicide],
             'threat': [threat],
             'gun': [gun],
             'controlled_substance': [controlled_substance],
+            'criminal_planing': [criminal_planing],
             'privacy': [privacy],
             'harassment': [harassment],
             'profanity': [profanity],
                 "is_proofreading_2": is_proofreading_2,
                 "answer_text_2": answer_text_2,
                 "score": int(score),
+                "helpfulness": int(helpfulness),
+                "correctness": int(correctness),
                 "coherence": int(coherence),
                 "complexity": int(complexity),
                 "verbosity": int(verbosity),
                 "threat": int(threat),
                 "gun": int(gun),
                 "controlled_substance": int(controlled_substance),
+                "criminal_planing": int(criminal_planing),
                 "privacy": int(privacy),
                 "harassment": int(harassment),
                 "profanity": int(profanity),
+                "political_content": int(political_content),
                 "moral_judgement": int(moral_judgement),
                 "typos": int(typos)
             }
                             gr_score_reset = gr.Button("スコアリセット", interactive=False)
                         gr_score_detail = gr.Slider(label="総合スコア　【必須】",value=3, minimum=1, maximum=5, step=1,  interactive=False)
+                        gr_eval_annotation_explain = gr.Markdown("詳細アノテーション (5点満点)")
                         with gr.Row() :
+                            gr_helpfulness = gr.Slider(label="有用性", minimum=0, value=0, maximum=5, step=1, interactive=False)
+                            gr_correctness = gr.Slider(label="正確さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_coherence = gr.Slider(label="一貫性", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_complexity = gr.Slider(label="複雑さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
                         with gr.Row():
                             gr_controlled_substance = gr.Radio(label="規制対象物質", choices=["不明", "有", "無"], value="不明", interactive=False)
+                            gr_criminal_planing = gr.Radio(label="犯罪計画", choices=["不明", "有", "無"], value="不明", interactive=False)
                         with gr.Row():
                             gr_privacy = gr.Radio(label="個人情報", choices=["不明", "有", "無"], value="不明", interactive=False)
                 # slicer
                 g_score: int,
+                g_helpfulness: int,
+                g_correctness: int,
+                g_coherence: int,
                 g_complexity: int,
                 g_verbosity: int,
                 g_humor: int,
                 g_threat: str,
                 g_gun: str,
                 g_controlled_substance: str,
+                g_criminal_planing: str,
                 g_privacy: str,
                 g_harassment: str,
                 g_profanity: str,
                 # 送信用データ更新
                 score.value = g_score
+                helpfulness.value = g_helpfulness
+                correctness.value = g_correctness
+                coherence.value = g_coherence
                 complexity.value = g_complexity
                 verbosity.value = g_verbosity
                 humor.value = g_humor
                 threat.value = checkbox_to_int(g_threat)
                 gun.value = checkbox_to_int(g_gun)
                 controlled_substance.value = checkbox_to_int(g_controlled_substance)
+                criminal_planing.value = checkbox_to_int(g_criminal_planing)
                 privacy.value = checkbox_to_int(g_privacy)
                 harassment.value = checkbox_to_int(g_harassment)
                 profanity.value = checkbox_to_int(g_profanity)
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
+                    helpfulness.value,
+                    correctness.value,
+                    coherence.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
                     threat.value,
                     gun.value,
                     controlled_substance.value,
+                    criminal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
                 inputs=[
                     gr_answer_text_3_1,
                     gr_score_detail,
+                    gr_helpfulness,
+                    gr_correctness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
+                    gr_criminal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
                     gr_question_text_3_1,
                     gr_answer_text_3_1,
                     gr_score_detail,
+                    gr_helpfulness,
+                    gr_correctness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
+                    gr_criminal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
+                    helpfulness.value,
+                    correctness.value,
+                    coherence.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
                     threat.value,
                     gun.value,
                     controlled_substance.value,
+                    criminal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
             def score_reset_display():
                 # gr.State
                 score.value = 3
+                helpfulness.value = 0
+                correctness.value = 0
+                coherence.value = 0
                 complexity.value = 0
                 verbosity.value = 0
                 humor.value = 0
                 suicide.value = 0
                 threat.value = 0
                 gun.value = 0
+                controlled_substance.value = 0
+                criminal_planing.value = 0
                 privacy.value = 0
                 harassment.value = 0
                 profanity.value = 0
                 inputs=[],
                 outputs=[
                     gr_score_detail,
+                    gr_helpfulness,
+                    gr_correctness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
+                    gr_criminal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
             gr_data_load_btn.click(
                 dataset_load_fn,
                 inputs=None,
+                # textをセットし、interactiveをTrueにする (UI更新)
                 outputs=[
                         gr_question_text_1_1,
                         gr_answer_text_1_1,
                         gr_submit_score,
                         gr_score_detail,
                         gr_score_reset,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,

run.py CHANGED Viewed

@@ -31,7 +31,7 @@ else:
 # (切り替えてテストする用に配列)
 OUTPUT_DATASET = [
     "team-hatakeyama-phase2/annotation_tanuki_phase2",
-    "kevineen/Tanuki-Phase2-annotation-dataset",  # 出力テスト
 ]
 # アノテーション対象データセット
@@ -47,10 +47,10 @@ ANNOTATION_DATASET = [
     # "kanhatakeyama/AutoWikiQA",
     # "susumuota/SyntheticTextWikiTranslate-askllm-v1", # Ask-LLM 翻訳
-    # Nomotron データ (将来用
 ]
-MULTITURN_ANNOTATION_DATASET = [
     # マルチターン 未対応
     "kanhatakeyama/AutoMultiTurnByMixtral8x22b",
 ]
@@ -87,8 +87,8 @@ annotated_dataset = gr.State(
         # 5段階評価
         'score': [], # 総合 (5段階評価)
-        'helphulness': [], # 有用性　(5段階評価)
-        'correcthness': [], # 正確さ　(5段階評価)
         'coherence': [], # 一貫性　(5段階評価)
         'complexity': [], # 複雑さ　(5段階評価)
         'verbosity': [], # 冗長性　(5段階評価)
@@ -108,7 +108,7 @@ annotated_dataset = gr.State(
         'threat': [], # 犯罪
         'gun': [], # 重火器
         'controlled_substance': [], # 規制対象物質
-        'climinal_planing': [], # 犯罪計画
         'privacy': [], # 個人情報
         'harassment': [], # ハラスメント
         'profanity': [], # 冒涜
@@ -140,9 +140,9 @@ answer_text_2 = gr.State("")  # answer_2 回答
 # (5段階評価)
 # 0は判断していない、又は判断が難しいという特徴量にする
 score = gr.State(3)  # 総合スコア 初期値は3 (最低限必須)
-helphulness = gr.State(0) # 有用性
-correcthness = gr.State(0) # 正確さ
-coherenece = gr.State(0) # 一貫性
 complexity = gr.State(0) # 複雑さ
 verbosity = gr.State(0) # 冗長性
 humor = gr.State(0) # ユーモア (SteerLM)
@@ -161,7 +161,7 @@ suicide = gr.State(0) # 自殺
 threat = gr.State(0) # 犯罪
 gun = gr.State(0) # 銃・重火器
 controlled_substance = gr.State(0) # 規制対象物質
-climinal_planing = gr.State(0) # 犯罪計画
 privacy = gr.State(0) # 個人情報・プライバシー情報
 harassment = gr.State(0) # ハラスメント
 profanity = gr.State(0) # 冒涜
@@ -332,8 +332,8 @@ def save_annotation(
         is_proofreading_2: bool,
         answer_text_2: str,
         score: int,
-        helphulness: int,
-        correcthness: int,
         coherence: int,
         complexity: int,
         verbosity: int,
@@ -350,7 +350,7 @@ def save_annotation(
         threat: int,
         gun: int,
         controlled_substance: int,
-        climinal_planing: int,
         privacy: int,
         harassment: int,
         profanity: int,
@@ -373,24 +373,24 @@ def save_annotation(
             'is_proofreading_2': [is_proofreading_2],
             'answer_text_2': [answer_text_2],
             'score': [score],
-            'helphullness': [helphulness],
-            'correcthness': [correcthness],
             'complexity': [complexity],
             'verbosity': [verbosity],
             'humor': [humor],
             'creativity': [creativity],
             'appropriate': [appropriate],
-            'following_finstructions': [following_instructions],
             'politeness': [politeness],
             'harmfulness': [harmfulness],
             'hate': [hate],
-            'sextual': [sexual],
             'violence': [violence],
             'suicide': [suicide],
             'threat': [threat],
             'gun': [gun],
             'controlled_substance': [controlled_substance],
-            'climinal_planing': [climinal_planing],
             'privacy': [privacy],
             'harassment': [harassment],
             'profanity': [profanity],
@@ -416,8 +416,8 @@ def save_annotation(
                 "is_proofreading_2": is_proofreading_2,
                 "answer_text_2": answer_text_2,
                 "score": int(score),
-                "helphulness": int(helphulness),
-                "correcthness": int(correcthness),
                 "coherence": int(coherence),
                 "complexity": int(complexity),
                 "verbosity": int(verbosity),
@@ -434,11 +434,11 @@ def save_annotation(
                 "threat": int(threat),
                 "gun": int(gun),
                 "controlled_substance": int(controlled_substance),
-                "climinal_planing": int(climinal_planing),
                 "privacy": int(privacy),
                 "harassment": int(harassment),
                 "profanity": int(profanity),
-                "policital_content": int(political_content),
                 "moral_judgement": int(moral_judgement),
                 "typos": int(typos)
             }
@@ -572,11 +572,11 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                             gr_score_reset = gr.Button("スコアリセット", interactive=False)
                         gr_score_detail = gr.Slider(label="総合スコア　【必須】",value=3, minimum=1, maximum=5, step=1,  interactive=False)
-                        gr_evalannotation_explain = gr.Markdown("詳細アノテーション (5点満点)")
                         with gr.Row() :
-                            gr_helphulness = gr.Slider(label="有用性", minimum=0, value=0, maximum=5, step=1, interactive=False)
-                            gr_correcthness = gr.Slider(label="正確さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_coherence = gr.Slider(label="一貫性", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_complexity = gr.Slider(label="複雑さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
@@ -612,7 +612,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         with gr.Row():
                             gr_controlled_substance = gr.Radio(label="規制対象物質", choices=["不明", "有", "無"], value="不明", interactive=False)
-                            gr_climinal_planing = gr.Radio(label="犯罪計画", choices=["不明", "有", "無"], value="不明", interactive=False)
                         with gr.Row():
                             gr_privacy = gr.Radio(label="個人情報", choices=["不明", "有", "無"], value="不明", interactive=False)
@@ -630,9 +630,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 # slicer
                 g_score: int,
-                g_helphulness: int,
-                g_correcthness: int,
-                g_coherenece: int,
                 g_complexity: int,
                 g_verbosity: int,
                 g_humor: int,
@@ -650,7 +650,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 g_threat: str,
                 g_gun: str,
                 g_controlled_substance: str,
-                g_climinal_planing: str,
                 g_privacy: str,
                 g_harassment: str,
                 g_profanity: str,
@@ -673,9 +673,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 # 送信用データ更新
                 score.value = g_score
-                helphulness.value = g_helphulness
-                correcthness.value = g_correcthness
-                coherenece.value = g_coherenece
                 complexity.value = g_complexity
                 verbosity.value = g_verbosity
                 humor.value = g_humor
@@ -692,7 +692,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 threat.value = checkbox_to_int(g_threat)
                 gun.value = checkbox_to_int(g_gun)
                 controlled_substance.value = checkbox_to_int(g_controlled_substance)
-                climinal_planing.value = checkbox_to_int(g_climinal_planing)
                 privacy.value = checkbox_to_int(g_privacy)
                 harassment.value = checkbox_to_int(g_harassment)
                 profanity.value = checkbox_to_int(g_profanity)
@@ -726,9 +726,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
-                    helphulness.value,
-                    correcthness.value,
-                    coherenece.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
@@ -744,7 +744,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     threat.value,
                     gun.value,
                     controlled_substance.value,
-                    climinal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
@@ -773,8 +773,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 inputs=[
                     gr_answer_text_3_1,
                     gr_score_detail,
-                    gr_helphulness,
-                    gr_correcthness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
@@ -791,7 +791,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
-                    gr_climinal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
@@ -808,8 +808,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_question_text_3_1,
                     gr_answer_text_3_1,
                     gr_score_detail,
-                    gr_helphulness,
-                    gr_correcthness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
@@ -826,7 +826,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
-                    gr_climinal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
@@ -941,9 +941,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
-                    helphulness.value,
-                    correcthness.value,
-                    coherenece.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
@@ -959,7 +959,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     threat.value,
                     gun.value,
                     controlled_substance.value,
-                    climinal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
@@ -1003,8 +1003,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1021,7 +1021,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
@@ -1057,8 +1057,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1075,7 +1075,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
@@ -1111,8 +1111,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1129,7 +1129,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
@@ -1150,8 +1150,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1168,7 +1168,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1186,8 +1186,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1204,7 +1204,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1222,8 +1222,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1240,7 +1240,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1258,8 +1258,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1276,7 +1276,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1294,8 +1294,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
-                                gr_helphulness,
-                                gr_correcthness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
@@ -1312,7 +1312,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
-                                gr_climinal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
@@ -1325,9 +1325,9 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
             def score_reset_display():
                 # gr.State
                 score.value = 3
-                helphulness.value = 0
-                correcthness.value = 0
-                coherenece.value = 0
                 complexity.value = 0
                 verbosity.value = 0
                 humor.value = 0
@@ -1342,8 +1342,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 suicide.value = 0
                 threat.value = 0
                 gun.value = 0
-                controlled_substance.vlaue = 0
-                climinal_planing.value = 0
                 privacy.value = 0
                 harassment.value = 0
                 profanity.value = 0
@@ -1362,8 +1362,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                 inputs=[],
                 outputs=[
                     gr_score_detail,
-                    gr_helphulness,
-                    gr_correcthness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
@@ -1380,7 +1380,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
-                    gr_climinal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
@@ -1394,7 +1394,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
             gr_data_load_btn.click(
                 dataset_load_fn,
                 inputs=None,
-                # textをセットし、intractiveをTrueにする (UI更新)
                 outputs=[
                         gr_question_text_1_1,
                         gr_answer_text_1_1,
@@ -1416,8 +1416,8 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_submit_score,
                         gr_score_detail,
                         gr_score_reset,
-                        gr_helphulness,
-                        gr_correcthness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
@@ -1434,7 +1434,7 @@ with gr.Blocks(theme=theme_, css=load_css()) as demo:
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
-                        gr_climinal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,

 # (切り替えてテストする用に配列)
 OUTPUT_DATASET = [
     "team-hatakeyama-phase2/annotation_tanuki_phase2",
+    "kevineen/Tanuki-Phase2-annotation-dataset", # 出力テスト
 ]
 # アノテーション対象データセット
     # "kanhatakeyama/AutoWikiQA",
     # "susumuota/SyntheticTextWikiTranslate-askllm-v1", # Ask-LLM 翻訳
+    # Nemotron データ (将来用
 ]
+MULTI_TURN_ANNOTATION_DATASET = [
     # マルチターン 未対応
     "kanhatakeyama/AutoMultiTurnByMixtral8x22b",
 ]
         # 5段階評価
         'score': [], # 総合 (5段階評価)
+        'helpfulness': [], # 有用性　(5段階評価)
+        'correctness': [], # 正確さ　(5段階評価)
         'coherence': [], # 一貫性　(5段階評価)
         'complexity': [], # 複雑さ　(5段階評価)
         'verbosity': [], # 冗長性　(5段階評価)
         'threat': [], # 犯罪
         'gun': [], # 重火器
         'controlled_substance': [], # 規制対象物質
+        'criminal_planing': [], # 犯罪計画
         'privacy': [], # 個人情報
         'harassment': [], # ハラスメント
         'profanity': [], # 冒涜
 # (5段階評価)
 # 0は判断していない、又は判断が難しいという特徴量にする
 score = gr.State(3)  # 総合スコア 初期値は3 (最低限必須)
+helpfulness = gr.State(0) # 有用性
+correctness = gr.State(0) # 正確さ
+coherence = gr.State(0) # 一貫性
 complexity = gr.State(0) # 複雑さ
 verbosity = gr.State(0) # 冗長性
 humor = gr.State(0) # ユーモア (SteerLM)
 threat = gr.State(0) # 犯罪
 gun = gr.State(0) # 銃・重火器
 controlled_substance = gr.State(0) # 規制対象物質
+criminal_planing = gr.State(0) # 犯罪計画
 privacy = gr.State(0) # 個人情報・プライバシー情報
 harassment = gr.State(0) # ハラスメント
 profanity = gr.State(0) # 冒涜
         is_proofreading_2: bool,
         answer_text_2: str,
         score: int,
+        helpfulness: int,
+        correctness: int,
         coherence: int,
         complexity: int,
         verbosity: int,
         threat: int,
         gun: int,
         controlled_substance: int,
+        criminal_planing: int,
         privacy: int,
         harassment: int,
         profanity: int,
             'is_proofreading_2': [is_proofreading_2],
             'answer_text_2': [answer_text_2],
             'score': [score],
+            'helpfulness': [helpfulness],
+            'correctness': [correctness],
             'complexity': [complexity],
             'verbosity': [verbosity],
             'humor': [humor],
             'creativity': [creativity],
             'appropriate': [appropriate],
+            'following_instructions': [following_instructions],
             'politeness': [politeness],
             'harmfulness': [harmfulness],
             'hate': [hate],
+            'sexual': [sexual],
             'violence': [violence],
             'suicide': [suicide],
             'threat': [threat],
             'gun': [gun],
             'controlled_substance': [controlled_substance],
+            'criminal_planing': [criminal_planing],
             'privacy': [privacy],
             'harassment': [harassment],
             'profanity': [profanity],
                 "is_proofreading_2": is_proofreading_2,
                 "answer_text_2": answer_text_2,
                 "score": int(score),
+                "helpfulness": int(helpfulness),
+                "correctness": int(correctness),
                 "coherence": int(coherence),
                 "complexity": int(complexity),
                 "verbosity": int(verbosity),
                 "threat": int(threat),
                 "gun": int(gun),
                 "controlled_substance": int(controlled_substance),
+                "criminal_planing": int(criminal_planing),
                 "privacy": int(privacy),
                 "harassment": int(harassment),
                 "profanity": int(profanity),
+                "political_content": int(political_content),
                 "moral_judgement": int(moral_judgement),
                 "typos": int(typos)
             }
                             gr_score_reset = gr.Button("スコアリセット", interactive=False)
                         gr_score_detail = gr.Slider(label="総合スコア　【必須】",value=3, minimum=1, maximum=5, step=1,  interactive=False)
+                        gr_eval_annotation_explain = gr.Markdown("詳細アノテーション (5点満点)")
                         with gr.Row() :
+                            gr_helpfulness = gr.Slider(label="有用性", minimum=0, value=0, maximum=5, step=1, interactive=False)
+                            gr_correctness = gr.Slider(label="正確さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_coherence = gr.Slider(label="一貫性", minimum=0, value=0, maximum=5, step=1, interactive=False)
                             gr_complexity = gr.Slider(label="複雑さ", minimum=0, value=0, maximum=5, step=1, interactive=False)
                         with gr.Row():
                             gr_controlled_substance = gr.Radio(label="規制対象物質", choices=["不明", "有", "無"], value="不明", interactive=False)
+                            gr_criminal_planing = gr.Radio(label="犯罪計画", choices=["不明", "有", "無"], value="不明", interactive=False)
                         with gr.Row():
                             gr_privacy = gr.Radio(label="個人情報", choices=["不明", "有", "無"], value="不明", interactive=False)
                 # slicer
                 g_score: int,
+                g_helpfulness: int,
+                g_correctness: int,
+                g_coherence: int,
                 g_complexity: int,
                 g_verbosity: int,
                 g_humor: int,
                 g_threat: str,
                 g_gun: str,
                 g_controlled_substance: str,
+                g_criminal_planing: str,
                 g_privacy: str,
                 g_harassment: str,
                 g_profanity: str,
                 # 送信用データ更新
                 score.value = g_score
+                helpfulness.value = g_helpfulness
+                correctness.value = g_correctness
+                coherence.value = g_coherence
                 complexity.value = g_complexity
                 verbosity.value = g_verbosity
                 humor.value = g_humor
                 threat.value = checkbox_to_int(g_threat)
                 gun.value = checkbox_to_int(g_gun)
                 controlled_substance.value = checkbox_to_int(g_controlled_substance)
+                criminal_planing.value = checkbox_to_int(g_criminal_planing)
                 privacy.value = checkbox_to_int(g_privacy)
                 harassment.value = checkbox_to_int(g_harassment)
                 profanity.value = checkbox_to_int(g_profanity)
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
+                    helpfulness.value,
+                    correctness.value,
+                    coherence.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
                     threat.value,
                     gun.value,
                     controlled_substance.value,
+                    criminal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
                 inputs=[
                     gr_answer_text_3_1,
                     gr_score_detail,
+                    gr_helpfulness,
+                    gr_correctness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
+                    gr_criminal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
                     gr_question_text_3_1,
                     gr_answer_text_3_1,
                     gr_score_detail,
+                    gr_helpfulness,
+                    gr_correctness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
+                    gr_criminal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
                     is_proofreading_2.value,
                     answer_text_2.value,
                     score.value,
+                    helpfulness.value,
+                    correctness.value,
+                    coherence.value,
                     complexity.value,
                     verbosity.value,
                     humor.value,
                     threat.value,
                     gun.value,
                     controlled_substance.value,
+                    criminal_planing.value,
                     privacy.value,
                     harassment.value,
                     profanity.value,
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
                         gr_question_text_3_1,
                         gr_answer_text_3_1,
                         gr_score_detail,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
                                 gr_question_text_3_1,
                                 gr_answer_text_3_1,
                                 gr_score_detail,
+                                gr_helpfulness,
+                                gr_correctness,
                                 gr_coherence,
                                 gr_complexity,
                                 gr_verbosity,
                                 gr_threat,
                                 gr_gun,
                                 gr_controlled_substance,
+                                gr_criminal_planing,
                                 gr_privacy,
                                 gr_harassment,
                                 gr_profanity,
             def score_reset_display():
                 # gr.State
                 score.value = 3
+                helpfulness.value = 0
+                correctness.value = 0
+                coherence.value = 0
                 complexity.value = 0
                 verbosity.value = 0
                 humor.value = 0
                 suicide.value = 0
                 threat.value = 0
                 gun.value = 0
+                controlled_substance.value = 0
+                criminal_planing.value = 0
                 privacy.value = 0
                 harassment.value = 0
                 profanity.value = 0
                 inputs=[],
                 outputs=[
                     gr_score_detail,
+                    gr_helpfulness,
+                    gr_correctness,
                     gr_coherence,
                     gr_complexity,
                     gr_verbosity,
                     gr_threat,
                     gr_gun,
                     gr_controlled_substance,
+                    gr_criminal_planing,
                     gr_privacy,
                     gr_harassment,
                     gr_profanity,
             gr_data_load_btn.click(
                 dataset_load_fn,
                 inputs=None,
+                # textをセットし、interactiveをTrueにする (UI更新)
                 outputs=[
                         gr_question_text_1_1,
                         gr_answer_text_1_1,
                         gr_submit_score,
                         gr_score_detail,
                         gr_score_reset,
+                        gr_helpfulness,
+                        gr_correctness,
                         gr_coherence,
                         gr_complexity,
                         gr_verbosity,
                         gr_threat,
                         gr_gun,
                         gr_controlled_substance,
+                        gr_criminal_planing,
                         gr_privacy,
                         gr_harassment,
                         gr_profanity,