Spaces:

FreedomIntelligence
/

S2S_Evaluation

Sleeping

File size: 27,134 Bytes

dff2993

<!DOCTYPE html>
<html lang="en">

<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Speech-to-Speech Model Comparison</title>
    <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/css/bootstrap.min.css" rel="stylesheet">
    <script src="https://code.jquery.com/jquery-3.6.0.min.js"></script>
    <style>

        body {

            background-color: #f4f6f9;

            font-family: 'Arial', sans-serif;

        }



        .container {

            background-color: white;

            border-radius: 10px;

            box-shadow: 0 4px 12px rgba(0, 0, 0, 0.1);

            padding: 30px;

        }



        h3 {

            font-size: 1.2rem;

            /* 调整标题字体大小 */

            font-weight: bold;

            color: #333;

        }



        .form-control {

            border-radius: 25px;

            padding: 15px;

        }



        .btn {

            border-radius: 25px;

            font-size: 0.9rem;

            padding: 8px 16px;

            transition: background-color 0.3s ease;

        }



        .btn-primary {

            background-color: #007bff;

            border: none;

        }



        .btn-primary:hover {

            background-color: #0056b3;

        }



        .btn-success {

            background-color: #28a745;

            border: none;

        }



        .btn-success:hover {

            background-color: #218838;

        }



        .btn-selected {

            background-color: #155724 !important;

            color: white !important;

        }



        .btn-option {

            font-size: 0.9rem;

            padding: 8px 20px;

            margin: 0 10px;

        }



        #test-content {

            display: none;

        }



        #category-select,

        #task-select-dropdown {

            width: 120% !important;

            /* 设置宽度为60% */

            margin: 0 auto;

            /* 居中对齐 */

        }



        #confirm-choice,

        #next-test {

            display: none;

            transition: opacity 0.3s ease;

        }



        #model-comparison {

            display: none;

            opacity: 0;

            transition: opacity 0.3s ease;

        }



        #model-comparison.show {

            opacity: 1;

        }



        #switch-task {

            font-size: 0.8rem;

            padding: 5px 10px;

            position: absolute;

            top: 10px;

            right: 20px;

            display: none;

        }

        #task-description {

        display: none;

        }

    </style>
</head>

<body>
    <div class="container py-5">
        <h3 class="text-center mb-4">Speech-to-Speech Model Comparison</h3>

        <div id="evaluation-info" class="mb-5">
            <p class="text-start">
                <strong>Welcome to the Speech-to-Speech (S2S) Model Evaluation!</strong>
                <br><br>
                In this evaluation, you will assess the performance of 4 S2S models:
                <strong>ChatGPT-4o</strong>, <strong>FunAudioLLM</strong>, <strong>SpeechGPT</strong>, and
                <strong>Mini-Omni</strong>.
                The goal is to evaluate how well these models handle various speech tasks across different domains.
                <br><br>
                Once you select a specific domain and task (e.g., <em>Educational Tutoring</em> and <em>Rhythm Control</em>),
                you will proceed to the evaluation stage. In each round, you will be presented with an audio input.
                For example:
                <br><br>
                
                <!-- Left-aligned Audio Sample and Audio Control -->
                <span style="vertical-align: middle; line-height: 1.2; display: inline-block;"><strong>Audio Sample:</strong></span>
                <audio controls style="vertical-align: middle;">
                    <source src="/static/audio/sample/input_audio.wav" type="audio/wav">
                </audio>
                
                <br><br>
                The corresponding text is:
                <em>"Say the following sentence at my speed first, then say it again very slowly:
                    'Artificial intelligence is changing the world in many ways.'" </em>
                <small>(Note: the audio plays at 1.5x the normal speed.)</small>
                <br><br>
                The responses of different S2S models will be provided, and your task is to choose which response best follows
                the instructions. For example<small>(Note: During the evaluation process, you will be provided with responses from only the two models that have the most comparative significance.)</small>:
                <br><br>
        
                <!-- ChatGPT-4o Output -->
                <span><strong>ChatGPT-4o:</strong></span>
                <audio controls style="vertical-align: middle;">
                    <source src="/static/audio/sample/4o_audio.wav" type="audio/wav">
                </audio>
                <p class="text-start" style="margin-left: 20px;">
                    <strong>Performance:</strong> Speech: Partially followed the instruction on speed. Semantics: Accurately followed the instruction, with no semantic deviation or missing information.
                </p>
        
                <!-- FunAudioLLM Output -->
                <span><strong>FunAudioLLM:</strong></span>
                <audio controls style="vertical-align: middle;">
                    <source src="/static/audio/sample/FunAudio_audio.wav" type="audio/wav">
                </audio>
                <p class="text-start" style="margin-left: 20px;">
                    <strong>Performance:</strong> Speech: Partially followed the instruction on speed. Semantics: Accurately followed the instruction, with no semantic deviation or missing information.
                </p>
        
                <!-- SpeechGPT Output -->
                <span><strong>SpeechGPT:</strong></span>
                <audio controls style="vertical-align: middle;">
                    <source src="/static/audio/sample/SpeechGPT.wav" type="audio/wav">
                </audio>
                <p class="text-start" style="margin-left: 20px;">
                    <strong>Performance:</strong> Speech: Did not follow the instruction on speed. Semantics: Partially followed the instruction, with minor semantic deviation and missing information.
                </p>
        
                <!-- Mini-Omni Output -->
                <span><strong>Mini-Omni:</strong></span>
                <audio controls style="vertical-align: middle;">
                    <source src="/static/audio/sample/mini-omni.wav" type="audio/wav">
                </audio>
                <p class="text-start" style="margin-left: 20px;">
                    <strong>Performance:</strong> Speech: Did not follow the instruction on speed. Semantics: Did not follow the instruction, with significant semantic deviation and missing information.
                </p>

                <p class="text-start">
                    After making your choice, you'll proceed to the next round.
                </p>
                <strong>Please enter your username and start the evaluation!</strong>
            </p>
        </div>

        <div id="user-input" class="text-center">
            <div class="mb-3">
                <input type="text" id="username" class="form-control w-50 mx-auto" placeholder="Your username" />
            </div>
            <button class="btn btn-primary" onclick="startTest()">Start Test</button>
        </div>


        <div id="task-select" class="text-center" style="display: none;">
            <h3 class="my-4">Select Test Category:</h3>
            <div class="d-grid gap-2 col-6 mx-auto">
                <!-- Category dropdown -->
                <select id="category-select" class="form-select mx-auto" onchange="populateTasks()">
                    <option value="" disabled selected>Select Category</option>
                    <option value="educational">Educational Tutoring</option>
                    <option value="social">Social Companionship</option>
                    <option value="entertainment">Entertainment Dubbing</option>
                    <option value="medical">Medical Consultation</option>
                </select>
            </div>

            <h3 class="my-4" id="specific-task-title" style="display: none;">Select Specific Task:</h3>
            <div class="d-grid gap-2 col-6 mx-auto">
                <!-- Task dropdown -->
                <select id="task-select-dropdown" class="form-select mx-auto" style="display: none;">
                    <option value="" disabled selected>Select Specific Task</option>
                    <!-- Options will be populated dynamically -->
                </select>
            </div>

            <button class="btn btn-primary mt-4" id="start-task-btn" onclick="selectTaskFromDropdown()"

                style="display: none;">Start Task</button>
        </div>

        <button id="switch-task" class="btn btn-warning" onclick="switchTask()">Switch Category and Tasks</button>

        <div id="test-content">
            <div class="text-center">

                <div class="row justify-content-center">
                    <div class="col-md-6 text-start double-text" style="margin-bottom: 10px;">
                        <strong>Task description:</strong> <span id="task-description"></span>
                    </div>
                </div>

                <!-- 在音频控件前添加粗体的 Audio: -->
                <div class="row justify-content-center">
                    <div class="col-md-6 d-flex justify-content-center align-items-center mb-4">
                        <strong class="me-2">Audio:</strong> <!-- 加粗的 Audio 标签 -->
                        <audio id="input-audio" controls></audio>
                    </div>
                </div>

                <div class="row justify-content-center">
                    <div class="col-md-6 text-start double-text" style="margin-bottom: 10px;">
                        <strong>Audio text:</strong> <span id="test-text"></span>
                    </div>
                </div>

                <!-- 调整后的左对齐样式 -->
                <div class="row justify-content-center">
                    <div class="col-md-6 text-start">
                        <p><strong>Question:</strong> Which of the following two models answers the result better?</p>
                    </div>
                </div>

                <!-- 使用flex布局放置音频 -->
                <div class="mb-4 text-center">
                    <div class="model-section d-flex align-items-center justify-content-center mb-3">
                        <h6 class="me-2" style="margin-bottom: 0; margin-top: 5px; font-weight: bold;">Model A:</h6>
                        <audio id="audio-a" controls></audio>
                    </div>
                    <div class="model-section d-flex align-items-center justify-content-center">
                        <h6 class="me-2" style="margin-bottom: 0; margin-top: 5px; font-weight: bold;">Model B:</h6>
                        <audio id="audio-b" controls></audio>
                    </div>
                </div>


                <div class="d-flex justify-content-center mt-4">
                    <button class="btn btn-success btn-option mx-2" onclick="selectModel('A')">Model A</button>
                    <button class="btn btn-success btn-option mx-2" onclick="selectModel('B')">Model B</button>
                </div>

                <div id="model-comparison" class="text-center mt-4">
                    <p>Model A: <span id="model-a"></span></p>
                    <p>Model B: <span id="model-b"></span></p>
                    <p>Your choice: <span id="chosen-model"></span></p>
                </div>

                <button id="confirm-choice" class="btn btn-primary mt-4" onclick="confirmChoice()">Confirm
                    Selection</button>
                <button id="next-test" class="btn btn-primary mt-4" onclick="loadNextTest()">Next Test</button>
            </div>
        </div>

        <div id="test-completed" class="text-center" style="display: none;">
            <h3>Thank you for completing the <span id="completed-task"></span> test!</h3>
            <p>Would you like to test another category or task?</p>
            <button class="btn btn-primary" onclick="switchTask()">Yes</button>
            <button class="btn btn-secondary" onclick="endTest()">No</button>
        </div>

        <!-- 引入 Bootstrap 脚本 -->
        <script src="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/js/bootstrap.bundle.min.js"></script>
        <script>

            let username;

            let task;

            let chosenModel;

            let modelA, modelB; // 存储映射后的模型名称



            // 根据模型路径显示友好的模型名称

            const modelNames = {

                "output_path_speechgpt": "SpeechGPT",

                "output_path_miniomni": "Mini-Omni",

                "output_path_4o": "ChatGPT-4o",

                "output_path_funaudio": "FunAudioLLM",

                "output_path_4o_cascade": "Cascade",

                "output_path_4o_llama_omni": "LLaMA-Omni"

            };



            function startTest() {

                username = $("#username").val();

                if (!username) {

                    alert("Please enter a username");

                    return;

                }

                $("#evaluation-info").hide();

                $("#user-input").hide();

                $("#task-select").show();

            }



            function switchTask() {

                // 清理页面所有之前的测试内容

                $("#task-description").text('');

                $("#test-content").hide();       // 隐藏测试内容

                $("#test-text").text('');        // 清空音频文本

                $("#input-audio").attr("src", '');  // 清空音频路径

                $("#audio-a").attr("src", '');      // 清空模型 A 音频

                $("#audio-b").attr("src", '');      // 清空模型 B 音频

                $("#chosen-model").text('');        // 清空用户选择的模型显示

                $("#model-a").text('');             // 清空模型 A 名称显示

                $("#model-b").text('');             // 清空模型 B 名称显示

                $("#confirm-choice").hide();        // 隐藏确认选择按钮

                $("#next-test").hide();             // 隐藏下一个测试按钮

                $("#model-comparison").removeClass('show').hide();  // 隐藏模型对比部分



                // 显示选择任务的页面

                $("#test-completed").hide();  // 隐藏感谢页面

                $("#task-select").show();     // 显示选择方向页面

                $("#switch-task").hide();     // 隐藏切换按钮直到新测试开始

            }



            function selectTask(selectedTask) {

                task = selectedTask;



                // 切换任务时清理页面内容，防止旧数据残留

                $("#task-description").text('');

                $("#test-text").text('');        // 清空音频文本

                $("#input-audio").attr("src", '');  // 清空音频路径

                $("#audio-a").attr("src", '');      // 清空模型 A 音频

                $("#audio-b").attr("src", '');      // 清空模型 B 音频

                $("#chosen-model").text('');        // 清空用户选择的模型显示

                $("#model-a").text('');             // 清空模型 A 名称显示

                $("#model-b").text('');             // 清空模型 B 名称显示

                $("#confirm-choice").hide();        // 隐藏确认选择按钮

                $("#next-test").hide();             // 隐藏下一个测试按钮

                $("#model-comparison").removeClass('show').hide();  // 隐藏模型对比部分



                // 隐藏选择任务界面，显示切换方向按钮

                $("#task-select").hide();

                $("#switch-task").show();



                // 发起请求获取新的测试数据

                $.ajax({

                    url: '/start_test',

                    type: 'POST',

                    contentType: 'application/json',

                    data: JSON.stringify({ username: username, task: task }),

                    success: function (data) {

                        $("#test-content").show();

                        loadNextTest();

                    },

                    error: function (xhr, status, error) {

                        console.error("Error occurred: ", status, error);

                    }

                });

            }



            function populateTasks() {

                const category = $("#category-select").val();

                const taskDropdown = $("#task-select-dropdown");



                // 清空任务下拉菜单

                taskDropdown.empty();

                // 添加禁用的默认选项

                taskDropdown.append('<option value="" disabled selected>Select Specific Task</option>');



                // 根据所选分类填充相应的任务选项

                if (category === 'educational') {

                    taskDropdown.append('<option value="pronunciation">Correcting pronunciation ability</option>');

                    taskDropdown.append('<option value="rhythm">Rhythm control capabilities</option>');

                    taskDropdown.append('<option value="translation">Cross-language translation with emotion</option>');

                    taskDropdown.append('<option value="language">Language consistency</option>');

                    taskDropdown.append('<option value="pause">Pause and segmentation</option>');

                    taskDropdown.append('<option value="polyphone">Polyphonic word comprehension</option>');

                    taskDropdown.append('<option value="stress">Emphasis control</option>');

                } else if (category === 'social') {

                    taskDropdown.append('<option value="emotion">Emotion recognition and expression</option>');

                    taskDropdown.append('<option value="identity">Identity coping ability</option>');

                    taskDropdown.append('<option value="humor">Implications ability</option>');

                    taskDropdown.append('<option value="irony">Sarcasm detection</option>');

                } else if (category === 'entertainment') {

                    taskDropdown.append('<option value="natural">Ability to simulate natural sound</option>');

                    taskDropdown.append('<option value="singing">Singing ability</option>');

                    taskDropdown.append('<option value="tongue">Tongue twisters capabilities</option>');

                    taskDropdown.append('<option value="crosstalk">Crosstalk ability</option>');

                    taskDropdown.append('<option value="poetry">Poetry recitation</option>');

                    taskDropdown.append('<option value="role">Role-playing</option>');

                    taskDropdown.append('<option value="story">Storytelling</option>');

                } else if (category === 'medical') {

                    taskDropdown.append('<option value="healthcare">Health consultation</option>');

                    taskDropdown.append('<option value="illness">Querying symptoms</option>');

                    taskDropdown.append('<option value="psychological">Psychological comfort</option>');

                }



                // 显示任务下拉菜单和开始按钮

                if (category) {

                    $("#specific-task-title").show();

                    $("#task-select-dropdown").show();

                    $("#start-task-btn").show();

                } else {

                    $("#specific-task-title").hide();

                    $("#task-select-dropdown").hide();

                    $("#start-task-btn").hide();

                }

            }





            function selectTaskFromDropdown() {

                const selectedTask = $("#task-select-dropdown").val();

                if (selectedTask) {

                    task = selectedTask;

                    $.ajax({

                        url: '/start_test',

                        type: 'POST',

                        contentType: 'application/json',

                        data: JSON.stringify({ username: username, task: task }),

                        success: function (data) {

                            // 在页面显示任务描述

                            $("#task-description").text(data.task_description);

                            $("#task-description").show();

                            $("#task-select").hide();

                            $("#test-content").show();

                            $("#switch-task").show();  // 显示右上角的切换任务按钮

                            loadNextTest();

                        },

                        error: function (xhr, status, error) {

                            console.error("Error occurred: ", status, error);

                        }

                    });

                } else {

                    alert("Please select a specific task.");

                }

            }









            function loadNextTest() {

                $.get('/next_test', function (data) {

                    if (data.message === 'Test completed') {

                        $("#test-content").hide();  // 隐藏测试内容

                        $("#test-completed").show(); // 显示测试完成的页面



                        // 动态显示完成的任务名称

                        $("#completed-task").text(task);



                        // 清空 session 数据，防止继续原方向的测试

                        sessionStorage.removeItem('current_index');

                    } else {

                        // 正常加载测试题目

                        console.log(data);  // 添加调试信息，检查 data 的内容

                        $("#task-description").text(data.task_description);

                        $("#test-text").text(data.text);

                        $("#input-audio").attr("src", data.input_path);

                        $("#audio-a").attr("src", data.audio_a);

                        $("#audio-b").attr("src", data.audio_b);



                        // 更新模型信息

                        modelA = modelNames[data.model_a];

                        modelB = modelNames[data.model_b];

                        $("#model-a").text(modelA);

                        $("#model-b").text(modelB);



                        $("#next-test").hide();

                        $("#model-comparison").hide();

                        $("#confirm-choice").show();

                        chosenModel = null;

                        $(".btn-option").prop('disabled', false);

                        $(".btn-option").removeClass("btn-selected").addClass("btn-success");

                    }

                }, 'json').fail(function (xhr, status, error) {

                    console.error("Failed to load test data:", status, error);

                });

            }



            function endTest() {

                // 用户选择结束测试，可以跳转到结束页面或者返回主页

                alert("Thank you for participating in the test!");

                // 或者可以通过 window.location.href 跳转到其他页面

                window.location.href = "/thank_you";  // 你可以设置一个感谢页面或者其他动作

            }



            function selectModel(model) {

                // 将用户选择的模型存储在变量 chosenModel 中

                chosenModel = model;



                // 禁用所有模型选择按钮，防止重复点击

                $(".btn-option").prop('disabled', false); // 允许用户重新选择



                // 重置所有按钮的样式

                $(".btn-option").removeClass("btn-selected").addClass("btn-success");



                // 根据用户选择的模型按钮，添加 btn-selected 类改变其样式

                if (model === 'A') {

                    $("button:contains('Model A')").removeClass("btn-success").addClass("btn-selected");

                } else if (model === 'B') {

                    $("button:contains('Model B')").removeClass("btn-success").addClass("btn-selected");

                }

            }



            function confirmChoice() {

                // 检查是否选择了模型，如果没有选择，则提示用户

                if (!chosenModel) {

                    alert("Please select a model before confirming.");

                    return;

                }



                // 禁用模型选择按钮，防止用户在确认选择后更改选择

                $(".btn-option").prop('disabled', true);



                // 一旦用户确认选择，立刻显示选择的详细信息

                if (chosenModel === 'A') {

                    $("#chosen-model").text(modelA);  // 使用 modelA 映射后的名称

                } else {

                    $("#chosen-model").text(modelB);  // 使用 modelB 映射后的名称

                }



                // 将模型 A 和 B 的名称显示在同一行中，包括中文和英文翻译

                $("#model-a").text(modelA);  // 模型 A 名称

                $("#model-b").text(modelB);  // 模型 B 名称



                // 确认选择后才显示模型详细信息

                $("#model-comparison").addClass('show');

                $("#model-comparison").show();  // 展示选择信息



                // 隐藏确认按钮，显示“Next Test”按钮

                $("#confirm-choice").hide();

                $("#next-test").show();



                // 提交用户选择的模型

                $.ajax({

                    url: '/submit_result',

                    type: 'POST',

                    contentType: 'application/json',

                    data: JSON.stringify({ chosen_model: chosenModel }),

                    success: function (data) {

                        // 成功提交后处理逻辑

                    },

                    error: function (xhr, status, error) {

                        console.error("Error occurred: ", status, error);

                    }

                });

            }

        </script>
</body>

</html>