Spaces:

JunyiAcademy
/

vaitor2

Sleeping

App Files Files Community

youngtsai commited on Mar 6, 2024

Commit

0569047

1 Parent(s): 01aa382

update

Browse files

Files changed (1) hide show

app.py +194 -40

app.py CHANGED Viewed

@@ -307,7 +307,7 @@ def update_file_on_drive(service, file_id, file_content):
     print(f"文件已更新，文件ID: {updated_file['id']}")
-# ----  Main Functions ----
 def process_file(password, file):
     verify_password(password)
@@ -347,6 +347,8 @@ def docx_to_text(file):
     doc = Document(file)
     return "\n".join([para.text for para in doc.paragraphs])
 def format_seconds_to_time(seconds):
     """将秒数格式化为 时:分:秒 的形式"""
     hours = int(seconds // 3600)
@@ -617,12 +619,16 @@ def screenshot_youtube_video(youtube_id, snapshot_sec):
     return screenshot_path
 def process_web_link(link):
     # 抓取和解析网页内容
     response = requests.get(link)
     soup = BeautifulSoup(response.content, 'html.parser')
     return soup.get_text()
 def get_mind_map(video_id, df_string, source):
     if source == "gcs":
         print("===get_mind_map on gcs===")
@@ -903,6 +909,145 @@ def change_questions(password, df_string):
     print("=====get_questions=====")
     return q1, q2, q3
 def respond(password, user_message, data, chat_history, socratic_mode=False):
     verify_password(password)
@@ -1281,7 +1426,6 @@ def chat_with_youtube_transcript(password, youtube_id, thread_id, trascript, use
     # 返回聊天历史和空字符串清空输入框
     return "", chat_history, thread.id
 def poll_run_status(run_id, thread_id, timeout=600, poll_interval=5):
     """
     Polls the status of a Run and handles different statuses appropriately.
@@ -1411,20 +1555,8 @@ with gr.Blocks() as demo:
                 groq_send_button = gr.Button("Send")
             with gr.Column(scale=3):
-                with gr.Tab("圖文"):
-                    transcript_html = gr.HTML(label="YouTube Transcript and Video")
-                with gr.Tab("投影片"):
-                    slide_image = gr.Image()
-                    slide_text = gr.Textbox()
-                    with gr.Row():
-                        prev_button = gr.Button("Previous")
-                        next_button = gr.Button("Next")
-                    prev_button.click(fn=prev_slide, inputs=[], outputs=[slide_image, slide_text])
-                    next_button.click(fn=next_slide, inputs=[], outputs=[slide_image, slide_text])
                 with gr.Tab("逐字稿"):
                     simple_html_content = gr.HTML(label="Simple Transcript")
-                with gr.Tab("本文"):
-                    df_string_output = gr.Textbox(lines=40, label="Data Text")
                 with gr.Tab("重點"):
                     df_summarise = gr.Textbox(container=True, show_copy_button=True, lines=40)
                 with gr.Tab("問題"):
@@ -1434,41 +1566,58 @@ with gr.Blocks() as demo:
                     btn_3 = gr.Button()
                     gr.Markdown("## 重新生成問題")
                     btn_create_question = gr.Button("Create Questions")
-                with gr.Tab("markdown"):
-                    gr.Markdown("## 請複製以下 markdown 並貼到你的心智圖工具中，建議使用：https://markmap.js.org/repl")
-                    mind_map = gr.Textbox(container=True, show_copy_button=True, lines=40, elem_id="mind_map_markdown")
                 with gr.Tab("心智圖",elem_id="mind_map_tab"):
                     mind_map_html = gr.HTML()
     with gr.Tab("教師版"):
         with gr.Row():
             gr.Markdown("## 教育評量饗宴")
         with gr.Row():
-            with gr.Column(scale=2):
-                with gr.Tab("認知階層評量題目"):
-                    cognitive_level_content = gr.Textbox(label="輸入學習目標與內容")
-                    cognitive_level_content_btn = gr.Button("生成評量題目")
                 with gr.Tab("素養導向閱讀題組"):
                     literacy_oriented_reading_content = gr.Textbox(label="輸入閱讀材料")
                     literacy_oriented_reading_content_btn = gr.Button("生成閱讀理解題")
-                with gr.Tab("學習單"):
-                    worksheet_content = gr.Textbox(label="輸入學習單內容")
-                    worksheet_content_btn = gr.Button("生成學習單")
-                with gr.Tab("自我評估"):
-                    self_assessment_content = gr.Textbox(label="輸入自評問卷或檢查表")
-                    self_assessment_content_btn = gr.Button("生成自評問卷")
-                with gr.Tab("自我反思評量"):
-                    self_reflection_content = gr.Textbox(label="輸入自我反思活動")
-                    self_reflection_content_btn = gr.Button("生成自我反思活動")
-                with gr.Tab("後設認知"):
-                    metacognition_content = gr.Textbox(label="輸入後設認知相關問題")
-                    metacognition_content_btn = gr.Button("生成後設認知問題")
-            with gr.Column(scale=3):
                 # 生成對應不同模式的結果
-                exam_result = gr.Textbox("生成結果")
     # 傳統模式
     # send_button.click(
     #     respond,
@@ -1559,8 +1708,13 @@ with gr.Blocks() as demo:
     # 教師版 學習單
     worksheet_content_btn.click(
         generate_worksheet,
-        inputs=[password, worksheet_content],
-        outputs=[exam_result]
     )
 demo.launch(allowed_paths=["videos"])

     print(f"文件已更新，文件ID: {updated_file['id']}")
+# ---- Text file ----
 def process_file(password, file):
     verify_password(password)
     doc = Document(file)
     return "\n".join([para.text for para in doc.paragraphs])
+# ---- YouTube link ----
 def format_seconds_to_time(seconds):
     """将秒数格式化为 时:分:秒 的形式"""
     hours = int(seconds // 3600)
     return screenshot_path
+# ---- Web ----
 def process_web_link(link):
     # 抓取和解析网页内容
     response = requests.get(link)
     soup = BeautifulSoup(response.content, 'html.parser')
     return soup.get_text()
+# ---- LLM Generator ----
 def get_mind_map(video_id, df_string, source):
     if source == "gcs":
         print("===get_mind_map on gcs===")
     print("=====get_questions=====")
     return q1, q2, q3
+# --- 學習單 ---
+def generate_worksheet(password, df_string):
+    verify_password(password)
+    # df_string delete embed_url, screenshot_path
+    df_string_json = json.loads(df_string)
+    for entry in df_string_json:
+        entry.pop('embed_url', None)
+        entry.pop('screenshot_path', None)
+    df_string_text = json.dumps(df_string_json, ensure_ascii=False, indent=2)
+    worksheet_prompt = get_worksheet_prompt()
+    # 使用 OpenAI 生成基于上传数据的问题
+    sys_content = "你是一個擅長資料分析跟影片教學備課的老師，請精讀資料文本，自行判斷資料的種類，使用 zh-TW"
+    user_content = f"""
+        這是逐字稿：{df_string_text}
+        ---
+        請根據逐字稿進行以下工作：
+        不要提到 【逐字稿】 這個詞，直接給出工作內容即可
+        {worksheet_prompt}
+    """
+    messages = [
+        {"role": "system", "content": sys_content},
+        {"role": "user", "content": user_content}
+    ]
+    print("=====generate_worksheet messages=====")
+    print(messages)
+    print("=====generate_worksheet messages=====")
+    request_payload = {
+        "model": "gpt-4-1106-preview",
+        "messages": messages,
+        "max_tokens": 4000,
+    }
+    response = OPEN_AI_CLIENT.chat.completions.create(**request_payload)
+    worksheet = response.choices[0].message.content.strip()
+    print("=====worksheet=====")
+    print(worksheet)
+    print("=====worksheet=====")
+    return worksheet, worksheet_prompt
+def get_worksheet_prompt():
+    default_worksheet_prompt = """
+    你是個專業的教師，熟悉布魯姆(Benjamin Bloom, 1964) 的認知理論。布魯姆認為人類的能力，大致可分為三個領域(domains)，即認知領域(cognitive domain)、情意領域(affective domain)、技能領域 (psychomotor domain)。
+    【認知領域】涉及知能及其運作，著重心智、學習以及問題解決的工作。認知目標從簡單的認識或記憶能力到複雜的評鑑能力。大部分的教育目標都屬於這個領域。認知領域的目標分為六個層次，每個層次代表不同的心智功能。
+    - 📖 知識：在認知目標中知識是最低層次的能力，包括名詞、事實、規則和原理原則等的認識和記憶。用來表示此種能力的行為動詞有：指出、寫出、界定、說明、舉例、命名、認明等。例：能在地圖上指出長江流經的省分。
+    - 🤔 理解：理解是指能把握所學過知識或概念的意義，包含轉譯、解釋、推論等能力。代表此能力的行為動詞有：解釋、說明、區別、舉例、摘要、歸納等。例：能解釋光合作用。
+    - 🛠️ 應用：應用是指將所學到的規則、方法、步驟、原理、原則和概念，應用到新情境的能力。用來表示此能力的行為動詞有：預測、證明、解決、修改、表現、應用等。例：學生能預測抽出容器內之氣體對容器的影響。
+    - 🔍 分析：分析是指將所學到的概念或原則，分析為各個構成的部分，或找出各部分之間的相互關係，包括要素、關係及組織原理等的分析。用以表示此種能力的行為動詞有：選出、分析、判斷：區分、指出某些組成要素、指出某些的相互關係等。例：讀完某篇文章後，學生能區分事實和意見。
+    - 🌐 綜合：綜合是指將所學到的片斷概念或知識、原理原則或事實，統整成新的整體。用來表示此種能力的行為動詞有：設計、組織、綜合、創造、歸納、聯合等。例：讀完一篇有關防治汙染的文章後，學生能綜合防治汙染的各種方法。
+    - 🏅 評鑑：評鑑是認知目標中最高層次的能力，指依據某項標準做價值的判斷的能力。用來表示此能力的行為動詞有：評鑑、判斷、評論、比較、批��等。例：學生能評斷辯論中的謬論。
+    學習單包含以下的內容，將以布魯姆教育目標來建構提問的架構；請用 markdown 格式來呈現，題目和題目之間要換行，並加上 point 符號，像是 "-" 或是 "1." 等等。
+    - 📝 主題：請使用上傳檔案的檔名作為標題
+    - 🔑 重點： 和影片有關重要知識摘要
+    - 💭 概念：概念性問題 - 布魯姆的知識層級；數學知識的建構
+    - 📊 計算：程序性問題 - 布魯姆的理解層級；和影片相同的例題，類似的練習題 → 計算與步驟操作
+    - 🚀 延伸與應用 - 布魯姆的應用、分析、綜合、評鑑層級 → 延伸思考與應用
+    其中，「重點」的題目請用挖空的填空題；在「計算」的程序性問題請以單選題或填空題的形式來建立，需要 3 個題目；「延伸與應用」請使用問答題的形式來建立，一題即可。
+    這是範例格式：
+    ### 主題：【概念】認識公里
+    【情境描述】
+    狐狸貓和家人出遊，過程中認識測量較長距離的單位「公里」。
+    **【影片重點】**
+    公里是用來測量長距離的單位，通常用於測量很遠的距離。
+    1公里等於＿＿＿公尺，也稱為千米。
+    公里的英文簡寫是 ＿＿＿＿。
+    **【概念】**
+    請問公里通常用於測量什麼類型的距離？
+    如果一圈操場是200公尺，那跑5圈是多少公尺？多少公里？
+    為什麼我們需要使用公里這個單位來測量距離？
+    **【計算】**
+    一圈操場是200公尺，跑10圈是多少公里？(A) 1公里 (B) 2公里 (C) 3公里 (D) 4公里
+    如果你跑了5圈操場，運動手環上會顯示你跑了多少公里？
+    6000公尺等於多少公里？
+    **【延伸與應用】**
+    假設你參加一場慈善路跑活動，全程是5公里。如果你已經跑了3公里，還剩下多少公里？你覺得這樣的活動對你的體能有什麼影響？
+    """
+    return default_worksheet_prompt
+def generate_exam_fine_tune_result(password, worksheet_prompt, df_string_output, exam_result, exam_result_fine_tune_prompt):
+    verify_password(password)
+    # df_string delete embed_url, screenshot_path
+    df_string_json = json.loads(df_string_output)
+    for entry in df_string_json:
+        entry.pop('embed_url', None)
+        entry.pop('screenshot_path', None)
+    df_string_text = json.dumps(df_string_json, ensure_ascii=False, indent=2)
+    # 使用 OpenAI 生成基于上传数据的问题
+    sys_content = "你是一個擅長資料分析跟影片教學備課的老師，請精讀資料文本，自行判斷資料的種類，使用 zh-TW"
+    user_content = f"""
+        這是逐字稿：{df_string_text}
+        ---
+        這是預設的 prompt
+        {worksheet_prompt}
+        ---
+        產生了以下的結果：
+        {exam_result}
+        ---
+        但我不是很滿意，請根據以下的調整，產生新的結果
+        {exam_result_fine_tune_prompt}
+    """
+    messages = [
+        {"role": "system", "content": sys_content},
+        {"role": "user", "content": user_content}
+    ]
+    print("=====generate_exam_fine_tune_result messages=====")
+    print(messages)
+    print("=====generate_exam_fine_tune_result messages=====")
+    request_payload = {
+        "model": "gpt-4-1106-preview",
+        "messages": messages,
+        "max_tokens": 4000,
+    }
+    response = OPEN_AI_CLIENT.chat.completions.create(**request_payload)
+    exam_fine_tune_result = response.choices[0].message.content.strip()
+    print("=====exam_fine_tune_result=====")
+    print(exam_fine_tune_result)
+    print("=====exam_fine_tune_result=====")
+    return exam_fine_tune_result
+# ---- Chatbot ----
 def respond(password, user_message, data, chat_history, socratic_mode=False):
     verify_password(password)
     # 返回聊天历史和空字符串清空输入框
     return "", chat_history, thread.id
 def poll_run_status(run_id, thread_id, timeout=600, poll_interval=5):
     """
     Polls the status of a Run and handles different statuses appropriately.
                 groq_send_button = gr.Button("Send")
             with gr.Column(scale=3):
                 with gr.Tab("逐字稿"):
                     simple_html_content = gr.HTML(label="Simple Transcript")
                 with gr.Tab("重點"):
                     df_summarise = gr.Textbox(container=True, show_copy_button=True, lines=40)
                 with gr.Tab("問題"):
                     btn_3 = gr.Button()
                     gr.Markdown("## 重新生成問題")
                     btn_create_question = gr.Button("Create Questions")
                 with gr.Tab("心智圖",elem_id="mind_map_tab"):
                     mind_map_html = gr.HTML()
+                with gr.Accordion("See Details", open=False):
+                    with gr.Tab("本文"):
+                        df_string_output = gr.Textbox(lines=40, label="Data Text")
+                    with gr.Tab("圖文"):
+                        transcript_html = gr.HTML(label="YouTube Transcript and Video")
+                    with gr.Tab("投影片"):
+                        slide_image = gr.Image()
+                        slide_text = gr.Textbox()
+                        with gr.Row():
+                            prev_button = gr.Button("Previous")
+                            next_button = gr.Button("Next")
+                        prev_button.click(fn=prev_slide, inputs=[], outputs=[slide_image, slide_text])
+                        next_button.click(fn=next_slide, inputs=[], outputs=[slide_image, slide_text])
+                    with gr.Tab("markdown"):
+                        gr.Markdown("## 請複製以下 markdown 並貼到你的心智圖工具中，建議使用：https://markmap.js.org/repl")
+                        mind_map = gr.Textbox(container=True, show_copy_button=True, lines=40, elem_id="mind_map_markdown")
     with gr.Tab("教師版"):
         with gr.Row():
             gr.Markdown("## 教育評量饗宴")
         with gr.Row():
+            with gr.Column(scale=1):
+                # with gr.Tab("認知階層評量題目"):
+                #     cognitive_level_content = gr.Textbox(label="輸入學習目標與內容")
+                #     cognitive_level_content_btn = gr.Button("生成評量題目")
+                with gr.Tab("學習單"):
+                    worksheet_content_btn = gr.Button("生成學習單")
+                    with gr.Accordion("prompt", open=False):
+                        worksheet_prompt = gr.Textbox(label="worksheet_prompt", show_copy_button=True, lines=40)
                 with gr.Tab("素養導向閱讀題組"):
                     literacy_oriented_reading_content = gr.Textbox(label="輸入閱讀材料")
                     literacy_oriented_reading_content_btn = gr.Button("生成閱讀理解題")
+                # with gr.Tab("自我評估"):
+                #     self_assessment_content = gr.Textbox(label="輸入自評問卷或檢查表")
+                #     self_assessment_content_btn = gr.Button("生成自評問卷")
+                # with gr.Tab("自我反思評量"):
+                #     self_reflection_content = gr.Textbox(label="輸入自我反思活動")
+                #     self_reflection_content_btn = gr.Button("生成自我反思活動")
+                # with gr.Tab("後設認知"):
+                #     metacognition_content = gr.Textbox(label="輸入後設認知相關問題")
+                #     metacognition_content_btn = gr.Button("生成後設認知問題")
+            with gr.Column(scale=1):
                 # 生成對應不同模式的結果
+                exam_result = gr.Textbox(label="初次生成結果", show_copy_button=True)
+                exam_result_fine_tune_prompt = gr.Textbox(label="根據結果，輸入你想更改的想法")
+                exam_result_fine_tune_btn = gr.Button("微調結果")
+                exam_result_fine_result = gr.Textbox(label="微調結果",show_copy_button=True)
     # 傳統模式
     # send_button.click(
     #     respond,
     # 教師版 學習單
     worksheet_content_btn.click(
         generate_worksheet,
+        inputs=[password, df_string_output],
+        outputs=[exam_result, worksheet_prompt]
+    )
+    exam_result_fine_tune_btn.click(
+        generate_exam_fine_tune_result,
+        inputs=[password, worksheet_prompt, df_string_output, exam_result, exam_result_fine_tune_prompt],
+        outputs=[exam_result_fine_result]
     )
 demo.launch(allowed_paths=["videos"])