video_bot_999

Sleeping

App Files Files Community

youngtsai commited on Feb 14

Commit

3ffa0fc

•

1 Parent(s): 65300ff

mind_map

Browse files

Files changed (1) hide show

app.py +58 -3

app.py CHANGED Viewed

@@ -347,6 +347,8 @@ def process_youtube_link(link):
     html_content = format_transcript_to_html(formatted_transcript)
     first_image = formatted_transcript[0]['screenshot_path']
     first_text = formatted_transcript[0]['text']
     # 确保返回与 UI 组件预期匹配的输出
     return questions[0] if len(questions) > 0 else "", \
@@ -354,9 +356,10 @@ def process_youtube_link(link):
             questions[2] if len(questions) > 2 else "", \
             formatted_transcript_json, \
             summary, \
             html_content, \
             first_image, \
-            first_text
 def format_transcript_to_html(formatted_transcript):
@@ -404,6 +407,57 @@ def process_web_link(link):
     soup = BeautifulSoup(response.content, 'html.parser')
     return soup.get_text()
 def processed_video_summary_to_json(summary):
     """
         整體格式為：
@@ -446,7 +500,6 @@ def processed_video_summary_to_json(summary):
     return summary_json
 # get video_id_summary.json content
 def get_video_id_summary(video_id, df_string):
     print("===get_video_id_summary===")
@@ -777,6 +830,8 @@ with gr.Blocks() as demo:
                 btn_3 = gr.Button()
                 gr.Markdown("## 重新生成問題")
                 btn_create_question = gr.Button("Create Questions")
     send_button.click(
         respond,
@@ -794,7 +849,7 @@ with gr.Blocks() as demo:
     file_upload.change(process_file, inputs=file_upload, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])
     # 当输入 YouTube 链接时触发
-    youtube_link.change(process_youtube_link, inputs=youtube_link, outputs=[btn_1, btn_2, btn_3, df_string_output, df_summarise, transcript_html, slide_image, slide_text])
     # 当输入网页链接时触发
     web_link.change(process_web_link, inputs=web_link, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])

     html_content = format_transcript_to_html(formatted_transcript)
     first_image = formatted_transcript[0]['screenshot_path']
     first_text = formatted_transcript[0]['text']
+    mind_map_json = get_mind_map(video_id, formatted_simple_transcript)
+    mind_map = mind_map_json["mind_map"]
     # 确保返回与 UI 组件预期匹配的输出
     return questions[0] if len(questions) > 0 else "", \
             questions[2] if len(questions) > 2 else "", \
             formatted_transcript_json, \
             summary, \
+            mind_map, \
             html_content, \
             first_image, \
+            first_text,
 def format_transcript_to_html(formatted_transcript):
     soup = BeautifulSoup(response.content, 'html.parser')
     return soup.get_text()
+def get_mind_map(video_id, df_string):
+    # 先抓 g drive 看看有沒有 {video_id}_mind_map.json
+    print("===get_mind_map===")
+    service = init_drive_service()
+    parent_folder_id = '1GgI4YVs0KckwStVQkLa1NZ8IpaEMurkL'
+    folder_id = create_folder_if_not_exists(service, video_id, parent_folder_id)
+    file_name = f'{video_id}_mind_map.json'
+    # 检查檔案是否存在
+    exists, file_id = check_file_exists(service, folder_id, file_name)
+    if not exists:
+        mind_map = generate_mind_map(df_string)
+        mind_map_json = {"mind_map": str(mind_map)}
+        mind_map_text = json.dumps(mind_map_json, ensure_ascii=False, indent=2)
+        upload_content_directly(service, file_name, folder_id, mind_map_text)
+        print("mind_map已上傳到Google Drive")
+    else:
+        # mindmap已存在，下载内容
+        print("mind_map已存在于Google Drive中")
+        mind_map_text = download_file_as_string(service, file_id)
+        mind_map_json = json.loads(mind_map_text)
+    return mind_map_json
+def generate_mind_map(df_string):
+    # 使用 OpenAI 生成基于上传数据的问题
+    sys_content = "你是一個擅長資料分析跟影片教學的老師，user 為學生，請精讀資料文本，自行判斷資料的種類，使用 zh-TW"
+    user_content = f"""
+        請根據 {df_string} 文本建立 markdown 心智圖
+        注意：不需要前後文敘述，直接給出 markdown 文本即可
+        這對我很重要
+    """
+    messages = [
+        {"role": "system", "content": sys_content},
+        {"role": "user", "content": user_content}
+    ]
+    request_payload = {
+        "model": "gpt-4-1106-preview",
+        "messages": messages,
+        "max_tokens": 4000,
+    }
+    response = client.chat.completions.create(**request_payload)
+    mind_map = response.choices[0].message.content.strip()
+    print("=====mind_map=====")
+    print(mind_map)
+    print("=====mind_map=====")
+    return mind_map
 def processed_video_summary_to_json(summary):
     """
         整體格式為：
     return summary_json
 # get video_id_summary.json content
 def get_video_id_summary(video_id, df_string):
     print("===get_video_id_summary===")
                 btn_3 = gr.Button()
                 gr.Markdown("## 重新生成問題")
                 btn_create_question = gr.Button("Create Questions")
+            with gr.Tab("心智圖"):
+                mind_map = gr.Textbox()
     send_button.click(
         respond,
     file_upload.change(process_file, inputs=file_upload, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])
     # 当输入 YouTube 链接时触发
+    youtube_link.change(process_youtube_link, inputs=youtube_link, outputs=[btn_1, btn_2, btn_3, df_string_output, df_summarise, mind_map, transcript_html, slide_image, slide_text])
     # 当输入网页链接时触发
     web_link.change(process_web_link, inputs=web_link, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])