video_bot_999

Sleeping

youngtsai commited on Feb 13

Commit

dc5db85

•

1 Parent(s): e5a1f9f

def preprocess_text(text):

Files changed (1) hide show

app.py CHANGED Viewed

@@ -393,6 +393,18 @@ def process_web_link(link):
     return soup.get_text()
 # get video_id_summary.json content
 def get_video_id_summary(video_id, df_string):
@@ -406,7 +418,9 @@ def get_video_id_summary(video_id, df_string):
         exists, file_id = check_file_exists(service, folder_id, file_name)
         if not exists:
             summary = generate_summarise(df_string)
-            summary_json = {"summary": summary}
             summary_text = json.dumps(summary_json, ensure_ascii=False, indent=2)
             file_id = upload_content_directly(service, file_name, folder_id, summary_text)
             print("summary已上传到Google Drive")

     return soup.get_text()
+def preprocess_text(text):
+    # 预处理文本以便在 JSON 中使用
+    json_text = text.replace("\n", "\\n")
+    json_text = json_text.replace('"', '\\"')
+    json_text = json_text.replace("'", "\\'")
+    json_text = json_text.replace("\t", "\\t")
+    json_text = json_text.replace("\r", "\\r")
+    json_text = json_text.replace("\f", "\\f")
+    json_text = json_text.replace("\b", "\\b")
+    json_text = json_text.replace("\v", "\\v")
+    return json_text
 # get video_id_summary.json content
 def get_video_id_summary(video_id, df_string):
         exists, file_id = check_file_exists(service, folder_id, file_name)
         if not exists:
             summary = generate_summarise(df_string)
+            # preprocess_text to json value acceptable
+            processed_summary = preprocess_text(summary)
+            summary_json = {"summary": processed_summary}
             summary_text = json.dumps(summary_json, ensure_ascii=False, indent=2)
             file_id = upload_content_directly(service, file_name, folder_id, summary_text)
             print("summary已上传到Google Drive")