Spaces:
Sleeping
Sleeping
formatted_transcript
Browse files
app.py
CHANGED
@@ -54,18 +54,21 @@ def process_youtube_link(link):
|
|
54 |
# 假设您已经获取了 YouTube 视频的逐字稿并存储在变量 `transcript` 中
|
55 |
video_id = link.split("=")[-1]
|
56 |
transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['zh-TW'])
|
57 |
-
|
58 |
-
|
59 |
# 基于逐字稿生成其他所需的输出
|
60 |
questions = generate_questions(transcript)
|
61 |
df_summarise = generate_df_summarise(transcript)
|
|
|
|
|
|
|
|
|
|
|
62 |
|
63 |
# 确保返回与 UI 组件预期匹配的输出
|
64 |
return questions[0] if len(questions) > 0 else "", \
|
65 |
questions[1] if len(questions) > 1 else "", \
|
66 |
questions[2] if len(questions) > 2 else "", \
|
67 |
df_summarise, \
|
68 |
-
|
69 |
|
70 |
def process_web_link(link):
|
71 |
# 抓取和解析网页内容
|
|
|
54 |
# 假设您已经获取了 YouTube 视频的逐字稿并存储在变量 `transcript` 中
|
55 |
video_id = link.split("=")[-1]
|
56 |
transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['zh-TW'])
|
|
|
|
|
57 |
# 基于逐字稿生成其他所需的输出
|
58 |
questions = generate_questions(transcript)
|
59 |
df_summarise = generate_df_summarise(transcript)
|
60 |
+
|
61 |
+
formatted_transcript = ""
|
62 |
+
for entry in transcript:
|
63 |
+
line = f"时间: {entry['start']} 秒, 持续: {entry['duration']} 秒, 文本: {entry['text']}\n"
|
64 |
+
formatted_transcript += line
|
65 |
|
66 |
# 确保返回与 UI 组件预期匹配的输出
|
67 |
return questions[0] if len(questions) > 0 else "", \
|
68 |
questions[1] if len(questions) > 1 else "", \
|
69 |
questions[2] if len(questions) > 2 else "", \
|
70 |
df_summarise, \
|
71 |
+
formatted_transcript
|
72 |
|
73 |
def process_web_link(link):
|
74 |
# 抓取和解析网页内容
|