youngtsai commited on
Commit
938aee2
1 Parent(s): 3e13a5c

formatted_transcript

Browse files
Files changed (1) hide show
  1. app.py +6 -3
app.py CHANGED
@@ -54,18 +54,21 @@ def process_youtube_link(link):
54
  # 假设您已经获取了 YouTube 视频的逐字稿并存储在变量 `transcript` 中
55
  video_id = link.split("=")[-1]
56
  transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['zh-TW'])
57
-
58
-
59
  # 基于逐字稿生成其他所需的输出
60
  questions = generate_questions(transcript)
61
  df_summarise = generate_df_summarise(transcript)
 
 
 
 
 
62
 
63
  # 确保返回与 UI 组件预期匹配的输出
64
  return questions[0] if len(questions) > 0 else "", \
65
  questions[1] if len(questions) > 1 else "", \
66
  questions[2] if len(questions) > 2 else "", \
67
  df_summarise, \
68
- transcript
69
 
70
  def process_web_link(link):
71
  # 抓取和解析网页内容
 
54
  # 假设您已经获取了 YouTube 视频的逐字稿并存储在变量 `transcript` 中
55
  video_id = link.split("=")[-1]
56
  transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['zh-TW'])
 
 
57
  # 基于逐字稿生成其他所需的输出
58
  questions = generate_questions(transcript)
59
  df_summarise = generate_df_summarise(transcript)
60
+
61
+ formatted_transcript = ""
62
+ for entry in transcript:
63
+ line = f"时间: {entry['start']} 秒, 持续: {entry['duration']} 秒, 文本: {entry['text']}\n"
64
+ formatted_transcript += line
65
 
66
  # 确保返回与 UI 组件预期匹配的输出
67
  return questions[0] if len(questions) > 0 else "", \
68
  questions[1] if len(questions) > 1 else "", \
69
  questions[2] if len(questions) > 2 else "", \
70
  df_summarise, \
71
+ formatted_transcript
72
 
73
  def process_web_link(link):
74
  # 抓取和解析网页内容