Spaces:

Jessiesj
/

5240_assignment

Sleeping

App Files Files Community

Jessiesj commited on 8 days ago

Commit

ebe1fd7

verified ·

1 Parent(s): cb06615

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -21

app.py CHANGED Viewed

@@ -3,24 +3,24 @@ from transformers import pipeline
 # function part
 # img2text
-# def img2text(url):
-#     image_to_text_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
-#     text = image_to_text_model(url)[0]["generated_text"]
-#     return text
-# # text2story
-# def text2story(text):
-#     text_to_story = pipeline("text-generation", model="isarth/distill_gpt2_story_generator",
-#                             max_length=300,  # 增加最大生成长度
-#                             min_length=100,  # 设置最小生成长度
-#                             do_sample=True,  # 启用随机采样
-#                             temperature=0.9,  # 控制随机性（0-1，越大越随机）
-#                             top_k=50,  # 限制候选词数量
-#                             top_p=0.95,  # 核采样参数
-#                             repetition_penalty=1.2)
-#     # story_text = ""   # to be completed
-#     story_text = text_to_story(text)[0]["generated_text"]
-#     return story_text
 # text2audio
 def text2audio(story_text):
@@ -43,13 +43,12 @@ if uploaded_file is not None:
     #Stage 1: Image to Text
     st.text('Processing img2text...')
-    # scenario = img2text(uploaded_file.name)
-    # st.write(scenario)
     #Stage 2: Text to Story
     st.text('Generating a story...')
-    # story = text2story(scenario)
-    story = "children playing in the park illustration and making fun of other characters."
     st.write(story)
     #Stage 3: Story to Audio data

 # function part
 # img2text
+def img2text(url):
+    image_to_text_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
+    text = image_to_text_model(url)[0]["generated_text"]
+    return text
+# text2story
+def text2story(text):
+    text_to_story = pipeline("text-generation", model="isarth/distill_gpt2_story_generator",
+                            max_length=300,  # 增加最大生成长度
+                            min_length=100,  # 设置最小生成长度
+                            do_sample=True,  # 启用随机采样
+                            temperature=0.9,  # 控制随机性（0-1，越大越随机）
+                            top_k=50,  # 限制候选词数量
+                            top_p=0.95,  # 核采样参数
+                            repetition_penalty=1.2)
+    # story_text = ""   # to be completed
+    story_text = text_to_story(text)[0]["generated_text"]
+    return story_text
 # text2audio
 def text2audio(story_text):
     #Stage 1: Image to Text
     st.text('Processing img2text...')
+    scenario = img2text(uploaded_file.name)
+    st.write(scenario)
     #Stage 2: Text to Story
     st.text('Generating a story...')
+    story = text2story(scenario)
     st.write(story)
     #Stage 3: Story to Audio data