Spaces:

LYL1015
/

JarvisArt-Preview

Running on Zero

LYL1015 commited on Jul 7

Commit

dd404b8

verified ·

1 Parent(s): 8db59b8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -546,15 +546,22 @@ def process_image_analysis_stream(image_dict, user_prompt, max_new_tokens, top_k
     # 检查图像输入
     if image_dict is None or image_dict.get('image') is None:
-        yield [["请先上传图片！", "我需要图片才能进行分析。"]], None
         return
     # 处理图像
     image = image_dict['image']
     if not isinstance(image, str):
         import tempfile
         temp_path = os.path.join(tempfile.gettempdir(), f"temp_image_{hash(str(image))}.png")
-        image.save(temp_path)
         image = temp_path
     # 处理提示词
@@ -631,14 +638,14 @@ def process_image_analysis_stream(image_dict, user_prompt, max_new_tokens, top_k
     thread.start()
     # 初始化聊天历史
-    chat_history = [[user_prompt, ""]]
     yield chat_history, None
     # 流式接收输出，参考mm_qwen2vl.py的bot函数
     full_response = ""
     for new_token in streamer:
         full_response += new_token
-        chat_history[-1][1] = full_response
         yield chat_history, None
     # 处理完成后的文件生成

     # 检查图像输入
     if image_dict is None or image_dict.get('image') is None:
+        yield [[{"role": "user", "content": "请先上传图片！"}, {"role": "assistant", "content": "我需要图片才能进行分析。"}]], None
         return
     # 处理图像
     image = image_dict['image']
     if not isinstance(image, str):
         import tempfile
+        from PIL import Image as PILImage
         temp_path = os.path.join(tempfile.gettempdir(), f"temp_image_{hash(str(image))}.png")
+        # 将 numpy 数组转换为 PIL Image
+        if hasattr(image, 'shape'):  # 确认是 numpy 数组
+            pil_img = PILImage.fromarray(image)
+            pil_img.save(temp_path)
+        else:
+            # 如果已经是 PIL Image
+            image.save(temp_path)
         image = temp_path
     # 处理提示词
     thread.start()
     # 初始化聊天历史
+    chat_history = [[{"role": "user", "content": user_prompt}, {"role": "assistant", "content": ""}]]
     yield chat_history, None
     # 流式接收输出，参考mm_qwen2vl.py的bot函数
     full_response = ""
     for new_token in streamer:
         full_response += new_token
+        chat_history[-1][1]["content"] = full_response
         yield chat_history, None
     # 处理完成后的文件生成