Spaces:

bstraehle
/

grady

Running

bstraehle commited on May 2

Commit

ad1b760

verified ·

1 Parent(s): e604944

Update crew.py

Files changed (1) hide show

crew.py CHANGED Viewed

@@ -15,10 +15,11 @@ from util import get_final_answer, get_img_b64
 ## LLMs
 MANAGER_MODEL      = "gpt-4.1"
-AGENT_MODEL        = "gpt-4.1"
 FINAL_ANSWER_MODEL = "gpt-4.5-preview"
 AUDIO_MODEL        = "gpt-4o-transcribe"
 IMAGE_MODEL        = "gpt-4.1"
 # LLM evaluation
@@ -115,23 +116,35 @@ def run_crew(question, file_path):
                FileNotFoundError: If the video file does not exist
                RuntimeError: If processing fails"""
         if not os.path.exists(file_path):
-            raise FileNotFoundError(f"Image file not found: {file_path}")
-        try:
-            img_b64 = get_img_b64(file_path)
-            client = OpenAI()
-            completion = client.chat.completions.create(
-                messages=[{"role": "user",
-                           "content": [{"type": "text", "text": question},
-                                       {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{img_b64}"}}]}],
-                model=IMAGE_MODEL
             )
-            return completion.choices[0].message.content
         except Exception as e:
-            raise RuntimeError(f"Failed to process image: {str(e)}")
     # Built-in tools

 ## LLMs
 MANAGER_MODEL      = "gpt-4.1"
+AGENT_MODEL        = "gpt-4.1-mini"
 FINAL_ANSWER_MODEL = "gpt-4.5-preview"
 AUDIO_MODEL        = "gpt-4o-transcribe"
 IMAGE_MODEL        = "gpt-4.1"
+VIDEO_MODEL        = "gpt-4.1-mini"
 # LLM evaluation
                FileNotFoundError: If the video file does not exist
                RuntimeError: If processing fails"""
         if not os.path.exists(file_path):
+            raise FileNotFoundError(f"Video file not found: {file_path}")
+        try:
+            video = cv2.VideoCapture(file_path)
+            base64Frames = []
+            while video.isOpened():
+                success, frame = video.read()
+                if not success:
+                    break
+                _, buffer = cv2.imencode(".jpg", frame)
+                base64Frames.append(base64.b64encode(buffer).decode("utf-8"))
+            video.release()
+            response = client.responses.create(
+                input=[{"role": "user",
+                        "content": [{"type": "input_text", "text": (question)},
+                                    *[{"type": "input_image", "image_url": f"data:image/jpeg;base64,{frame}"} for frame in base64Frames]]}],
+                model=VIDEO_MODEL
             )
+            return response.output_text
         except Exception as e:
+            raise RuntimeError(f"Failed to process video: {str(e)}")
     # Built-in tools