Spaces:

rairo
/

NeoFix-API

Running

App Files Files Community

rairo commited on Jun 11, 2025

Commit

bd7ea2f

verified ·

1 Parent(s): b899d5b

Update main.py

Browse files

Files changed (1) hide show

main.py +20 -40

main.py CHANGED Viewed

@@ -564,10 +564,12 @@ def create_project():
         print(traceback.format_exc())
         return jsonify({'error': f"An error occurred: {e}"}), 500
 @app.route('/api/projects/<string:project_id>/approve', methods=['PUT'])
 def approve_project_plan(project_id):
     uid = verify_token(request.headers.get('Authorization'))
-    if not uid: return jsonify({'error': 'Unauthorized'}), 401
     project_ref = db_ref.child(f'projects/{project_id}')
     project_data = project_ref.get()
@@ -575,19 +577,14 @@ def approve_project_plan(project_id):
         return jsonify({'error': 'Project not found or access denied'}), 404
     selected_option = request.json.get('selectedOption')
-    # 1) Download & compress the user’s image before sending it off to Gemini
     response = requests.get(project_data['userImageURL'])
-    pil_image = Image.open(io.BytesIO(response.content)).convert("RGB")
-    pil_image.thumbnail((1024, 1024))  # max‐side 1024px
-    buf = io.BytesIO()
-    pil_image.save(buf, format='JPEG', quality=75, optimize=True)
-    buf.seek(0)
-    compressed_image = Image.open(buf)
-    context = (f"The user chose the upcycling project: '{selected_option}'."
-               if selected_option
-               else f"The user has approved the plan for '{project_data['projectTitle']}'.")
     detailed_prompt = f"""
     You are a DIY expert. The user wants to proceed with the project titled "{project_data['projectTitle']}".
@@ -609,26 +606,24 @@ def approve_project_plan(project_id):
             model=GENERATION_MODEL,
             config=types.GenerateContentConfig(response_modalities=["Text", "Image"])
         )
-        full_resp = chat.send_message([detailed_prompt, compressed_image])
         gen_parts = full_resp.candidates[0].content.parts
         combined_text = ""
         inline_images = []
         for part in gen_parts:
-            if part.text:
                 combined_text += part.text + "\n"
-            if part.inline_data:
-                img = Image.open(BytesIO(part.inline_data.data)).convert("RGB")
-                # 2) Immediately downscale each AI‐generated image
-                img.thumbnail((800, 800))
                 inline_images.append(img)
         combined_text = combined_text.strip()
-        # parse out tools + steps
         tools_section = re.search(r"TOOLS AND MATERIALS:\s*(.*?)\s*STEPS:", combined_text, re.DOTALL).group(1).strip()
         steps_section = re.search(r"STEPS:\s*(.*)", combined_text, re.DOTALL).group(1).strip()
-        tools_list = [line.strip('- ').strip() for line in tools_section.splitlines() if line.strip()]
         parsed_steps = parse_numbered_steps(steps_section)
         if len(parsed_steps) != len(inline_images):
@@ -636,28 +631,12 @@ def approve_project_plan(project_id):
         final_steps = []
         for i, step_info in enumerate(parsed_steps):
-            # 3) Save JPEG at 70% quality
             img_byte_arr = io.BytesIO()
-            inline_images[i].save(
-                img_byte_arr,
-                format='JPEG',
-                quality=70,
-                optimize=True
-            )
             img_path = f"users/{uid}/projects/{project_id}/steps/step_{i+1}_image.jpg"
             img_url = upload_to_storage(img_byte_arr.getvalue(), img_path, 'image/jpeg')
-            # 4) Generate and compress TTS audio to mp3 @ 64kbps
-            raw_audio = generate_tts_audio(step_info['text'])  # returns raw bytes
-            from pydub import AudioSegment
-            sound = AudioSegment.from_file(io.BytesIO(raw_audio), format="wav")
-            mp3_buf = io.BytesIO()
-            sound.export(mp3_buf, format="mp3", bitrate="64k")
-            mp3_buf.seek(0)
-            narration_url = upload_to_storage(mp3_buf.read(),
-                                              f"users/{uid}/projects/{project_id}/steps/step_{i+1}_tts.mp3",
-                                              'audio/mpeg')
             step_info.update({
                 "imageUrl": img_url,
                 "narrationUrl": narration_url,
@@ -673,6 +652,7 @@ def approve_project_plan(project_id):
             "selectedOption": selected_option or ""
         }
         project_ref.update(update_data)
         return jsonify({"success": True, **update_data})
     except Exception as e:

         print(traceback.format_exc())
         return jsonify({'error': f"An error occurred: {e}"}), 500
 @app.route('/api/projects/<string:project_id>/approve', methods=['PUT'])
 def approve_project_plan(project_id):
     uid = verify_token(request.headers.get('Authorization'))
+    if not uid:
+        return jsonify({'error': 'Unauthorized'}), 401
     project_ref = db_ref.child(f'projects/{project_id}')
     project_data = project_ref.get()
         return jsonify({'error': 'Project not found or access denied'}), 404
     selected_option = request.json.get('selectedOption')
     response = requests.get(project_data['userImageURL'])
+    pil_image = Image.open(io.BytesIO(response.content)).convert('RGB')
+    context = (
+        f"The user chose the upcycling project: '{selected_option}'."
+        if selected_option
+        else f"The user has approved the plan for '{project_data['projectTitle']}'."
+    )
     detailed_prompt = f"""
     You are a DIY expert. The user wants to proceed with the project titled "{project_data['projectTitle']}".
             model=GENERATION_MODEL,
             config=types.GenerateContentConfig(response_modalities=["Text", "Image"])
         )
+        full_resp = chat.send_message([detailed_prompt, pil_image])
         gen_parts = full_resp.candidates[0].content.parts
         combined_text = ""
         inline_images = []
         for part in gen_parts:
+            if part.text is not None:
                 combined_text += part.text + "\n"
+            if part.inline_data is not None:
+                img = Image.open(io.BytesIO(part.inline_data.data)).convert('RGB')
                 inline_images.append(img)
         combined_text = combined_text.strip()
         tools_section = re.search(r"TOOLS AND MATERIALS:\s*(.*?)\s*STEPS:", combined_text, re.DOTALL).group(1).strip()
         steps_section = re.search(r"STEPS:\s*(.*)", combined_text, re.DOTALL).group(1).strip()
+        tools_list = [line.strip("- ").strip() for line in tools_section.split('\n') if line.strip()]
         parsed_steps = parse_numbered_steps(steps_section)
         if len(parsed_steps) != len(inline_images):
         final_steps = []
         for i, step_info in enumerate(parsed_steps):
             img_byte_arr = io.BytesIO()
+            inline_images[i].save(img_byte_arr, format='JPEG', optimize=True, quality=70)
             img_path = f"users/{uid}/projects/{project_id}/steps/step_{i+1}_image.jpg"
             img_url = upload_to_storage(img_byte_arr.getvalue(), img_path, 'image/jpeg')
+            narration_url = generate_tts_audio_and_upload(step_info['text'], uid, project_id, i + 1)
             step_info.update({
                 "imageUrl": img_url,
                 "narrationUrl": narration_url,
             "selectedOption": selected_option or ""
         }
         project_ref.update(update_data)
         return jsonify({"success": True, **update_data})
     except Exception as e: