Spaces:

VladRet2026
/

ConvertAudioToJSON

Sleeping

App Files Files

VladGeekPro Copilot commited on 15 days ago

Commit

392dfe4

1 Parent(s): f856ebd

addedDebugForTesting

Browse files

Co-authored-by: Copilot <copilot@github.com>

Files changed (1) hide show

app.py +19 -0

app.py CHANGED Viewed

@@ -374,6 +374,8 @@ class ExpenseTextExtractor:
         t0 = time.time()
         date_info = self.date_extractor.extract(text, reference_date=reference_date, debug=debug)
         timings["date_extractor"] = round(time.time() - t0, 3)
         t0 = time.time()
         supplier_info = self.supplier_extractor.extract(
@@ -382,6 +384,8 @@ class ExpenseTextExtractor:
             debug=debug,
         )
         timings["supplier_extractor"] = round(time.time() - t0, 3)
         t0 = time.time()
         user_info = self.user_extractor.extract(
@@ -391,6 +395,8 @@ class ExpenseTextExtractor:
             debug=debug,
         )
         timings["user_extractor"] = round(time.time() - t0, 3)
         t0 = time.time()
         amount_info = self.amount_extractor.extract(
@@ -400,6 +406,8 @@ class ExpenseTextExtractor:
             debug=debug,
         )
         timings["amount_extractor"] = round(time.time() - t0, 3)
         if debug:
             print(f"[TIMINGS] {timings}")
@@ -506,6 +514,13 @@ def process_voice_request(audio_path: str, mode: str, payload: dict[str, Any], d
     user_names = extract_names(context.get("users"))
     transcript, whisper_time = transcribe_audio_text(audio_path)
     if mode == "notes":
         notes = polish_notes_text(transcript)
@@ -531,6 +546,8 @@ def process_voice_request(audio_path: str, mode: str, payload: dict[str, Any], d
     print(f"[TIMINGS] pipeline_init: {pipeline_init_time}s")
     extracted = extractor.extract(transcript, reference_date=date.today().isoformat(), debug=debug)
     total_time = round(time.time() - total_start, 3)
     print(f"[TIMINGS] TOTAL: {total_time}s (whisper: {whisper_time}s)")
@@ -546,6 +563,8 @@ def process_voice_request(audio_path: str, mode: str, payload: dict[str, Any], d
     }
     if debug and extracted.get("debug"):
         payload["debug"] = extracted.get("debug")
     return payload

         t0 = time.time()
         date_info = self.date_extractor.extract(text, reference_date=reference_date, debug=debug)
         timings["date_extractor"] = round(time.time() - t0, 3)
+        if debug:
+            print(f"[DEBUG][DATE] {date_info}")
         t0 = time.time()
         supplier_info = self.supplier_extractor.extract(
             debug=debug,
         )
         timings["supplier_extractor"] = round(time.time() - t0, 3)
+        if debug:
+            print(f"[DEBUG][SUPPLIER] {supplier_info}")
         t0 = time.time()
         user_info = self.user_extractor.extract(
             debug=debug,
         )
         timings["user_extractor"] = round(time.time() - t0, 3)
+        if debug:
+            print(f"[DEBUG][USER] {user_info}")
         t0 = time.time()
         amount_info = self.amount_extractor.extract(
             debug=debug,
         )
         timings["amount_extractor"] = round(time.time() - t0, 3)
+        if debug:
+            print(f"[DEBUG][AMOUNT] {amount_info}")
         if debug:
             print(f"[TIMINGS] {timings}")
     user_names = extract_names(context.get("users"))
     transcript, whisper_time = transcribe_audio_text(audio_path)
+    if debug:
+        print(f"[DEBUG][TRANSCRIPT] {transcript}")
+        print(
+            f"[DEBUG][CONTEXT] suppliers_count={len(supplier_names)}, users_count={len(user_names)}"
+        )
+        print(f"[DEBUG][SUPPLIERS] {supplier_names}")
+        print(f"[DEBUG][USERS] {user_names}")
     if mode == "notes":
         notes = polish_notes_text(transcript)
     print(f"[TIMINGS] pipeline_init: {pipeline_init_time}s")
     extracted = extractor.extract(transcript, reference_date=date.today().isoformat(), debug=debug)
+    if debug:
+        print(f"[DEBUG][EXTRACTED_RAW] {extracted}")
     total_time = round(time.time() - total_start, 3)
     print(f"[TIMINGS] TOTAL: {total_time}s (whisper: {whisper_time}s)")
     }
     if debug and extracted.get("debug"):
         payload["debug"] = extracted.get("debug")
+    if debug:
+        print(f"[DEBUG][RESPONSE_PAYLOAD] {payload}")
     return payload