Spaces:

sasan
/

KITT

Build error

App Files Files Community

sasan commited on May 23, 2024

Commit

cdb2b77

1 Parent(s): e3db752

Small updates

Browse files

Files changed (2) hide show

kitt/core/__init__.py +2 -2
main.py +20 -14

kitt/core/__init__.py CHANGED Viewed

@@ -101,7 +101,7 @@ def speed_from_text(voice):
             return v.speed
-def tts(
     self,
     text: str = "",
     language_name: str = "",
@@ -198,7 +198,7 @@ def tts_gradio(text, voice, cache):
     (gpt_cond_latent, speaker_embedding) = compute_speaker_embedding(
         voice_path, tts_pipeline.synthesizer.tts_config, tts_pipeline, cache
     )
-    out = tts(
         tts_pipeline.synthesizer,
         text,
         language_name="en",

             return v.speed
+def tts_xtts(
     self,
     text: str = "",
     language_name: str = "",
     (gpt_cond_latent, speaker_embedding) = compute_speaker_embedding(
         voice_path, tts_pipeline.synthesizer.tts_config, tts_pipeline, cache
     )
+    out = tts_xtts(
         tts_pipeline.synthesizer,
         text,
         language_name="en",

main.py CHANGED Viewed

@@ -40,7 +40,7 @@ from kitt.skills.routing import calculate_route, find_address
 ORIGIN = "Mondorf-les-Bains, Luxembourg"
 DESTINATION = "Rue Alphonse Weicker, Luxembourg"
-DEFAULT_LLM_BACKEND = "ollama"
 ENABLE_HISTORY = True
 ENABLE_TTS = True
 TTS_BACKEND = "local"
@@ -133,11 +133,11 @@ def search_along_route(query=""):
 def set_time(time_picker):
     vehicle.time = time_picker
-    return vehicle.model_dump_json()
 def get_vehicle_status(state):
-    return state.value["vehicle"].model_dump_json()
 tools = [
@@ -232,11 +232,16 @@ def run_llama3_model(query, voice_character, state):
     )
     gr.Info(f"Output text: {output_text}\nGenerating voice output...")
     voice_out = None
-    if state["tts_enabled"]:
-        # voice_out = run_tts_replicate(output_text, voice_character)
         # voice_out = run_tts_fast(output_text)[0]
-        voice_out = run_melo_tts(output_text, voice_character)
-        # voice_out = tts_gradio(output_text, voice_character, speaker_embedding_cache)[0]
     return (
         output_text,
         voice_out,
@@ -264,7 +269,7 @@ def run_model(query, voice_character, state):
     return (
         text,
         voice,
-        vehicle.model_dump_json(),
         state,
         dict(update_proxy=global_context["update_proxy"]),
     )
@@ -299,7 +304,8 @@ def update_vehicle_status(trip_progress, origin, destination, state):
     plot = kitt_utils.plot_route(
         global_context["route_points"], vehicle=vehicle.location_coordinates
     )
-    return vehicle.model_dump_json(), plot, state
 device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -335,8 +341,8 @@ def save_and_transcribe_audio(audio):
         gr.Info(f"Transcribed text is: {text}\nProcessing the input...")
     except Exception as e:
-        print(f"Error: {e}")
-        return "Error transcribing audio."
     return text
@@ -447,6 +453,9 @@ def create_demo(tts_server: bool = False, model="llama3"):
         with gr.Row():
             with gr.Column(scale=1, min_width=300):
                 time_picker = gr.Dropdown(
                     choices=hour_options,
                     label="What time is it? (HH:MM)",
@@ -516,9 +525,6 @@ def create_demo(tts_server: bool = False, model="llama3"):
                         value=dict(update_proxy=0),
                         label="Global context",
                     )
-                vehicle_status = gr.JSON(
-                    value=vehicle.model_dump_json(), label="Vehicle status"
-                )
                 with gr.Accordion("Config"):
                     tts_enabled = gr.Radio(
                         ["Yes", "No"],

 ORIGIN = "Mondorf-les-Bains, Luxembourg"
 DESTINATION = "Rue Alphonse Weicker, Luxembourg"
+DEFAULT_LLM_BACKEND = "replicate"
 ENABLE_HISTORY = True
 ENABLE_TTS = True
 TTS_BACKEND = "local"
 def set_time(time_picker):
     vehicle.time = time_picker
+    return vehicle.model_dump_json(indent=2)
 def get_vehicle_status(state):
+    return state.value["vehicle"].model_dump_json(indent=2)
 tools = [
     )
     gr.Info(f"Output text: {output_text}\nGenerating voice output...")
     voice_out = None
+    if global_context["tts_enabled"]:
+        if "Fast" in voice_character:
+            voice_out = run_melo_tts(output_text, voice_character)
+        elif global_context["tts_backend"] == "replicate":
+            voice_out = run_tts_replicate(output_text, voice_character)
+        else:
+            voice_out = tts_gradio(output_text, voice_character, speaker_embedding_cache)[0]
+        #
         # voice_out = run_tts_fast(output_text)[0]
+        #
     return (
         output_text,
         voice_out,
     return (
         text,
         voice,
+        vehicle,
         state,
         dict(update_proxy=global_context["update_proxy"]),
     )
     plot = kitt_utils.plot_route(
         global_context["route_points"], vehicle=vehicle.location_coordinates
     )
+    return vehicle, plot, state
+    return vehicle.model_dump_json(indent=2), plot, state
 device = "cuda" if torch.cuda.is_available() else "cpu"
         gr.Info(f"Transcribed text is: {text}\nProcessing the input...")
     except Exception as e:
+        logger.error(f"Error: {e}")
+        raise Exception("Error transcribing audio.")
     return text
         with gr.Row():
             with gr.Column(scale=1, min_width=300):
+                vehicle_status = gr.JSON(
+                    value=vehicle.model_dump_json(indent=2), label="Vehicle status"
+                )
                 time_picker = gr.Dropdown(
                     choices=hour_options,
                     label="What time is it? (HH:MM)",
                         value=dict(update_proxy=0),
                         label="Global context",
                     )
                 with gr.Accordion("Config"):
                     tts_enabled = gr.Radio(
                         ["Yes", "No"],