Spaces:

sob111
/

xtts-castellano

Runtime error

sob111 commited on Sep 4

Commit

9930087

verified ·

1 Parent(s): 9a2564d

Update finetune_xtts_hf.py

Files changed (1) hide show

finetune_xtts_hf.py CHANGED Viewed

@@ -19,15 +19,21 @@ print("=== Descargando dataset sob111/voxpopuli_es_500 ===")
 ds = load_dataset("sob111/voxpopuli_es_500", split="train", token=HF_TOKEN)
 # Guardar metadata.json en el formato esperado por Coqui TTS
-os.makedirs("/tmp/voxpopuli_es_500", exist_ok=True)
 meta_file = "/tmp/voxpopuli_es_500/metadata.json"
 with open(meta_file, "w", encoding="utf-8") as f:
-    for sample in ds:
         entry = {
-            "audio_file": sample["audio_file"],
-            "text": sample["text"],
-            "speaker_name": sample.get("speaker_name", "speaker")
         }
         f.write(json.dumps(entry, ensure_ascii=False) + "\n")

 ds = load_dataset("sob111/voxpopuli_es_500", split="train", token=HF_TOKEN)
 # Guardar metadata.json en el formato esperado por Coqui TTS
+os.makedirs("/tmp/voxpopuli_es_500/wav_data", exist_ok=True)
 meta_file = "/tmp/voxpopuli_es_500/metadata.json"
 with open(meta_file, "w", encoding="utf-8") as f:
+    for i, sample in enumerate(ds):
+        # Guardar cada audio en wav_data
+        audio_path = f"/tmp/voxpopuli_es_500/wav_data/sample_{i}.wav"
+        array = sample["audio"]["array"]
+        import soundfile as sf
+        sf.write(audio_path, array, sample["audio"]["sampling_rate"])
         entry = {
+            "audio_file": audio_path,
+            "text": sample.get("text") or sample.get("sentence", ""),
+            "speaker_name": str(sample.get("speaker_id", "speaker"))
         }
         f.write(json.dumps(entry, ensure_ascii=False) + "\n")