import os
from typing import IO, Union
from modules.speaker import Speaker, speaker_mgr
import subprocess


def get_datasets_dir():
    """
    列出 ./datasets/data_* 文件夹
    """
    dataset_path = "./datasets"
    dataset_list = os.listdir(dataset_path)
    dataset_list = [
        d for d in dataset_list if os.path.isdir(os.path.join(dataset_path, d))
    ]
    dataset_list = [d for d in dataset_list if d.startswith("data_")]
    return dataset_list


def get_datasets_listfile():
    datasets = get_datasets_dir()
    listfiles = []
    for d in datasets:
        dir_path = os.path.join("./datasets", d)
        files = os.listdir(dir_path)
        for f in files:
            if f.endswith(".list"):
                listfiles.append(os.path.join(dir_path, f))
    return listfiles


def run_speaker_ft(
    batch_size: int, epochs: int, train_text: bool, data_path: str, init_speaker: str
):
    command = ["python3", "-m", "modules.finetune.train_speaker"]
    command += [
        f"--batch_size={batch_size}",
        f"--epochs={epochs}",
        f"--data_path={data_path}",
    ]
    if train_text:
        command.append("--train_text")
    if init_speaker:
        command.append(f"--init_speaker={init_speaker}")
    process = subprocess.Popen(
        command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True, bufsize=1
    )

    return process