Spaces:
Running
on
Zero
Running
on
Zero
mrfakename
commited on
Sync from GitHub repo
Browse filesThis Space is synced from the GitHub repo: https://github.com/SWivid/F5-TTS. Please submit contributions to the Space there
src/f5_tts/infer/examples/basic/basic.toml
CHANGED
@@ -7,4 +7,5 @@ gen_text = "I don't really care what you call me. I've been a silent spectator,
|
|
7 |
# File with text to generate. Ignores the text above.
|
8 |
gen_file = ""
|
9 |
remove_silence = false
|
10 |
-
output_dir = "tests"
|
|
|
|
7 |
# File with text to generate. Ignores the text above.
|
8 |
gen_file = ""
|
9 |
remove_silence = false
|
10 |
+
output_dir = "tests"
|
11 |
+
output_file = "infer_cli_out.wav"
|
src/f5_tts/infer/infer_cli.py
CHANGED
@@ -57,7 +57,7 @@ parser.add_argument(
|
|
57 |
"-f",
|
58 |
"--gen_file",
|
59 |
type=str,
|
60 |
-
help="File with text to generate. Ignores --
|
61 |
)
|
62 |
parser.add_argument(
|
63 |
"-o",
|
@@ -65,6 +65,12 @@ parser.add_argument(
|
|
65 |
type=str,
|
66 |
help="Path to output folder..",
|
67 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
68 |
parser.add_argument(
|
69 |
"--remove_silence",
|
70 |
help="Remove silence.",
|
@@ -104,13 +110,14 @@ if "voices" in config:
|
|
104 |
if gen_file:
|
105 |
gen_text = codecs.open(gen_file, "r", "utf-8").read()
|
106 |
output_dir = args.output_dir if args.output_dir else config["output_dir"]
|
|
|
107 |
model = args.model if args.model else config["model"]
|
108 |
ckpt_file = args.ckpt_file if args.ckpt_file else ""
|
109 |
vocab_file = args.vocab_file if args.vocab_file else ""
|
110 |
remove_silence = args.remove_silence if args.remove_silence else config["remove_silence"]
|
111 |
speed = args.speed
|
112 |
|
113 |
-
wave_path = Path(output_dir) /
|
114 |
# spectrogram_path = Path(output_dir) / "infer_cli_out.png"
|
115 |
|
116 |
vocoder_name = args.vocoder_name
|
|
|
57 |
"-f",
|
58 |
"--gen_file",
|
59 |
type=str,
|
60 |
+
help="File with text to generate. Ignores --gen_text",
|
61 |
)
|
62 |
parser.add_argument(
|
63 |
"-o",
|
|
|
65 |
type=str,
|
66 |
help="Path to output folder..",
|
67 |
)
|
68 |
+
parser.add_argument(
|
69 |
+
"-w",
|
70 |
+
"--output_file",
|
71 |
+
type=str,
|
72 |
+
help="Filename of output file..",
|
73 |
+
)
|
74 |
parser.add_argument(
|
75 |
"--remove_silence",
|
76 |
help="Remove silence.",
|
|
|
110 |
if gen_file:
|
111 |
gen_text = codecs.open(gen_file, "r", "utf-8").read()
|
112 |
output_dir = args.output_dir if args.output_dir else config["output_dir"]
|
113 |
+
output_file = args.output_file if args.output_file else config["output_file"]
|
114 |
model = args.model if args.model else config["model"]
|
115 |
ckpt_file = args.ckpt_file if args.ckpt_file else ""
|
116 |
vocab_file = args.vocab_file if args.vocab_file else ""
|
117 |
remove_silence = args.remove_silence if args.remove_silence else config["remove_silence"]
|
118 |
speed = args.speed
|
119 |
|
120 |
+
wave_path = Path(output_dir) / output_file
|
121 |
# spectrogram_path = Path(output_dir) / "infer_cli_out.png"
|
122 |
|
123 |
vocoder_name = args.vocoder_name
|