kokuren
commited on
Commit
•
257871f
1
Parent(s):
14f4aae
Add all files including large files with Git LFS
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- RinneElu_RVCfree/RinneElu1_100ep.pth +3 -0
- RinneElu_TTSeng/RinEluEng.safetensors +3 -0
- RinneElu_TTSeng/config.json +107 -0
- RinneElu_TTSeng/style_vectors.npy +3 -0
- RinneElu_TTSfree/RinneElu_s05000.safetensors +3 -0
- RinneElu_TTSfree/config.json +121 -0
- RinneElu_TTSfree/style_vectors.npy +3 -0
- beatrice_v2/output/__main__.py +0 -0
- beatrice_v2/output/checkpoint_latest.pt +3 -0
- beatrice_v2/output/checkpoint_train_00000001.pt +3 -0
- beatrice_v2/output/checkpoint_train_00002000.pt +3 -0
- beatrice_v2/output/checkpoint_train_00004000.pt +3 -0
- beatrice_v2/output/checkpoint_train_00006000.pt +3 -0
- beatrice_v2/output/checkpoint_train_00008000.pt +3 -0
- beatrice_v2/output/checkpoint_train_00010000.pt +3 -0
- beatrice_v2/output/config.json +37 -0
- beatrice_v2/output/events.out.tfevents.1731006050.DESKTOP-PN4E7G1.14176.0 +3 -0
- beatrice_v2/output/paraphernalia_train_00000001/beatrice_paraphernalia_train_00000001.toml +20 -0
- beatrice_v2/output/paraphernalia_train_00000001/formant_shift_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00000001/noimage.png +0 -0
- beatrice_v2/output/paraphernalia_train_00000001/phone_extractor.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00000001/pitch_estimator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00000001/speaker_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00000001/waveform_generator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00002000/beatrice_paraphernalia_train_00002000.toml +20 -0
- beatrice_v2/output/paraphernalia_train_00002000/formant_shift_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00002000/noimage.png +0 -0
- beatrice_v2/output/paraphernalia_train_00002000/phone_extractor.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00002000/pitch_estimator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00002000/speaker_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00002000/waveform_generator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00004000/beatrice_paraphernalia_train_00004000.toml +20 -0
- beatrice_v2/output/paraphernalia_train_00004000/formant_shift_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00004000/noimage.png +0 -0
- beatrice_v2/output/paraphernalia_train_00004000/phone_extractor.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00004000/pitch_estimator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00004000/speaker_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00004000/waveform_generator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00006000/beatrice_paraphernalia_train_00006000.toml +20 -0
- beatrice_v2/output/paraphernalia_train_00006000/formant_shift_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00006000/noimage.png +0 -0
- beatrice_v2/output/paraphernalia_train_00006000/phone_extractor.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00006000/pitch_estimator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00006000/speaker_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00006000/waveform_generator.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00008000/beatrice_paraphernalia_train_00008000.toml +20 -0
- beatrice_v2/output/paraphernalia_train_00008000/formant_shift_embeddings.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00008000/noimage.png +0 -0
- beatrice_v2/output/paraphernalia_train_00008000/phone_extractor.bin +3 -0
- beatrice_v2/output/paraphernalia_train_00008000/pitch_estimator.bin +3 -0
RinneElu_RVCfree/RinneElu1_100ep.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8356b42c98e0dbe6522e3cbbfa8ce2dedc69da9aaae6856ff8fdc43255f6cd92
|
3 |
+
size 57578929
|
RinneElu_TTSeng/RinEluEng.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26d2dbc00e096847b641b3a3d435cb5a1a8d12773250816602b1c86f5e44e827
|
3 |
+
size 198768188
|
RinneElu_TTSeng/config.json
ADDED
@@ -0,0 +1,107 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_name": "RinEluEng",
|
3 |
+
"train": {
|
4 |
+
"log_interval": 200,
|
5 |
+
"eval_interval": 1000,
|
6 |
+
"seed": 42,
|
7 |
+
"epochs": 100,
|
8 |
+
"learning_rate": 0.0002,
|
9 |
+
"betas": [
|
10 |
+
0.8,
|
11 |
+
0.99
|
12 |
+
],
|
13 |
+
"eps": 1e-09,
|
14 |
+
"batch_size": 4,
|
15 |
+
"bf16_run": false,
|
16 |
+
"lr_decay": 0.99995,
|
17 |
+
"segment_size": 16384,
|
18 |
+
"init_lr_ratio": 1,
|
19 |
+
"warmup_epochs": 0,
|
20 |
+
"c_mel": 45,
|
21 |
+
"c_kl": 1.0,
|
22 |
+
"skip_optimizer": false,
|
23 |
+
"freeze_ZH_bert": false,
|
24 |
+
"freeze_JP_bert": false,
|
25 |
+
"freeze_EN_bert": false,
|
26 |
+
"freeze_style": false,
|
27 |
+
"freeze_encoder": false,
|
28 |
+
"freeze_decoder": false
|
29 |
+
},
|
30 |
+
"data": {
|
31 |
+
"training_files": "Data/RinEluGrobal/train.list",
|
32 |
+
"validation_files": "Data/RinEluGrobal/val.list",
|
33 |
+
"max_wav_value": 32768.0,
|
34 |
+
"sampling_rate": 44100,
|
35 |
+
"filter_length": 2048,
|
36 |
+
"hop_length": 512,
|
37 |
+
"win_length": 2048,
|
38 |
+
"n_mel_channels": 128,
|
39 |
+
"mel_fmin": 0.0,
|
40 |
+
"mel_fmax": null,
|
41 |
+
"add_blank": true,
|
42 |
+
"n_speakers": 1,
|
43 |
+
"cleaned_text": true,
|
44 |
+
"num_styles": 1,
|
45 |
+
"style2id": {
|
46 |
+
"Neutral": 0
|
47 |
+
},
|
48 |
+
"spk2id": {
|
49 |
+
"RinEluGrobal": 0
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"model": {
|
53 |
+
"use_spk_conditioned_encoder": true,
|
54 |
+
"use_noise_scaled_mas": true,
|
55 |
+
"use_mel_posterior_encoder": false,
|
56 |
+
"use_duration_discriminator": true,
|
57 |
+
"inter_channels": 192,
|
58 |
+
"hidden_channels": 192,
|
59 |
+
"filter_channels": 768,
|
60 |
+
"n_heads": 2,
|
61 |
+
"n_layers": 6,
|
62 |
+
"kernel_size": 3,
|
63 |
+
"p_dropout": 0.1,
|
64 |
+
"resblock": "1",
|
65 |
+
"resblock_kernel_sizes": [
|
66 |
+
3,
|
67 |
+
7,
|
68 |
+
11
|
69 |
+
],
|
70 |
+
"resblock_dilation_sizes": [
|
71 |
+
[
|
72 |
+
1,
|
73 |
+
3,
|
74 |
+
5
|
75 |
+
],
|
76 |
+
[
|
77 |
+
1,
|
78 |
+
3,
|
79 |
+
5
|
80 |
+
],
|
81 |
+
[
|
82 |
+
1,
|
83 |
+
3,
|
84 |
+
5
|
85 |
+
]
|
86 |
+
],
|
87 |
+
"upsample_rates": [
|
88 |
+
8,
|
89 |
+
8,
|
90 |
+
2,
|
91 |
+
2,
|
92 |
+
2
|
93 |
+
],
|
94 |
+
"upsample_initial_channel": 512,
|
95 |
+
"upsample_kernel_sizes": [
|
96 |
+
16,
|
97 |
+
16,
|
98 |
+
8,
|
99 |
+
2,
|
100 |
+
2
|
101 |
+
],
|
102 |
+
"n_layers_q": 3,
|
103 |
+
"use_spectral_norm": false,
|
104 |
+
"gin_channels": 256
|
105 |
+
},
|
106 |
+
"version": "2.3.1"
|
107 |
+
}
|
RinneElu_TTSeng/style_vectors.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b44d17806f96fd790e7b18066339cf0d2db5b6f268566d9edce684081ab297d
|
3 |
+
size 1152
|
RinneElu_TTSfree/RinneElu_s05000.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2a2bd121ba3e01006ddeaba66c9230fb28a63ef891f5209faf7be5fb35eebb7
|
3 |
+
size 251150980
|
RinneElu_TTSfree/config.json
ADDED
@@ -0,0 +1,121 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"train": {
|
3 |
+
"log_interval": 200,
|
4 |
+
"eval_interval": 1000,
|
5 |
+
"seed": 42,
|
6 |
+
"epochs": 300,
|
7 |
+
"learning_rate": 0.0001,
|
8 |
+
"betas": [
|
9 |
+
0.8,
|
10 |
+
0.99
|
11 |
+
],
|
12 |
+
"eps": 1e-09,
|
13 |
+
"batch_size": 4,
|
14 |
+
"bf16_run": true,
|
15 |
+
"fp16_run": false,
|
16 |
+
"lr_decay": 0.99996,
|
17 |
+
"segment_size": 16384,
|
18 |
+
"init_lr_ratio": 1,
|
19 |
+
"warmup_epochs": 0,
|
20 |
+
"c_mel": 45,
|
21 |
+
"c_kl": 1.0,
|
22 |
+
"c_commit": 100,
|
23 |
+
"skip_optimizer": true,
|
24 |
+
"freeze_ZH_bert": false,
|
25 |
+
"freeze_JP_bert": false,
|
26 |
+
"freeze_EN_bert": false,
|
27 |
+
"freeze_emo": false,
|
28 |
+
"freeze_style": false
|
29 |
+
},
|
30 |
+
"data": {
|
31 |
+
"use_jp_extra": true,
|
32 |
+
"training_files": "Data/RinneElu/train.list",
|
33 |
+
"validation_files": "Data/RinneElu/val.list",
|
34 |
+
"max_wav_value": 32768.0,
|
35 |
+
"sampling_rate": 44100,
|
36 |
+
"filter_length": 2048,
|
37 |
+
"hop_length": 512,
|
38 |
+
"win_length": 2048,
|
39 |
+
"n_mel_channels": 128,
|
40 |
+
"mel_fmin": 0.0,
|
41 |
+
"mel_fmax": null,
|
42 |
+
"add_blank": true,
|
43 |
+
"n_speakers": 1,
|
44 |
+
"cleaned_text": true,
|
45 |
+
"spk2id": {
|
46 |
+
"RinneElu": 0
|
47 |
+
},
|
48 |
+
"num_styles": 5,
|
49 |
+
"style2id": {
|
50 |
+
"Neutral": 0,
|
51 |
+
"Angry": 1,
|
52 |
+
"Fear": 2,
|
53 |
+
"Happy": 3,
|
54 |
+
"Sad": 4
|
55 |
+
}
|
56 |
+
},
|
57 |
+
"model": {
|
58 |
+
"use_spk_conditioned_encoder": true,
|
59 |
+
"use_noise_scaled_mas": true,
|
60 |
+
"use_mel_posterior_encoder": false,
|
61 |
+
"use_duration_discriminator": false,
|
62 |
+
"use_wavlm_discriminator": true,
|
63 |
+
"inter_channels": 192,
|
64 |
+
"hidden_channels": 192,
|
65 |
+
"filter_channels": 768,
|
66 |
+
"n_heads": 2,
|
67 |
+
"n_layers": 6,
|
68 |
+
"kernel_size": 3,
|
69 |
+
"p_dropout": 0.1,
|
70 |
+
"resblock": "1",
|
71 |
+
"resblock_kernel_sizes": [
|
72 |
+
3,
|
73 |
+
7,
|
74 |
+
11
|
75 |
+
],
|
76 |
+
"resblock_dilation_sizes": [
|
77 |
+
[
|
78 |
+
1,
|
79 |
+
3,
|
80 |
+
5
|
81 |
+
],
|
82 |
+
[
|
83 |
+
1,
|
84 |
+
3,
|
85 |
+
5
|
86 |
+
],
|
87 |
+
[
|
88 |
+
1,
|
89 |
+
3,
|
90 |
+
5
|
91 |
+
]
|
92 |
+
],
|
93 |
+
"upsample_rates": [
|
94 |
+
8,
|
95 |
+
8,
|
96 |
+
2,
|
97 |
+
2,
|
98 |
+
2
|
99 |
+
],
|
100 |
+
"upsample_initial_channel": 512,
|
101 |
+
"upsample_kernel_sizes": [
|
102 |
+
16,
|
103 |
+
16,
|
104 |
+
8,
|
105 |
+
2,
|
106 |
+
2
|
107 |
+
],
|
108 |
+
"n_layers_q": 3,
|
109 |
+
"use_spectral_norm": false,
|
110 |
+
"gin_channels": 512,
|
111 |
+
"slm": {
|
112 |
+
"model": "./slm/wavlm-base-plus",
|
113 |
+
"sr": 16000,
|
114 |
+
"hidden": 768,
|
115 |
+
"nlayers": 13,
|
116 |
+
"initial_channel": 64
|
117 |
+
}
|
118 |
+
},
|
119 |
+
"version": "2.0-JP-Extra",
|
120 |
+
"model_name": "RinneElu"
|
121 |
+
}
|
RinneElu_TTSfree/style_vectors.npy
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5ee09560ae39c8594bd0391c61d24e13221fdcc529fca725f03805677997685
|
3 |
+
size 5248
|
beatrice_v2/output/__main__.py
ADDED
The diff for this file is too large to render.
See raw diff
|
|
beatrice_v2/output/checkpoint_latest.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:338dad341a9c9ae05b1248468d3cbe7e5a16eb446b538288823330eedf40eda3
|
3 |
+
size 588692604
|
beatrice_v2/output/checkpoint_train_00000001.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53b39e36627c692cad24f0cb54efe2cff73e0f1cb53138e26f69206dbd4845bd
|
3 |
+
size 588692604
|
beatrice_v2/output/checkpoint_train_00002000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0c1da60f40aa429a989b52914184f90609784c03c9dfb7b5687ee825731f4c5
|
3 |
+
size 588692604
|
beatrice_v2/output/checkpoint_train_00004000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30c0af1d179879aaf97e82cb0e42767698ff35d6a7e4d03cd6a1cc8aad018891
|
3 |
+
size 588692604
|
beatrice_v2/output/checkpoint_train_00006000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01f8aa815a325445c5e789167f43201315dfdeeb4e525d70ce316d320287943c
|
3 |
+
size 588692604
|
beatrice_v2/output/checkpoint_train_00008000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f229a42115121a3191771f4a69a96736a926f4d5503f0824732f705e07701970
|
3 |
+
size 588692604
|
beatrice_v2/output/checkpoint_train_00010000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:338dad341a9c9ae05b1248468d3cbe7e5a16eb446b538288823330eedf40eda3
|
3 |
+
size 588692604
|
beatrice_v2/output/config.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"learning_rate_g": 0.0002,
|
3 |
+
"learning_rate_d": 0.0001,
|
4 |
+
"min_learning_rate_g": 1e-05,
|
5 |
+
"min_learning_rate_d": 5e-06,
|
6 |
+
"adam_betas": [
|
7 |
+
0.8,
|
8 |
+
0.99
|
9 |
+
],
|
10 |
+
"adam_eps": 1e-06,
|
11 |
+
"batch_size": 8,
|
12 |
+
"grad_weight_mel": 1.0,
|
13 |
+
"grad_weight_ap": 2.0,
|
14 |
+
"grad_weight_adv": 3.0,
|
15 |
+
"grad_weight_fm": 3.0,
|
16 |
+
"grad_balancer_ema_decay": 0.995,
|
17 |
+
"use_amp": true,
|
18 |
+
"num_workers": 16,
|
19 |
+
"n_steps": 10000,
|
20 |
+
"warmup_steps": 2000,
|
21 |
+
"in_sample_rate": 16000,
|
22 |
+
"out_sample_rate": 24000,
|
23 |
+
"wav_length": 96000,
|
24 |
+
"segment_length": 100,
|
25 |
+
"phone_extractor_file": "assets/pretrained/003b_checkpoint_03000000.pt",
|
26 |
+
"pitch_estimator_file": "assets/pretrained/008_1_checkpoint_00300000.pt",
|
27 |
+
"in_ir_wav_dir": "assets/ir",
|
28 |
+
"in_noise_wav_dir": "assets/noise",
|
29 |
+
"in_test_wav_dir": "assets/test",
|
30 |
+
"pretrained_file": "assets/pretrained/079_checkpoint_libritts_r_200_02400000.pt",
|
31 |
+
"hidden_channels": 256,
|
32 |
+
"san": false,
|
33 |
+
"compile_convnext": false,
|
34 |
+
"compile_d4c": false,
|
35 |
+
"compile_discriminator": false,
|
36 |
+
"profile": false
|
37 |
+
}
|
beatrice_v2/output/events.out.tfevents.1731006050.DESKTOP-PN4E7G1.14176.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf74519f1929897a43ca0b668489a77e629386fe52196bc860e4cd59ee42fd3d
|
3 |
+
size 29858706
|
beatrice_v2/output/paraphernalia_train_00000001/beatrice_paraphernalia_train_00000001.toml
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[model]
|
2 |
+
version = "2.0.0-beta.1"
|
3 |
+
name = "train_00000001"
|
4 |
+
description = """
|
5 |
+
No description for this model.
|
6 |
+
このモデルの説明はありません。
|
7 |
+
"""
|
8 |
+
|
9 |
+
[voice.0]
|
10 |
+
name = "RinneElu"
|
11 |
+
description = """
|
12 |
+
No description for this voice.
|
13 |
+
この声の説明はありません。
|
14 |
+
"""
|
15 |
+
average_pitch = 61.375
|
16 |
+
|
17 |
+
[voice.0.portrait]
|
18 |
+
path = "noimage.png"
|
19 |
+
description = """
|
20 |
+
"""
|
beatrice_v2/output/paraphernalia_train_00000001/formant_shift_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dca84db5755d2738e94e19f0ed2157f311421d5b9f3fc06a71381443f559b5df
|
3 |
+
size 4608
|
beatrice_v2/output/paraphernalia_train_00000001/noimage.png
ADDED
beatrice_v2/output/paraphernalia_train_00000001/phone_extractor.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293c72831d78aac3e13f6093cfd3944cbeb497a00c461e437279e37d96a37660
|
3 |
+
size 10847360
|
beatrice_v2/output/paraphernalia_train_00000001/pitch_estimator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09911ca8c9cf9f19a3304043f7dfef743af2a238ec2308f15f8e7ed4b3cddab
|
3 |
+
size 3434112
|
beatrice_v2/output/paraphernalia_train_00000001/speaker_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e2fdf13ab30dcfed2ca129482e72495376200aa5a334626fc66a48a5aee1a3f
|
3 |
+
size 512
|
beatrice_v2/output/paraphernalia_train_00000001/waveform_generator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3c3a727f508d24296fbab36428250322df371bd5505b64c0cfe75aa7c773aea
|
3 |
+
size 9528320
|
beatrice_v2/output/paraphernalia_train_00002000/beatrice_paraphernalia_train_00002000.toml
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[model]
|
2 |
+
version = "2.0.0-beta.1"
|
3 |
+
name = "train_00002000"
|
4 |
+
description = """
|
5 |
+
No description for this model.
|
6 |
+
このモデルの説明はありません。
|
7 |
+
"""
|
8 |
+
|
9 |
+
[voice.0]
|
10 |
+
name = "RinneElu"
|
11 |
+
description = """
|
12 |
+
No description for this voice.
|
13 |
+
この声の説明はありません。
|
14 |
+
"""
|
15 |
+
average_pitch = 61.375
|
16 |
+
|
17 |
+
[voice.0.portrait]
|
18 |
+
path = "noimage.png"
|
19 |
+
description = """
|
20 |
+
"""
|
beatrice_v2/output/paraphernalia_train_00002000/formant_shift_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:046f90ad10e6e8f09693844aa147ae3a72b390992173d8af0c48c05fe272605c
|
3 |
+
size 4608
|
beatrice_v2/output/paraphernalia_train_00002000/noimage.png
ADDED
beatrice_v2/output/paraphernalia_train_00002000/phone_extractor.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293c72831d78aac3e13f6093cfd3944cbeb497a00c461e437279e37d96a37660
|
3 |
+
size 10847360
|
beatrice_v2/output/paraphernalia_train_00002000/pitch_estimator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09911ca8c9cf9f19a3304043f7dfef743af2a238ec2308f15f8e7ed4b3cddab
|
3 |
+
size 3434112
|
beatrice_v2/output/paraphernalia_train_00002000/speaker_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d1eed18f985a55fec2a9f2c0035ea99a5e995b6e5a9da80fce4203848370d51
|
3 |
+
size 512
|
beatrice_v2/output/paraphernalia_train_00002000/waveform_generator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31826c49cfeef3a84580a95bd9bd9f3e308d61106c0d07b71254c2aecac6eede
|
3 |
+
size 9528320
|
beatrice_v2/output/paraphernalia_train_00004000/beatrice_paraphernalia_train_00004000.toml
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[model]
|
2 |
+
version = "2.0.0-beta.1"
|
3 |
+
name = "train_00004000"
|
4 |
+
description = """
|
5 |
+
No description for this model.
|
6 |
+
このモデルの説明はありません。
|
7 |
+
"""
|
8 |
+
|
9 |
+
[voice.0]
|
10 |
+
name = "RinneElu"
|
11 |
+
description = """
|
12 |
+
No description for this voice.
|
13 |
+
この声の説明はありません。
|
14 |
+
"""
|
15 |
+
average_pitch = 61.375
|
16 |
+
|
17 |
+
[voice.0.portrait]
|
18 |
+
path = "noimage.png"
|
19 |
+
description = """
|
20 |
+
"""
|
beatrice_v2/output/paraphernalia_train_00004000/formant_shift_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11ff1b8d8380e9f7eb4cb5fb8f6c76ed9007f1ce0642d48921686ff5912c410d
|
3 |
+
size 4608
|
beatrice_v2/output/paraphernalia_train_00004000/noimage.png
ADDED
beatrice_v2/output/paraphernalia_train_00004000/phone_extractor.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293c72831d78aac3e13f6093cfd3944cbeb497a00c461e437279e37d96a37660
|
3 |
+
size 10847360
|
beatrice_v2/output/paraphernalia_train_00004000/pitch_estimator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09911ca8c9cf9f19a3304043f7dfef743af2a238ec2308f15f8e7ed4b3cddab
|
3 |
+
size 3434112
|
beatrice_v2/output/paraphernalia_train_00004000/speaker_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d4cb6e50f59a62639578fdd5dcd1a96bb84e2ec349c53008a74a3001e64fefa
|
3 |
+
size 512
|
beatrice_v2/output/paraphernalia_train_00004000/waveform_generator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:046cfa9767cac97332a4d07bdaba2f899863a12a35a81cd87622a59448f2aeb1
|
3 |
+
size 9528320
|
beatrice_v2/output/paraphernalia_train_00006000/beatrice_paraphernalia_train_00006000.toml
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[model]
|
2 |
+
version = "2.0.0-beta.1"
|
3 |
+
name = "train_00006000"
|
4 |
+
description = """
|
5 |
+
No description for this model.
|
6 |
+
このモデルの説明はありません。
|
7 |
+
"""
|
8 |
+
|
9 |
+
[voice.0]
|
10 |
+
name = "RinneElu"
|
11 |
+
description = """
|
12 |
+
No description for this voice.
|
13 |
+
この声の説明はありません。
|
14 |
+
"""
|
15 |
+
average_pitch = 61.375
|
16 |
+
|
17 |
+
[voice.0.portrait]
|
18 |
+
path = "noimage.png"
|
19 |
+
description = """
|
20 |
+
"""
|
beatrice_v2/output/paraphernalia_train_00006000/formant_shift_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:752d67af00d2b233bc0de8283f6ad774cd14cbb02cffa3d0abf2f552dc8ba396
|
3 |
+
size 4608
|
beatrice_v2/output/paraphernalia_train_00006000/noimage.png
ADDED
beatrice_v2/output/paraphernalia_train_00006000/phone_extractor.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293c72831d78aac3e13f6093cfd3944cbeb497a00c461e437279e37d96a37660
|
3 |
+
size 10847360
|
beatrice_v2/output/paraphernalia_train_00006000/pitch_estimator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09911ca8c9cf9f19a3304043f7dfef743af2a238ec2308f15f8e7ed4b3cddab
|
3 |
+
size 3434112
|
beatrice_v2/output/paraphernalia_train_00006000/speaker_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3770b311b82c948ae522f7fdad74597964aa6a98f1cb5760049c184451abc6e
|
3 |
+
size 512
|
beatrice_v2/output/paraphernalia_train_00006000/waveform_generator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23695a03c2514d70c08e62ff7297222a893aa67a90c7023cffd0ea0c97c88d6a
|
3 |
+
size 9528320
|
beatrice_v2/output/paraphernalia_train_00008000/beatrice_paraphernalia_train_00008000.toml
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[model]
|
2 |
+
version = "2.0.0-beta.1"
|
3 |
+
name = "train_00008000"
|
4 |
+
description = """
|
5 |
+
No description for this model.
|
6 |
+
このモデルの説明はありません。
|
7 |
+
"""
|
8 |
+
|
9 |
+
[voice.0]
|
10 |
+
name = "RinneElu"
|
11 |
+
description = """
|
12 |
+
No description for this voice.
|
13 |
+
この声の説明はありません。
|
14 |
+
"""
|
15 |
+
average_pitch = 61.375
|
16 |
+
|
17 |
+
[voice.0.portrait]
|
18 |
+
path = "noimage.png"
|
19 |
+
description = """
|
20 |
+
"""
|
beatrice_v2/output/paraphernalia_train_00008000/formant_shift_embeddings.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78509174f4e23479d72195764334b64af0fa01e6682c2875f07cd3ffc916cd71
|
3 |
+
size 4608
|
beatrice_v2/output/paraphernalia_train_00008000/noimage.png
ADDED
beatrice_v2/output/paraphernalia_train_00008000/phone_extractor.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:293c72831d78aac3e13f6093cfd3944cbeb497a00c461e437279e37d96a37660
|
3 |
+
size 10847360
|
beatrice_v2/output/paraphernalia_train_00008000/pitch_estimator.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a09911ca8c9cf9f19a3304043f7dfef743af2a238ec2308f15f8e7ed4b3cddab
|
3 |
+
size 3434112
|