nielsr HF staff commited on
Commit
0eb70ea
1 Parent(s): e3b4b4a

Push model using huggingface_hub.

Browse files
Files changed (2) hide show
  1. config.json +70 -0
  2. model.safetensors +1 -1
config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio_embedding_dim": 1024,
3
+ "audio_embedding_dropout": 0.0,
4
+ "audio_max_length": 16.0,
5
+ "audio_min_length": 1.0,
6
+ "audio_pad_token": 2050,
7
+ "audio_positional_embedding_dropout": 0.0,
8
+ "audio_vocab_size": 2048,
9
+ "batch_size": 100,
10
+ "clipping_update_period": 1000,
11
+ "codebook_weight": "[2,1,1,1]",
12
+ "d_model": 1024,
13
+ "dataset": "gigaspeech",
14
+ "dataset_dir": "/data/scratch/pyp/datasets/gigaspeech_phn_enc_manifest/xl",
15
+ "drop_long": 1,
16
+ "dynamic_batching": 1,
17
+ "early_stop_step": 3200,
18
+ "early_stop_threshold": -1.0,
19
+ "empty_token": 2048,
20
+ "encodec_folder_name": "encodec_16khz_4codebooks",
21
+ "encodec_sr": 50,
22
+ "eog": 2049,
23
+ "eos": 2051,
24
+ "exp_dir": "/data/scratch/pyp/exp_pyp/VoiceCraft/gigaspeech/tts_enhanced_330M",
25
+ "gradient_accumulation_steps": 24,
26
+ "gradient_clip_val": 1.0,
27
+ "load_model_from": "./pretrained_models/giga330M.pth",
28
+ "lr": 1e-05,
29
+ "manifest_name": "manifest_large16khz_lessambi",
30
+ "mask_len_max": 600,
31
+ "mask_len_min": 1,
32
+ "mask_sample_dist": "poisson1",
33
+ "max_mask_portion": 0.9,
34
+ "max_n_spans": 3,
35
+ "max_num_tokens": 20000,
36
+ "min_gap": 5,
37
+ "n_codebooks": 4,
38
+ "n_special": 4,
39
+ "nhead": 16,
40
+ "num_buckets": 10,
41
+ "num_decoder_layers": 24,
42
+ "num_epochs": 10,
43
+ "num_steps": 500000,
44
+ "num_workers": 8,
45
+ "optimizer_name": "AdamW",
46
+ "pad_x": 0,
47
+ "phn_folder_name": "phonemes",
48
+ "precision": "float16",
49
+ "print_every_n_steps": 400,
50
+ "pseudo_epoch_size": 3000,
51
+ "reduce_lr_start_epoch": 4,
52
+ "reduce_lr_start_step": 3000,
53
+ "reduced_eog": 1,
54
+ "resume": false,
55
+ "seed": 1,
56
+ "shuffle_mask_embedding": 0,
57
+ "special_first": 0,
58
+ "tb_write_every_n_steps": 100,
59
+ "text_embedding_dropout": 0.0,
60
+ "text_max_length": 400,
61
+ "text_min_length": 10.0,
62
+ "text_pad_token": 120,
63
+ "text_positional_embedding_dropout": 0.0,
64
+ "text_vocab_size": 120,
65
+ "trm_dropout": 0.0,
66
+ "val_every_n_steps": 1600,
67
+ "val_max_num_tokens": 6000,
68
+ "warmup_fraction": 0.1,
69
+ "weight_decay": 0.0
70
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d449a5124af0bf5880961bc79b77b7ace0d2cce53e53b83284cb02ef88296e7a
3
  size 1293853416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72b7de7d0f414ec9f7159d98cc075474a176b78f5e097925a120729c14361ef7
3
  size 1293853416