PolyAI-pheme

Build error

taras-sereda commited on Jan 8

Commit

3980644

•

1 Parent(s): 586e19e

speech tokenizer, requirements

Files changed (4) hide show

ckpt/speechtokenizer/SpeechTokenizer.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d04593b6c9a4b475f91ca481141a6ef5b23e6ac112f347dd2b2717f193c1c728
+size 481906997

ckpt/speechtokenizer/config.json ADDED Viewed

+{
+    "resblock": "1",
+    "num_gpus": 3,
+    "batch_size": 60,
+    "learning_rate": 0.0001,
+    "adam_b1": 0.5,
+    "adam_b2": 0.9,
+    "lr_decay": 0.98,
+    "seed": 1234,
+    "lambda_distill": 0.15,
+    "n_filters": 64,
+    "strides": [8,5,4,2],
+    "dimension": 1024,
+    "semantic_dimension": 768,
+    "bidirectional": true,
+    "dilation_base": 2,
+    "residual_kernel_size": 3,
+    "n_residual_layers": 1,
+    "lstm_layers": 2,
+    "activation": "ELU",
+    "segment_size": 48000,
+    "num_mels": 80,
+    "num_freq": 1025,
+    "n_fft": 1024,
+    "hop_size": 240,
+    "win_size": 1024,
+    "sampling_rate": 16000,
+    "sample_rate": 16000,
+    "codebook_size": 1024,
+    "n_q": 8,
+    "fmin": 0,
+    "fmax": 8000,
+    "fmax_for_loss": null,
+    "num_workers": 12,
+    "dist_config": {
+        "dist_backend": "nccl",
+        "dist_url": "tcp://localhost:54322",
+        "world_size": 1
+    }
+}

ckpt/unique_text_tokens.k2symbols ADDED Viewed

+<eps> 0
+! 1
+" 2
+( 3
+) 4
+, 5
+. 6
+: 7
+; 8
+? 9
+_ 10
+aɪ 11
+aɪə 12
+aɪɚ 13
+aɪʊ 14
+aɪʊɹ 15
+aʊ 16
+b 17
+d 18
+dʒ 19
+e 20
+enus 21
+es 22
+eɪ 23
+f 24
+fr 25
+h 26
+i 27
+iə 28
+iː 29
+j 30
+k 31
+l 32
+m 33
+n 34
+nʲ 35
+oʊ 36
+oː 37
+oːɹ 38
+p 39
+r 40
+s 41
+t 42
+tʃ 43
+uː 44
+v 45
+w 46
+x 47
+z 48
+æ 49
+ç 50
+ð 51
+ø 52
+ŋ 53
+ɐ 54
+ɑ 55
+ɑː 56
+ɑːɹ 57
+ɔ 58
+ɔɪ 59
+ɔː 60
+ɔːɹ 61
+ə 62
+əl 63
+ɚ 64
+ɛ 65
+ɛɹ 66
+ɛː 67
+ɜː 68
+ɡ 69
+ɡʲ 70
+ɣ 71
+ɪ 72
+ɪɹ 73
+ɫ 74
+ɬ 75
+ɲ 76
+ɹ 77
+ɾ 78
+ʃ 79
+ʊ 80
+ʊɹ 81
+ʌ 82
+ʒ 83
+ʔ 84
+̃ 85
+̩ 86
+θ 87
+ᵻ 88
+— 89

requirements.txt CHANGED Viewed

@@ -1,3 +1,9 @@
 torchvision
 torchaudio
 torch

 torchvision
 torchaudio
 torch
+transformers
+einops
+librosa
+pyannote.audio @ https://github.com/pyannote/pyannote-audio/archive/develop.zip
+wheel
+phonemizer