ArthurZ HF staff commited on
Commit
1cc9a18
·
1 Parent(s): 862cac7

add config

Browse files
Files changed (1) hide show
  1. config.json +268 -0
config.json ADDED
@@ -0,0 +1,268 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "alignment_head": [
4
+ 2,
5
+ null,
6
+ null
7
+ ],
8
+ "alignment_layer": [
9
+ 68,
10
+ null,
11
+ null
12
+ ],
13
+ "attn_dropout": 0.0,
14
+ "attn_init_scale": 1.0,
15
+ "attn_order": [
16
+ 10,
17
+ 2,
18
+ 2
19
+ ],
20
+ "blocks": 128,
21
+ "bos_token_id": 50256,
22
+ "c_res": 1,
23
+ "cond_c_res": [
24
+ 0,
25
+ 1,
26
+ 1
27
+ ],
28
+ "cond_depth": [
29
+ 3,
30
+ 16,
31
+ 16
32
+ ],
33
+ "cond_dilation_cycle": [
34
+ null,
35
+ 8,
36
+ 8
37
+ ],
38
+ "cond_dilation_growth_rate": [
39
+ 1,
40
+ 3,
41
+ 3
42
+ ],
43
+ "cond_m_conv": 1,
44
+ "cond_res_scale": false,
45
+ "cond_width": [
46
+ 128,
47
+ 1024,
48
+ 1024
49
+ ],
50
+ "cond_zero_out": false,
51
+ "copy_input": false,
52
+ "depth": [
53
+ 79,
54
+ 72,
55
+ 72
56
+ ],
57
+ "downs_t": [
58
+ 3,
59
+ 2,
60
+ 2
61
+ ],
62
+ "emb_dropout": 0.0,
63
+ "eos_token_id": 50256,
64
+ "fp16_params": true,
65
+ "hop_length": 256,
66
+ "init_scale": [
67
+ 0.7,
68
+ 1,
69
+ 1
70
+ ],
71
+ "initializer_range": 0.02,
72
+ "l_bins": 2048,
73
+ "labels": false,
74
+ "layer_norm_epsilon": 1e-05,
75
+ "m_attn": 0.25,
76
+ "max_bow_genre_size": 1,
77
+ "max_duration": 600.0,
78
+ "merged_decoder": [
79
+ true,
80
+ false,
81
+ false
82
+ ],
83
+ "min_duration": 23.8,
84
+ "mlp_init_scale": 0.02,
85
+ "model_type": "jukebox",
86
+ "multispec_loss_hop_length": [
87
+ 240,
88
+ 120,
89
+ 50
90
+ ],
91
+ "multispec_loss_n_fft": [
92
+ 2048,
93
+ 1024,
94
+ 512
95
+ ],
96
+ "multispec_loss_window_size": [
97
+ 1200,
98
+ 600,
99
+ 240
100
+ ],
101
+ "multispectral": 1.0,
102
+ "n_ctx": [
103
+ 8192,
104
+ 8192,
105
+ 8192
106
+ ],
107
+ "n_embd": 768,
108
+ "n_head": 12,
109
+ "n_heads": [
110
+ 8,
111
+ 1,
112
+ 1
113
+ ],
114
+ "n_inner": null,
115
+ "n_layer": 12,
116
+ "n_positions": 1024,
117
+ "n_tokens": [
118
+ 512,
119
+ 0,
120
+ 0
121
+ ],
122
+ "n_vocab": 80,
123
+ "name": "AudioSamples",
124
+ "nb_priors": 3,
125
+ "pos_init": false,
126
+ "prime_attn_dropout": 0.0,
127
+ "prime_attn_order": [
128
+ 2,
129
+ 0,
130
+ 0
131
+ ],
132
+ "prime_blocks": 32,
133
+ "prime_c_res": 1,
134
+ "prime_cond_c_res": [
135
+ 0,
136
+ 1,
137
+ 1
138
+ ],
139
+ "prime_depth": [
140
+ 18,
141
+ 3,
142
+ 3
143
+ ],
144
+ "prime_emb_dropout": 0.0,
145
+ "prime_heads": 4,
146
+ "prime_init_scale": [
147
+ 0.1,
148
+ 0.4,
149
+ 0.4
150
+ ],
151
+ "prime_loss_fraction": [
152
+ 0.4,
153
+ 0.0,
154
+ 0.0
155
+ ],
156
+ "prime_m_attn": 0.25,
157
+ "prime_m_mlp": 1.0,
158
+ "prime_pos_init": false,
159
+ "prime_res_scale": false,
160
+ "prime_resid_dropout": 0.0,
161
+ "prime_spread": null,
162
+ "prime_width": [
163
+ 1280,
164
+ 128,
165
+ 128
166
+ ],
167
+ "prime_zero_out": false,
168
+ "priors_width": [
169
+ 4096,
170
+ 2048,
171
+ 1024
172
+ ],
173
+ "reorder_and_upcast_attn": false,
174
+ "res_scale": false,
175
+ "resid_dropout": 0.0,
176
+ "sample_hop_length": 30000,
177
+ "sample_length": 44100,
178
+ "sample_length_in_seconds": 1,
179
+ "scale_attn_by_inverse_layer_idx": false,
180
+ "scale_attn_weights": true,
181
+ "single_enc_dec": [
182
+ false,
183
+ false,
184
+ false
185
+ ],
186
+ "spectral": 0.0,
187
+ "spread": null,
188
+ "sr": 16000,
189
+ "strides_t": [
190
+ 2,
191
+ 2,
192
+ 2
193
+ ],
194
+ "summary_activation": null,
195
+ "summary_first_dropout": 0.1,
196
+ "summary_proj_to_labels": true,
197
+ "summary_type": "cls_index",
198
+ "summary_use_proj": true,
199
+ "t_bins": 128,
200
+ "transformers_version": "4.21.0.dev0",
201
+ "use_cache": true,
202
+ "use_nonrelative_specloss": true,
203
+ "use_tokens": [
204
+ true,
205
+ false,
206
+ false
207
+ ],
208
+ "vocab_size": 50257,
209
+ "vq_vae_codebook_dimension": 2048,
210
+ "vq_vae_commit": 0.02,
211
+ "vq_vae_conv_block_depth": 4,
212
+ "vq_vae_conv_block_width": 64,
213
+ "vq_vae_depth": 4,
214
+ "vq_vae_dilation_cycle": null,
215
+ "vq_vae_dilation_growth_rate": 3,
216
+ "vq_vae_downs_t": [
217
+ 3,
218
+ 2,
219
+ 2
220
+ ],
221
+ "vq_vae_emmbedding_width": 2048,
222
+ "vq_vae_levels": 3,
223
+ "vq_vae_lmu": 0.99,
224
+ "vq_vae_m_conv": 1,
225
+ "vq_vae_multipliers": [
226
+ 2,
227
+ 1,
228
+ 1
229
+ ],
230
+ "vq_vae_reverse_decoder_dilation": 1,
231
+ "vq_vae_strides_t": [
232
+ 2,
233
+ 2,
234
+ 2
235
+ ],
236
+ "vq_vae_width": 64,
237
+ "vqvae_z_shapes": [
238
+ [
239
+ 125
240
+ ],
241
+ [
242
+ 500
243
+ ],
244
+ [
245
+ 2000
246
+ ]
247
+ ],
248
+ "width": [
249
+ 4800,
250
+ 1920,
251
+ 128
252
+ ],
253
+ "y_bins": [
254
+ [
255
+ 604,
256
+ 7898
257
+ ],
258
+ [
259
+ 120,
260
+ 4111
261
+ ],
262
+ [
263
+ 120,
264
+ 4111
265
+ ]
266
+ ],
267
+ "zero_out": false
268
+ }