ArthurZ HF staff commited on
Commit
af1bd4b
1 Parent(s): cd41aeb

Upload model

Browse files
Files changed (1) hide show
  1. config.json +30 -80
config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_commit_hash": null,
3
- "_name_or_path": "/home/arthur_huggingface_co/transformers/jukebox-1b-lyrics-converted",
4
  "architectures": [
5
  "JukeboxModel"
6
  ],
@@ -26,32 +26,14 @@
26
  "attn_res_scale": false,
27
  "blocks": 64,
28
  "conv_res_scale": false,
29
- "depth": 72,
30
  "emb_dropout": 0,
31
- "embed_dim": 2048,
32
- "encoder_attention_multiplier": 0.25,
33
- "encoder_attention_pattern": "RawColumnPreviousRowAttention",
34
- "encoder_attn_dropout": 0.0,
35
- "encoder_attn_res_scale": false,
36
- "encoder_blocks": 32,
37
- "encoder_depth": 18,
38
- "encoder_emb_dropout": 0.0,
39
- "encoder_heads": 4,
40
- "encoder_init_scale": 0.1,
41
- "encoder_loss_fraction": [
42
- 0.4,
43
- 0.0,
44
- 0.0
45
- ],
46
- "encoder_mlp_multiplier": 1.0,
47
- "encoder_n_vocab": 79,
48
- "encoder_resid_dropout": 0.0,
49
- "encoder_spread": null,
50
- "encoder_width": 1280,
51
- "encoder_zero_out": false,
52
  "init_scale": 0.2,
53
  "is_encoder_decoder": true,
54
- "lyric_conditioning": true,
 
55
  "mask": true,
56
  "max_duration": 600.0,
57
  "max_nb_genres": 1,
@@ -63,10 +45,12 @@
63
  ],
64
  "min_duration": 17.84,
65
  "mlp_multiplier": 1.0,
66
- "model_type": "jukebox",
 
67
  "n_ctx": 6144,
68
  "n_heads": 2,
69
  "nb_relevant_lyric_tokens": 384,
 
70
  "res_conv_depth": null,
71
  "res_conv_width": null,
72
  "res_convolution_multiplier": null,
@@ -86,8 +70,6 @@
86
  "sampling_rate": 44100,
87
  "spread": null,
88
  "timing_dims": 64,
89
- "transformers_version": "4.25.0.dev0",
90
- "width": 2048,
91
  "zero_out": false
92
  },
93
  "prior_1": {
@@ -100,32 +82,15 @@
100
  "attn_res_scale": false,
101
  "blocks": 64,
102
  "conv_res_scale": true,
103
- "depth": 72,
104
  "emb_dropout": 0,
105
  "embed_dim": 2048,
106
- "encoder_attention_multiplier": null,
107
- "encoder_attention_pattern": null,
108
- "encoder_attn_dropout": null,
109
- "encoder_attn_res_scale": false,
110
- "encoder_blocks": null,
111
- "encoder_depth": null,
112
- "encoder_emb_dropout": null,
113
- "encoder_heads": null,
114
- "encoder_init_scale": null,
115
- "encoder_loss_fraction": [
116
- 0.4,
117
- 0.0,
118
- 0.0
119
- ],
120
- "encoder_mlp_multiplier": null,
121
- "encoder_n_vocab": 0,
122
- "encoder_resid_dropout": null,
123
- "encoder_spread": null,
124
- "encoder_width": null,
125
- "encoder_zero_out": null,
126
  "init_scale": 1,
127
  "is_encoder_decoder": false,
128
- "lyric_conditioning": false,
 
129
  "mask": true,
130
  "max_duration": 600.0,
131
  "max_nb_genres": 1,
@@ -137,10 +102,12 @@
137
  ],
138
  "min_duration": 17.84,
139
  "mlp_multiplier": 1.0,
140
- "model_type": "jukebox",
 
141
  "n_ctx": 8192,
142
  "n_heads": 1,
143
  "nb_relevant_lyric_tokens": 0,
 
144
  "res_conv_depth": 16,
145
  "res_conv_width": 1024,
146
  "res_convolution_multiplier": 1,
@@ -160,8 +127,6 @@
160
  "sampling_rate": 44100,
161
  "spread": null,
162
  "timing_dims": 64,
163
- "transformers_version": "4.25.0.dev0",
164
- "width": 1920,
165
  "zero_out": false
166
  },
167
  "prior_2": {
@@ -174,32 +139,15 @@
174
  "attn_res_scale": false,
175
  "blocks": 64,
176
  "conv_res_scale": null,
177
- "depth": 72,
178
  "emb_dropout": 0,
179
  "embed_dim": 2048,
180
- "encoder_attention_multiplier": null,
181
- "encoder_attention_pattern": null,
182
- "encoder_attn_dropout": null,
183
- "encoder_attn_res_scale": false,
184
- "encoder_blocks": null,
185
- "encoder_depth": null,
186
- "encoder_emb_dropout": null,
187
- "encoder_heads": null,
188
- "encoder_init_scale": null,
189
- "encoder_loss_fraction": [
190
- 0.4,
191
- 0.0,
192
- 0.0
193
- ],
194
- "encoder_mlp_multiplier": null,
195
- "encoder_n_vocab": 0,
196
- "encoder_resid_dropout": null,
197
- "encoder_spread": null,
198
- "encoder_width": null,
199
- "encoder_zero_out": null,
200
  "init_scale": 1,
201
  "is_encoder_decoder": false,
202
- "lyric_conditioning": false,
 
203
  "mask": true,
204
  "max_duration": 600.0,
205
  "max_nb_genres": 1,
@@ -211,10 +159,12 @@
211
  ],
212
  "min_duration": 17.84,
213
  "mlp_multiplier": 1.0,
214
- "model_type": "jukebox",
 
215
  "n_ctx": 8192,
216
  "n_heads": 1,
217
  "nb_relevant_lyric_tokens": 0,
 
218
  "res_conv_depth": 16,
219
  "res_conv_width": 1024,
220
  "res_convolution_multiplier": 1,
@@ -234,8 +184,6 @@
234
  "sampling_rate": 44100,
235
  "spread": null,
236
  "timing_dims": 64,
237
- "transformers_version": "4.25.0.dev0",
238
- "width": 1920,
239
  "zero_out": false
240
  },
241
  "sampling_rate": 44100,
@@ -244,7 +192,6 @@
244
  "transformers_version": null,
245
  "vqvae_config": {
246
  "act_fn": "relu",
247
- "codebook_dimension": 2048,
248
  "commit": 0.02,
249
  "conv_input_shape": 1,
250
  "conv_res_scale": false,
@@ -254,14 +201,16 @@
254
  0.5,
255
  0.5
256
  ],
 
257
  "levels": 3,
258
  "lmu": 0.99,
259
- "model_type": "",
260
  "multipliers": [
261
  2,
262
  1,
263
  1
264
  ],
 
265
  "res_conv_depth": 4,
266
  "res_conv_width": 32,
267
  "res_convolution_multiplier": 1,
@@ -278,6 +227,7 @@
278
  2
279
  ],
280
  "sample_length": 1058304,
281
- "transformers_version": "4.25.0.dev0"
 
282
  }
283
  }
 
1
  {
2
  "_commit_hash": null,
3
+ "_name_or_path": "jukebox-1b-lyrics",
4
  "architectures": [
5
  "JukeboxModel"
6
  ],
 
26
  "attn_res_scale": false,
27
  "blocks": 64,
28
  "conv_res_scale": false,
 
29
  "emb_dropout": 0,
30
+ "encoder_config": null,
31
+ "encoder_loss_fraction": 0.4,
32
+ "hidden_size": 2048,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  "init_scale": 0.2,
34
  "is_encoder_decoder": true,
35
+ "level": 0,
36
+ "lyric_vocab_size": 79,
37
  "mask": true,
38
  "max_duration": 600.0,
39
  "max_nb_genres": 1,
 
45
  ],
46
  "min_duration": 17.84,
47
  "mlp_multiplier": 1.0,
48
+ "model_type": "jukebox_prior",
49
+ "music_vocab_size": 2048,
50
  "n_ctx": 6144,
51
  "n_heads": 2,
52
  "nb_relevant_lyric_tokens": 384,
53
+ "num_layers": 72,
54
  "res_conv_depth": null,
55
  "res_conv_width": null,
56
  "res_convolution_multiplier": null,
 
70
  "sampling_rate": 44100,
71
  "spread": null,
72
  "timing_dims": 64,
 
 
73
  "zero_out": false
74
  },
75
  "prior_1": {
 
82
  "attn_res_scale": false,
83
  "blocks": 64,
84
  "conv_res_scale": true,
 
85
  "emb_dropout": 0,
86
  "embed_dim": 2048,
87
+ "encoder_config": null,
88
+ "encoder_loss_fraction": 0,
89
+ "hidden_size": 1920,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  "init_scale": 1,
91
  "is_encoder_decoder": false,
92
+ "level": 1,
93
+ "lyric_vocab_size": 80,
94
  "mask": true,
95
  "max_duration": 600.0,
96
  "max_nb_genres": 1,
 
102
  ],
103
  "min_duration": 17.84,
104
  "mlp_multiplier": 1.0,
105
+ "model_type": "jukebox_prior",
106
+ "music_vocab_size": 2048,
107
  "n_ctx": 8192,
108
  "n_heads": 1,
109
  "nb_relevant_lyric_tokens": 0,
110
+ "num_layers": 72,
111
  "res_conv_depth": 16,
112
  "res_conv_width": 1024,
113
  "res_convolution_multiplier": 1,
 
127
  "sampling_rate": 44100,
128
  "spread": null,
129
  "timing_dims": 64,
 
 
130
  "zero_out": false
131
  },
132
  "prior_2": {
 
139
  "attn_res_scale": false,
140
  "blocks": 64,
141
  "conv_res_scale": null,
 
142
  "emb_dropout": 0,
143
  "embed_dim": 2048,
144
+ "encoder_config": null,
145
+ "encoder_loss_fraction": 0,
146
+ "hidden_size": 1920,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
147
  "init_scale": 1,
148
  "is_encoder_decoder": false,
149
+ "level": 2,
150
+ "lyric_vocab_size": 80,
151
  "mask": true,
152
  "max_duration": 600.0,
153
  "max_nb_genres": 1,
 
159
  ],
160
  "min_duration": 17.84,
161
  "mlp_multiplier": 1.0,
162
+ "model_type": "jukebox_prior",
163
+ "music_vocab_size": 2048,
164
  "n_ctx": 8192,
165
  "n_heads": 1,
166
  "nb_relevant_lyric_tokens": 0,
167
+ "num_layers": 72,
168
  "res_conv_depth": 16,
169
  "res_conv_width": 1024,
170
  "res_convolution_multiplier": 1,
 
184
  "sampling_rate": 44100,
185
  "spread": null,
186
  "timing_dims": 64,
 
 
187
  "zero_out": false
188
  },
189
  "sampling_rate": 44100,
 
192
  "transformers_version": null,
193
  "vqvae_config": {
194
  "act_fn": "relu",
 
195
  "commit": 0.02,
196
  "conv_input_shape": 1,
197
  "conv_res_scale": false,
 
201
  0.5,
202
  0.5
203
  ],
204
+ "init_scale": 0.2,
205
  "levels": 3,
206
  "lmu": 0.99,
207
+ "model_type": "jukebox_vqvae",
208
  "multipliers": [
209
  2,
210
  1,
211
  1
212
  ],
213
+ "nb_discrete_codes": 2048,
214
  "res_conv_depth": 4,
215
  "res_conv_width": 32,
216
  "res_convolution_multiplier": 1,
 
227
  2
228
  ],
229
  "sample_length": 1058304,
230
+ "transformers_version": "4.25.0.dev0",
231
+ "zero_out": false
232
  }
233
  }