aapot
commited on
Commit
•
e385993
1
Parent(s):
2ebfd3b
Add 350k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_350000/checkpoint +3 -0
- checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_350000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_350000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_350000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e943a65491a88b7281237b2903e2d8c384b7e3823db49ca33da7fe512b105a3
|
3 |
+
size 1037969
|
checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dfb49f3e9a8f2415059eade8e4a60c87456520d7dcaa0cc68ffbad79247329f
|
3 |
+
size 1405
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c841edc3759c707432f4b36475ce85cba39ea425485d397634a7590590ae2313
|
3 |
+
size 1426
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c26a26d296cd9f8c7c9a58e68202995edf78b6ec767e513b00c422b8c19e1693
|
3 |
+
size 1386
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8872fa11b532f708da9b461f739a2103a213969cd39a15dafefcba97cb706fac
|
3 |
+
size 1445
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb82bfe44c5a13f731d89cb469eb58f7b06fd2046c58cf5012dfecd45721e2df
|
3 |
+
size 1431
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0246749408ec2f1597ac6a6faff4def65a231cdd16900441e6e4300aa92ab68f
|
3 |
+
size 1425
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:205359debee4f606ad95760bfae6f0d91bb305dbb1d9ad5f8c218305c89f5de9
|
3 |
+
size 1448
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f87c43c44a1fbb8b6834519633d072deacd547f7c861f212a1230318ca1f4a34
|
3 |
+
size 1429
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6430e64c4a3b0b65766fa2007249a9f234fc4842e248ba30f6ed4797091d2b9a
|
3 |
+
size 1434
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98a76264db8fe11099b973372b9fdad0d44db0fcac9bc33607d09c67788aaf76
|
3 |
+
size 1427
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08108f23aabca29e60bc0c8cf2182572369b9229e4e5c63f6b50c3ee45bd0c91
|
3 |
+
size 1421
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7e392dab2b32932d8e014a0c7286d0fdc5cffd6b320fb613c989ab0450cf159
|
3 |
+
size 1390
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6b6d4ae135ad781ad33105c2d7a45ceb9de6d1278133b9398d098167487295f
|
3 |
+
size 1416
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96aba15db7fd4999a8466736cadb387ee8174a4ac752a9f8b6af0a737c0614a0
|
3 |
+
size 1398
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85d1fd08168cd126cc92f733bc9a5f2b853db19c7466b27b236923f654d6625a
|
3 |
+
size 1393
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afabb8842641a1787561a1fb1283bb191a6035876af4ef914904b33d343d7318
|
3 |
+
size 1403
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:859575d928df9ca197ee075ecbc1eb59276cd27a5623b00673cc811934c127c7
|
3 |
+
size 1394
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:253576ec7f534f976b174b29075ba7307c7310f51bc2e41d32cfdf5a01dddbb5
|
3 |
+
size 1378
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf9f29f81d641fafc25d008c94da480809c7865fd51abb53849e652e39cd45b2
|
3 |
+
size 1390
|
checkpoint_350000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdc3423fbe1255223af0db9d87efd36ecb3e5b36e2789a8ccd0ae4d61421bf91
|
3 |
+
size 1404
|
checkpoint_350000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_6.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b9d49485a0bd5bb5bd89f2a14bbf2e9c0145e53654c32214121d629695401cf
|
3 |
+
size 1379
|
checkpoint_350000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_6.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7532afb9e2fd184b44c560df07596ebf59a2568e93fb627ef463667dfaef4013
|
3 |
+
size 1390
|
checkpoint_350000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_7.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d681a39e5d05c0368791cd15f27588687982e88c303b3520ed81628625d9d0c
|
3 |
+
size 1433
|
checkpoint_350000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|
checkpoint_350000/state.param_states.decoder.layers_7.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad534326ab797f7d0eb2b05e29e4612375468094278561f8d1fcd295e6bd1ba9
|
3 |
+
size 1418
|
checkpoint_350000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0abc950cac11ef626f934932fe9764223fb94e32a0a61ee59b0e5bb8cb2426eb
|
3 |
+
size 168
|