aapot
commited on
Commit
·
1e65451
1
Parent(s):
2cbe506
Add 850k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_850000/checkpoint +3 -0
- checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_850000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_850000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_850000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55230f320637e7cceb015fe037c01fc844802b19d306aed5d400a757bc78a874
|
3 |
+
size 8513341
|
checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ea47d9a3de274b30abdfe13ef9b1812a8ea0c4693b0a0cf5da00f3fd9f57252
|
3 |
+
size 3668
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba1669e48da515debc8d9694247ebccd9c55d9d849d0263f377b227b37828adf
|
3 |
+
size 3657
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23ba8877b57f0ca58c684baa3ea76a9ef91562e6dacdcdd390d785292657fd5e
|
3 |
+
size 3447
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb2125d50209eec9a270a4f806541492d6eaaecaea8742a41f4bc90c250966a1
|
3 |
+
size 3555
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:543aec1d6c3f1ea14e73c23879a2b1559b32fe2dc2c4eb4b2402862e06f0cabf
|
3 |
+
size 3583
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26ff19a77dbdd533fc87c9c6fde3a0860b7a8e4c6308f08b0c6e2bd27f02cb78
|
3 |
+
size 3494
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ca40bdcbbc3f0e904c3932d3c6af2ac5cbbb4b5183e49fe174ef75fda609e26
|
3 |
+
size 3700
|
checkpoint_850000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28d59817a19a6b5c7cc8bef6826bded4241a33262089bbf1b4558118b1f72494
|
3 |
+
size 3637
|
checkpoint_850000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:375843aaaff5abf442599e2f574c00dd2c6c0aa540ca0d90436cfad2311cce33
|
3 |
+
size 3611
|
checkpoint_850000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a456787e026e4c0f2e9d86517d569906cb47794b954845808f78c6628a164136
|
3 |
+
size 3688
|
checkpoint_850000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9bd80b6fbc4fe774faff72dac7f4847b4cbc1800d1deecc243a6de5308950d7
|
3 |
+
size 3583
|
checkpoint_850000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98c11b320bbe10e659f4eae62256f196665bce4824b808a4fc80746bf9e99901
|
3 |
+
size 3621
|
checkpoint_850000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee5aa3a4045507b3c664190293244c7fd23706fc15095d13acd6d8c3018ba085
|
3 |
+
size 3576
|
checkpoint_850000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19f649cccded7e0f43a9fd06773b5ef76fc6fb248b0e43d07916462c09c873e1
|
3 |
+
size 3655
|
checkpoint_850000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b938cd4c3d63bdae8ffa5fbf816088ab306e0cb8501d515d37a2a7b31ef54288
|
3 |
+
size 3641
|
checkpoint_850000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e714b0da7d546df4a743bd7cfb2f47bac822fcb6ecd0ded545c2957fa950ed3e
|
3 |
+
size 3597
|
checkpoint_850000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae7c6d8b00189ae1f66f760e3a6d51509e2252e60d234f2c5aacc62542d3472
|
3 |
+
size 3602
|
checkpoint_850000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f39f298d9be87c44fbe835eb8c3ae896c44477b3348ff24f4a2c5551a8b46fe
|
3 |
+
size 3647
|
checkpoint_850000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afcdcf731544652456285c924a94b9a3cebc98c83c5266a67d51fbc65085d17f
|
3 |
+
size 3644
|
checkpoint_850000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5857fc0a1dbe56c8ea7dd3b2814c4a3bc9acfa1d25f6fd5d18fcdc4910b09c81
|
3 |
+
size 3633
|
checkpoint_850000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b13de9ce0e0a90cfb5f0f5cdbf842c3745bb4be6fa0d903e707137cf3640029
|
3 |
+
size 3599
|
checkpoint_850000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7a898ed64425eccc3102a603b30488fca78ca9a4f5bfeca18da8deedb704126
|
3 |
+
size 3588
|
checkpoint_850000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b762736127251279db69cb568f3351af09c9f5fcc860ac79a7eed22f04a8cfa
|
3 |
+
size 3669
|
checkpoint_850000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_850000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0a89cbf87f4b0ea6bb3a93164550a9bd670d6660326d7b4d131ec619881b887
|
3 |
+
size 3570
|
checkpoint_850000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|