aapot
commited on
Commit
·
370a38a
1
Parent(s):
94a7267
Add 620k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_620000/checkpoint +3 -0
- checkpoint_620000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_620000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_620000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_620000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f37e9f3cca180eefa1eeb9c975707b162bd591ceca9e442322a167198e4320b5
|
3 |
+
size 8513341
|
checkpoint_620000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a47d1e4ae7c5f4bbee5e7328caad2e4a563b65d81b54d295cbc2820167574f3e
|
3 |
+
size 3657
|
checkpoint_620000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6aa665c9f40173b6bc85cae054b96565629ce925120de02388c46f1d7dcf7ce
|
3 |
+
size 3654
|
checkpoint_620000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbc8b9ac567cfcef85f676fa9a62304dd5778284b91591525daf50ed47df4271
|
3 |
+
size 3428
|
checkpoint_620000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:850cc70b987875220dc77018fcf32acf455aa293ad88aa26a8ea748117e3d8b6
|
3 |
+
size 3549
|
checkpoint_620000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9a2745069f8edfa0842ed3b569dfffd20a3e8cb6997a3fa5a182fbc074065a1
|
3 |
+
size 3591
|
checkpoint_620000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8665727c27e88bacc4dfbf65ec7db6066320a82fe801a0977e63d0c5e5653a5
|
3 |
+
size 3478
|
checkpoint_620000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ea2e8d6dde13abd324eee86ae8e647f8110ca42b4d6066bb26da98948c84629
|
3 |
+
size 3695
|
checkpoint_620000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dabf586f58a22a5d272f9b320824f1757cfe5345a2c371a832708a80fc60e138
|
3 |
+
size 3665
|
checkpoint_620000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44b24fc3169412fd94662f10877b68c533262e8fca45a8707f05040a0cf9bf00
|
3 |
+
size 3578
|
checkpoint_620000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f51ae11aaa36b4127ad60b86b3d39f954dd1d130d54c791ed65671b830ca7820
|
3 |
+
size 3684
|
checkpoint_620000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db501ad071c0eaed3c6f4bb4d57909d92f5580728e779cdd7e8593f5a4cd6d25
|
3 |
+
size 3563
|
checkpoint_620000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cecbf035de98d3beb09386b19bc8cfe9cb2f5b9d5d4c4ddb5a2142bc8c8f40c1
|
3 |
+
size 3591
|
checkpoint_620000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ccfb4238f1dbe6d67445b497055b2e21bcac016a9df279cb5e4f5c2d526fff
|
3 |
+
size 3567
|
checkpoint_620000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd5aa96bd35a5d64670ec7915ee719ead9b6f36ebc103c976985fa1056732dfd
|
3 |
+
size 3630
|
checkpoint_620000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53c5a33ec3a12295ede4ccfc1742813f3254007dbd50dac88cfc49a2c79c43b8
|
3 |
+
size 3599
|
checkpoint_620000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a8ba724a463f15d55aa83aac10a0082988ab2e641f2b96fb285468a946f57a9
|
3 |
+
size 3593
|
checkpoint_620000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99ca04b3e4f197c1c22f530aa91e5fcfea3f87520e4a448b36f986bf5a93cbc7
|
3 |
+
size 3562
|
checkpoint_620000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccb5c98250b4bd36e3f14a791e2b2c4f8edd0a95a3a2e8e7acdbf4824220d8d0
|
3 |
+
size 3601
|
checkpoint_620000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31419ef3d80c90a484f703df8fbc9e6c03c99204b96b424212b7cfd4eedf7113
|
3 |
+
size 3666
|
checkpoint_620000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4f22f217b8db4a1e4c29dcf45c316e77048e173d16582b2e3ee5ec1bf002690
|
3 |
+
size 3663
|
checkpoint_620000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a04f9929ba6e6b64cafd48853fad1ec030879fa457cc308eb3d3339b9c843a4
|
3 |
+
size 3587
|
checkpoint_620000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50a70912b19cde1887aefaac7605ee39913dea5df67f4399f332684ed75fdc68
|
3 |
+
size 3586
|
checkpoint_620000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7371ca956266f518b0b896766605c9d0dae96e6388e78b610bcdcc1aa1bfe5e6
|
3 |
+
size 3645
|
checkpoint_620000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|
checkpoint_620000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3eead9060f0c24ca50a2d0f4afe8c8b9226520c135007e7991990aaababa45fe
|
3 |
+
size 3554
|
checkpoint_620000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
|
3 |
+
size 170
|