jburtoft commited on
Commit
f069ffa
1 Parent(s): 7548fe9

9267ee116e0be22e44ffd4e55d05f19b5b9cfbabd1760bf07b6f38d5aa307710

Browse files
.gitattributes CHANGED
@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ compiled/13f69de924bfe5a0f650.neff filter=lfs diff=lfs merge=lfs -text
37
+ compiled/24a88b503bb13eebc633.neff filter=lfs diff=lfs merge=lfs -text
38
+ compiled/4d315c567ee64f5c3c52.neff filter=lfs diff=lfs merge=lfs -text
39
+ compiled/91d9e9131e21917fb676.neff filter=lfs diff=lfs merge=lfs -text
40
+ compiled/a2673088cd059202b6c2.neff filter=lfs diff=lfs merge=lfs -text
41
+ compiled/b480b1deeb6e4c40c9d4.neff filter=lfs diff=lfs merge=lfs -text
42
+ compiled/b59dca76c353105042b2.neff filter=lfs diff=lfs merge=lfs -text
43
+ compiled/d9a9b3aab1095d21dc94.neff filter=lfs diff=lfs merge=lfs -text
44
+ compiled/e6af685a35c321de6779.neff filter=lfs diff=lfs merge=lfs -text
45
+ compiled/ee57f53ab745d1cbe07e.neff filter=lfs diff=lfs merge=lfs -text
checkpoint/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49b4ee604e7d7e179f251f097927f0eafc5fc52df7a9ec65044c33abf2bcf7f5
3
+ size 180355961
checkpoint/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5abd4edb11af6e901b4b4d0bc5c097d2932ff2029280a1085407840c7dc5af4
3
+ size 17279
checkpoint/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:528205bd1dc0e4eba76915767798b7008a39dda5a51fd73b994a871d2d2b1c90
3
+ size 17306
compiled/13f69de924bfe5a0f650.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65b2f7cff6c7bf24eab41ce1faae0057004a8463dfce36d87606e6727eda2987
3
+ size 14767104
compiled/24a88b503bb13eebc633.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f42285118e3b6f96375126454974d7ae5be886b1d51f2c2c61525e13f93f44f5
3
+ size 13487104
compiled/4d315c567ee64f5c3c52.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01965060bdfa4c4f95d0f85b9d8e6e276c05c990d62e614a7cd1160aa23aa165
3
+ size 13036544
compiled/91d9e9131e21917fb676.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2438ff1af0ed8d1ab17994bb45c3877d2cf4ccd832916c7f25f60545f87a8a5e
3
+ size 17368064
compiled/a2673088cd059202b6c2.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88343a361ff47156aa698912016ccca4ff6d379cd3d2b008b2cecce2b5a6becb
3
+ size 13364224
compiled/b480b1deeb6e4c40c9d4.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2990f48d8428ab3408af8391ea76778a42eb7c32e1531e1e429cfc7de1b2734e
3
+ size 26819584
compiled/b59dca76c353105042b2.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a45a9c1cc7e68f2bab451e0fa2303004e0f4997ac30d6a83fe5d85638bdab1f
3
+ size 12555264
compiled/d9a9b3aab1095d21dc94.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e5a75299c00e8e18567124d10abc32c2b23648937e88b7696f1021f0c8836d4
3
+ size 12493824
compiled/e6af685a35c321de6779.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd59c62e2962131c1ce08765cf8eb9ba1d935d63421c86c4e5beb59602265678
3
+ size 12678144
compiled/ee57f53ab745d1cbe07e.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f90883e287b09fd487239b1c121f27c9e1d8f7a6d79376e4609e592ba130c79
3
+ size 12944384
config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "CodeLlama-7b-hf/config.json",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 4096,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 11008,
13
+ "max_position_embeddings": 16384,
14
+ "model_type": "llama",
15
+ "neuron": {
16
+ "auto_cast_type": "fp16",
17
+ "batch_size": 1,
18
+ "compiler_type": "neuronx-cc",
19
+ "compiler_version": "2.11.0.34+c5231f848",
20
+ "num_cores": 2,
21
+ "sequence_length": 2048,
22
+ "task": "text-generation"
23
+ },
24
+ "num_attention_heads": 32,
25
+ "num_hidden_layers": 32,
26
+ "num_key_value_heads": 32,
27
+ "pretraining_tp": 1,
28
+ "rms_norm_eps": 1e-05,
29
+ "rope_scaling": null,
30
+ "rope_theta": 1000000,
31
+ "tie_word_embeddings": false,
32
+ "torch_dtype": "bfloat16",
33
+ "transformers_version": "4.35.0",
34
+ "use_cache": true,
35
+ "vocab_size": 32016
36
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.35.0"
6
+ }