mayank-mishra commited on
Commit
0a81cba
1 Parent(s): 862809c

update to r1.1

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "activation_function": "gelu_pytorch_tanh",
3
  "architectures": [
4
  "GPTBigCodeForCausalLM"
5
  ],
@@ -22,7 +22,7 @@
22
  "scale_attention_softmax_in_fp32": true,
23
  "scale_attn_weights": true,
24
  "torch_dtype": "bfloat16",
25
- "transformers_version": "4.38.1",
26
  "use_cache": true,
27
  "vocab_size": 49152
28
  }
 
1
  {
2
+ "activation_function": "gelu",
3
  "architectures": [
4
  "GPTBigCodeForCausalLM"
5
  ],
 
22
  "scale_attention_softmax_in_fp32": true,
23
  "scale_attn_weights": true,
24
  "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.41.2",
26
  "use_cache": true,
27
  "vocab_size": 49152
28
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.38.1"
7
  }
 
3
  "bos_token_id": 0,
4
  "eos_token_id": 0,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.41.2"
7
  }
model-00001-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29a2622ae4c65993fbdb24731570b8e144b92083c743cd464740c53feedb07d6
3
  size 4952185256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22b893e90be19cc42647f7d76caef1bd7101b6904df709b93472265fa6e41594
3
  size 4952185256
model-00002-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ceaa3f12eaa9c465094ca4a1a96a76af66d434f456b501572fdd47459f5ab36
3
  size 4930227792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc7f98d43d5aa8531381ffd2b7995008f1471a707a57becf638d089c549edec8
3
  size 4930227792
model-00003-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68b205db105c140d016f85e80c2c27153ca557ad0095da542d34613d6ab27028
3
  size 4927118464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f56c8969bbdc7995f1c61123f4b63da7ff202a93e40fde98121ec9ccdc49556
3
  size 4927118464
model-00004-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4ad77a69ec76054eaf783c0f55070ae545ae1a6bf10d4457ec776696502cb94
3
  size 4930227864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd7060b8fac28950098ce792fc518a0a8af296f47e22709ccaad1ce8216591ea
3
  size 4930227864
model-00005-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9e5f77714b34e326b73a26684c5f98bfc883da65085fad9e28e25a3708194ab
3
  size 4927118464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd071ecf07518991d9d82749d9c864a7e923eb82450048565e9121604f4cbe2
3
  size 4927118464
model-00006-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c59ff4a90e1c82cb2788c2180cf37e0616b0920ff3fec480ac11e550d4ca6cdf
3
  size 4930227864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3a0e75fbd4db5862a20e23ce6ffbf69a4a28d59505085b8d82c1d61620cbf98
3
  size 4930227864
model-00007-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8cb945b3b369eee9e1020c3f3a6a89bc875ace3de1c69d0ac3b65dfa7ce990b
3
  size 4927118464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fee8bebaf2202e65cd8253898b317fc4a03a5a5cfb5bd6a01ccbf76a65d7c8b
3
  size 4927118464
model-00008-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:405e07efd511ce7c5b7250310026be2a998068d3441f33bf15968c4ce8c4d04a
3
  size 4930227864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fa8ce48dbb754a3e762d10d3590c65fb0eb30b6f28044f37ad184c335ff6916
3
  size 4930227864
model-00009-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98f8e3576530d40a41001a6f0991cdd107e8d14147dfbbf1c5fa21f02eabf120
3
  size 679601176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62f5a5189fb992fb52b72861f432dc19123bef17f78c42e1db8a89b208b4b5ab
3
  size 679601176
tokenizer.json CHANGED
@@ -206,6 +206,7 @@
206
  "end_of_word_suffix": null,
207
  "fuse_unk": false,
208
  "byte_fallback": false,
 
209
  "vocab": {
210
  "<|endoftext|>": 0,
211
  "<fim_prefix>": 1,
 
206
  "end_of_word_suffix": null,
207
  "fuse_unk": false,
208
  "byte_fallback": false,
209
+ "ignore_merges": false,
210
  "vocab": {
211
  "<|endoftext|>": 0,
212
  "<fim_prefix>": 1,
tokenizer_config.json CHANGED
@@ -178,7 +178,7 @@
178
  "bos_token": "<|endoftext|>",
179
  "clean_up_tokenization_spaces": true,
180
  "eos_token": "<|endoftext|>",
181
- "model_max_length": 9223372036854775807,
182
  "pad_token": "<|endoftext|>",
183
  "padding_side": "left",
184
  "tokenizer_class": "GPT2Tokenizer",
 
178
  "bos_token": "<|endoftext|>",
179
  "clean_up_tokenization_spaces": true,
180
  "eos_token": "<|endoftext|>",
181
+ "model_max_length": 8192,
182
  "pad_token": "<|endoftext|>",
183
  "padding_side": "left",
184
  "tokenizer_class": "GPT2Tokenizer",