TheRadDani commited on
Commit
ab80262
1 Parent(s): 400f05b

RLHF model of StarCoder

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2164791914a2399a54aed9ae2e0b3a6214198a8d03664276eaf378edfeccdca
3
  size 656601304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7238b285b314e21148702302531cde42d2b900153ce19a27e7a7aeac87e5fe6b
3
  size 656601304
special_tokens_map.json CHANGED
@@ -34,7 +34,13 @@
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
- "pad_token": "<|endoftext|>",
 
 
 
 
 
 
38
  "unk_token": {
39
  "content": "<|endoftext|>",
40
  "lstrip": false,
 
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
+ "pad_token": {
38
+ "content": "<|endoftext|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
  "unk_token": {
45
  "content": "<|endoftext|>",
46
  "lstrip": false,
tokenizer.json CHANGED
@@ -1,9 +1,14 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": {
5
  "strategy": {
6
- "Fixed": 32
7
  },
8
  "direction": "Left",
9
  "pad_to_multiple_of": null,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 256,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 256
12
  },
13
  "direction": "Left",
14
  "pad_to_multiple_of": null,
tokenizer_config.json CHANGED
@@ -178,8 +178,11 @@
178
  "bos_token": "<|endoftext|>",
179
  "clean_up_tokenization_spaces": true,
180
  "eos_token": "<|endoftext|>",
 
181
  "model_max_length": 1000000000000000019884624838656,
 
182
  "pad_token": "<|endoftext|>",
 
183
  "padding_side": "left",
184
  "tokenizer_class": "GPT2Tokenizer",
185
  "unk_token": "<|endoftext|>",
 
178
  "bos_token": "<|endoftext|>",
179
  "clean_up_tokenization_spaces": true,
180
  "eos_token": "<|endoftext|>",
181
+ "max_length": 32,
182
  "model_max_length": 1000000000000000019884624838656,
183
+ "pad_to_multiple_of": null,
184
  "pad_token": "<|endoftext|>",
185
+ "pad_token_type_id": 0,
186
  "padding_side": "left",
187
  "tokenizer_class": "GPT2Tokenizer",
188
  "unk_token": "<|endoftext|>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e802996ed957debf7d3bf3ff709646a6f063fe24e0a857449a3a18b03a0005b
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46ab18728d598e8df336a50de9eae8756e806779df4977d5db38d49239627d96
3
  size 4856