TheRadDani commited on
Commit
400f05b
·
verified ·
1 Parent(s): 97d80d6

RLHF model of StarCoder

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9e8676d7c37b61e40b712f7e796f2b9273321bf9d2dc46cab4640b63b83af3c
3
  size 656601304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2164791914a2399a54aed9ae2e0b3a6214198a8d03664276eaf378edfeccdca
3
  size 656601304
special_tokens_map.json CHANGED
@@ -34,13 +34,7 @@
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
- "pad_token": {
38
- "content": "[PAD]",
39
- "lstrip": false,
40
- "normalized": false,
41
- "rstrip": false,
42
- "single_word": false
43
- },
44
  "unk_token": {
45
  "content": "<|endoftext|>",
46
  "lstrip": false,
 
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
+ "pad_token": "<|endoftext|>",
 
 
 
 
 
 
38
  "unk_token": {
39
  "content": "<|endoftext|>",
40
  "lstrip": false,
tokenizer.json CHANGED
@@ -1,20 +1,15 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 256,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 256
12
  },
13
- "direction": "Right",
14
  "pad_to_multiple_of": null,
15
- "pad_id": 49152,
16
  "pad_type_id": 0,
17
- "pad_token": "[PAD]"
18
  },
19
  "added_tokens": [
20
  {
@@ -187,15 +182,6 @@
187
  "rstrip": false,
188
  "normalized": false,
189
  "special": true
190
- },
191
- {
192
- "id": 49152,
193
- "content": "[PAD]",
194
- "single_word": false,
195
- "lstrip": false,
196
- "rstrip": false,
197
- "normalized": false,
198
- "special": true
199
  }
200
  ],
201
  "normalizer": null,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": {
5
  "strategy": {
6
+ "Fixed": 32
7
  },
8
+ "direction": "Left",
9
  "pad_to_multiple_of": null,
10
+ "pad_id": 0,
11
  "pad_type_id": 0,
12
+ "pad_token": "<|endoftext|>"
13
  },
14
  "added_tokens": [
15
  {
 
182
  "rstrip": false,
183
  "normalized": false,
184
  "special": true
 
 
 
 
 
 
 
 
 
185
  }
186
  ],
187
  "normalizer": null,
tokenizer_config.json CHANGED
@@ -152,14 +152,6 @@
152
  "rstrip": false,
153
  "single_word": false,
154
  "special": true
155
- },
156
- "49152": {
157
- "content": "[PAD]",
158
- "lstrip": false,
159
- "normalized": false,
160
- "rstrip": false,
161
- "single_word": false,
162
- "special": true
163
  }
164
  },
165
  "additional_special_tokens": [
@@ -187,7 +179,8 @@
187
  "clean_up_tokenization_spaces": true,
188
  "eos_token": "<|endoftext|>",
189
  "model_max_length": 1000000000000000019884624838656,
190
- "pad_token": "[PAD]",
 
191
  "tokenizer_class": "GPT2Tokenizer",
192
  "unk_token": "<|endoftext|>",
193
  "vocab_size": 49152
 
152
  "rstrip": false,
153
  "single_word": false,
154
  "special": true
 
 
 
 
 
 
 
 
155
  }
156
  },
157
  "additional_special_tokens": [
 
179
  "clean_up_tokenization_spaces": true,
180
  "eos_token": "<|endoftext|>",
181
  "model_max_length": 1000000000000000019884624838656,
182
+ "pad_token": "<|endoftext|>",
183
+ "padding_side": "left",
184
  "tokenizer_class": "GPT2Tokenizer",
185
  "unk_token": "<|endoftext|>",
186
  "vocab_size": 49152
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46ab18728d598e8df336a50de9eae8756e806779df4977d5db38d49239627d96
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e802996ed957debf7d3bf3ff709646a6f063fe24e0a857449a3a18b03a0005b
3
  size 4856