Text Generation
Transformers
Safetensors
English
llama
code
hpc
parallel
axonn
text-generation-inference
daniellnichols commited on
Commit
d539aad
·
verified ·
1 Parent(s): 81f05ea

add tokenizer to v2.1

Browse files
Files changed (3) hide show
  1. README.md +6 -6
  2. tokenizer.json +1 -0
  3. tokenizer_config.json +1 -0
README.md CHANGED
@@ -1,17 +1,17 @@
1
  ---
2
- library_name: transformers
3
- tags:
4
- - code
5
- - hpc
6
- - parallel
7
- - axonn
8
  datasets:
9
  - hpcgroup/hpc-instruct
10
  - ise-uiuc/Magicoder-OSS-Instruct-75K
11
  - nickrosh/Evol-Instruct-Code-80k-v1
12
  language:
13
  - en
 
14
  pipeline_tag: text-generation
 
 
 
 
 
15
  ---
16
 
17
  # HPC-Coder-v2
 
1
  ---
 
 
 
 
 
 
2
  datasets:
3
  - hpcgroup/hpc-instruct
4
  - ise-uiuc/Magicoder-OSS-Instruct-75K
5
  - nickrosh/Evol-Instruct-Code-80k-v1
6
  language:
7
  - en
8
+ library_name: transformers
9
  pipeline_tag: text-generation
10
+ tags:
11
+ - code
12
+ - hpc
13
+ - parallel
14
+ - axonn
15
  ---
16
 
17
  # HPC-Coder-v2
tokenizer.json CHANGED
@@ -321,6 +321,7 @@
321
  "end_of_word_suffix": null,
322
  "fuse_unk": false,
323
  "byte_fallback": false,
 
324
  "vocab": {
325
  "!": 0,
326
  "\"": 1,
 
321
  "end_of_word_suffix": null,
322
  "fuse_unk": false,
323
  "byte_fallback": false,
324
+ "ignore_merges": false,
325
  "vocab": {
326
  "!": 0,
327
  "\"": 1,
tokenizer_config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
 
4
  "added_tokens_decoder": {
5
  "32000": {
6
  "content": "õ",
 
1
  {
2
  "add_bos_token": true,
3
  "add_eos_token": false,
4
+ "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
  "32000": {
7
  "content": "õ",