chinnadhurai sankar
commited on
Commit
•
07fe3ef
1
Parent(s):
0121e6c
initial commit
Browse files- elm-0.25_news_classification/added_tokens.json +3 -0
- elm-0.25_news_classification/ckpt.pt +3 -0
- elm-0.25_news_classification/config.yaml +1 -0
- elm-0.25_news_classification/example_prompts.json +13 -0
- elm-0.25_news_classification/merges.txt +0 -0
- elm-0.25_news_classification/slicex_elm_config.json +1 -0
- elm-0.25_news_classification/special_tokens_map.json +30 -0
- elm-0.25_news_classification/tokenizer.json +0 -0
- elm-0.25_news_classification/tokenizer_config.json +30 -0
- elm-0.25_news_classification/vocab.json +0 -0
- elm-0.75_news_classification/added_tokens.json +3 -0
- elm-0.75_news_classification/ckpt.pt +3 -0
- elm-0.75_news_classification/config.yaml +1 -0
- elm-0.75_news_classification/example_prompts.json +13 -0
- elm-0.75_news_classification/merges.txt +0 -0
- elm-0.75_news_classification/slicex_elm_config.json +1 -0
- elm-0.75_news_classification/special_tokens_map.json +30 -0
- elm-0.75_news_classification/tokenizer.json +0 -0
- elm-0.75_news_classification/tokenizer_config.json +30 -0
- elm-0.75_news_classification/vocab.json +0 -0
- elm-1.0_news_classification/added_tokens.json +3 -0
- elm-1.0_news_classification/ckpt.pt +3 -0
- elm-1.0_news_classification/config.yaml +1 -0
- elm-1.0_news_classification/example_prompts.json +13 -0
- elm-1.0_news_classification/merges.txt +0 -0
- elm-1.0_news_classification/slicex_elm_config.json +1 -0
- elm-1.0_news_classification/special_tokens_map.json +30 -0
- elm-1.0_news_classification/tokenizer.json +0 -0
- elm-1.0_news_classification/tokenizer_config.json +30 -0
- elm-1.0_news_classification/vocab.json +0 -0
elm-0.25_news_classification/added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[PAD]": 50257
|
3 |
+
}
|
elm-0.25_news_classification/ckpt.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7053be8926ca6b0e047974424e26def7a4731d1ac0c7a8ac2ece353f1ef1b95e
|
3 |
+
size 840171202
|
elm-0.25_news_classification/config.yaml
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
name_or_path: elm/rambutan
|
elm-0.25_news_classification/example_prompts.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"inputs": [
|
3 |
+
"GM May Close Plant in Europe DETROIT (Reuters) - General Motors Corp. <A HREF=\"http://www.investor.reuters.com/FullQuote.aspx?ticker=GM.N target=/stocks/quickinfo/fullquote\">GM.N</A> will likely cut some jobs in Europe and may close a plant there as part of a restructuring plan under development to try to return the region to profitability, the U.S. automaker said on Wednesday.",
|
4 |
+
"Netflix, TiVo sign VoD alliance Netflix, the online DVD rental company, and TiVo yesterday said they will work together to deliver movies digitally down the wires, presumably specifically to the latter #39;s PVR equipment.",
|
5 |
+
"NBA Star Pippen Announces Retirement National Basketball Association star Scottie Pippen has announced his retirement from the game, leaving the Chicago Bulls team he helped lead to six NBA titles.",
|
6 |
+
"Radcliffe to Run in New York Marathon LONDON (Reuters) - World marathon record holder Paula Radcliffe believes she has put her failure at the Athens Olympics behind her after announcing on Tuesday that she will run in the New York marathon on November 7.",
|
7 |
+
"GE Says It's on Track for 2004, 2005 BOSTON (Reuters) - Diversified manufacturer General Electric Co. <A HREF=\"http://www.investor.reuters.com/FullQuote.aspx?ticker=GE.N target=/stocks/quickinfo/fullquote\">GE.N</A> said on Tuesday that it is on track to meet its full-year earnings forecast and to achieve double-digit gains in earnings per share in 2005.",
|
8 |
+
"Hyundai signs deal for China truck plant Hyundai Motor Co. said yesterday that it has signed an agreement with a Chinese company, Jianghuai Automobile Corp., to build a commercial vehicle and engine plant in China #39;s Anhui province.",
|
9 |
+
"Sprint is chock full of potential heros It would be nice to see this week #39;s 100-meter sprint as simply the best footrace of all time. We could witness four sub-10-second sprints for the first time ever. It would be nice to watch with raised eyebrows instead of furrowed ones. It ...",
|
10 |
+
"Clash of the unpredictables: WI-Pak tie What would happen when two of the worlds most talented and unpredictable sides rub shoulders and that too in an ICC Champions Trophy semi-final?"
|
11 |
+
],
|
12 |
+
"template": "[INST]Below is a news article. Please classify it under one of the following classes (World, Business, Sports, Sci/Tech). Please format your response as a JSON payload.\n\n### Article: {input}\n\n### JSON Response:[/INST]"
|
13 |
+
}
|
elm-0.25_news_classification/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-0.25_news_classification/slicex_elm_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"_name_or_path": "elm_rambutan"}
|
elm-0.25_news_classification/special_tokens_map.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<|endoftext|>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "<|endoftext|>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": {
|
17 |
+
"content": "[PAD]",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": true,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"unk_token": {
|
24 |
+
"content": "<|endoftext|>",
|
25 |
+
"lstrip": false,
|
26 |
+
"normalized": true,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
}
|
30 |
+
}
|
elm-0.25_news_classification/tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-0.25_news_classification/tokenizer_config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": false,
|
3 |
+
"add_prefix_space": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"50256": {
|
6 |
+
"content": "<|endoftext|>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": true,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"50257": {
|
14 |
+
"content": "[PAD]",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": true,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
}
|
21 |
+
},
|
22 |
+
"bos_token": "<|endoftext|>",
|
23 |
+
"clean_up_tokenization_spaces": true,
|
24 |
+
"eos_token": "<|endoftext|>",
|
25 |
+
"errors": "replace",
|
26 |
+
"model_max_length": 1024,
|
27 |
+
"pad_token": "[PAD]",
|
28 |
+
"tokenizer_class": "GPT2Tokenizer",
|
29 |
+
"unk_token": "<|endoftext|>"
|
30 |
+
}
|
elm-0.25_news_classification/vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-0.75_news_classification/added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[PAD]": 50257
|
3 |
+
}
|
elm-0.75_news_classification/ckpt.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c118d47fc78c207bcfc1570035b14e92f3a1f0cff3b4a2e7f393a02a2e6afd2
|
3 |
+
size 1696314274
|
elm-0.75_news_classification/config.yaml
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
name_or_path: elm/rambutan
|
elm-0.75_news_classification/example_prompts.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"inputs": [
|
3 |
+
"GM May Close Plant in Europe DETROIT (Reuters) - General Motors Corp. <A HREF=\"http://www.investor.reuters.com/FullQuote.aspx?ticker=GM.N target=/stocks/quickinfo/fullquote\">GM.N</A> will likely cut some jobs in Europe and may close a plant there as part of a restructuring plan under development to try to return the region to profitability, the U.S. automaker said on Wednesday.",
|
4 |
+
"Netflix, TiVo sign VoD alliance Netflix, the online DVD rental company, and TiVo yesterday said they will work together to deliver movies digitally down the wires, presumably specifically to the latter #39;s PVR equipment.",
|
5 |
+
"NBA Star Pippen Announces Retirement National Basketball Association star Scottie Pippen has announced his retirement from the game, leaving the Chicago Bulls team he helped lead to six NBA titles.",
|
6 |
+
"Radcliffe to Run in New York Marathon LONDON (Reuters) - World marathon record holder Paula Radcliffe believes she has put her failure at the Athens Olympics behind her after announcing on Tuesday that she will run in the New York marathon on November 7.",
|
7 |
+
"GE Says It's on Track for 2004, 2005 BOSTON (Reuters) - Diversified manufacturer General Electric Co. <A HREF=\"http://www.investor.reuters.com/FullQuote.aspx?ticker=GE.N target=/stocks/quickinfo/fullquote\">GE.N</A> said on Tuesday that it is on track to meet its full-year earnings forecast and to achieve double-digit gains in earnings per share in 2005.",
|
8 |
+
"Hyundai signs deal for China truck plant Hyundai Motor Co. said yesterday that it has signed an agreement with a Chinese company, Jianghuai Automobile Corp., to build a commercial vehicle and engine plant in China #39;s Anhui province.",
|
9 |
+
"Sprint is chock full of potential heros It would be nice to see this week #39;s 100-meter sprint as simply the best footrace of all time. We could witness four sub-10-second sprints for the first time ever. It would be nice to watch with raised eyebrows instead of furrowed ones. It ...",
|
10 |
+
"Clash of the unpredictables: WI-Pak tie What would happen when two of the worlds most talented and unpredictable sides rub shoulders and that too in an ICC Champions Trophy semi-final?"
|
11 |
+
],
|
12 |
+
"template": "[INST]Below is a news article. Please classify it under one of the following classes (World, Business, Sports, Sci/Tech). Please format your response as a JSON payload.\n\n### Article: {input}\n\n### JSON Response:[/INST]"
|
13 |
+
}
|
elm-0.75_news_classification/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-0.75_news_classification/slicex_elm_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"_name_or_path": "elm_rambutan"}
|
elm-0.75_news_classification/special_tokens_map.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<|endoftext|>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "<|endoftext|>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": {
|
17 |
+
"content": "[PAD]",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": true,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"unk_token": {
|
24 |
+
"content": "<|endoftext|>",
|
25 |
+
"lstrip": false,
|
26 |
+
"normalized": true,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
}
|
30 |
+
}
|
elm-0.75_news_classification/tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-0.75_news_classification/tokenizer_config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": false,
|
3 |
+
"add_prefix_space": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"50256": {
|
6 |
+
"content": "<|endoftext|>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": true,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"50257": {
|
14 |
+
"content": "[PAD]",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": true,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
}
|
21 |
+
},
|
22 |
+
"bos_token": "<|endoftext|>",
|
23 |
+
"clean_up_tokenization_spaces": true,
|
24 |
+
"eos_token": "<|endoftext|>",
|
25 |
+
"errors": "replace",
|
26 |
+
"model_max_length": 1024,
|
27 |
+
"pad_token": "[PAD]",
|
28 |
+
"tokenizer_class": "GPT2Tokenizer",
|
29 |
+
"unk_token": "<|endoftext|>"
|
30 |
+
}
|
elm-0.75_news_classification/vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-1.0_news_classification/added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[PAD]": 50257
|
3 |
+
}
|
elm-1.0_news_classification/ckpt.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e13e37f2410fff36cb11e2cd3cbcc814a380bdbecc06967a34c0d035d52294a3
|
3 |
+
size 2124385874
|
elm-1.0_news_classification/config.yaml
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
name_or_path: elm/rambutan
|
elm-1.0_news_classification/example_prompts.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"inputs": [
|
3 |
+
"GM May Close Plant in Europe DETROIT (Reuters) - General Motors Corp. <A HREF=\"http://www.investor.reuters.com/FullQuote.aspx?ticker=GM.N target=/stocks/quickinfo/fullquote\">GM.N</A> will likely cut some jobs in Europe and may close a plant there as part of a restructuring plan under development to try to return the region to profitability, the U.S. automaker said on Wednesday.",
|
4 |
+
"Netflix, TiVo sign VoD alliance Netflix, the online DVD rental company, and TiVo yesterday said they will work together to deliver movies digitally down the wires, presumably specifically to the latter #39;s PVR equipment.",
|
5 |
+
"NBA Star Pippen Announces Retirement National Basketball Association star Scottie Pippen has announced his retirement from the game, leaving the Chicago Bulls team he helped lead to six NBA titles.",
|
6 |
+
"Radcliffe to Run in New York Marathon LONDON (Reuters) - World marathon record holder Paula Radcliffe believes she has put her failure at the Athens Olympics behind her after announcing on Tuesday that she will run in the New York marathon on November 7.",
|
7 |
+
"GE Says It's on Track for 2004, 2005 BOSTON (Reuters) - Diversified manufacturer General Electric Co. <A HREF=\"http://www.investor.reuters.com/FullQuote.aspx?ticker=GE.N target=/stocks/quickinfo/fullquote\">GE.N</A> said on Tuesday that it is on track to meet its full-year earnings forecast and to achieve double-digit gains in earnings per share in 2005.",
|
8 |
+
"Hyundai signs deal for China truck plant Hyundai Motor Co. said yesterday that it has signed an agreement with a Chinese company, Jianghuai Automobile Corp., to build a commercial vehicle and engine plant in China #39;s Anhui province.",
|
9 |
+
"Sprint is chock full of potential heros It would be nice to see this week #39;s 100-meter sprint as simply the best footrace of all time. We could witness four sub-10-second sprints for the first time ever. It would be nice to watch with raised eyebrows instead of furrowed ones. It ...",
|
10 |
+
"Clash of the unpredictables: WI-Pak tie What would happen when two of the worlds most talented and unpredictable sides rub shoulders and that too in an ICC Champions Trophy semi-final?"
|
11 |
+
],
|
12 |
+
"template": "[INST]Below is a news article. Please classify it under one of the following classes (World, Business, Sports, Sci/Tech). Please format your response as a JSON payload.\n\n### Article: {input}\n\n### JSON Response:[/INST]"
|
13 |
+
}
|
elm-1.0_news_classification/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-1.0_news_classification/slicex_elm_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"_name_or_path": "elm_rambutan"}
|
elm-1.0_news_classification/special_tokens_map.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<|endoftext|>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "<|endoftext|>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": {
|
17 |
+
"content": "[PAD]",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": true,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"unk_token": {
|
24 |
+
"content": "<|endoftext|>",
|
25 |
+
"lstrip": false,
|
26 |
+
"normalized": true,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
}
|
30 |
+
}
|
elm-1.0_news_classification/tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
elm-1.0_news_classification/tokenizer_config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": false,
|
3 |
+
"add_prefix_space": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"50256": {
|
6 |
+
"content": "<|endoftext|>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": true,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"50257": {
|
14 |
+
"content": "[PAD]",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": true,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
}
|
21 |
+
},
|
22 |
+
"bos_token": "<|endoftext|>",
|
23 |
+
"clean_up_tokenization_spaces": true,
|
24 |
+
"eos_token": "<|endoftext|>",
|
25 |
+
"errors": "replace",
|
26 |
+
"model_max_length": 1024,
|
27 |
+
"pad_token": "[PAD]",
|
28 |
+
"tokenizer_class": "GPT2Tokenizer",
|
29 |
+
"unk_token": "<|endoftext|>"
|
30 |
+
}
|
elm-1.0_news_classification/vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|