Sankalp-Bahad commited on
Commit
388c82b
1 Parent(s): afc8a95

Upload 7 files

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "xlm-roberta-base",
3
  "architectures": [
4
  "XLMRobertaForTokenClassification"
5
  ],
@@ -9,49 +9,59 @@
9
  "eos_token_id": 2,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
- "hidden_size": 768,
13
  "id2label": {
14
- "0": "B-NEL",
15
- "1": "B-NEO",
16
- "2": "B-NEP",
17
- "3": "I-NEL",
18
- "4": "I-NEO",
19
- "5": "I-NEP",
20
- "6": "O",
21
- "7": "B-NETI",
22
- "8": "I-NETI",
23
- "9": "B-NEN",
24
- "10": "I-NEN",
25
- "11": "B-NEAR",
26
- "12": "I-NEAR"
 
 
 
 
 
 
 
 
 
 
27
  },
28
  "initializer_range": 0.02,
29
- "intermediate_size": 3072,
30
  "label2id": {
31
- "B-NEL": 0,
32
- "B-NEO": 1,
33
- "I-NEN": 10,
34
- "B-NEAR": 11,
35
- "I-NEAR": 12,
36
- "B-NEP": 2,
37
- "I-NEL": 3,
38
- "I-NEO": 4,
39
- "I-NEP": 5,
40
- "O": 6,
41
- "B-NETI": 7,
42
- "I-NETI": 8,
43
- "B-NEN": 9
44
  },
45
  "layer_norm_eps": 1e-05,
46
  "max_position_embeddings": 514,
47
  "model_type": "xlm-roberta",
48
- "num_attention_heads": 12,
49
- "num_hidden_layers": 12,
50
  "output_past": true,
51
  "pad_token_id": 1,
52
  "position_embedding_type": "absolute",
53
  "torch_dtype": "float32",
54
- "transformers_version": "4.37.2",
55
  "type_vocab_size": 1,
56
  "use_cache": true,
57
  "vocab_size": 250002
 
1
  {
2
+ "_name_or_path": "cfilt/HiNER-original-xlm-roberta-large",
3
  "architectures": [
4
  "XLMRobertaForTokenClassification"
5
  ],
 
9
  "eos_token_id": 2,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
  "id2label": {
14
+ "0": "O",
15
+ "1": "O",
16
+ "2": "O",
17
+ "3": "B-NEAR",
18
+ "4": "B-NEL",
19
+ "5": "O",
20
+ "6": "B-NEN",
21
+ "7": "B-NEO",
22
+ "8": "B-NEP",
23
+ "9": "O",
24
+ "10": "B-NETI",
25
+ "11": "O",
26
+ "12": "O",
27
+ "13": "O",
28
+ "14": "I-NEAR",
29
+ "15": "I-NEL",
30
+ "16": "O",
31
+ "17": "I-NEN",
32
+ "18": "I-NEO",
33
+ "19": "I-NEP",
34
+ "20": "O",
35
+ "21": "I-NETI",
36
+ "22": "O"
37
  },
38
  "initializer_range": 0.02,
39
+ "intermediate_size": 4096,
40
  "label2id": {
41
+ "O" : 22 ,
42
+ "B-NEAR" : 3 ,
43
+ "B-NEL" : 4 ,
44
+ "B-NEN" : 6 ,
45
+ "B-NEO" : 7 ,
46
+ "B-NEP" : 8 ,
47
+ "B-NETI" : 10 ,
48
+ "I-NEAR" : 14 ,
49
+ "I-NEL" : 15 ,
50
+ "I-NEN" : 17 ,
51
+ "I-NEO" : 18 ,
52
+ "I-NEP" : 19 ,
53
+ "I-NETI" : 21
54
  },
55
  "layer_norm_eps": 1e-05,
56
  "max_position_embeddings": 514,
57
  "model_type": "xlm-roberta",
58
+ "num_attention_heads": 16,
59
+ "num_hidden_layers": 24,
60
  "output_past": true,
61
  "pad_token_id": 1,
62
  "position_embedding_type": "absolute",
63
  "torch_dtype": "float32",
64
+ "transformers_version": "4.41.2",
65
  "type_vocab_size": 1,
66
  "use_cache": true,
67
  "vocab_size": 250002
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d2afc04bc965bd583b98ae39b040750152f780beefb727328ca3bb77367d43c
3
- size 1109876260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a3074876f85609f238c2e2fb8ffa84933a040e687e0e897aa2a4cefdbc34d49
3
+ size 2235506156
special_tokens_map.json CHANGED
@@ -1,7 +1,25 @@
1
  {
2
- "bos_token": "<s>",
3
- "cls_token": "<s>",
4
- "eos_token": "</s>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "mask_token": {
6
  "content": "<mask>",
7
  "lstrip": true,
@@ -9,7 +27,25 @@
9
  "rstrip": false,
10
  "single_word": false
11
  },
12
- "pad_token": "<pad>",
13
- "sep_token": "</s>",
14
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
  }
 
1
  {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
  "mask_token": {
24
  "content": "<mask>",
25
  "lstrip": true,
 
27
  "rstrip": false,
28
  "single_word": false
29
  },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f59925fcb90c92b894cb93e51bb9b4a6105c5c249fe54ce1c704420ac39b81af
3
- size 17082756
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a56def25aa40facc030ea8b0b87f3688e4b3c39eb8b45d5702b3a1300fe2a20
3
+ size 17082734
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3181a426ea7660639201e31c0b9d3b891225f912e98c0bc899a460a9585b58ae
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c824368a04d54b86cd2697dbb4f0895c6bad560cb02a6c1f6fa5cabebf355741
3
+ size 5048