init

Browse files

Files changed (14) hide show

config.json +102 -0
parameter.json +1 -0
pytorch_model.bin +3 -0
sentencepiece.bpe.model +3 -0
special_tokens_map.json +1 -0
test_bc5cdr_span.json +1 -0
test_bionlp2004_span.json +1 -0
test_conll2003_span.json +1 -0
test_fin_span.json +1 -0
test_ontonotes5.json +1 -0
test_ontonotes5_span.json +1 -0
test_panx_dataset-en_span.json +1 -0
test_wnut2017_span.json +1 -0
tokenizer_config.json +1 -0

config.json ADDED Viewed

	@@ -0,0 +1,102 @@

+{
+  "_name_or_path": "xlm-roberta-large",
+  "architectures": [
+    "XLMRobertaForTokenClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "O",
+    "1": "B-cardinal number",
+    "2": "B-date",
+    "3": "I-date",
+    "4": "B-person",
+    "5": "I-person",
+    "6": "B-group",
+    "7": "B-geopolitical area",
+    "8": "I-geopolitical area",
+    "9": "B-law",
+    "10": "I-law",
+    "11": "B-organization",
+    "12": "I-organization",
+    "13": "B-percent",
+    "14": "I-percent",
+    "15": "B-ordinal number",
+    "16": "B-money",
+    "17": "I-money",
+    "18": "B-work of art",
+    "19": "I-work of art",
+    "20": "B-facility",
+    "21": "B-time",
+    "22": "I-cardinal number",
+    "23": "B-location",
+    "24": "B-quantity",
+    "25": "I-quantity",
+    "26": "I-group",
+    "27": "I-location",
+    "28": "B-product",
+    "29": "I-time",
+    "30": "B-event",
+    "31": "I-event",
+    "32": "I-facility",
+    "33": "B-language",
+    "34": "I-product",
+    "35": "I-ordinal number",
+    "36": "I-language"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "B-cardinal number": 1,
+    "B-date": 2,
+    "B-event": 30,
+    "B-facility": 20,
+    "B-geopolitical area": 7,
+    "B-group": 6,
+    "B-language": 33,
+    "B-law": 9,
+    "B-location": 23,
+    "B-money": 16,
+    "B-ordinal number": 15,
+    "B-organization": 11,
+    "B-percent": 13,
+    "B-person": 4,
+    "B-product": 28,
+    "B-quantity": 24,
+    "B-time": 21,
+    "B-work of art": 18,
+    "I-cardinal number": 22,
+    "I-date": 3,
+    "I-event": 31,
+    "I-facility": 32,
+    "I-geopolitical area": 8,
+    "I-group": 26,
+    "I-language": 36,
+    "I-law": 10,
+    "I-location": 27,
+    "I-money": 17,
+    "I-ordinal number": 35,
+    "I-organization": 12,
+    "I-percent": 14,
+    "I-person": 5,
+    "I-product": 34,
+    "I-quantity": 25,
+    "I-time": 29,
+    "I-work of art": 19,
+    "O": 0
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "output_past": true,
+  "pad_token_id": 1,
+  "type_vocab_size": 1,
+  "vocab_size": 250002
+}

parameter.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"dataset": ["ontonotes5"], "transformers_model": "xlm-roberta-large", "random_seed": 1234, "lr": 1e-05, "total_step": 5000, "warmup_step": 700, "weight_decay": 1e-07, "batch_size": 32, "max_seq_length": 128, "fp16": false, "max_grad_norm": 1.0, "lower_case": false}

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c04dbe383c9c912ff8f88ef6bc06e82f3eb09cb47009ce390cb5dcc919e8aba
+size 2235680668

sentencepiece.bpe.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": "<mask>"}

test_bc5cdr_span.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"valid": {"f1": 0.0, "recall": 0.0, "precision": 0.0, "summary": ""}, "test": {"f1": 0.0, "recall": 0.0, "precision": 0.0, "summary": ""}}

test_bionlp2004_span.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"valid": {"f1": 0.0, "recall": 0.0, "precision": 0.0, "summary": ""}}

test_conll2003_span.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"valid": {"f1": 65.06572295247726, "recall": 51.44913052168699, "precision": 88.48401512547267, "accuracy": 93.95145555295403, "summary": " precision recall f1-score support\n\n entity 0.88 0.51 0.65 5003\n\n micro avg 0.88 0.51 0.65 5003\n macro avg 0.88 0.51 0.65 5003\nweighted avg 0.88 0.51 0.65 5003\n"}, "test": {"f1": 65.45039908779933, "recall": 52.38288379639019, "precision": 87.20459149223497, "accuracy": 93.5293229514915, "summary": " precision recall f1-score support\n\n entity 0.87 0.52 0.65 4931\n\n micro avg 0.87 0.52 0.65 4931\n macro avg 0.87 0.52 0.65 4931\nweighted avg 0.87 0.52 0.65 4931\n"}}

test_fin_span.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"valid": {"f1": 18.343195266272186, "recall": 12.3015873015873, "precision": 36.04651162790697, "accuracy": 96.72131147540983, "summary": " precision recall f1-score support\n\n entity 0.36 0.12 0.18 252\n\n micro avg 0.36 0.12 0.18 252\n macro avg 0.36 0.12 0.18 252\nweighted avg 0.36 0.12 0.18 252\n"}}

test_ontonotes5.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"valid": {"f1": 88.21593738882959, "recall": 89.83787700389458, "precision": 86.65152441687779, "accuracy": 98.0702468131272, "summary": " precision recall f1-score support\n\n cardinal number 0.84 0.89 0.86 937\n date 0.81 0.87 0.84 1507\n event 0.69 0.61 0.65 143\n facility 0.55 0.71 0.62 115\ngeopolitical area 0.95 0.96 0.95 2262\n group 0.90 0.93 0.92 847\n language 0.74 0.76 0.75 33\n law 0.57 0.78 0.66 40\n location 0.76 0.76 0.76 204\n money 0.89 0.92 0.91 274\n ordinal number 0.83 0.87 0.85 232\n organization 0.88 0.88 0.88 1728\n percent 0.91 0.90 0.90 177\n person 0.92 0.96 0.94 2014\n product 0.62 0.76 0.69 72\n quantity 0.74 0.79 0.76 100\n time 0.70 0.78 0.74 214\n work of art 0.46 0.57 0.51 142\n\n micro avg 0.87 0.90 0.88 11041\n macro avg 0.77 0.82 0.79 11041\n weighted avg 0.87 0.90 0.88 11041\n"}, "test": {"f1": 89.13091020426016, "recall": 90.56083903653008, "precision": 87.74543575611436, "accuracy": 98.19865275739149, "summary": " precision recall f1-score support\n\n cardinal number 0.84 0.87 0.86 934\n date 0.83 0.88 0.86 1601\n event 0.53 0.60 0.56 63\n facility 0.77 0.78 0.77 135\ngeopolitical area 0.97 0.96 0.97 2240\n group 0.91 0.95 0.93 841\n language 0.78 0.64 0.70 22\n law 0.51 0.60 0.55 40\n location 0.78 0.82 0.80 179\n money 0.81 0.87 0.84 314\n ordinal number 0.81 0.94 0.87 195\n organization 0.89 0.91 0.90 1792\n percent 0.86 0.90 0.88 348\n person 0.95 0.95 0.95 1988\n product 0.67 0.79 0.73 76\n quantity 0.77 0.80 0.79 105\n time 0.61 0.67 0.64 212\n work of art 0.51 0.61 0.55 166\n\n micro avg 0.88 0.91 0.89 11251\n macro avg 0.77 0.81 0.79 11251\n weighted avg 0.88 0.91 0.89 11251\n"}}

test_ontonotes5_span.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"valid": {"f1": 91.53465125619171, "recall": 92.89013676297438, "precision": 90.21815622800844, "accuracy": 98.57540005424464, "summary": " precision recall f1-score support\n\n entity 0.90 0.93 0.92 11041\n\n micro avg 0.90 0.93 0.92 11041\n macro avg 0.90 0.93 0.92 11041\nweighted avg 0.90 0.93 0.92 11041\n"}, "test": {"f1": 91.69336083198034, "recall": 92.86285663496578, "precision": 90.5529554515514, "accuracy": 98.576745648983, "summary": " precision recall f1-score support\n\n entity 0.91 0.93 0.92 11251\n\n micro avg 0.91 0.93 0.92 11251\n macro avg 0.91 0.93 0.92 11251\nweighted avg 0.91 0.93 0.92 11251\n"}}

test_panx_dataset-en_span.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"valid": {"f1": 47.37385063915676, "recall": 37.41409847679773, "precision": 64.55990220048899, "accuracy": 70.63085680196863, "summary": " precision recall f1-score support\n\n entity 0.65 0.37 0.47 14115\n\n micro avg 0.65 0.37 0.47 14115\n macro avg 0.65 0.37 0.47 14115\nweighted avg 0.65 0.37 0.47 14115\n"}, "test": {"f1": 47.568306010928964, "recall": 37.59176623002735, "precision": 64.75328539548723, "accuracy": 70.42360721192838, "summary": " precision recall f1-score support\n\n entity 0.65 0.38 0.48 13894\n\n micro avg 0.65 0.38 0.48 13894\n macro avg 0.65 0.38 0.48 13894\nweighted avg 0.65 0.38 0.48 13894\n"}}

test_wnut2017_span.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"valid": {"f1": 66.28975265017668, "recall": 58.47880299251871, "precision": 76.5089722675367, "accuracy": 96.18101966774871, "summary": " precision recall f1-score support\n\n entity 0.77 0.58 0.66 802\n\n micro avg 0.77 0.58 0.66 802\n macro avg 0.77 0.58 0.66 802\nweighted avg 0.77 0.58 0.66 802\n"}, "test": {"f1": 53.691275167785236, "recall": 47.47774480712167, "precision": 61.77606177606177, "accuracy": 94.98896533817994, "summary": " precision recall f1-score support\n\n entity 0.62 0.47 0.54 1011\n\n micro avg 0.62 0.47 0.54 1011\n macro avg 0.62 0.47 0.54 1011\nweighted avg 0.62 0.47 0.54 1011\n"}}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "name_or_path": "xlm-roberta-large"}