saattrupdan commited on
Commit
2c2e7f8
1 Parent(s): de7bce4

Training in progress, epoch 0

Browse files
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "xlm-roberta-base",
3
  "architectures": [
4
- "XLMRobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
@@ -24,10 +24,9 @@
24
  },
25
  "layer_norm_eps": 1e-05,
26
  "max_position_embeddings": 514,
27
- "model_type": "xlm-roberta",
28
  "num_attention_heads": 12,
29
- "num_hidden_layers": 12,
30
- "output_past": true,
31
  "pad_token_id": 1,
32
  "position_embedding_type": "absolute",
33
  "problem_type": "single_label_classification",
@@ -35,5 +34,5 @@
35
  "transformers_version": "4.11.3",
36
  "type_vocab_size": 1,
37
  "use_cache": true,
38
- "vocab_size": 250002
39
  }
1
  {
2
+ "_name_or_path": "distilroberta-base",
3
  "architectures": [
4
+ "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
24
  },
25
  "layer_norm_eps": 1e-05,
26
  "max_position_embeddings": 514,
27
+ "model_type": "roberta",
28
  "num_attention_heads": 12,
29
+ "num_hidden_layers": 6,
 
30
  "pad_token_id": 1,
31
  "position_embedding_type": "absolute",
32
  "problem_type": "single_label_classification",
34
  "transformers_version": "4.11.3",
35
  "type_vocab_size": 1,
36
  "use_cache": true,
37
+ "vocab_size": 50265
38
  }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d8bb68777b7f1164f22a854b15e63d74a86f4b5d4261f81d79786c41132db88
3
- size 1112269229
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09dc584f4a4fe60147b24507bd4898aeefb45c05eef4f75fd696f182bf6520c6
3
+ size 328529005
runs/Oct13_15-24-16_milo/1634135062.6294315/events.out.tfevents.1634135062.milo.23058.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d79bb9d8a7823afe9f6a96bef40a84be099032b64ae91128062583e308cbdc86
3
+ size 4627
runs/Oct13_15-24-16_milo/events.out.tfevents.1634135062.milo.23058.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eba35cafa771cbc94023bbc995a274909108d6ea9463e9216dee5e2fe56999f
3
+ size 3909
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "sep_token": "</s>", "cls_token": "<s>", "unk_token": "<unk>", "pad_token": "<pad>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "xlm-roberta-base", "tokenizer_class": "XLMRobertaTokenizer"}
1
+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilroberta-base", "tokenizer_class": "RobertaTokenizer"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fbae7a2de61c3aa4d3211ad78273d3b80b70f0aebe364c3158663e08dc20370
3
  size 2927
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c187cf3c366c8b0e441eb37e539a1f416f19c0fa0dce5c0d48dd120e3034e65
3
  size 2927
vocab.json ADDED
The diff for this file is too large to render. See raw diff