finiteautomata commited on
Commit
d72a191
1 Parent(s): 7a7848c

Update with arg newspapers

Browse files
added_tokens.json CHANGED
@@ -1 +1 @@
1
- {"emoji": 31005, "hashtag": 31004, "url": 31003, "@usuario": 31002}
1
+ {"emoji": 31005, "url": 31003, "hashtag": 31004, "@usuario": 31002}
config.json CHANGED
@@ -20,7 +20,7 @@
20
  "pad_token_id": 1,
21
  "position_embedding_type": "absolute",
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.10.0.dev0",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
  "vocab_size": 31006
20
  "pad_token_id": 1,
21
  "position_embedding_type": "absolute",
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.11.2",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
  "vocab_size": 31006
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 2.24,
3
- "eval_loss": 0.8874114155769348,
4
- "eval_runtime": 382.8478,
5
- "eval_samples": 200000,
6
- "eval_samples_per_second": 522.401,
7
- "eval_steps_per_second": 4.083,
8
- "perplexity": 2.428834264192218
9
  }
1
  {
2
+ "epoch": 4.71,
3
+ "eval_loss": 1.2962344884872437,
4
+ "eval_runtime": 203.9458,
5
+ "eval_samples": 181300,
6
+ "eval_samples_per_second": 888.962,
7
+ "eval_steps_per_second": 3.476,
8
+ "perplexity": 3.6555058697726976
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9936087dc2e9bde1731951c97cebfd3b483d018b1212c5a34ddc0774318f9dc
3
  size 534989479
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cd66dc8733c59bc73dbea053347ab3223a0163ee1ad16ae7911fc15b195d12c
3
  size 534989479
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
train_results.json CHANGED
@@ -1,9 +1,8 @@
1
  {
2
- "epoch": 2.24,
3
- "total_flos": 3.370512610512077e+17,
4
- "train_loss": 0.09681204452514648,
5
- "train_runtime": 5680.8564,
6
- "train_samples": 8369648,
7
- "train_samples_per_second": 3605.09,
8
- "train_steps_per_second": 1.76
9
  }
1
  {
2
+ "epoch": 4.71,
3
+ "train_loss": 0.26460304527282713,
4
+ "train_runtime": 30325.8771,
5
+ "train_samples": 4349088,
6
+ "train_samples_per_second": 675.331,
7
+ "train_steps_per_second": 0.33
 
8
  }