Upload 12 files
Browse files- banglaBERT-on-banlgasarc.ipynb +0 -0
- optimizer.pt +1 -1
- pytorch_model.bin +1 -1
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +16 -0
- trainer_state.json +19 -19
- training_args.bin +1 -1
- vocab.txt +0 -0
banglaBERT-on-banlgasarc.ipynb
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 885067549
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a9813440e2828b31992f56123741c8672db60b228d289df0a0e47655b643fa5
|
3 |
size 885067549
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 442547117
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1566088e16c8f9a2aa90cbd5e90498f9b8ad0c34cf77f1ecfdb9197d7de07743
|
3 |
size 442547117
|
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"do_basic_tokenize": true,
|
4 |
+
"do_lower_case": false,
|
5 |
+
"full_tokenizer_file": null,
|
6 |
+
"mask_token": "[MASK]",
|
7 |
+
"name_or_path": "csebuetnlp/banglabert",
|
8 |
+
"never_split": null,
|
9 |
+
"pad_token": "[PAD]",
|
10 |
+
"sep_token": "[SEP]",
|
11 |
+
"special_tokens_map_file": null,
|
12 |
+
"strip_accents": null,
|
13 |
+
"tokenize_chinese_chars": false,
|
14 |
+
"tokenizer_class": "ElectraTokenizer",
|
15 |
+
"unk_token": "[UNK]"
|
16 |
+
}
|
trainer_state.json
CHANGED
@@ -10,43 +10,43 @@
|
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
"learning_rate": 3.3333333333333335e-05,
|
13 |
-
"loss": 0.
|
14 |
"step": 500
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
-
"eval_accuracy": 0.
|
19 |
-
"eval_f1": 0.
|
20 |
-
"eval_loss": 0.
|
21 |
-
"eval_precision": 0.
|
22 |
-
"eval_recall": 0.
|
23 |
-
"eval_runtime":
|
24 |
-
"eval_samples_per_second":
|
25 |
-
"eval_steps_per_second":
|
26 |
"step": 500
|
27 |
},
|
28 |
{
|
29 |
"epoch": 2.0,
|
30 |
"learning_rate": 1.6666666666666667e-05,
|
31 |
-
"loss": 0.
|
32 |
"step": 1000
|
33 |
},
|
34 |
{
|
35 |
"epoch": 2.0,
|
36 |
-
"eval_accuracy": 0.
|
37 |
-
"eval_f1": 0.
|
38 |
-
"eval_loss": 0.
|
39 |
-
"eval_precision": 0.
|
40 |
-
"eval_recall": 0.
|
41 |
-
"eval_runtime":
|
42 |
-
"eval_samples_per_second":
|
43 |
-
"eval_steps_per_second":
|
44 |
"step": 1000
|
45 |
},
|
46 |
{
|
47 |
"epoch": 3.0,
|
48 |
"learning_rate": 0.0,
|
49 |
-
"loss": 0.
|
50 |
"step": 1500
|
51 |
}
|
52 |
],
|
|
|
10 |
{
|
11 |
"epoch": 1.0,
|
12 |
"learning_rate": 3.3333333333333335e-05,
|
13 |
+
"loss": 0.228,
|
14 |
"step": 500
|
15 |
},
|
16 |
{
|
17 |
"epoch": 1.0,
|
18 |
+
"eval_accuracy": 0.9846984698469847,
|
19 |
+
"eval_f1": 0.9792429792429792,
|
20 |
+
"eval_loss": 0.06820278614759445,
|
21 |
+
"eval_precision": 0.9901234567901235,
|
22 |
+
"eval_recall": 0.9685990338164251,
|
23 |
+
"eval_runtime": 21.3752,
|
24 |
+
"eval_samples_per_second": 51.976,
|
25 |
+
"eval_steps_per_second": 6.503,
|
26 |
"step": 500
|
27 |
},
|
28 |
{
|
29 |
"epoch": 2.0,
|
30 |
"learning_rate": 1.6666666666666667e-05,
|
31 |
+
"loss": 0.0644,
|
32 |
"step": 1000
|
33 |
},
|
34 |
{
|
35 |
"epoch": 2.0,
|
36 |
+
"eval_accuracy": 0.9963996399639964,
|
37 |
+
"eval_f1": 0.9951573849878934,
|
38 |
+
"eval_loss": 0.020056167617440224,
|
39 |
+
"eval_precision": 0.9975728155339806,
|
40 |
+
"eval_recall": 0.9927536231884058,
|
41 |
+
"eval_runtime": 13.8433,
|
42 |
+
"eval_samples_per_second": 80.256,
|
43 |
+
"eval_steps_per_second": 10.041,
|
44 |
"step": 1000
|
45 |
},
|
46 |
{
|
47 |
"epoch": 3.0,
|
48 |
"learning_rate": 0.0,
|
49 |
+
"loss": 0.0193,
|
50 |
"step": 1500
|
51 |
}
|
52 |
],
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3439
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67e607d0b1966cdb2d5f309b4de11279902e0a8cd54a8d9e8e673b07342fe129
|
3 |
size 3439
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|