Md Mushfiqur Rahman commited on
Commit
e19f367
1 Parent(s): 4bd6cc2

Upload with huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - canine
5
+ - pretrained-on-english-language
6
+ ---
7
+
8
+ ### How to use
9
+
10
+ Here is how to use this model:
11
+
12
+ ```python
13
+ from transformers import CanineModel
14
+ model = CanineModel.from_pretrained('mushfiqur11/<repo name>')
15
+ ```
all_results.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 29.85,
3
+ "eval_accuracy_score": 0.9155309270630523,
4
+ "eval_f1": 0.5339233038348082,
5
+ "eval_loss": 0.3548363149166107,
6
+ "eval_precision": 0.489851150202977,
7
+ "eval_recall": 0.586709886547812,
8
+ "eval_runtime": 2.3816,
9
+ "eval_samples": 302,
10
+ "eval_samples_per_second": 126.805,
11
+ "eval_steps_per_second": 15.956,
12
+ "test_accuracy_score": 0.9315360056757716,
13
+ "test_f1": 0.5307237141556668,
14
+ "test_loss": 0.32899531722068787,
15
+ "test_precision": 0.4732142857142857,
16
+ "test_recall": 0.6041450777202072,
17
+ "test_runtime": 4.7209,
18
+ "test_samples": 605,
19
+ "test_samples_per_second": 128.153,
20
+ "test_steps_per_second": 16.099,
21
+ "train_loss": 0.10185246992111206,
22
+ "train_runtime": 987.1722,
23
+ "train_samples": 2116,
24
+ "train_samples_per_second": 486.237,
25
+ "train_steps_per_second": 15.195
26
+ }
config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/canine-c",
3
+ "architectures": [
4
+ "CanineForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 57344,
8
+ "downsampling_rate": 4,
9
+ "eos_token_id": 57345,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "O",
15
+ "1": "B-DATE",
16
+ "2": "I-DATE",
17
+ "3": "B-PER",
18
+ "4": "I-PER",
19
+ "5": "B-ORG",
20
+ "6": "I-ORG",
21
+ "7": "B-LOC",
22
+ "8": "I-LOC"
23
+ },
24
+ "initializer_range": 0.02,
25
+ "intermediate_size": 3072,
26
+ "label2id": {
27
+ "B-DATE": 1,
28
+ "B-LOC": 7,
29
+ "B-ORG": 5,
30
+ "B-PER": 3,
31
+ "I-DATE": 2,
32
+ "I-LOC": 8,
33
+ "I-ORG": 6,
34
+ "I-PER": 4,
35
+ "O": 0
36
+ },
37
+ "layer_norm_eps": 1e-12,
38
+ "local_transformer_stride": 128,
39
+ "max_position_embeddings": 16384,
40
+ "model_type": "canine",
41
+ "num_attention_heads": 12,
42
+ "num_hash_buckets": 16384,
43
+ "num_hash_functions": 8,
44
+ "num_hidden_layers": 12,
45
+ "pad_token_id": 0,
46
+ "torch_dtype": "float32",
47
+ "transformers_version": "4.17.0",
48
+ "type_vocab_size": 16,
49
+ "upsampling_kernel_size": 4,
50
+ "use_cache": true
51
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd72fedd36bd63193f9d192bb0f30ca5e6bb37351acddf89be128237799902df
3
+ size 528594737
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "eos_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "sep_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "pad_token": {"content": "\u0000", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "cls_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, "mask_token": {"content": "", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true}}
test_predictions.txt ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "eos_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "sep_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "cls_token": {"content": "", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "pad_token": {"content": "\u0000", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "mask_token": {"content": "", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true, "__type": "AddedToken"}, "add_prefix_space": false, "model_max_length": 2048, "special_tokens_map_file": "/home/mrahma45/.cache/huggingface/transformers/f8be97736b4765e3e8d559b4e7d4f1f531b1621150e5344b600684a27bc84e38.ab71f530366fe02e2834427e7b90198bfd0d573bc4279bfafdb2b95fe2b46dde", "name_or_path": "google/canine-c", "tokenizer_class": "CanineTokenizer"}
trainer_state.json ADDED
@@ -0,0 +1,169 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5339233038348082,
3
+ "best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/canine/canine-base-finetuned-masakhaner-kin/checkpoint-1000",
4
+ "epoch": 29.850746268656717,
5
+ "global_step": 2000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 2.99,
12
+ "eval_accuracy_score": 0.8626628725475513,
13
+ "eval_f1": 0.2977635782747604,
14
+ "eval_loss": 0.40653204917907715,
15
+ "eval_precision": 0.24578059071729957,
16
+ "eval_recall": 0.37763371150729336,
17
+ "eval_runtime": 2.3533,
18
+ "eval_samples_per_second": 128.333,
19
+ "eval_steps_per_second": 16.148,
20
+ "step": 200
21
+ },
22
+ {
23
+ "epoch": 5.97,
24
+ "eval_accuracy_score": 0.8854275872397783,
25
+ "eval_f1": 0.3580729166666667,
26
+ "eval_loss": 0.36062297224998474,
27
+ "eval_precision": 0.2992383025027203,
28
+ "eval_recall": 0.44570502431118314,
29
+ "eval_runtime": 2.3498,
30
+ "eval_samples_per_second": 128.522,
31
+ "eval_steps_per_second": 16.172,
32
+ "step": 400
33
+ },
34
+ {
35
+ "epoch": 7.46,
36
+ "learning_rate": 4.865771812080537e-05,
37
+ "loss": 0.3324,
38
+ "step": 500
39
+ },
40
+ {
41
+ "epoch": 8.96,
42
+ "eval_accuracy_score": 0.902201587539314,
43
+ "eval_f1": 0.4444444444444445,
44
+ "eval_loss": 0.3250875771045685,
45
+ "eval_precision": 0.40052015604681407,
46
+ "eval_recall": 0.4991896272285251,
47
+ "eval_runtime": 2.3578,
48
+ "eval_samples_per_second": 128.086,
49
+ "eval_steps_per_second": 16.117,
50
+ "step": 600
51
+ },
52
+ {
53
+ "epoch": 11.94,
54
+ "eval_accuracy_score": 0.9062453197543807,
55
+ "eval_f1": 0.44697508896797156,
56
+ "eval_loss": 0.35800644755363464,
57
+ "eval_precision": 0.39847715736040606,
58
+ "eval_recall": 0.5089141004862237,
59
+ "eval_runtime": 2.3569,
60
+ "eval_samples_per_second": 128.132,
61
+ "eval_steps_per_second": 16.123,
62
+ "step": 800
63
+ },
64
+ {
65
+ "epoch": 14.93,
66
+ "learning_rate": 4.697986577181208e-05,
67
+ "loss": 0.0559,
68
+ "step": 1000
69
+ },
70
+ {
71
+ "epoch": 14.93,
72
+ "eval_accuracy_score": 0.9155309270630523,
73
+ "eval_f1": 0.5339233038348082,
74
+ "eval_loss": 0.3548363149166107,
75
+ "eval_precision": 0.489851150202977,
76
+ "eval_recall": 0.586709886547812,
77
+ "eval_runtime": 2.3472,
78
+ "eval_samples_per_second": 128.664,
79
+ "eval_steps_per_second": 16.19,
80
+ "step": 1000
81
+ },
82
+ {
83
+ "epoch": 17.91,
84
+ "eval_accuracy_score": 0.9156806949228695,
85
+ "eval_f1": 0.5113221329437545,
86
+ "eval_loss": 0.39484161138534546,
87
+ "eval_precision": 0.4654255319148936,
88
+ "eval_recall": 0.5672609400324149,
89
+ "eval_runtime": 2.3511,
90
+ "eval_samples_per_second": 128.453,
91
+ "eval_steps_per_second": 16.163,
92
+ "step": 1200
93
+ },
94
+ {
95
+ "epoch": 20.9,
96
+ "eval_accuracy_score": 0.9123858020068893,
97
+ "eval_f1": 0.4756446991404012,
98
+ "eval_loss": 0.4212295711040497,
99
+ "eval_precision": 0.42618741976893454,
100
+ "eval_recall": 0.5380875202593193,
101
+ "eval_runtime": 2.351,
102
+ "eval_samples_per_second": 128.457,
103
+ "eval_steps_per_second": 16.163,
104
+ "step": 1400
105
+ },
106
+ {
107
+ "epoch": 22.39,
108
+ "learning_rate": 4.530201342281879e-05,
109
+ "loss": 0.0133,
110
+ "step": 1500
111
+ },
112
+ {
113
+ "epoch": 23.88,
114
+ "eval_accuracy_score": 0.9149318556237831,
115
+ "eval_f1": 0.5033308660251665,
116
+ "eval_loss": 0.42608439922332764,
117
+ "eval_precision": 0.46321525885558584,
118
+ "eval_recall": 0.5510534846029174,
119
+ "eval_runtime": 2.3525,
120
+ "eval_samples_per_second": 128.373,
121
+ "eval_steps_per_second": 16.153,
122
+ "step": 1600
123
+ },
124
+ {
125
+ "epoch": 26.87,
126
+ "eval_accuracy_score": 0.9161299985023214,
127
+ "eval_f1": 0.53003003003003,
128
+ "eval_loss": 0.4479231536388397,
129
+ "eval_precision": 0.4937062937062937,
130
+ "eval_recall": 0.5721231766612642,
131
+ "eval_runtime": 2.3519,
132
+ "eval_samples_per_second": 128.409,
133
+ "eval_steps_per_second": 16.157,
134
+ "step": 1800
135
+ },
136
+ {
137
+ "epoch": 29.85,
138
+ "learning_rate": 4.36241610738255e-05,
139
+ "loss": 0.0058,
140
+ "step": 2000
141
+ },
142
+ {
143
+ "epoch": 29.85,
144
+ "eval_accuracy_score": 0.918076980679946,
145
+ "eval_f1": 0.5291887793783169,
146
+ "eval_loss": 0.4661569595336914,
147
+ "eval_precision": 0.49715099715099714,
148
+ "eval_recall": 0.5656401944894651,
149
+ "eval_runtime": 2.349,
150
+ "eval_samples_per_second": 128.566,
151
+ "eval_steps_per_second": 16.177,
152
+ "step": 2000
153
+ },
154
+ {
155
+ "epoch": 29.85,
156
+ "step": 2000,
157
+ "total_flos": 1.0376509207394304e+16,
158
+ "train_loss": 0.10185246992111206,
159
+ "train_runtime": 987.1722,
160
+ "train_samples_per_second": 486.237,
161
+ "train_steps_per_second": 15.195
162
+ }
163
+ ],
164
+ "max_steps": 15000,
165
+ "num_train_epochs": 224,
166
+ "total_flos": 1.0376509207394304e+16,
167
+ "trial_name": null,
168
+ "trial_params": null
169
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:424515a6dcd4dfc2371f5d5944eeefa3fd52c968da5823ee6fb66496d8860f08
3
+ size 3259