Alani19 commited on
Commit
2a5048b
1 Parent(s): e15ed37

Upload folder using huggingface_hub

Browse files
checkpoint-60/config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased-finetuned-sst-2-english",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "finetuning_task": "sst-2",
11
+ "hidden_dim": 3072,
12
+ "id2label": {
13
+ "0": "NEGATIVE",
14
+ "1": "POSITIVE"
15
+ },
16
+ "initializer_range": 0.02,
17
+ "label2id": {
18
+ "NEGATIVE": 0,
19
+ "POSITIVE": 1
20
+ },
21
+ "max_position_embeddings": 512,
22
+ "model_type": "distilbert",
23
+ "n_heads": 12,
24
+ "n_layers": 6,
25
+ "output_past": true,
26
+ "pad_token_id": 0,
27
+ "problem_type": "single_label_classification",
28
+ "qa_dropout": 0.1,
29
+ "seq_classif_dropout": 0.2,
30
+ "sinusoidal_pos_embds": false,
31
+ "tie_weights_": true,
32
+ "torch_dtype": "float32",
33
+ "transformers_version": "4.42.3",
34
+ "vocab_size": 30522
35
+ }
checkpoint-60/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a60d012f2ffc4e98b6a73a23cba6b48e950612ead91cb136a2448cb238ad9b3b
3
+ size 267832560
checkpoint-60/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4adaa201633b91242a4d05660189a3fce4c52c8bc83f5005733018fdae21ec2
3
+ size 535724410
checkpoint-60/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04a119a464492964f206274d8c2cfc18a0c7b06c76c10f05f3e33943615fdd62
3
+ size 13990
checkpoint-60/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90979e82e94259c1d6f68c5ef23bb17c7019c0bbe3422cf6d46e9cdac106c874
3
+ size 1064
checkpoint-60/trainer_state.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "eval_steps": 500,
6
+ "global_step": 60,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.85,
14
+ "eval_loss": 0.3328920304775238,
15
+ "eval_runtime": 19.3098,
16
+ "eval_samples_per_second": 2.071,
17
+ "eval_steps_per_second": 0.259,
18
+ "step": 20
19
+ },
20
+ {
21
+ "epoch": 1.5,
22
+ "grad_norm": 1.1108067035675049,
23
+ "learning_rate": 2.5e-05,
24
+ "loss": 0.5935,
25
+ "step": 30
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_accuracy": 0.9,
30
+ "eval_loss": 0.36818569898605347,
31
+ "eval_runtime": 19.4153,
32
+ "eval_samples_per_second": 2.06,
33
+ "eval_steps_per_second": 0.258,
34
+ "step": 40
35
+ },
36
+ {
37
+ "epoch": 3.0,
38
+ "grad_norm": 0.13847129046916962,
39
+ "learning_rate": 0.0,
40
+ "loss": 0.1087,
41
+ "step": 60
42
+ }
43
+ ],
44
+ "logging_steps": 30,
45
+ "max_steps": 60,
46
+ "num_input_tokens_seen": 0,
47
+ "num_train_epochs": 3,
48
+ "save_steps": 500,
49
+ "stateful_callbacks": {
50
+ "TrainerControl": {
51
+ "args": {
52
+ "should_epoch_stop": false,
53
+ "should_evaluate": false,
54
+ "should_log": false,
55
+ "should_save": true,
56
+ "should_training_stop": true
57
+ },
58
+ "attributes": {}
59
+ }
60
+ },
61
+ "total_flos": 63584351354880.0,
62
+ "train_batch_size": 8,
63
+ "trial_name": null,
64
+ "trial_params": null
65
+ }
checkpoint-60/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e464a2625faac84ce28854b56aa22de40827a7f85f1a107d48ed87dd3b21ad4e
3
+ size 5176
checkpoint-87/config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased-finetuned-sst-2-english",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "finetuning_task": "sst-2",
11
+ "hidden_dim": 3072,
12
+ "id2label": {
13
+ "0": "NEGATIVE",
14
+ "1": "POSITIVE"
15
+ },
16
+ "initializer_range": 0.02,
17
+ "label2id": {
18
+ "NEGATIVE": 0,
19
+ "POSITIVE": 1
20
+ },
21
+ "max_position_embeddings": 512,
22
+ "model_type": "distilbert",
23
+ "n_heads": 12,
24
+ "n_layers": 6,
25
+ "output_past": true,
26
+ "pad_token_id": 0,
27
+ "problem_type": "single_label_classification",
28
+ "qa_dropout": 0.1,
29
+ "seq_classif_dropout": 0.2,
30
+ "sinusoidal_pos_embds": false,
31
+ "tie_weights_": true,
32
+ "torch_dtype": "float32",
33
+ "transformers_version": "4.42.3",
34
+ "vocab_size": 30522
35
+ }
checkpoint-87/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a349c1e5d4576d99c61c5ead350f35b91a4fbb43cf87cfca993c4dfe810e20e
3
+ size 267832560
checkpoint-87/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64e2aa63acc3789e5a7f3727f9899c9bb65506fef07d9145ce744d3409f9e587
3
+ size 535724410
checkpoint-87/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38389f072ec0d30f99df13707be5ca1cb3d208dba29a5dccc9e3baee97162213
3
+ size 13990
checkpoint-87/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b32b93c709a450374c8a5d9ec8dd207b166bccf542e023947107eae5bd3a09cb
3
+ size 1064
checkpoint-87/trainer_state.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "eval_steps": 500,
6
+ "global_step": 87,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.9,
14
+ "eval_loss": 0.2707670331001282,
15
+ "eval_runtime": 19.5658,
16
+ "eval_samples_per_second": 2.044,
17
+ "eval_steps_per_second": 0.256,
18
+ "step": 29
19
+ },
20
+ {
21
+ "epoch": 1.0344827586206897,
22
+ "grad_norm": 4.015429496765137,
23
+ "learning_rate": 3.275862068965517e-05,
24
+ "loss": 0.7211,
25
+ "step": 30
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_accuracy": 0.9,
30
+ "eval_loss": 0.34923750162124634,
31
+ "eval_runtime": 19.9116,
32
+ "eval_samples_per_second": 2.009,
33
+ "eval_steps_per_second": 0.251,
34
+ "step": 58
35
+ },
36
+ {
37
+ "epoch": 2.0689655172413794,
38
+ "grad_norm": 0.996155321598053,
39
+ "learning_rate": 1.5517241379310346e-05,
40
+ "loss": 0.1894,
41
+ "step": 60
42
+ }
43
+ ],
44
+ "logging_steps": 30,
45
+ "max_steps": 87,
46
+ "num_input_tokens_seen": 0,
47
+ "num_train_epochs": 3,
48
+ "save_steps": 500,
49
+ "stateful_callbacks": {
50
+ "TrainerControl": {
51
+ "args": {
52
+ "should_epoch_stop": false,
53
+ "should_evaluate": false,
54
+ "should_log": false,
55
+ "should_save": true,
56
+ "should_training_stop": true
57
+ },
58
+ "attributes": {}
59
+ }
60
+ },
61
+ "total_flos": 90210298484736.0,
62
+ "train_batch_size": 8,
63
+ "trial_name": null,
64
+ "trial_params": null
65
+ }
checkpoint-87/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e464a2625faac84ce28854b56aa22de40827a7f85f1a107d48ed87dd3b21ad4e
3
+ size 5176
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a349c1e5d4576d99c61c5ead350f35b91a4fbb43cf87cfca993c4dfe810e20e
3
+ size 267832560
runs/Jul09_19-53-12_DESKTOP-O6LJL2H/events.out.tfevents.1720576420.DESKTOP-O6LJL2H.5552.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b72dd11f93110a659fb32463346dc5c2ab88113b855925773493a79e2986d4e3
3
+ size 6718
runs/Jul09_19-53-12_DESKTOP-O6LJL2H/events.out.tfevents.1720581251.DESKTOP-O6LJL2H.5552.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7bf80709b1aa11b47f65921e7c8e05fd3f4e529a44cd2670335dddb35eaa9ef
3
+ size 6718
runs/Jul09_19-53-12_DESKTOP-O6LJL2H/events.out.tfevents.1720582067.DESKTOP-O6LJL2H.5552.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:815fa1a110d9220935fb3d2a36f95f6559a90223f93ef3c1abbbe99fb0e087ed
3
+ size 405