holylovenia commited on
Commit
0785668
1 Parent(s): 60ae015

Training in progress, epoch 0

Browse files
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.9,
3
+ "eval_accuracy": 0.5555555555555556,
4
+ "eval_loss": 4.485937118530273,
5
+ "eval_runtime": 2.696,
6
+ "eval_samples_per_second": 36.721,
7
+ "eval_steps_per_second": 4.822,
8
+ "total_flos": 2.76987521728512e+16,
9
+ "train_loss": 5.3129854474748885,
10
+ "train_runtime": 102.3477,
11
+ "train_samples_per_second": 11.92,
12
+ "train_steps_per_second": 0.342
13
+ }
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "ResNetForImageClassification"
4
  ],
 
1
  {
2
+ "_name_or_path": "microsoft/resnet-50",
3
  "architectures": [
4
  "ResNetForImageClassification"
5
  ],
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.9,
3
+ "eval_accuracy": 0.5901639344262295,
4
+ "eval_loss": 4.461605072021484,
5
+ "eval_runtime": 1.5358,
6
+ "eval_samples_per_second": 39.718,
7
+ "eval_steps_per_second": 5.209
8
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4e950fbcfbf14d2c1e5cf3f023a40f4d10a5f728328cfdc924717acad57d141
3
  size 102552257
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd66ca801e52eb37229e448e70f422f8cc2eb600a2509bc4f763349dc77e99f
3
  size 102552257
test_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.9,
3
+ "eval_accuracy": 0.5555555555555556,
4
+ "eval_loss": 4.485937118530273,
5
+ "eval_runtime": 2.696,
6
+ "eval_samples_per_second": 36.721,
7
+ "eval_steps_per_second": 4.822
8
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.9,
3
+ "total_flos": 2.76987521728512e+16,
4
+ "train_loss": 5.3129854474748885,
5
+ "train_runtime": 102.3477,
6
+ "train_samples_per_second": 11.92,
7
+ "train_steps_per_second": 0.342
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5901639344262295,
3
+ "best_model_checkpoint": "problem2-test/checkpoint-21",
4
+ "epoch": 4.903225806451613,
5
+ "global_step": 35,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.9,
12
+ "eval_accuracy": 0.0,
13
+ "eval_loss": 6.274798393249512,
14
+ "eval_runtime": 1.2157,
15
+ "eval_samples_per_second": 50.175,
16
+ "eval_steps_per_second": 6.58,
17
+ "step": 7
18
+ },
19
+ {
20
+ "epoch": 1.39,
21
+ "learning_rate": 4.032258064516129e-05,
22
+ "loss": 7.4671,
23
+ "step": 10
24
+ },
25
+ {
26
+ "epoch": 1.9,
27
+ "eval_accuracy": 0.5737704918032787,
28
+ "eval_loss": 5.177652835845947,
29
+ "eval_runtime": 1.19,
30
+ "eval_samples_per_second": 51.26,
31
+ "eval_steps_per_second": 6.723,
32
+ "step": 14
33
+ },
34
+ {
35
+ "epoch": 2.77,
36
+ "learning_rate": 2.4193548387096777e-05,
37
+ "loss": 5.3033,
38
+ "step": 20
39
+ },
40
+ {
41
+ "epoch": 2.9,
42
+ "eval_accuracy": 0.5901639344262295,
43
+ "eval_loss": 4.461605072021484,
44
+ "eval_runtime": 1.0892,
45
+ "eval_samples_per_second": 56.006,
46
+ "eval_steps_per_second": 7.345,
47
+ "step": 21
48
+ },
49
+ {
50
+ "epoch": 3.9,
51
+ "eval_accuracy": 0.5245901639344263,
52
+ "eval_loss": 5.181081295013428,
53
+ "eval_runtime": 1.1367,
54
+ "eval_samples_per_second": 53.664,
55
+ "eval_steps_per_second": 7.038,
56
+ "step": 28
57
+ },
58
+ {
59
+ "epoch": 4.26,
60
+ "learning_rate": 8.064516129032258e-06,
61
+ "loss": 4.1105,
62
+ "step": 30
63
+ },
64
+ {
65
+ "epoch": 4.9,
66
+ "eval_accuracy": 0.5573770491803278,
67
+ "eval_loss": 4.228121757507324,
68
+ "eval_runtime": 1.1738,
69
+ "eval_samples_per_second": 51.966,
70
+ "eval_steps_per_second": 6.815,
71
+ "step": 35
72
+ },
73
+ {
74
+ "epoch": 4.9,
75
+ "step": 35,
76
+ "total_flos": 2.76987521728512e+16,
77
+ "train_loss": 5.3129854474748885,
78
+ "train_runtime": 102.3477,
79
+ "train_samples_per_second": 11.92,
80
+ "train_steps_per_second": 0.342
81
+ }
82
+ ],
83
+ "max_steps": 35,
84
+ "num_train_epochs": 5,
85
+ "total_flos": 2.76987521728512e+16,
86
+ "trial_name": null,
87
+ "trial_params": null
88
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fd18edac8f43b5874de7efd29fa4bed4ebcd9f4751592d4f4414bcf8457b809
3
- size 3375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7889c739104d31b8ec179af3c7fc7b7a9ca53be12e0f39a2ad3ffa3a02a26b81
3
+ size 3311