kgoli commited on
Commit
9f4cc2e
1 Parent(s): a832976

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
  "eval_accuracy": 0.6923076923076923,
4
  "eval_loss": 0.6873394846916199,
5
  "eval_runtime": 1.5094,
6
  "eval_samples_per_second": 17.226,
7
  "eval_steps_per_second": 0.663,
8
- "total_flos": 7086826637549568.0,
9
- "train_loss": 0.6862780253092448,
10
- "train_runtime": 87.2572,
11
- "train_samples_per_second": 8.045,
12
- "train_steps_per_second": 0.069
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
  "eval_accuracy": 0.6923076923076923,
4
  "eval_loss": 0.6873394846916199,
5
  "eval_runtime": 1.5094,
6
  "eval_samples_per_second": 17.226,
7
  "eval_steps_per_second": 0.663,
8
+ "total_flos": 2.362275545849856e+16,
9
+ "train_loss": 0.6464766740798951,
10
+ "train_runtime": 277.8757,
11
+ "train_samples_per_second": 8.421,
12
+ "train_steps_per_second": 0.072
13
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "./hfmodel",
3
  "architectures": [
4
  "ResNetForImageClassification"
5
  ],
 
1
  {
2
+ "_name_or_path": "microsoft/resnet-18",
3
  "architectures": [
4
  "ResNetForImageClassification"
5
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1eca31df85fd98510c6b498db935abb6402a6f046c8da18b849612d1642e9497
3
  size 44764336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ae71a5cee240902541c0d471dcce4708ef5ce660d3aff8a3b045f88a0a77a4f
3
  size 44764336
runs/May16_15-12-00_goku2/events.out.tfevents.1715872373.goku2.4604.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45a81f55791fa6dc1bae91b76f5b8b8e1b072c86328cde87b470fb7e3ff49a9e
3
+ size 5128
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 7086826637549568.0,
4
- "train_loss": 0.6862780253092448,
5
- "train_runtime": 87.2572,
6
- "train_samples_per_second": 8.045,
7
- "train_steps_per_second": 0.069
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "total_flos": 2.362275545849856e+16,
4
+ "train_loss": 0.6464766740798951,
5
+ "train_runtime": 277.8757,
6
+ "train_samples_per_second": 8.421,
7
+ "train_steps_per_second": 0.072
8
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.6923076923076923,
3
  "best_model_checkpoint": "resnet-18-finetuned-fraud/checkpoint-2",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 6,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,46 +11,123 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_accuracy": 0.6923076923076923,
14
- "eval_loss": 0.6873394846916199,
15
- "eval_runtime": 1.7943,
16
- "eval_samples_per_second": 14.49,
17
- "eval_steps_per_second": 0.557,
18
  "step": 2
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 0.6923076923076923,
23
- "eval_loss": 0.6751973032951355,
24
- "eval_runtime": 1.6274,
25
- "eval_samples_per_second": 15.976,
26
- "eval_steps_per_second": 0.614,
27
  "step": 4
28
  },
29
  {
30
  "epoch": 3.0,
31
  "eval_accuracy": 0.6923076923076923,
32
- "eval_loss": 0.6680338382720947,
33
- "eval_runtime": 1.6065,
34
- "eval_samples_per_second": 16.184,
35
- "eval_steps_per_second": 0.622,
36
  "step": 6
37
  },
38
  {
39
- "epoch": 3.0,
40
- "step": 6,
41
- "total_flos": 7086826637549568.0,
42
- "train_loss": 0.6862780253092448,
43
- "train_runtime": 87.2572,
44
- "train_samples_per_second": 8.045,
45
- "train_steps_per_second": 0.069
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ],
48
  "logging_steps": 10,
49
- "max_steps": 6,
50
  "num_input_tokens_seen": 0,
51
- "num_train_epochs": 3,
52
  "save_steps": 500,
53
- "total_flos": 7086826637549568.0,
54
  "train_batch_size": 32,
55
  "trial_name": null,
56
  "trial_params": null
 
1
  {
2
  "best_metric": 0.6923076923076923,
3
  "best_model_checkpoint": "resnet-18-finetuned-fraud/checkpoint-2",
4
+ "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 1.0,
13
  "eval_accuracy": 0.6923076923076923,
14
+ "eval_loss": 0.6821401119232178,
15
+ "eval_runtime": 1.7618,
16
+ "eval_samples_per_second": 14.757,
17
+ "eval_steps_per_second": 0.568,
18
  "step": 2
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 0.6923076923076923,
23
+ "eval_loss": 0.6628227829933167,
24
+ "eval_runtime": 1.6027,
25
+ "eval_samples_per_second": 16.223,
26
+ "eval_steps_per_second": 0.624,
27
  "step": 4
28
  },
29
  {
30
  "epoch": 3.0,
31
  "eval_accuracy": 0.6923076923076923,
32
+ "eval_loss": 0.6421977281570435,
33
+ "eval_runtime": 1.6359,
34
+ "eval_samples_per_second": 15.894,
35
+ "eval_steps_per_second": 0.611,
36
  "step": 6
37
  },
38
  {
39
+ "epoch": 4.0,
40
+ "eval_accuracy": 0.6923076923076923,
41
+ "eval_loss": 0.6217892169952393,
42
+ "eval_runtime": 1.6129,
43
+ "eval_samples_per_second": 16.12,
44
+ "eval_steps_per_second": 0.62,
45
+ "step": 8
46
+ },
47
+ {
48
+ "epoch": 5.0,
49
+ "grad_norm": 3.009413242340088,
50
+ "learning_rate": 2.777777777777778e-05,
51
+ "loss": 0.6696,
52
+ "step": 10
53
+ },
54
+ {
55
+ "epoch": 5.0,
56
+ "eval_accuracy": 0.6923076923076923,
57
+ "eval_loss": 0.6059156656265259,
58
+ "eval_runtime": 1.6613,
59
+ "eval_samples_per_second": 15.65,
60
+ "eval_steps_per_second": 0.602,
61
+ "step": 10
62
+ },
63
+ {
64
+ "epoch": 6.0,
65
+ "eval_accuracy": 0.6923076923076923,
66
+ "eval_loss": 0.5922008752822876,
67
+ "eval_runtime": 1.4671,
68
+ "eval_samples_per_second": 17.723,
69
+ "eval_steps_per_second": 0.682,
70
+ "step": 12
71
+ },
72
+ {
73
+ "epoch": 7.0,
74
+ "eval_accuracy": 0.6923076923076923,
75
+ "eval_loss": 0.5782066583633423,
76
+ "eval_runtime": 1.5993,
77
+ "eval_samples_per_second": 16.257,
78
+ "eval_steps_per_second": 0.625,
79
+ "step": 14
80
+ },
81
+ {
82
+ "epoch": 8.0,
83
+ "eval_accuracy": 0.6923076923076923,
84
+ "eval_loss": 0.5681060552597046,
85
+ "eval_runtime": 1.508,
86
+ "eval_samples_per_second": 17.242,
87
+ "eval_steps_per_second": 0.663,
88
+ "step": 16
89
+ },
90
+ {
91
+ "epoch": 9.0,
92
+ "eval_accuracy": 0.6923076923076923,
93
+ "eval_loss": 0.5619844198226929,
94
+ "eval_runtime": 1.6504,
95
+ "eval_samples_per_second": 15.754,
96
+ "eval_steps_per_second": 0.606,
97
+ "step": 18
98
+ },
99
+ {
100
+ "epoch": 10.0,
101
+ "grad_norm": 3.1605825424194336,
102
+ "learning_rate": 0.0,
103
+ "loss": 0.6234,
104
+ "step": 20
105
+ },
106
+ {
107
+ "epoch": 10.0,
108
+ "eval_accuracy": 0.6923076923076923,
109
+ "eval_loss": 0.5624192357063293,
110
+ "eval_runtime": 1.4997,
111
+ "eval_samples_per_second": 17.337,
112
+ "eval_steps_per_second": 0.667,
113
+ "step": 20
114
+ },
115
+ {
116
+ "epoch": 10.0,
117
+ "step": 20,
118
+ "total_flos": 2.362275545849856e+16,
119
+ "train_loss": 0.6464766740798951,
120
+ "train_runtime": 277.8757,
121
+ "train_samples_per_second": 8.421,
122
+ "train_steps_per_second": 0.072
123
  }
124
  ],
125
  "logging_steps": 10,
126
+ "max_steps": 20,
127
  "num_input_tokens_seen": 0,
128
+ "num_train_epochs": 10,
129
  "save_steps": 500,
130
+ "total_flos": 2.362275545849856e+16,
131
  "train_batch_size": 32,
132
  "trial_name": null,
133
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1c9438ce0ead107b64ca22a0d18d49ec750844ddba5d3926b4c64f726172a98
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43bf2011d4389d0100877b2d1dc641cbbf8cc9cedc1dc9a974b1d23500c819da
3
  size 5048