crangana commited on
Commit
5cdda77
1 Parent(s): 9d3e1c4

End of training

Browse files
README.md ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: microsoft/resnet-50
4
+ tags:
5
+ - generated_from_trainer
6
+ datasets:
7
+ - fair_face
8
+ metrics:
9
+ - accuracy
10
+ model-index:
11
+ - name: trained-gender
12
+ results:
13
+ - task:
14
+ name: Image Classification
15
+ type: image-classification
16
+ dataset:
17
+ name: fair_face
18
+ type: fair_face
19
+ config: '0.25'
20
+ split: validation
21
+ args: '0.25'
22
+ metrics:
23
+ - name: Accuracy
24
+ type: accuracy
25
+ value: 0.8985758626985576
26
+ ---
27
+
28
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
+ should probably proofread and complete it, then remove this comment. -->
30
+
31
+ # trained-gender
32
+
33
+ This model is a fine-tuned version of [microsoft/resnet-50](https://huggingface.co/microsoft/resnet-50) on the fair_face dataset.
34
+ It achieves the following results on the evaluation set:
35
+ - Loss: 0.2437
36
+ - Accuracy: 0.8986
37
+
38
+ ## Model description
39
+
40
+ More information needed
41
+
42
+ ## Intended uses & limitations
43
+
44
+ More information needed
45
+
46
+ ## Training and evaluation data
47
+
48
+ More information needed
49
+
50
+ ## Training procedure
51
+
52
+ ### Training hyperparameters
53
+
54
+ The following hyperparameters were used during training:
55
+ - learning_rate: 0.0002
56
+ - train_batch_size: 16
57
+ - eval_batch_size: 8
58
+ - seed: 42
59
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
+ - lr_scheduler_type: linear
61
+ - num_epochs: 4
62
+
63
+ ### Training results
64
+
65
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
66
+ |:-------------:|:-----:|:-----:|:---------------:|:--------:|
67
+ | 0.4277 | 0.18 | 1000 | 0.4054 | 0.8089 |
68
+ | 0.315 | 0.37 | 2000 | 0.3487 | 0.8318 |
69
+ | 0.3082 | 0.55 | 3000 | 0.3052 | 0.8633 |
70
+ | 0.3235 | 0.74 | 4000 | 0.2899 | 0.8684 |
71
+ | 0.2505 | 0.92 | 5000 | 0.2693 | 0.8785 |
72
+ | 0.2484 | 1.11 | 6000 | 0.2547 | 0.8889 |
73
+ | 0.1933 | 1.29 | 7000 | 0.2521 | 0.8901 |
74
+ | 0.1497 | 1.48 | 8000 | 0.2443 | 0.8929 |
75
+ | 0.326 | 1.66 | 9000 | 0.2406 | 0.8958 |
76
+ | 0.215 | 1.84 | 10000 | 0.2381 | 0.9007 |
77
+ | 0.2035 | 2.03 | 11000 | 0.2437 | 0.8986 |
78
+
79
+
80
+ ### Framework versions
81
+
82
+ - Transformers 4.34.0
83
+ - Pytorch 2.0.1+cu118
84
+ - Datasets 2.14.5
85
+ - Tokenizers 0.14.0
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.03,
3
+ "total_flos": 3.7370912368449946e+18,
4
+ "train_loss": 0.29799577762321994,
5
+ "train_runtime": 2883.713,
6
+ "train_samples_per_second": 120.323,
7
+ "train_steps_per_second": 7.521
8
+ }
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/resnet-50",
3
+ "architectures": [
4
+ "ResNetForImageClassification"
5
+ ],
6
+ "depths": [
7
+ 3,
8
+ 4,
9
+ 6,
10
+ 3
11
+ ],
12
+ "downsample_in_first_stage": false,
13
+ "embedding_size": 64,
14
+ "hidden_act": "relu",
15
+ "hidden_sizes": [
16
+ 256,
17
+ 512,
18
+ 1024,
19
+ 2048
20
+ ],
21
+ "id2label": {
22
+ "0": "Male",
23
+ "1": "Female"
24
+ },
25
+ "label2id": {
26
+ "Female": "1",
27
+ "Male": "0"
28
+ },
29
+ "layer_type": "bottleneck",
30
+ "model_type": "resnet",
31
+ "num_channels": 3,
32
+ "out_features": [
33
+ "stage4"
34
+ ],
35
+ "out_indices": [
36
+ 4
37
+ ],
38
+ "problem_type": "single_label_classification",
39
+ "stage_names": [
40
+ "stem",
41
+ "stage1",
42
+ "stage2",
43
+ "stage3",
44
+ "stage4"
45
+ ],
46
+ "torch_dtype": "float32",
47
+ "transformers_version": "4.34.0"
48
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_pct": 0.875,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "feature_extractor_type": "ConvNextFeatureExtractor",
7
+ "image_mean": [
8
+ 0.485,
9
+ 0.456,
10
+ 0.406
11
+ ],
12
+ "image_processor_type": "ConvNextFeatureExtractor",
13
+ "image_std": [
14
+ 0.229,
15
+ 0.224,
16
+ 0.225
17
+ ],
18
+ "resample": 3,
19
+ "rescale_factor": 0.00392156862745098,
20
+ "size": {
21
+ "shortest_edge": 224
22
+ }
23
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2f520d9bb1efdbeabea0393c82d7a8c638a5b86e6c3f18838b3d4d55f3cafcc
3
+ size 94374989
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 2.03,
3
+ "total_flos": 3.7370912368449946e+18,
4
+ "train_loss": 0.29799577762321994,
5
+ "train_runtime": 2883.713,
6
+ "train_samples_per_second": 120.323,
7
+ "train_steps_per_second": 7.521
8
+ }
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e622ea34b3a4b39362b93e7e14f202c46480012779b94791d9dfa10e1ec1fbf9
3
+ size 4027