vinluvie commited on
Commit
f19b1ee
1 Parent(s): 607a579

End of training

Browse files
README.md CHANGED
@@ -15,6 +15,8 @@ should probably proofread and complete it, then remove this comment. -->
15
  # clip-vit-large-patch14-finetuned-sofas
16
 
17
  This model is a fine-tuned version of [openai/clip-vit-large-patch14](https://huggingface.co/openai/clip-vit-large-patch14) on the imagefolder dataset.
 
 
18
 
19
  ## Model description
20
 
 
15
  # clip-vit-large-patch14-finetuned-sofas
16
 
17
  This model is a fine-tuned version of [openai/clip-vit-large-patch14](https://huggingface.co/openai/clip-vit-large-patch14) on the imagefolder dataset.
18
+ It achieves the following results on the evaluation set:
19
+ - Loss: 2.6927
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_loss": 2.9003005027770996,
4
- "eval_runtime": 11.5402,
5
- "eval_samples_per_second": 4.506,
6
- "eval_steps_per_second": 0.173,
7
- "test_loss": 3.050781726837158,
8
- "test_runtime": 25.3536,
9
- "test_samples_per_second": 4.102,
10
- "test_steps_per_second": 0.158,
11
- "train_loss": 2.9446426391601563,
12
- "train_runtime": 3632.8393,
13
- "train_samples_per_second": 1.153,
14
- "train_steps_per_second": 0.039
15
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_loss": 2.6927454471588135,
4
+ "eval_runtime": 9.9974,
5
+ "eval_samples_per_second": 4.701,
6
+ "eval_steps_per_second": 0.2,
7
+ "test_loss": 2.9896740913391113,
8
+ "test_runtime": 20.647,
9
+ "test_samples_per_second": 4.698,
10
+ "test_steps_per_second": 0.194,
11
+ "train_loss": 2.822861735026042,
12
+ "train_runtime": 3007.5818,
13
+ "train_samples_per_second": 1.26,
14
+ "train_steps_per_second": 0.04
15
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_loss": 2.9003005027770996,
4
- "eval_runtime": 11.5402,
5
- "eval_samples_per_second": 4.506,
6
- "eval_steps_per_second": 0.173
7
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_loss": 2.6927454471588135,
4
+ "eval_runtime": 9.9974,
5
+ "eval_samples_per_second": 4.701,
6
+ "eval_steps_per_second": 0.2
7
  }
preprocessor_config.json CHANGED
@@ -1,4 +1,21 @@
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "crop_size": {
3
  "height": 224,
4
  "width": 224
 
1
  {
2
+ "_valid_processor_keys": [
3
+ "images",
4
+ "do_resize",
5
+ "size",
6
+ "resample",
7
+ "do_center_crop",
8
+ "crop_size",
9
+ "do_rescale",
10
+ "rescale_factor",
11
+ "do_normalize",
12
+ "image_mean",
13
+ "image_std",
14
+ "do_convert_rgb",
15
+ "return_tensors",
16
+ "data_format",
17
+ "input_data_format"
18
+ ],
19
  "crop_size": {
20
  "height": 224,
21
  "width": 224
test_results.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "test_loss": 3.050781726837158,
3
- "test_runtime": 25.3536,
4
- "test_samples_per_second": 4.102,
5
- "test_steps_per_second": 0.158
6
  }
 
1
  {
2
+ "test_loss": 2.9896740913391113,
3
+ "test_runtime": 20.647,
4
+ "test_samples_per_second": 4.698,
5
+ "test_steps_per_second": 0.194
6
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 10.0,
3
- "train_loss": 2.9446426391601563,
4
- "train_runtime": 3632.8393,
5
- "train_samples_per_second": 1.153,
6
- "train_steps_per_second": 0.039
7
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "train_loss": 2.822861735026042,
4
+ "train_runtime": 3007.5818,
5
+ "train_samples_per_second": 1.26,
6
+ "train_steps_per_second": 0.04
7
  }
trainer_state.json CHANGED
@@ -3,27 +3,27 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 10.0,
5
  "eval_steps": 500,
6
- "global_step": 140,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 10.0,
13
- "step": 140,
14
- "total_flos": 753693745889700.0,
15
- "train_loss": 2.9446426391601563,
16
- "train_runtime": 3632.8393,
17
- "train_samples_per_second": 1.153,
18
- "train_steps_per_second": 0.039
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 140,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 10,
25
  "save_steps": 500,
26
- "total_flos": 753693745889700.0,
27
  "train_batch_size": 32,
28
  "trial_name": null,
29
  "trial_params": null
 
3
  "best_model_checkpoint": null,
4
  "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 120,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 10.0,
13
+ "step": 120,
14
+ "total_flos": 681742075637700.0,
15
+ "train_loss": 2.822861735026042,
16
+ "train_runtime": 3007.5818,
17
+ "train_samples_per_second": 1.26,
18
+ "train_steps_per_second": 0.04
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 120,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 10,
25
  "save_steps": 500,
26
+ "total_flos": 681742075637700.0,
27
  "train_batch_size": 32,
28
  "trial_name": null,
29
  "trial_params": null