End of training

Browse files

Files changed (9) hide show

README.md +79 -0
all_results.json +18 -0
config.json +79 -0
eval_results.json +13 -0
model.safetensors +3 -0
preprocessor_config.json +28 -0
train_results.json +8 -0
trainer_state.json +276 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,79 @@

+---
+library_name: transformers
+license: apache-2.0
+base_model: microsoft/beit-base-patch16-224-pt22k-ft22k
+tags:
+- generated_from_trainer
+metrics:
+- precision
+- recall
+- f1
+- accuracy
+model-index:
+- name: beit-base-patch16-224-pt22k-ft22k-finetuned-barkley
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# beit-base-patch16-224-pt22k-ft22k-finetuned-barkley
+This model is a fine-tuned version of [microsoft/beit-base-patch16-224-pt22k-ft22k](https://huggingface.co/microsoft/beit-base-patch16-224-pt22k-ft22k) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.0079
+- Precision: 1.0
+- Recall: 1.0
+- F1: 1.0
+- Accuracy: 1.0
+- Top1 Accuracy: 1.0
+- Error Rate: 0.0
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0002
+- train_batch_size: 32
+- eval_batch_size: 32
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- lr_scheduler_warmup_ratio: 0.1
+- num_epochs: 30
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy | Top1 Accuracy | Error Rate |
+|:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|:-------------:|:----------:|
+| 1.5547        | 1.0   | 38   | 1.4018          | 0.5683    | 0.4539 | 0.4240 | 0.4728   | 0.4539        | 0.5272     |
+| 1.1732        | 2.0   | 76   | 0.9193          | 0.8095    | 0.7961 | 0.7985 | 0.8077   | 0.7961        | 0.1923     |
+| 0.6764        | 3.0   | 114  | 0.3644          | 0.9488    | 0.9474 | 0.9470 | 0.9483   | 0.9474        | 0.0517     |
+| 0.2566        | 4.0   | 152  | 0.0871          | 0.9937    | 0.9934 | 0.9934 | 0.9944   | 0.9934        | 0.0056     |
+| 0.1014        | 5.0   | 190  | 0.0533          | 0.9809    | 0.9803 | 0.9802 | 0.9811   | 0.9803        | 0.0189     |
+| 0.0538        | 6.0   | 228  | 0.0208          | 1.0       | 1.0    | 1.0    | 1.0      | 1.0           | 0.0        |
+| 0.0304        | 7.0   | 266  | 0.0079          | 1.0       | 1.0    | 1.0    | 1.0      | 1.0           | 0.0        |
+| 0.0571        | 8.0   | 304  | 0.0088          | 1.0       | 1.0    | 1.0    | 1.0      | 1.0           | 0.0        |
+| 0.0608        | 9.0   | 342  | 0.0226          | 0.9936    | 0.9934 | 0.9934 | 0.9933   | 0.9934        | 0.0067     |
+### Framework versions
+- Transformers 4.44.2
+- Pytorch 2.3.1+cu121
+- Datasets 3.0.1
+- Tokenizers 0.19.1

all_results.json ADDED Viewed

	@@ -0,0 +1,18 @@

+{
+    "epoch": 9.0,
+    "eval_accuracy": 1.0,
+    "eval_error_rate": 0.0,
+    "eval_f1": 1.0,
+    "eval_loss": 0.007897687144577503,
+    "eval_precision": 1.0,
+    "eval_recall": 1.0,
+    "eval_runtime": 44.0386,
+    "eval_samples_per_second": 3.452,
+    "eval_steps_per_second": 0.114,
+    "eval_top1_accuracy": 1.0,
+    "total_flos": 8.477326613832008e+17,
+    "train_loss": 0.4405021691880031,
+    "train_runtime": 8765.8937,
+    "train_samples_per_second": 4.162,
+    "train_steps_per_second": 0.13
+}

config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "_name_or_path": "microsoft/beit-base-patch16-224-pt22k-ft22k",
+  "add_fpn": false,
+  "architectures": [
+    "BeitForImageClassification"
+  ],
+  "attention_probs_dropout_prob": 0.0,
+  "auxiliary_channels": 256,
+  "auxiliary_concat_input": false,
+  "auxiliary_loss_weight": 0.4,
+  "auxiliary_num_convs": 1,
+  "drop_path_rate": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Iinstia bijuga",
+    "1": "Mangifera indica",
+    "2": "Pterocarpus indicus",
+    "3": "Roystonea regia",
+    "4": "Tabebuia"
+  },
+  "image_size": 224,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Iinstia bijuga": 0,
+    "Mangifera indica": 1,
+    "Pterocarpus indicus": 2,
+    "Roystonea regia": 3,
+    "Tabebuia": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "layer_scale_init_value": 0.1,
+  "model_type": "beit",
+  "num_attention_heads": 12,
+  "num_channels": 3,
+  "num_hidden_layers": 12,
+  "out_features": [
+    "stage12"
+  ],
+  "out_indices": [
+    12
+  ],
+  "patch_size": 16,
+  "pool_scales": [
+    1,
+    2,
+    3,
+    6
+  ],
+  "problem_type": "single_label_classification",
+  "reshape_hidden_states": true,
+  "semantic_loss_ignore_index": 255,
+  "stage_names": [
+    "stem",
+    "stage1",
+    "stage2",
+    "stage3",
+    "stage4",
+    "stage5",
+    "stage6",
+    "stage7",
+    "stage8",
+    "stage9",
+    "stage10",
+    "stage11",
+    "stage12"
+  ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_absolute_position_embeddings": false,
+  "use_auxiliary_head": true,
+  "use_mask_token": false,
+  "use_mean_pooling": true,
+  "use_relative_position_bias": true,
+  "use_shared_relative_position_bias": false,
+  "vocab_size": 8192
+}

eval_results.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+    "epoch": 9.0,
+    "eval_accuracy": 1.0,
+    "eval_error_rate": 0.0,
+    "eval_f1": 1.0,
+    "eval_loss": 0.007897687144577503,
+    "eval_precision": 1.0,
+    "eval_recall": 1.0,
+    "eval_runtime": 44.0386,
+    "eval_samples_per_second": 3.452,
+    "eval_steps_per_second": 0.114,
+    "eval_top1_accuracy": 1.0
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb29d38667592d9d6399400c6135abd3f2eb95163b499ac1964339b9adf30c00
+size 343089556

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": false,
+  "do_normalize": true,
+  "do_reduce_labels": false,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "BeitImageProcessor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 9.0,
+    "total_flos": 8.477326613832008e+17,
+    "train_loss": 0.4405021691880031,
+    "train_runtime": 8765.8937,
+    "train_samples_per_second": 4.162,
+    "train_steps_per_second": 0.13
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,276 @@

+{
+  "best_metric": 0.007897687144577503,
+  "best_model_checkpoint": "beit-base-patch16-224-pt22k-ft22k-finetuned-barkley\\checkpoint-266",
+  "epoch": 9.0,
+  "eval_steps": 500,
+  "global_step": 342,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "train_accuracy": 0.31167763157894735
+    },
+    {
+      "epoch": 1.0,
+      "grad_norm": 12.05273151397705,
+      "learning_rate": 1.3523651731772227e-06,
+      "loss": 1.5547,
+      "step": 38
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.472770236299648,
+      "eval_error_rate": 0.527229763700352,
+      "eval_f1": 0.4239844424393964,
+      "eval_loss": 1.4018361568450928,
+      "eval_precision": 0.568315238272393,
+      "eval_recall": 0.45394736842105265,
+      "eval_runtime": 77.2729,
+      "eval_samples_per_second": 1.967,
+      "eval_steps_per_second": 0.065,
+      "eval_top1_accuracy": 0.45394736842105265,
+      "step": 38
+    },
+    {
+      "epoch": 2.0,
+      "train_accuracy": 0.6059941520467836
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": Infinity,
+      "learning_rate": 2.945896675096576e-06,
+      "loss": 1.1732,
+      "step": 76
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.8077275012569132,
+      "eval_error_rate": 0.19227249874308683,
+      "eval_f1": 0.798546834840623,
+      "eval_loss": 0.9193388223648071,
+      "eval_precision": 0.8095493933458997,
+      "eval_recall": 0.7960526315789473,
+      "eval_runtime": 74.7172,
+      "eval_samples_per_second": 2.034,
+      "eval_steps_per_second": 0.067,
+      "eval_top1_accuracy": 0.7960526315789473,
+      "step": 76
+    },
+    {
+      "epoch": 3.0,
+      "train_accuracy": 0.8654970760233918
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 9.15374755859375,
+      "learning_rate": 5.472913419787674e-06,
+      "loss": 0.6764,
+      "step": 114
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9483207642031172,
+      "eval_error_rate": 0.05167923579688283,
+      "eval_f1": 0.9470289415786431,
+      "eval_loss": 0.36436742544174194,
+      "eval_precision": 0.9488354259225403,
+      "eval_recall": 0.9473684210526315,
+      "eval_runtime": 76.1752,
+      "eval_samples_per_second": 1.995,
+      "eval_steps_per_second": 0.066,
+      "eval_top1_accuracy": 0.9473684210526315,
+      "step": 114
+    },
+    {
+      "epoch": 4.0,
+      "train_accuracy": 0.9649122807017544
+    },
+    {
+      "epoch": 4.0,
+      "grad_norm": 8.670642852783203,
+      "learning_rate": 8.59766441885347e-06,
+      "loss": 0.2566,
+      "step": 152
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.9944444444444445,
+      "eval_error_rate": 0.005555555555555536,
+      "eval_f1": 0.99343678755752,
+      "eval_loss": 0.08713744580745697,
+      "eval_precision": 0.9936647173489279,
+      "eval_recall": 0.993421052631579,
+      "eval_runtime": 72.4529,
+      "eval_samples_per_second": 2.098,
+      "eval_steps_per_second": 0.069,
+      "eval_top1_accuracy": 0.993421052631579,
+      "step": 152
+    },
+    {
+      "epoch": 5.0,
+      "train_accuracy": 0.9839181286549707
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 8.482632637023926,
+      "learning_rate": 1.1941067495001943e-05,
+      "loss": 0.1014,
+      "step": 190
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.981111111111111,
+      "eval_error_rate": 0.018888888888888955,
+      "eval_f1": 0.980233547031901,
+      "eval_loss": 0.05328463390469551,
+      "eval_precision": 0.9808624413887572,
+      "eval_recall": 0.9802631578947368,
+      "eval_runtime": 73.3921,
+      "eval_samples_per_second": 2.071,
+      "eval_steps_per_second": 0.068,
+      "eval_top1_accuracy": 0.9802631578947368,
+      "step": 190
+    },
+    {
+      "epoch": 6.0,
+      "train_accuracy": 0.9897660818713451
+    },
+    {
+      "epoch": 6.0,
+      "grad_norm": 0.8424493670463562,
+      "learning_rate": 1.50975144835985e-05,
+      "loss": 0.0538,
+      "step": 228
+    },
+    {
+      "epoch": 6.0,
+      "eval_accuracy": 1.0,
+      "eval_error_rate": 0.0,
+      "eval_f1": 1.0,
+      "eval_loss": 0.020772233605384827,
+      "eval_precision": 1.0,
+      "eval_recall": 1.0,
+      "eval_runtime": 74.2604,
+      "eval_samples_per_second": 2.047,
+      "eval_steps_per_second": 0.067,
+      "eval_top1_accuracy": 1.0,
+      "step": 228
+    },
+    {
+      "epoch": 7.0,
+      "train_accuracy": 0.9941520467836257
+    },
+    {
+      "epoch": 7.0,
+      "grad_norm": 0.9595191478729248,
+      "learning_rate": 1.7684077977850795e-05,
+      "loss": 0.0304,
+      "step": 266
+    },
+    {
+      "epoch": 7.0,
+      "eval_accuracy": 1.0,
+      "eval_error_rate": 0.0,
+      "eval_f1": 1.0,
+      "eval_loss": 0.007897687144577503,
+      "eval_precision": 1.0,
+      "eval_recall": 1.0,
+      "eval_runtime": 69.1824,
+      "eval_samples_per_second": 2.197,
+      "eval_steps_per_second": 0.072,
+      "eval_top1_accuracy": 1.0,
+      "step": 266
+    },
+    {
+      "epoch": 8.0,
+      "train_accuracy": 0.9861111111111112
+    },
+    {
+      "epoch": 8.0,
+      "grad_norm": 2.93084454536438,
+      "learning_rate": 1.9386966536009276e-05,
+      "loss": 0.0571,
+      "step": 304
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 1.0,
+      "eval_error_rate": 0.0,
+      "eval_f1": 1.0,
+      "eval_loss": 0.008802073076367378,
+      "eval_precision": 1.0,
+      "eval_recall": 1.0,
+      "eval_runtime": 59.208,
+      "eval_samples_per_second": 2.567,
+      "eval_steps_per_second": 0.084,
+      "eval_top1_accuracy": 1.0,
+      "step": 304
+    },
+    {
+      "epoch": 9.0,
+      "train_accuracy": 0.9817251461988304
+    },
+    {
+      "epoch": 9.0,
+      "grad_norm": 0.27030402421951294,
+      "learning_rate": 1.9998370404079306e-05,
+      "loss": 0.0608,
+      "step": 342
+    },
+    {
+      "epoch": 9.0,
+      "eval_accuracy": 0.9933333333333334,
+      "eval_error_rate": 0.006666666666666599,
+      "eval_f1": 0.9934103601236665,
+      "eval_loss": 0.022643933072686195,
+      "eval_precision": 0.9935988620199147,
+      "eval_recall": 0.993421052631579,
+      "eval_runtime": 54.0581,
+      "eval_samples_per_second": 2.812,
+      "eval_steps_per_second": 0.092,
+      "eval_top1_accuracy": 0.993421052631579,
+      "step": 342
+    },
+    {
+      "epoch": 9.0,
+      "step": 342,
+      "total_flos": 8.477326613832008e+17,
+      "train_loss": 0.4405021691880031,
+      "train_runtime": 8765.8937,
+      "train_samples_per_second": 4.162,
+      "train_steps_per_second": 0.13
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 1140,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 30,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 8.477326613832008e+17,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3db2e50743efae30a7e86a2e2dcbcd6e1e65f7aa5345f29196518285ac5a8880
+size 5176