End of training

Files changed (5) hide show

README.md CHANGED Viewed

@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.9664
-- Accuracy: 0.6
 ## Model description
@@ -44,20 +44,20 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.1
-- training_steps: 100
 ### Training results
-| Training Loss | Epoch | Step | Validation Loss | Accuracy |
-|:-------------:|:-----:|:----:|:---------------:|:--------:|
-| 2.0855        | 0.38  | 38   | 1.8140          | 0.3      |
-| 1.1008        | 1.38  | 76   | 1.1303          | 0.5571   |
-| 0.6874        | 2.24  | 100  | 0.9664          | 0.6      |
 ### Framework versions
-- Transformers 4.36.2
-- Pytorch 2.3.0+rocm6.0
 - Datasets 2.19.1
-- Tokenizers 0.15.2

 This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.3963
+- Accuracy: 0.1154
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.1
+- training_steps: 36
 ### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Accuracy |
+|:-------------:|:------:|:----:|:---------------:|:--------:|
+| 2.4449        | 0.3889 | 14   | 2.4051          | 0.0769   |
+| 2.4615        | 1.3889 | 28   | 2.3911          | 0.1154   |
+| 2.4631        | 2.2222 | 36   | 2.3963          | 0.1154   |
 ### Framework versions
+- Transformers 4.40.1
+- Pytorch 2.1.2+rocm6.0
 - Datasets 2.19.1
+- Tokenizers 0.19.1

config.json CHANGED Viewed

@@ -12,31 +12,33 @@
   "hidden_dropout_prob": 0.0,
   "hidden_size": 768,
   "id2label": {
-    "0": "ApplyEyeMakeup",
-    "1": "BasketballDunk",
-    "2": "ApplyLipstick",
-    "3": "BaseballPitch",
-    "4": "BenchPress",
-    "5": "Basketball",
-    "6": "BalanceBeam",
-    "7": "BandMarching",
-    "8": "Archery",
-    "9": "BabyCrawling"
   },
   "image_size": 224,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "label2id": {
-    "ApplyEyeMakeup": 0,
-    "ApplyLipstick": 2,
-    "Archery": 8,
-    "BabyCrawling": 9,
-    "BalanceBeam": 6,
-    "BandMarching": 7,
-    "BaseballPitch": 3,
-    "Basketball": 5,
-    "BasketballDunk": 1,
-    "BenchPress": 4
   },
   "layer_norm_eps": 1e-12,
   "model_type": "videomae",
@@ -49,7 +51,7 @@
   "problem_type": "single_label_classification",
   "qkv_bias": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.36.2",
   "tubelet_size": 2,
   "use_mean_pooling": false
 }

   "hidden_dropout_prob": 0.0,
   "hidden_size": 768,
   "id2label": {
+    "0": " Book",
+    "1": " Ball",
+    "2": " Afternoon",
+    "3": "Animal",
+    "4": " Boat",
+    "5": " Bank",
+    "6": " Actor",
+    "7": " Blue",
+    "8": "child",
+    "9": "bathroom",
+    "10": " Chair"
   },
   "image_size": 224,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "label2id": {
+    " Actor": 6,
+    " Afternoon": 2,
+    " Ball": 1,
+    " Bank": 5,
+    " Blue": 7,
+    " Boat": 4,
+    " Book": 0,
+    " Chair": 10,
+    "Animal": 3,
+    "bathroom": 9,
+    "child": 8
   },
   "layer_norm_eps": 1e-12,
   "model_type": "videomae",
   "problem_type": "single_label_classification",
   "qkv_bias": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.40.1",
   "tubelet_size": 2,
   "use_mean_pooling": false
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9fbf010135175af726b8aeff637245fa77d3843172bd52171c0984808e32c14f
-size 344961984

 version https://git-lfs.github.com/spec/v1
+oid sha256:faa8c3932321cd311c0c568725d9395b07e6e76a15514770eed364a3eb655f50
+size 344965060

preprocessor_config.json CHANGED Viewed

@@ -1,4 +1,20 @@
 {
   "crop_size": {
     "height": 224,
     "width": 224
@@ -7,7 +23,6 @@
   "do_normalize": true,
   "do_rescale": true,
   "do_resize": true,
-  "feature_extractor_type": "VideoMAEFeatureExtractor",
   "image_mean": [
     0.485,
     0.456,

 {
+  "_valid_processor_keys": [
+    "videos",
+    "do_resize",
+    "size",
+    "resample",
+    "do_center_crop",
+    "crop_size",
+    "do_rescale",
+    "rescale_factor",
+    "do_normalize",
+    "image_mean",
+    "image_std",
+    "return_tensors",
+    "data_format",
+    "input_data_format"
+  ],
   "crop_size": {
     "height": 224,
     "width": 224
   "do_normalize": true,
   "do_rescale": true,
   "do_resize": true,
   "image_mean": [
     0.485,
     0.456,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46a2e1e4777ae1c15e7d44624f1d1ea074a3e33fc19525a122ccf1b4669cb97e
-size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:395eb1ad1b9d276373380e3a1a22d522ce93275bb86ae6735c95352aea21b206
+size 5048