ulisesbravo commited on Nov 26, 2024

Commit

41b26b3

verified ·

1 Parent(s): 020c1bb

Upload folder using huggingface_hub

Browse files

Files changed (18) hide show

README.md +36 -0
checkpoint-768/config.json +48 -0
checkpoint-768/model.safetensors +3 -0
checkpoint-768/optimizer.pt +3 -0
checkpoint-768/rng_state.pth +3 -0
checkpoint-768/scheduler.pt +3 -0
checkpoint-768/trainer_state.json +544 -0
checkpoint-768/training_args.bin +3 -0
config.json +48 -0
model.safetensors +3 -0
runs/Nov26_00-57-41_r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36/events.out.tfevents.1732582662.r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36.144.0 +2 -2
runs/Nov26_00-57-41_r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36/events.out.tfevents.1732603239.r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36.144.1 +3 -0
special_tokens_map.json +37 -0
tokenizer.json +0 -0
tokenizer_config.json +64 -0
training_args.bin +3 -0
training_params.json +30 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,36 @@

+---
+tags:
+- autotrain
+- text-classification
+base_model: ulisesbravo/autotrain-BERTimbau-DGS-0001
+widget:
+- text: "I love AutoTrain"
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 0.7617048025131226
+f1_macro: 0.7457262796719101
+f1_micro: 0.748046875
+f1_weighted: 0.7458152229876283
+precision_macro: 0.7510527252931124
+precision_micro: 0.748046875
+precision_weighted: 0.7510721957087751
+recall_macro: 0.7478964401294499
+recall_micro: 0.748046875
+recall_weighted: 0.748046875
+accuracy: 0.748046875

checkpoint-768/config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "_name_or_path": "ulisesbravo/autotrain-BERTimbau-DGS-0001",
+  "_num_labels": 5,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1 - INTIMA\u00c7\u00c3O INICIAL",
+    "1": "2 - INTIMA\u00c7\u00c3O INSTRU\u00c7\u00c3O",
+    "2": "3 - INTIMA\u00c7\u00c3O RECURSAL",
+    "3": "4 - INTIMA\u00c7\u00c3O CUMPRIMENTO DE SENTEN\u00c7A",
+    "4": "5 - INTIMA\u00c7\u00c3O TR\u00c2NSITO"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1 - INTIMA\u00c7\u00c3O INICIAL": 0,
+    "2 - INTIMA\u00c7\u00c3O INSTRU\u00c7\u00c3O": 1,
+    "3 - INTIMA\u00c7\u00c3O RECURSAL": 2,
+    "4 - INTIMA\u00c7\u00c3O CUMPRIMENTO DE SENTEN\u00c7A": 3,
+    "5 - INTIMA\u00c7\u00c3O TR\u00c2NSITO": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.46.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 29794
+}

checkpoint-768/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:51f8d08d02da34c510712efc366891b14d6bc355263f6ea4be2539dc7aef4b32
+size 435731452

checkpoint-768/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c1811deda59694839c504bf51aadd15afb803ab2035583eb5bfcbef589f0c1b6
+size 871578362

checkpoint-768/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62e74b716758556f6ba31c1f5a2ccd12d8dd08fc7d5c9fa43acc5d86090e0175
+size 13990

checkpoint-768/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:350c3c48766c7873590e96de15f51186910dbfc3a3758c08a47def3fc7ba5b33
+size 1064

checkpoint-768/trainer_state.json ADDED Viewed

	@@ -0,0 +1,544 @@

+{
+  "best_metric": 0.7617048025131226,
+  "best_model_checkpoint": "autotrain-BERTimbau-DGS-0002/checkpoint-768",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 768,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.046875,
+      "grad_norm": 16.356477737426758,
+      "learning_rate": 7.792207792207792e-06,
+      "loss": 0.9263,
+      "step": 12
+    },
+    {
+      "epoch": 0.09375,
+      "grad_norm": 16.417421340942383,
+      "learning_rate": 1.5584415584415583e-05,
+      "loss": 0.7481,
+      "step": 24
+    },
+    {
+      "epoch": 0.140625,
+      "grad_norm": 8.063264846801758,
+      "learning_rate": 2.3376623376623376e-05,
+      "loss": 0.6649,
+      "step": 36
+    },
+    {
+      "epoch": 0.1875,
+      "grad_norm": 20.237438201904297,
+      "learning_rate": 3.1168831168831166e-05,
+      "loss": 0.6951,
+      "step": 48
+    },
+    {
+      "epoch": 0.234375,
+      "grad_norm": 20.48522186279297,
+      "learning_rate": 3.8961038961038966e-05,
+      "loss": 0.7835,
+      "step": 60
+    },
+    {
+      "epoch": 0.28125,
+      "grad_norm": 18.863914489746094,
+      "learning_rate": 4.675324675324675e-05,
+      "loss": 0.8848,
+      "step": 72
+    },
+    {
+      "epoch": 0.328125,
+      "grad_norm": 44.188045501708984,
+      "learning_rate": 4.949348769898698e-05,
+      "loss": 0.7587,
+      "step": 84
+    },
+    {
+      "epoch": 0.375,
+      "grad_norm": 3.5654993057250977,
+      "learning_rate": 4.862518089725037e-05,
+      "loss": 0.8591,
+      "step": 96
+    },
+    {
+      "epoch": 0.421875,
+      "grad_norm": 14.715095520019531,
+      "learning_rate": 4.775687409551375e-05,
+      "loss": 1.0722,
+      "step": 108
+    },
+    {
+      "epoch": 0.46875,
+      "grad_norm": 24.525127410888672,
+      "learning_rate": 4.6888567293777135e-05,
+      "loss": 0.8705,
+      "step": 120
+    },
+    {
+      "epoch": 0.515625,
+      "grad_norm": 11.264841079711914,
+      "learning_rate": 4.6020260492040525e-05,
+      "loss": 0.725,
+      "step": 132
+    },
+    {
+      "epoch": 0.5625,
+      "grad_norm": 10.208191871643066,
+      "learning_rate": 4.515195369030391e-05,
+      "loss": 0.9423,
+      "step": 144
+    },
+    {
+      "epoch": 0.609375,
+      "grad_norm": 36.85372543334961,
+      "learning_rate": 4.42836468885673e-05,
+      "loss": 0.6916,
+      "step": 156
+    },
+    {
+      "epoch": 0.65625,
+      "grad_norm": 10.57655143737793,
+      "learning_rate": 4.341534008683068e-05,
+      "loss": 0.9208,
+      "step": 168
+    },
+    {
+      "epoch": 0.703125,
+      "grad_norm": 8.791451454162598,
+      "learning_rate": 4.2547033285094066e-05,
+      "loss": 0.7232,
+      "step": 180
+    },
+    {
+      "epoch": 0.75,
+      "grad_norm": 3.045738697052002,
+      "learning_rate": 4.1678726483357456e-05,
+      "loss": 0.8408,
+      "step": 192
+    },
+    {
+      "epoch": 0.796875,
+      "grad_norm": 10.673927307128906,
+      "learning_rate": 4.081041968162084e-05,
+      "loss": 0.8796,
+      "step": 204
+    },
+    {
+      "epoch": 0.84375,
+      "grad_norm": 25.335668563842773,
+      "learning_rate": 3.994211287988423e-05,
+      "loss": 0.6581,
+      "step": 216
+    },
+    {
+      "epoch": 0.890625,
+      "grad_norm": 14.630143165588379,
+      "learning_rate": 3.9073806078147614e-05,
+      "loss": 0.8087,
+      "step": 228
+    },
+    {
+      "epoch": 0.9375,
+      "grad_norm": 10.134491920471191,
+      "learning_rate": 3.8205499276411e-05,
+      "loss": 0.7872,
+      "step": 240
+    },
+    {
+      "epoch": 0.984375,
+      "grad_norm": 9.269867897033691,
+      "learning_rate": 3.733719247467439e-05,
+      "loss": 0.817,
+      "step": 252
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.703125,
+      "eval_f1_macro": 0.695547181551088,
+      "eval_f1_micro": 0.703125,
+      "eval_f1_weighted": 0.6955464487515762,
+      "eval_loss": 0.8037577867507935,
+      "eval_precision_macro": 0.7208504141314569,
+      "eval_precision_micro": 0.703125,
+      "eval_precision_weighted": 0.721030433935127,
+      "eval_recall_macro": 0.7032362459546926,
+      "eval_recall_micro": 0.703125,
+      "eval_recall_weighted": 0.703125,
+      "eval_runtime": 433.339,
+      "eval_samples_per_second": 1.182,
+      "eval_steps_per_second": 0.074,
+      "step": 256
+    },
+    {
+      "epoch": 1.03125,
+      "grad_norm": 18.80913543701172,
+      "learning_rate": 3.646888567293778e-05,
+      "loss": 0.9221,
+      "step": 264
+    },
+    {
+      "epoch": 1.078125,
+      "grad_norm": 17.218036651611328,
+      "learning_rate": 3.5600578871201154e-05,
+      "loss": 0.6136,
+      "step": 276
+    },
+    {
+      "epoch": 1.125,
+      "grad_norm": 11.861041069030762,
+      "learning_rate": 3.4732272069464545e-05,
+      "loss": 0.691,
+      "step": 288
+    },
+    {
+      "epoch": 1.171875,
+      "grad_norm": 13.683526992797852,
+      "learning_rate": 3.3863965267727935e-05,
+      "loss": 0.633,
+      "step": 300
+    },
+    {
+      "epoch": 1.21875,
+      "grad_norm": 4.825338840484619,
+      "learning_rate": 3.299565846599132e-05,
+      "loss": 0.4653,
+      "step": 312
+    },
+    {
+      "epoch": 1.265625,
+      "grad_norm": 25.25005531311035,
+      "learning_rate": 3.212735166425471e-05,
+      "loss": 0.8424,
+      "step": 324
+    },
+    {
+      "epoch": 1.3125,
+      "grad_norm": 6.728404998779297,
+      "learning_rate": 3.1259044862518086e-05,
+      "loss": 0.5561,
+      "step": 336
+    },
+    {
+      "epoch": 1.359375,
+      "grad_norm": 25.705286026000977,
+      "learning_rate": 3.0390738060781476e-05,
+      "loss": 0.6089,
+      "step": 348
+    },
+    {
+      "epoch": 1.40625,
+      "grad_norm": 9.829946517944336,
+      "learning_rate": 2.9522431259044863e-05,
+      "loss": 0.7743,
+      "step": 360
+    },
+    {
+      "epoch": 1.453125,
+      "grad_norm": 18.433866500854492,
+      "learning_rate": 2.865412445730825e-05,
+      "loss": 0.6377,
+      "step": 372
+    },
+    {
+      "epoch": 1.5,
+      "grad_norm": 8.541472434997559,
+      "learning_rate": 2.778581765557164e-05,
+      "loss": 0.5226,
+      "step": 384
+    },
+    {
+      "epoch": 1.546875,
+      "grad_norm": 5.109964847564697,
+      "learning_rate": 2.691751085383502e-05,
+      "loss": 0.6857,
+      "step": 396
+    },
+    {
+      "epoch": 1.59375,
+      "grad_norm": 16.345888137817383,
+      "learning_rate": 2.6049204052098407e-05,
+      "loss": 0.7348,
+      "step": 408
+    },
+    {
+      "epoch": 1.640625,
+      "grad_norm": 2.8149545192718506,
+      "learning_rate": 2.5180897250361797e-05,
+      "loss": 0.5388,
+      "step": 420
+    },
+    {
+      "epoch": 1.6875,
+      "grad_norm": 25.609724044799805,
+      "learning_rate": 2.4312590448625184e-05,
+      "loss": 0.6311,
+      "step": 432
+    },
+    {
+      "epoch": 1.734375,
+      "grad_norm": 18.137908935546875,
+      "learning_rate": 2.3444283646888568e-05,
+      "loss": 0.5373,
+      "step": 444
+    },
+    {
+      "epoch": 1.78125,
+      "grad_norm": 20.912015914916992,
+      "learning_rate": 2.2575976845151954e-05,
+      "loss": 0.5749,
+      "step": 456
+    },
+    {
+      "epoch": 1.828125,
+      "grad_norm": 3.7946367263793945,
+      "learning_rate": 2.170767004341534e-05,
+      "loss": 0.4923,
+      "step": 468
+    },
+    {
+      "epoch": 1.875,
+      "grad_norm": 4.118808269500732,
+      "learning_rate": 2.0839363241678728e-05,
+      "loss": 0.5086,
+      "step": 480
+    },
+    {
+      "epoch": 1.921875,
+      "grad_norm": 24.049333572387695,
+      "learning_rate": 1.9971056439942115e-05,
+      "loss": 0.5282,
+      "step": 492
+    },
+    {
+      "epoch": 1.96875,
+      "grad_norm": 6.969969272613525,
+      "learning_rate": 1.91027496382055e-05,
+      "loss": 0.7777,
+      "step": 504
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.73828125,
+      "eval_f1_macro": 0.7360418623759021,
+      "eval_f1_micro": 0.73828125,
+      "eval_f1_weighted": 0.7360378486320622,
+      "eval_loss": 0.7803243398666382,
+      "eval_precision_macro": 0.750415606846448,
+      "eval_precision_micro": 0.73828125,
+      "eval_precision_weighted": 0.7504776910198645,
+      "eval_recall_macro": 0.7383399961926519,
+      "eval_recall_micro": 0.73828125,
+      "eval_recall_weighted": 0.73828125,
+      "eval_runtime": 436.6228,
+      "eval_samples_per_second": 1.173,
+      "eval_steps_per_second": 0.073,
+      "step": 512
+    },
+    {
+      "epoch": 2.015625,
+      "grad_norm": 28.933380126953125,
+      "learning_rate": 1.823444283646889e-05,
+      "loss": 0.5839,
+      "step": 516
+    },
+    {
+      "epoch": 2.0625,
+      "grad_norm": 2.4092745780944824,
+      "learning_rate": 1.7366136034732272e-05,
+      "loss": 0.3359,
+      "step": 528
+    },
+    {
+      "epoch": 2.109375,
+      "grad_norm": 9.090546607971191,
+      "learning_rate": 1.649782923299566e-05,
+      "loss": 0.4643,
+      "step": 540
+    },
+    {
+      "epoch": 2.15625,
+      "grad_norm": 21.722578048706055,
+      "learning_rate": 1.5629522431259043e-05,
+      "loss": 0.4644,
+      "step": 552
+    },
+    {
+      "epoch": 2.203125,
+      "grad_norm": 5.349146842956543,
+      "learning_rate": 1.4761215629522431e-05,
+      "loss": 0.5075,
+      "step": 564
+    },
+    {
+      "epoch": 2.25,
+      "grad_norm": 6.464962482452393,
+      "learning_rate": 1.389290882778582e-05,
+      "loss": 0.2939,
+      "step": 576
+    },
+    {
+      "epoch": 2.296875,
+      "grad_norm": 32.128089904785156,
+      "learning_rate": 1.3024602026049203e-05,
+      "loss": 0.4584,
+      "step": 588
+    },
+    {
+      "epoch": 2.34375,
+      "grad_norm": 6.097667694091797,
+      "learning_rate": 1.2156295224312592e-05,
+      "loss": 0.6406,
+      "step": 600
+    },
+    {
+      "epoch": 2.390625,
+      "grad_norm": 19.716564178466797,
+      "learning_rate": 1.1287988422575977e-05,
+      "loss": 0.4642,
+      "step": 612
+    },
+    {
+      "epoch": 2.4375,
+      "grad_norm": 29.19405174255371,
+      "learning_rate": 1.0419681620839364e-05,
+      "loss": 0.3899,
+      "step": 624
+    },
+    {
+      "epoch": 2.484375,
+      "grad_norm": 16.421785354614258,
+      "learning_rate": 9.55137481910275e-06,
+      "loss": 0.4938,
+      "step": 636
+    },
+    {
+      "epoch": 2.53125,
+      "grad_norm": 21.284482955932617,
+      "learning_rate": 8.683068017366136e-06,
+      "loss": 0.419,
+      "step": 648
+    },
+    {
+      "epoch": 2.578125,
+      "grad_norm": 38.47277069091797,
+      "learning_rate": 7.814761215629521e-06,
+      "loss": 0.4105,
+      "step": 660
+    },
+    {
+      "epoch": 2.625,
+      "grad_norm": 43.99268341064453,
+      "learning_rate": 6.94645441389291e-06,
+      "loss": 0.4791,
+      "step": 672
+    },
+    {
+      "epoch": 2.671875,
+      "grad_norm": 24.28075408935547,
+      "learning_rate": 6.078147612156296e-06,
+      "loss": 0.4125,
+      "step": 684
+    },
+    {
+      "epoch": 2.71875,
+      "grad_norm": 39.111759185791016,
+      "learning_rate": 5.209840810419682e-06,
+      "loss": 0.7284,
+      "step": 696
+    },
+    {
+      "epoch": 2.765625,
+      "grad_norm": 12.080262184143066,
+      "learning_rate": 4.341534008683068e-06,
+      "loss": 0.3698,
+      "step": 708
+    },
+    {
+      "epoch": 2.8125,
+      "grad_norm": 10.01552677154541,
+      "learning_rate": 3.473227206946455e-06,
+      "loss": 0.5005,
+      "step": 720
+    },
+    {
+      "epoch": 2.859375,
+      "grad_norm": 7.803253173828125,
+      "learning_rate": 2.604920405209841e-06,
+      "loss": 0.5321,
+      "step": 732
+    },
+    {
+      "epoch": 2.90625,
+      "grad_norm": 8.892068862915039,
+      "learning_rate": 1.7366136034732275e-06,
+      "loss": 0.6087,
+      "step": 744
+    },
+    {
+      "epoch": 2.953125,
+      "grad_norm": 1.938845157623291,
+      "learning_rate": 8.683068017366137e-07,
+      "loss": 0.535,
+      "step": 756
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 4.535564422607422,
+      "learning_rate": 0.0,
+      "loss": 0.2496,
+      "step": 768
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.748046875,
+      "eval_f1_macro": 0.7457262796719101,
+      "eval_f1_micro": 0.748046875,
+      "eval_f1_weighted": 0.7458152229876283,
+      "eval_loss": 0.7617048025131226,
+      "eval_precision_macro": 0.7510527252931124,
+      "eval_precision_micro": 0.748046875,
+      "eval_precision_weighted": 0.7510721957087751,
+      "eval_recall_macro": 0.7478964401294499,
+      "eval_recall_micro": 0.748046875,
+      "eval_recall_weighted": 0.748046875,
+      "eval_runtime": 444.9594,
+      "eval_samples_per_second": 1.151,
+      "eval_steps_per_second": 0.072,
+      "step": 768
+    }
+  ],
+  "logging_steps": 12,
+  "max_steps": 768,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 5,
+        "early_stopping_threshold": 0.01
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1616597867298816.0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-768/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d006918cf2f8dc18dbdd7564d8e622357e45f4b2fe2cfe7a8e7fe12fa3640c98
+size 5304

config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "_name_or_path": "ulisesbravo/autotrain-BERTimbau-DGS-0001",
+  "_num_labels": 5,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1 - INTIMA\u00c7\u00c3O INICIAL",
+    "1": "2 - INTIMA\u00c7\u00c3O INSTRU\u00c7\u00c3O",
+    "2": "3 - INTIMA\u00c7\u00c3O RECURSAL",
+    "3": "4 - INTIMA\u00c7\u00c3O CUMPRIMENTO DE SENTEN\u00c7A",
+    "4": "5 - INTIMA\u00c7\u00c3O TR\u00c2NSITO"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1 - INTIMA\u00c7\u00c3O INICIAL": 0,
+    "2 - INTIMA\u00c7\u00c3O INSTRU\u00c7\u00c3O": 1,
+    "3 - INTIMA\u00c7\u00c3O RECURSAL": 2,
+    "4 - INTIMA\u00c7\u00c3O CUMPRIMENTO DE SENTEN\u00c7A": 3,
+    "5 - INTIMA\u00c7\u00c3O TR\u00c2NSITO": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.46.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 29794
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:51f8d08d02da34c510712efc366891b14d6bc355263f6ea4be2539dc7aef4b32
+size 435731452

runs/Nov26_00-57-41_r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36/events.out.tfevents.1732582662.r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36.144.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ec0d2c5bcbddd561b89d40b339d160da69cdeabaa9461d08c6ad4bb3c031458
-size 20884

 version https://git-lfs.github.com/spec/v1
+oid sha256:c481768b97781055eea340ddbf7023627ce64d8b4f824983422642784c99673d
+size 22282

runs/Nov26_00-57-41_r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36/events.out.tfevents.1732603239.r-ulisesbravo-train-teste2-etn05s4x-fc8db-htf36.144.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e91207b7e4b9c077d1a46728b1dfbde39bc118df59ed3dc224702ab9b3ee937
+size 921

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "max_length": 512,
+  "model_max_length": 1000000000000000019884624838656,
+  "never_split": null,
+  "pad_to_multiple_of": null,
+  "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
+  "sep_token": "[SEP]",
+  "stride": 0,
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d006918cf2f8dc18dbdd7564d8e622357e45f4b2fe2cfe7a8e7fe12fa3640c98
+size 5304

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "autotrain-BERTimbau-DGS-0002/autotrain-data",
+    "model": "ulisesbravo/autotrain-BERTimbau-DGS-0001",
+    "lr": 5e-05,
+    "epochs": 3,
+    "max_seq_length": 512,
+    "batch_size": 8,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 1,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": -1,
+    "project_name": "autotrain-BERTimbau-DGS-0002",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "push_to_hub": true,
+    "eval_strategy": "epoch",
+    "username": "ulisesbravo",
+    "log": "tensorboard",
+    "early_stopping_patience": 5,
+    "early_stopping_threshold": 0.01
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff