labicquette commited on Mar 15, 2024

Commit

2eccdea

•

1 Parent(s): 0e97feb

upload model

Browse files

Files changed (24) hide show

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/added_tokens.json +3 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/config.json +39 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/model.safetensors +3 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/sentencepiece.bpe.model +3 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/special_tokens_map.json +20 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/tokenizer.json +0 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/tokenizer_config.json +85 -0
almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/training_args.bin +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/config.json +39 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/model.safetensors +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/optimizer.pt +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/rng_state.pth +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/scheduler.pt +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/trainer_state.json +79 -0
almanach_camembert-base-ft-BUILD/checkpoint-1248/training_args.bin +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/config.json +39 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/model.safetensors +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/optimizer.pt +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/rng_state.pth +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/scheduler.pt +3 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/trainer_state.json +50 -0
almanach_camembert-base-ft-BUILD/checkpoint-624/training_args.bin +3 -0
almanach_camembert-base-ft-BUILD/logs/events.out.tfevents.1710352452.DESKTOP-VOM7ARG.16588.0 +3 -0
almanach_camembert-base-ft-BUILD/logs/events.out.tfevents.1710356063.DESKTOP-VOM7ARG.42033.0 +3 -0

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/added_tokens.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "<unk>NOTUSED": 32005
+}

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "almanach/camembert-base",
+  "architectures": [
+    "CamembertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 5,
+  "classifier_dropout": null,
+  "eos_token_id": 6,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Entr\u00e9e",
+    "1": "Plat principal",
+    "2": "Dessert"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Dessert": 2,
+    "Entr\u00e9e": 0,
+    "Plat principal": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "camembert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.1",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 32005
+}

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:37cfb8976ca3087b13c65a9a7eb5c3f53f6caa177276fa581d8c05ad1404ad37
+size 442521180

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/sentencepiece.bpe.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
+size 810912

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "additional_special_tokens": [
+    "<s>NOTUSED",
+    "</s>NOTUSED",
+    "<unk>NOTUSED"
+  ],
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>NOTUSED",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>NOTUSED",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "6": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "32004": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "32005": {
+      "content": "<unk>NOTUSED",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "<s>NOTUSED",
+    "</s>NOTUSED",
+    "<unk>NOTUSED"
+  ],
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "padding": "max_length",
+  "sep_token": "</s>",
+  "tokenizer_class": "CamembertTokenizer",
+  "truncation": true,
+  "unk_token": "<unk>"
+}

almanach_camembert-base-ft-BUILD/almanach_camembert-base-ft-BUILD-best/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ea323feb777171b1e19c143df6d74de920adacfecf00b62ff7d79acbe08d5cb
+size 4792

almanach_camembert-base-ft-BUILD/checkpoint-1248/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "almanach/camembert-base",
+  "architectures": [
+    "CamembertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 5,
+  "classifier_dropout": null,
+  "eos_token_id": 6,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Entr\u00e9e",
+    "1": "Plat principal",
+    "2": "Dessert"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Dessert": 2,
+    "Entr\u00e9e": 0,
+    "Plat principal": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "camembert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.1",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 32005
+}

almanach_camembert-base-ft-BUILD/checkpoint-1248/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1b2463c7b907b5086243fa8f3d67f8ba80f4b42aadeeb3e41b7dc540e1009bd6
+size 442521180

almanach_camembert-base-ft-BUILD/checkpoint-1248/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6c2641f538bb57edfbec4b176fdb2676fb0978e1d5184c64724d8e9e0ea804d
+size 885162234

almanach_camembert-base-ft-BUILD/checkpoint-1248/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a9051d5c762bfe1d4b2b94f0fcdff0b687d75db7bf89e2a18676bb4bedb74332
+size 14244

almanach_camembert-base-ft-BUILD/checkpoint-1248/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1dc7306e6fc72ea98c143e28f6b732bcca62fd175d4eec363f5176463773dc58
+size 1064

almanach_camembert-base-ft-BUILD/checkpoint-1248/trainer_state.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "best_metric": 0.8732301150631039,
+  "best_model_checkpoint": "./models/camembert-base/almanach_camembert-base-ft-BUILD/checkpoint-1248",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 1248,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.32,
+      "learning_rate": 2e-05,
+      "loss": 0.8361,
+      "step": 200
+    },
+    {
+      "epoch": 0.64,
+      "learning_rate": 4e-05,
+      "loss": 0.3948,
+      "step": 400
+    },
+    {
+      "epoch": 0.96,
+      "learning_rate": 4.9128919860627184e-05,
+      "loss": 0.3576,
+      "step": 600
+    },
+    {
+      "epoch": 1.0,
+      "eval_f1": 0.8681621844300148,
+      "eval_loss": 0.3254093825817108,
+      "eval_p": 0.869921888637574,
+      "eval_r": 0.8713942307692307,
+      "eval_runtime": 343.7765,
+      "eval_samples_per_second": 7.261,
+      "eval_steps_per_second": 0.454,
+      "step": 624
+    },
+    {
+      "epoch": 1.28,
+      "learning_rate": 4.7386759581881534e-05,
+      "loss": 0.3094,
+      "step": 800
+    },
+    {
+      "epoch": 1.6,
+      "learning_rate": 4.564459930313589e-05,
+      "loss": 0.293,
+      "step": 1000
+    },
+    {
+      "epoch": 1.92,
+      "learning_rate": 4.390243902439025e-05,
+      "loss": 0.3123,
+      "step": 1200
+    },
+    {
+      "epoch": 2.0,
+      "eval_f1": 0.8732301150631039,
+      "eval_loss": 0.3346249461174011,
+      "eval_p": 0.8730534836267592,
+      "eval_r": 0.8754006410256411,
+      "eval_runtime": 196.1779,
+      "eval_samples_per_second": 12.723,
+      "eval_steps_per_second": 0.795,
+      "step": 1248
+    }
+  ],
+  "logging_steps": 200,
+  "max_steps": 6240,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
+  "save_steps": 500,
+  "total_flos": 5250165137344512.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

almanach_camembert-base-ft-BUILD/checkpoint-1248/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ea323feb777171b1e19c143df6d74de920adacfecf00b62ff7d79acbe08d5cb
+size 4792

almanach_camembert-base-ft-BUILD/checkpoint-624/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "almanach/camembert-base",
+  "architectures": [
+    "CamembertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 5,
+  "classifier_dropout": null,
+  "eos_token_id": 6,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Entr\u00e9e",
+    "1": "Plat principal",
+    "2": "Dessert"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Dessert": 2,
+    "Entr\u00e9e": 0,
+    "Plat principal": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "camembert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.1",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 32005
+}

almanach_camembert-base-ft-BUILD/checkpoint-624/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a0e8e0a5309ecdc790d0817fdd536f16baa5fbe1ff12995098091e0a5298ff2
+size 442521180

almanach_camembert-base-ft-BUILD/checkpoint-624/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:98e58ecb3c1caea3d1a4e1f3dfd22d588a62c87574136f210de165be2dfccf35
+size 885162234

almanach_camembert-base-ft-BUILD/checkpoint-624/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5fe3c8b5b99829df69895c8004712171fbe98a2971c17b9adae1f54c9b19f9d
+size 14244

almanach_camembert-base-ft-BUILD/checkpoint-624/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6f9ff747d8beb685f79f4af8347a7c784b50d8d31b2c1338a54956825c2a57b
+size 1064

almanach_camembert-base-ft-BUILD/checkpoint-624/trainer_state.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "best_metric": 0.8681621844300148,
+  "best_model_checkpoint": "./models/camembert-base/almanach_camembert-base-ft-BUILD/checkpoint-624",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 624,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.32,
+      "learning_rate": 2e-05,
+      "loss": 0.8361,
+      "step": 200
+    },
+    {
+      "epoch": 0.64,
+      "learning_rate": 4e-05,
+      "loss": 0.3948,
+      "step": 400
+    },
+    {
+      "epoch": 0.96,
+      "learning_rate": 4.9128919860627184e-05,
+      "loss": 0.3576,
+      "step": 600
+    },
+    {
+      "epoch": 1.0,
+      "eval_f1": 0.8681621844300148,
+      "eval_loss": 0.3254093825817108,
+      "eval_p": 0.869921888637574,
+      "eval_r": 0.8713942307692307,
+      "eval_runtime": 343.7765,
+      "eval_samples_per_second": 7.261,
+      "eval_steps_per_second": 0.454,
+      "step": 624
+    }
+  ],
+  "logging_steps": 200,
+  "max_steps": 6240,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
+  "save_steps": 500,
+  "total_flos": 2625082568672256.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

almanach_camembert-base-ft-BUILD/checkpoint-624/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ea323feb777171b1e19c143df6d74de920adacfecf00b62ff7d79acbe08d5cb
+size 4792

almanach_camembert-base-ft-BUILD/logs/events.out.tfevents.1710352452.DESKTOP-VOM7ARG.16588.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cca3b062181cffa99ccb5186d6edd8e318a717fa7b8e28b6faaec6590d59f9e5
+size 7341

almanach_camembert-base-ft-BUILD/logs/events.out.tfevents.1710356063.DESKTOP-VOM7ARG.42033.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1ed714f64e8ba3193c6adf5748f5d025161580f7e2a431ccf20c35000b75f7b8
+size 11364