Training in progress epoch 0

Browse files

Files changed (6) hide show

README.md +6 -15
config.json +8 -1
tf_model.h5 +1 -1
tokenizer.json +0 -0
tokenizer_config.json +113 -105
vocab.txt +0 -0

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-base_model: aubmindlab/bert-base-arabertv2
 tags:
 - generated_from_keras_callback
 model-index:
@@ -12,11 +12,11 @@ probably proofread and complete it, then remove this comment. -->
 # NourMohamed91/v_model
-This model is a fine-tuned version of [aubmindlab/bert-base-arabertv2](https://huggingface.co/aubmindlab/bert-base-arabertv2) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Train Loss: 0.0860
-- Validation Loss: 0.0561
-- Epoch: 9
 ## Model description
@@ -42,16 +42,7 @@ The following hyperparameters were used during training:
 | Train Loss | Validation Loss | Epoch |
 |:----------:|:---------------:|:-----:|
-| 4.4674     | 2.8440          | 0     |
-| 1.7610     | 0.5503          | 1     |
-| 0.4084     | 0.1634          | 2     |
-| 0.2088     | 0.1181          | 3     |
-| 0.1409     | 0.0843          | 4     |
-| 0.1130     | 0.0592          | 5     |
-| 0.1097     | 0.0590          | 6     |
-| 0.0911     | 0.0517          | 7     |
-| 0.0896     | 0.0568          | 8     |
-| 0.0860     | 0.0561          | 9     |
 ### Framework versions

 ---
+base_model: gp-tar4/QA_FineTuned_Arabert
 tags:
 - generated_from_keras_callback
 model-index:
 # NourMohamed91/v_model
+This model is a fine-tuned version of [gp-tar4/QA_FineTuned_Arabert](https://huggingface.co/gp-tar4/QA_FineTuned_Arabert) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Train Loss: 1.9933
+- Validation Loss: 0.2847
+- Epoch: 0
 ## Model description
 | Train Loss | Validation Loss | Epoch |
 |:----------:|:---------------:|:-----:|
+| 1.9933     | 0.2847          | 0     |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,10 +1,11 @@
 {
-  "_name_or_path": "aubmindlab/bert-base-arabertv2",
   "architectures": [
     "BertForQuestionAnswering"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
@@ -16,7 +17,13 @@
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
   "transformers_version": "4.41.0",
   "type_vocab_size": 2,
   "use_cache": true,

 {
+  "_name_or_path": "gp-tar4/QA_FineTuned_Arabert",
   "architectures": [
     "BertForQuestionAnswering"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
+  "directionality": "bidi",
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
   "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
   "transformers_version": "4.41.0",
   "type_vocab_size": 2,
   "use_cache": true,

tf_model.h5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7307bfd4ed3e7a83e2a870154c95b62816d09bebca1c107bd88935dd6e5f45f3
 size 538686416

 version https://git-lfs.github.com/spec/v1
+oid sha256:37749a0d36fb7ec773accf8788945d92009a230583f94f083e53982fdb46abc0
 size 538686416

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "added_tokens_decoder": {
-    "0": {
       "content": "+ا",
       "lstrip": false,
       "normalized": true,
@@ -8,284 +8,284 @@
       "single_word": true,
       "special": true
     },
-    "1": {
-      "content": "+ك",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "2": {
-      "content": "ب+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "3": {
-      "content": "+هم",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "4": {
-      "content": "+ات",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "5": {
-      "content": "+ي",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "6": {
-      "content": "ل+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "7": {
-      "content": "+هما",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "8": {
-      "content": "+نا",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "9": {
-      "content": "+ن",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "10": {
-      "content": "+ها",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "11": {
-      "content": "+كما",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "12": {
-      "content": "+ة",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "13": {
-      "content": "ف+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "14": {
-      "content": "+كم",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "15": {
-      "content": "+كن",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "16": {
-      "content": "+ت",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "17": {
-      "content": "[بريد]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "18": {
-      "content": "[مستخدم]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "19": {
-      "content": "لل+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "20": {
-      "content": "ال+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "21": {
-      "content": "[رابط]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "22": {
-      "content": "س+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "23": {
-      "content": "+ان",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "24": {
-      "content": "+وا",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "25": {
-      "content": "+ه",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "26": {
-      "content": "+ون",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "27": {
-      "content": "+هن",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
-    "28": {
-      "content": "+ين",
       "lstrip": false,
-      "normalized": true,
       "rstrip": false,
-      "single_word": true,
       "special": true
     },
-    "29": {
-      "content": "و+",
       "lstrip": false,
-      "normalized": true,
       "rstrip": false,
-      "single_word": true,
       "special": true
     },
-    "30": {
-      "content": "ك+",
       "lstrip": false,
-      "normalized": true,
       "rstrip": false,
-      "single_word": true,
       "special": true
     },
-    "31": {
-      "content": "[PAD]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "32": {
-      "content": "[UNK]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "33": {
-      "content": "[CLS]",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
-      "single_word": false,
       "special": true
     },
-    "34": {
-      "content": "[SEP]",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
-      "single_word": false,
       "special": true
     },
-    "35": {
-      "content": "[MASK]",
       "lstrip": false,
-      "normalized": false,
       "rstrip": false,
-      "single_word": false,
       "special": true
     }
   },
@@ -293,46 +293,54 @@
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": false,
   "mask_token": "[MASK]",
   "max_len": 512,
   "model_max_length": 512,
   "never_split": [
-    "+ك",
-    "+كما",
-    "ك+",
     "+وا",
-    "+ين",
-    "و+",
-    "+كن",
-    "+ان",
     "+هم",
     "+ة",
-    "[بريد]",
-    "لل+",
-    "+ي",
-    "+ت",
     "+ن",
-    "س+",
-    "ل+",
-    "[مستخدم]",
-    "+كم",
     "+ا",
     "ب+",
-    "ف+",
     "+نا",
-    "+ها",
-    "+ون",
     "+هما",
     "ال+",
-    "+ه",
-    "+هن",
-    "+ات",
-    "[رابط]"
   ],
   "pad_token": "[PAD]",
   "sep_token": "[SEP]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
   "unk_token": "[UNK]"
 }

 {
   "added_tokens_decoder": {
+    "124": {
       "content": "+ا",
       "lstrip": false,
       "normalized": true,
       "single_word": true,
       "special": true
     },
+    "125": {
+      "content": "+ة",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "126": {
+      "content": "+ت",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "127": {
+      "content": "+ك",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "128": {
+      "content": "+ن",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "129": {
+      "content": "+ه",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "130": {
+      "content": "+ي",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "448": {
+      "content": "ب+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "635": {
+      "content": "س+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "765": {
+      "content": "ف+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "802": {
+      "content": "ك+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "816": {
+      "content": "ل+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "897": {
+      "content": "و+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1012": {
+      "content": "+ات",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1013": {
+      "content": "+ان",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1015": {
+      "content": "+كم",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1016": {
+      "content": "+كن",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1017": {
+      "content": "+نا",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1018": {
+      "content": "+ها",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1019": {
+      "content": "+هم",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1020": {
+      "content": "+هن",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1021": {
+      "content": "+وا",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1022": {
+      "content": "+ون",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "1023": {
+      "content": "+ين",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "3000": {
+      "content": "ال+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "6154": {
+      "content": "لل+",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "8270": {
+      "content": "+كما",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "8271": {
+      "content": "+هما",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": true,
       "special": true
     },
+    "29756": {
+      "content": "[CLS]",
       "lstrip": false,
+      "normalized": false,
       "rstrip": false,
+      "single_word": false,
       "special": true
     },
+    "29757": {
+      "content": "[PAD]",
       "lstrip": false,
+      "normalized": false,
       "rstrip": false,
+      "single_word": false,
       "special": true
     },
+    "29758": {
+      "content": "[SEP]",
       "lstrip": false,
+      "normalized": false,
       "rstrip": false,
+      "single_word": false,
       "special": true
     },
+    "29759": {
+      "content": "[UNK]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "46585": {
+      "content": "[MASK]",
       "lstrip": false,
       "normalized": false,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "46586": {
+      "content": "[بريد]",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
+      "single_word": true,
       "special": true
     },
+    "46587": {
+      "content": "[رابط]",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
+      "single_word": true,
       "special": true
     },
+    "57701": {
+      "content": "[مستخدم]",
       "lstrip": false,
+      "normalized": true,
       "rstrip": false,
+      "single_word": true,
       "special": true
     }
   },
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
   "do_lower_case": false,
+  "full_tokenizer_file": null,
   "mask_token": "[MASK]",
   "max_len": 512,
+  "max_length": 384,
   "model_max_length": 512,
   "never_split": [
     "+وا",
+    "س+",
+    "[مستخدم]",
+    "+ك",
     "+هم",
     "+ة",
     "+ن",
+    "لل+",
+    "[بريد]",
+    "[رابط]",
+    "+ه",
+    "+كن",
     "+ا",
+    "+ات",
+    "+ي",
     "ب+",
     "+نا",
+    "+هن",
+    "+كم",
+    "ك+",
+    "+ين",
     "+هما",
+    "و+",
+    "+كما",
+    "+ان",
+    "+ت",
+    "+ون",
+    "ل+",
+    "+ها",
     "ال+",
+    "ف+"
   ],
+  "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "sep_token": "[SEP]",
+  "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "only_second",
   "unk_token": "[UNK]"
 }

vocab.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff