Training in progress, epoch 2
Browse files- config.json +1 -1
- model.safetensors +1 -1
- runs/Dec03_15-19-22_334ed81528ca/events.out.tfevents.1701616970.334ed81528ca.6379.0 +2 -2
- runs/Dec03_15-36-41_334ed81528ca/events.out.tfevents.1701617995.334ed81528ca.11254.0 +3 -0
- special_tokens_map.json +35 -5
- tokenizer_config.json +4 -0
- training_args.bin +1 -1
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "relu",
|
5 |
"architectures": [
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "nadsoft/Faseeh-v0.1-beta",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "relu",
|
5 |
"architectures": [
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2460354912
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e552eccfeb9b585b84e7b223b98a74ca8c85c96f9c32a769b90fd53d7d17b97d
|
3 |
size 2460354912
|
runs/Dec03_15-19-22_334ed81528ca/events.out.tfevents.1701616970.334ed81528ca.6379.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84040688cf3e8f4d35a68ab4bb6a7e744fcd449b8a2c3e1577032e37709e68dc
|
3 |
+
size 5338
|
runs/Dec03_15-36-41_334ed81528ca/events.out.tfevents.1701617995.334ed81528ca.11254.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa5a0920a83e3ebda7300b401eb98267f410f9c91106e331eb6a81a06f419f09
|
3 |
+
size 5016
|
special_tokens_map.json
CHANGED
@@ -203,9 +203,27 @@
|
|
203 |
"zho_Hant",
|
204 |
"zul_Latn"
|
205 |
],
|
206 |
-
"bos_token":
|
207 |
-
|
208 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
209 |
"mask_token": {
|
210 |
"content": "<mask>",
|
211 |
"lstrip": true,
|
@@ -220,6 +238,18 @@
|
|
220 |
"rstrip": false,
|
221 |
"single_word": false
|
222 |
},
|
223 |
-
"sep_token":
|
224 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
225 |
}
|
|
|
203 |
"zho_Hant",
|
204 |
"zul_Latn"
|
205 |
],
|
206 |
+
"bos_token": {
|
207 |
+
"content": "<s>",
|
208 |
+
"lstrip": false,
|
209 |
+
"normalized": false,
|
210 |
+
"rstrip": false,
|
211 |
+
"single_word": false
|
212 |
+
},
|
213 |
+
"cls_token": {
|
214 |
+
"content": "<s>",
|
215 |
+
"lstrip": false,
|
216 |
+
"normalized": false,
|
217 |
+
"rstrip": false,
|
218 |
+
"single_word": false
|
219 |
+
},
|
220 |
+
"eos_token": {
|
221 |
+
"content": "</s>",
|
222 |
+
"lstrip": false,
|
223 |
+
"normalized": false,
|
224 |
+
"rstrip": false,
|
225 |
+
"single_word": false
|
226 |
+
},
|
227 |
"mask_token": {
|
228 |
"content": "<mask>",
|
229 |
"lstrip": true,
|
|
|
238 |
"rstrip": false,
|
239 |
"single_word": false
|
240 |
},
|
241 |
+
"sep_token": {
|
242 |
+
"content": "</s>",
|
243 |
+
"lstrip": false,
|
244 |
+
"normalized": false,
|
245 |
+
"rstrip": false,
|
246 |
+
"single_word": false
|
247 |
+
},
|
248 |
+
"unk_token": {
|
249 |
+
"content": "<unk>",
|
250 |
+
"lstrip": false,
|
251 |
+
"normalized": false,
|
252 |
+
"rstrip": false,
|
253 |
+
"single_word": false
|
254 |
+
}
|
255 |
}
|
tokenizer_config.json
CHANGED
@@ -1875,13 +1875,17 @@
|
|
1875 |
"eos_token": "</s>",
|
1876 |
"legacy_behaviour": false,
|
1877 |
"mask_token": "<mask>",
|
|
|
1878 |
"model_max_length": 1024,
|
1879 |
"pad_token": "[PAD]",
|
1880 |
"return_tensors": "pt",
|
1881 |
"sep_token": "</s>",
|
1882 |
"sp_model_kwargs": {},
|
1883 |
"src_lang": "ajp_Arab",
|
|
|
1884 |
"tgt_lang": "eng_Latn",
|
1885 |
"tokenizer_class": "NllbTokenizer",
|
|
|
|
|
1886 |
"unk_token": "<unk>"
|
1887 |
}
|
|
|
1875 |
"eos_token": "</s>",
|
1876 |
"legacy_behaviour": false,
|
1877 |
"mask_token": "<mask>",
|
1878 |
+
"max_length": 128,
|
1879 |
"model_max_length": 1024,
|
1880 |
"pad_token": "[PAD]",
|
1881 |
"return_tensors": "pt",
|
1882 |
"sep_token": "</s>",
|
1883 |
"sp_model_kwargs": {},
|
1884 |
"src_lang": "ajp_Arab",
|
1885 |
+
"stride": 0,
|
1886 |
"tgt_lang": "eng_Latn",
|
1887 |
"tokenizer_class": "NllbTokenizer",
|
1888 |
+
"truncation_side": "right",
|
1889 |
+
"truncation_strategy": "longest_first",
|
1890 |
"unk_token": "<unk>"
|
1891 |
}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6568c1c3f0d96445292c19d770928d11e8916064302ada262e45857b310ca3ac
|
3 |
size 4728
|