Chakita commited on
Commit
fbbaaf1
1 Parent(s): c6a235e

Training in progress, step 500

Browse files
.gitattributes CHANGED
@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "Chakita/Kalbert",
3
  "architectures": [
4
  "AlbertForMaskedLM"
5
  ],
@@ -26,7 +26,8 @@
26
  "num_memory_blocks": 0,
27
  "pad_token_id": 0,
28
  "position_embedding_type": "absolute",
29
- "transformers_version": "4.5.0",
 
30
  "type_vocab_size": 2,
31
  "vocab_size": 200000
32
  }
 
1
  {
2
+ "_name_or_path": "ai4bharat/indic-bert",
3
  "architectures": [
4
  "AlbertForMaskedLM"
5
  ],
 
26
  "num_memory_blocks": 0,
27
  "pad_token_id": 0,
28
  "position_embedding_type": "absolute",
29
+ "torch_dtype": "float32",
30
+ "transformers_version": "4.25.1",
31
  "type_vocab_size": 2,
32
  "vocab_size": 200000
33
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03f2aafa592d94ad45d397b267c0fdc0875587548d7cf565f0d54167d980ca3a
3
- size 132623604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dd1508a90b10cf978c9b4e259f499afb86cfebe760268fbc255ffb935067d83
3
+ size 132620936
runs/Jan04_12-47-05_19415c40739a/1672836493.027966/events.out.tfevents.1672836493.19415c40739a.216.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:324ef35d22377715ea780851ce0041ca8bb82c1695ab1915578007836ece7e59
3
+ size 5483
runs/Jan04_12-47-05_19415c40739a/events.out.tfevents.1672836493.19415c40739a.216.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5663886022245e3185502b9d41ce679e624fc5e9a165e0eab40ae6d30ba4b9b5
3
+ size 3809
runs/Jan04_12-52-56_19415c40739a/1672836786.3600266/events.out.tfevents.1672836786.19415c40739a.216.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17f844c721d50d9ed345c3a6ce3c23418633f9815bce0a160f326451b66eaa01
3
+ size 5483
runs/Jan04_12-52-56_19415c40739a/events.out.tfevents.1672836786.19415c40739a.216.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51d82d4bd71cac0d5451f5393915a167c042afef939ab125f122415190ecd519
3
+ size 3963
runs/Jan04_12-53-45_19415c40739a/1672836833.3656578/events.out.tfevents.1672836833.19415c40739a.216.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97b52357f77eb9331ab865a5e0422ec4ea88266167bee4ba131a8e2355a37c36
3
+ size 5483
runs/Jan04_12-53-45_19415c40739a/events.out.tfevents.1672836833.19415c40739a.216.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d5720b6f2461c45bed584030ee29f81d37591dffce9b4e80042f33911b70120
3
+ size 4591
special_tokens_map.json CHANGED
@@ -1 +1,15 @@
1
- {"bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": {"content": "[MASK]", "single_word": false, "lstrip": true, "rstrip": false, "normalized": true}}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "eos_token": "[SEP]",
5
+ "mask_token": {
6
+ "content": "[MASK]",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "[SEP]",
14
+ "unk_token": "<unk>"
15
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:431ec72a485a382d7e3a6063af5f54249b36e4870e0c8d079918e79cd0a4f8f1
3
+ size 15285606
tokenizer_config.json CHANGED
@@ -1 +1,24 @@
1
- {"do_lower_case": true, "remove_space": true, "keep_accents": false, "bos_token": "[CLS]", "eos_token": "[SEP]", "unk_token": "<unk>", "sep_token": "[SEP]", "pad_token": "<pad>", "cls_token": "[CLS]", "mask_token": "[MASK]", "special_tokens_map_file": null, "name_or_path": "Chakita/Kalbert"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "[CLS]",
3
+ "cls_token": "[CLS]",
4
+ "do_lower_case": true,
5
+ "eos_token": "[SEP]",
6
+ "keep_accents": false,
7
+ "mask_token": {
8
+ "__type": "AddedToken",
9
+ "content": "[MASK]",
10
+ "lstrip": true,
11
+ "normalized": false,
12
+ "rstrip": false,
13
+ "single_word": false
14
+ },
15
+ "model_max_length": 1000000000000000019884624838656,
16
+ "name_or_path": "ai4bharat/indic-bert",
17
+ "pad_token": "<pad>",
18
+ "remove_space": true,
19
+ "sep_token": "[SEP]",
20
+ "sp_model_kwargs": {},
21
+ "special_tokens_map_file": null,
22
+ "tokenizer_class": "AlbertTokenizer",
23
+ "unk_token": "<unk>"
24
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed1cda506bb11d63f58a02ad16309108852a0f2e992a7eded56d2024811162df
3
- size 2351
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:403088aa8ad81300a1218209040beb8da93fbf5678bf7fdc71ef8b4a5340535c
3
+ size 3387