negfir commited on
Commit
dc35cd1
1 Parent(s): c23a086

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "google/bert_uncased_L-12_H-512_A-8",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
@@ -7,13 +7,13 @@
7
  "classifier_dropout": null,
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
- "hidden_size": 512,
11
  "initializer_range": 0.02,
12
- "intermediate_size": 2048,
13
  "layer_norm_eps": 1e-12,
14
  "max_position_embeddings": 512,
15
  "model_type": "bert",
16
- "num_attention_heads": 8,
17
  "num_hidden_layers": 12,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
 
1
  {
2
+ "_name_or_path": "google/bert_uncased_L-12_H-768_A-12",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
 
7
  "classifier_dropout": null,
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
  "initializer_range": 0.02,
12
+ "intermediate_size": 3072,
13
  "layer_norm_eps": 1e-12,
14
  "max_position_embeddings": 512,
15
  "model_type": "bert",
16
+ "num_attention_heads": 12,
17
  "num_hidden_layers": 12,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6b9dc877795014f0beaaa1c5df81846e777e101573cbe8d6f6d304df5dc32fc
3
- size 216020013
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:372c4a0cb7b055f458028759e48493abea67022d2d8393f51eebf567a9b468f5
3
+ size 438020141
runs/Mar23_23-42-39_1f6fbf265ce1/events.out.tfevents.1648078963.1f6fbf265ce1.70.11 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a1657f6eecf7c6b1c40b6c5ba7b1b192c32702883211c6baec6ff0fef15a378
3
- size 3799
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe2ecf151195447c4d7bd39854cecfdfd5511720d3d85b4e42de67460687645
3
+ size 6121
runs/Mar23_23-42-39_1f6fbf265ce1/events.out.tfevents.1648079188.1f6fbf265ce1.70.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315a213c52e894112a1786bcfbfd78fa9558f4105e2623fdb57bf21c9d66796e
3
+ size 375
runs/Mar24_00-14-47_1f6fbf265ce1/1648080891.792791/events.out.tfevents.1648080891.1f6fbf265ce1.70.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40c79a0a536c0b30e62636d948a3e383271dff59e8c94ab469f6093fbf14af58
3
+ size 4842
runs/Mar24_00-14-47_1f6fbf265ce1/events.out.tfevents.1648080891.1f6fbf265ce1.70.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39fad841e72e0caa28cf97d5cd781785399cbb1dd2af47cef48fdb6abcb12812
3
+ size 3801
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e10869da30ac2c970c023b7e884def919519b12c9456fbd49103db439e4b884c
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f07c7b20cfe3d6ddfbe5938efbbc988ec136941f0d1569fbf4968c0658bbaad
3
  size 3055