fpadovani commited on
Commit
8dfdd00
1 Parent(s): 517f68f

Training in progress epoch 0

Browse files
checkpoint-2000/config.json CHANGED
@@ -3,18 +3,20 @@
3
  "architectures": [
4
  "GPT2LMHeadModel"
5
  ],
 
6
  "attn_pdrop": 0.1,
7
  "bos_token_id": 5,
8
  "embd_pdrop": 0.1,
9
  "eos_token_id": 4,
 
10
  "initializer_range": 0.02,
11
  "layer_norm_epsilon": 1e-05,
12
  "model_type": "gpt2",
13
  "n_ctx": 128,
14
  "n_embd": 128,
15
- "n_head": 4,
16
  "n_inner": null,
17
- "n_layer": 4,
18
  "n_positions": 128,
19
  "reorder_and_upcast_attn": false,
20
  "resid_pdrop": 0.1,
 
3
  "architectures": [
4
  "GPT2LMHeadModel"
5
  ],
6
+ "attention_probs_dropout_prob": 0.1,
7
  "attn_pdrop": 0.1,
8
  "bos_token_id": 5,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 4,
11
+ "hidden_dropout_prob": 0.1,
12
  "initializer_range": 0.02,
13
  "layer_norm_epsilon": 1e-05,
14
  "model_type": "gpt2",
15
  "n_ctx": 128,
16
  "n_embd": 128,
17
+ "n_head": 32,
18
  "n_inner": null,
19
+ "n_layer": 2,
20
  "n_positions": 128,
21
  "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
checkpoint-2000/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b63f198c7497bd2841852386f58c71aa608c42edaaa03864c1c89f28820d7c84
3
- size 7438256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72b8f1431861f4f99c8a6c4334d906aadde093d300f60ce124b1f48411c16dfd
3
+ size 5849744
checkpoint-2000/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ae28a2f41e9984bc2ecf544ce621bbae18c78d30dfa59ebad78c82c9a3eb2b7
3
- size 14910074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f55ebbba1d58789f4d9f559dcb15ace72f8f2929c49d3dedff87915c53b24c7
3
+ size 11717834
checkpoint-2000/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f4bfbeca8fff7808687f31f7ea0c493baeef2f350c34e0d2c6843bdfbc49374
3
  size 14604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c20ac4079187b7525e81a42cdb5ad3bdc736c79836d9e044d1a0ba96023ba64
3
  size 14604
checkpoint-2000/scheduler.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80ad8562be07622fc9e024c897347ceead7b11b7c6000cf58d9491ab7f219099
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56cab430bf2883ab08ecdb0930091aaa86b7be034aaf50147f79e0060e5cbc6c
3
  size 1064
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72b8f1431861f4f99c8a6c4334d906aadde093d300f60ce124b1f48411c16dfd
3
  size 5849744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:918b0091f7a32f70809205d697ad6626712f47b3f2764df939a53f0160d03dc7
3
  size 5849744