yhavinga commited on
Commit
dd3b617
1 Parent(s): 21e9f42

Saving weights and log at 40000 steps

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/home/yeb/data/gpt2-medium-dutch",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -11,7 +11,6 @@
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
- "torch_dtype": "float32",
15
  "n_ctx": 1024,
16
  "n_embd": 1024,
17
  "n_head": 16,
@@ -35,6 +34,7 @@
35
  "max_length": 50
36
  }
37
  },
 
38
  "transformers_version": "4.13.0",
39
  "use_cache": true,
40
  "vocab_size": 50257
 
1
  {
2
+ "_name_or_path": ".",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
11
  "initializer_range": 0.02,
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
 
14
  "n_ctx": 1024,
15
  "n_embd": 1024,
16
  "n_head": 16,
 
34
  "max_length": 50
35
  }
36
  },
37
+ "torch_dtype": "float32",
38
  "transformers_version": "4.13.0",
39
  "use_cache": true,
40
  "vocab_size": 50257
flax_model.msgpack ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a90571e6747628a2de9ab2ae081c144e50175c8e5306a667d36006be0523069a
3
+ size 1419302302
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c85e4b9ed9a69055ebfdf420cd6ae3c941c24f10304e093e04da5c04f09873b
3
+ size 1444576537
runs/events.out.tfevents.1640982862.t1v-n-88d0ebfa-w-0.14259.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5586fc63276f816a2453d6d9c9c1c903ec2a2e1a837c9a8e4cca0251146cdf8b
3
+ size 6457155