jojo-ai-mst commited on
Commit
509c989
1 Parent(s): 07ef033

Training in progress, step 10000

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "gpt2-medium",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -12,13 +12,11 @@
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
- "n_embd": 1024,
16
- "n_head": 16,
17
  "n_inner": null,
18
- "n_layer": 24,
19
  "n_positions": 1024,
20
- "n_special": 0,
21
- "predict_special_tokens": true,
22
  "reorder_and_upcast_attn": false,
23
  "resid_pdrop": 0.1,
24
  "scale_attn_by_inverse_layer_idx": false,
 
1
  {
2
+ "_name_or_path": "/content/MyanmarGPT - previous",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
  "n_inner": null,
18
+ "n_layer": 12,
19
  "n_positions": 1024,
 
 
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
22
  "scale_attn_by_inverse_layer_idx": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47b019be2a89f1b83d91ac9ba19d3824bc8addbbf20c72ed2b0aa76aade63abe
3
- size 1419322880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4569809d19f454d109e221beed5db02bbfe9744c43bdeac597eb309882aec7c2
3
+ size 497774208
runs/Dec13_19-19-51_6862dcd86e9a/events.out.tfevents.1702495192.6862dcd86e9a.191.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73091212c44137b5a6326ffc9b828a8aeb87cb2ca35430d5390f3f9a252cd854
3
+ size 7615
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de6356f01f5d2dc37383b24cfbf060d65a8349d336bc137fec32ebca1473d475
3
  size 4536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:887cde771b6d493f66e03443461a14fbff58c5fba53667686e2c83fc1a1b66c8
3
  size 4536