Nbeau commited on
Commit
884b5e7
1 Parent(s): 7a7168a

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. README.md +1 -9
  2. config.json +1 -1
  3. model.safetensors +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -6,14 +6,6 @@ tags:
6
  model-index:
7
  - name: GPT2-arithmetic-3digits
8
  results: []
9
- datasets:
10
- - Nbeau/additiondataset_3digits_10000examples
11
- widget:
12
- - text: "Input:\n561+372\nTarget:"
13
- inference:
14
- parameters:
15
- add_special_tokens: True
16
- do_sample: False
17
  ---
18
 
19
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -69,4 +61,4 @@ The following hyperparameters were used during training:
69
  - Transformers 4.40.2
70
  - Pytorch 2.3.0
71
  - Datasets 2.19.1
72
- - Tokenizers 0.19.1
 
6
  model-index:
7
  - name: GPT2-arithmetic-3digits
8
  results: []
 
 
 
 
 
 
 
 
9
  ---
10
 
11
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
61
  - Transformers 4.40.2
62
  - Pytorch 2.3.0
63
  - Datasets 2.19.1
64
+ - Tokenizers 0.19.1
config.json CHANGED
@@ -17,7 +17,7 @@
17
  "n_inner": null,
18
  "n_layer": 12,
19
  "n_positions": 1024,
20
- "pad_token_id": 2,
21
  "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
23
  "scale_attn_by_inverse_layer_idx": false,
 
17
  "n_inner": null,
18
  "n_layer": 12,
19
  "n_positions": 1024,
20
+ "pad_token_id": 32000,
21
  "reorder_and_upcast_attn": false,
22
  "resid_pdrop": 0.1,
23
  "scale_attn_by_inverse_layer_idx": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cb8cb936fe8224bcc38b887023cc71a454545c82c238652c1fac6e4088583b7
3
  size 441691776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:559704e9da8d819c84387e547a1e42ee323924e58074bb0600c77ae442cec227
3
  size 441691776
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13f5cb4d558e9ea973b249dfda6c2f28100bdb0853103fe41bc350cf518db912
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1267483ff059ea879b3a0ea0f4a5afb8cff43a998d3030d4f8be0527a68d0f01
3
  size 5048