AAA01101312 commited on
Commit
1e128ba
1 Parent(s): 14b5c73

Training in progress, step 500

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80683dcd7bad6070adbf4a6cffeae9bd86f1e04d3dd349da72feb2cb66c2f5e7
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0cc4778c604548cc03ed426cc23687a92f886997199dd2cf98d6ba3dcdbfe3b
3
  size 268290900
run-4/checkpoint-500/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34c58a50c849b52be08129cef2729104b91f5ebaf46457436ac0e5ddb0274590
3
  size 268290900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0cc4778c604548cc03ed426cc23687a92f886997199dd2cf98d6ba3dcdbfe3b
3
  size 268290900
run-4/checkpoint-500/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d28a1e8094eb6ab9663cd2fb830933ca60972e0ea885d2d509150b1efcbf6e84
3
  size 536643898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2219825dffd50ded2ac97c5ef392d5520e0cd579c8dac0addd5b05f923a40510
3
  size 536643898
run-4/checkpoint-500/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4f75fa3851d3548c8bbed0ee7c49e6a23f30f028b074a4398b38c7ecbd0f8e9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40a61c60e2a1f354f14fb973803108ea16a9c8c66946147c407c26a5211c4f3d
3
  size 1064
run-4/checkpoint-500/tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
run-4/checkpoint-500/trainer_state.json CHANGED
@@ -10,32 +10,32 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.5770967741935484,
14
- "eval_loss": 0.21370309591293335,
15
- "eval_runtime": 13.9985,
16
- "eval_samples_per_second": 221.453,
17
- "eval_steps_per_second": 27.717,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
- "grad_norm": 0.547938346862793,
23
- "learning_rate": 1.371069182389937e-05,
24
- "loss": 0.3338,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
- "max_steps": 1590,
30
  "num_input_tokens_seen": 0,
31
- "num_train_epochs": 5,
32
  "save_steps": 500,
33
  "total_flos": 130072209152340.0,
34
  "train_batch_size": 48,
35
  "trial_name": null,
36
  "trial_params": {
37
- "alpha": 0.6150671860788094,
38
- "num_train_epochs": 5,
39
- "temperature": 9
40
  }
41
  }
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.5816129032258065,
14
+ "eval_loss": 0.20736075937747955,
15
+ "eval_runtime": 17.0342,
16
+ "eval_samples_per_second": 181.987,
17
+ "eval_steps_per_second": 22.778,
18
  "step": 318
19
  },
20
  {
21
  "epoch": 1.5723270440251573,
22
+ "grad_norm": 0.5436314940452576,
23
+ "learning_rate": 1.4758909853249476e-05,
24
+ "loss": 0.3269,
25
  "step": 500
26
  }
27
  ],
28
  "logging_steps": 500,
29
+ "max_steps": 1908,
30
  "num_input_tokens_seen": 0,
31
+ "num_train_epochs": 6,
32
  "save_steps": 500,
33
  "total_flos": 130072209152340.0,
34
  "train_batch_size": 48,
35
  "trial_name": null,
36
  "trial_params": {
37
+ "alpha": 0.1269072763270631,
38
+ "num_train_epochs": 6,
39
+ "temperature": 10
40
  }
41
  }
run-4/checkpoint-500/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:278f8d33f8210fa6267daa5ada1e98b5fd52b1bb1fcfcfeeb3b0875f77b14e08
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853140cfe9700b0f73b0cfadaae534b2ccf66ea184486e4df0f7ec3edaf66498
3
  size 5048
runs/May17_05-23-10_MainPC/events.out.tfevents.1715892747.MainPC.51768.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14eef6632bfc8e9c26a557e1d5bab585b9c485c0494c22febfa56cbda88b114
3
+ size 13062
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:651d2dfaf598da9232615029aef591cddb19f62ee5e131248da1afc5915c5227
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853140cfe9700b0f73b0cfadaae534b2ccf66ea184486e4df0f7ec3edaf66498
3
  size 5048