mllm-dev commited on
Commit
693551c
1 Parent(s): 1d2bc21

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. model.safetensors +1 -1
  2. optimizer.pt +1 -1
  3. rng_state.pth +1 -1
  4. trainer_state.json +20 -20
  5. training_args.bin +1 -1
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ebd4e2388cfc26d0f32b5ede296bb3b43fd0595626cc375c9b07ac05cd9c238
3
  size 497805008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4160a07954e4412b0d257e7be809f5d543abd688371a7a1d9a5f5e8aaa095e3
3
  size 497805008
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4285543d27ca4dfed07ba3feaa9d46f5b1d99783648e2ff51f9ad8aae15e8d2d
3
  size 995704133
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9ba3736cbea56a07a3efd14e17484f317576ea02e56f59c8bd2a83e6e7b8bca
3
  size 995704133
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08f7c8f2f1f450ef4812e0468b7a029a19d12df470c12014d4db6d65476b4372
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2cde58ea73ab57892d0e819c1447881d94dc98179fd7503d033de1277c65e9
3
  size 14575
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 1.410697102546692,
3
  "best_model_checkpoint": "tam_test_out_drug_data/checkpoint-1011",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
@@ -10,43 +10,43 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.46396354505719334,
14
- "eval_loss": 1.46442449092865,
15
- "eval_runtime": 15.0839,
16
- "eval_samples_per_second": 712.879,
17
- "eval_steps_per_second": 7.491,
18
  "step": 337
19
  },
20
  {
21
  "epoch": 1.48,
22
- "grad_norm": 391296.28125,
23
  "learning_rate": 5.554896142433234e-05,
24
- "loss": 1.6493,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
- "eval_accuracy": 0.47372826188040545,
30
- "eval_loss": 1.4272058010101318,
31
- "eval_runtime": 15.1004,
32
- "eval_samples_per_second": 712.101,
33
  "eval_steps_per_second": 7.483,
34
  "step": 674
35
  },
36
  {
37
  "epoch": 2.97,
38
- "grad_norm": 266398.21875,
39
  "learning_rate": 5.109792284866469e-05,
40
- "loss": 1.3762,
41
  "step": 1000
42
  },
43
  {
44
  "epoch": 3.0,
45
- "eval_accuracy": 0.47456523760810937,
46
- "eval_loss": 1.410697102546692,
47
- "eval_runtime": 15.0489,
48
- "eval_samples_per_second": 714.539,
49
- "eval_steps_per_second": 7.509,
50
  "step": 1011
51
  }
52
  ],
@@ -55,7 +55,7 @@
55
  "num_input_tokens_seen": 0,
56
  "num_train_epochs": 20,
57
  "save_steps": 500,
58
- "total_flos": 1.276707860453376e+16,
59
  "train_batch_size": 96,
60
  "trial_name": null,
61
  "trial_params": null
 
1
  {
2
+ "best_metric": 1.4213874340057373,
3
  "best_model_checkpoint": "tam_test_out_drug_data/checkpoint-1011",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.46219659629870735,
14
+ "eval_loss": 1.4630001783370972,
15
+ "eval_runtime": 15.2997,
16
+ "eval_samples_per_second": 702.823,
17
+ "eval_steps_per_second": 7.386,
18
  "step": 337
19
  },
20
  {
21
  "epoch": 1.48,
22
+ "grad_norm": 283691.34375,
23
  "learning_rate": 5.554896142433234e-05,
24
+ "loss": 1.599,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
+ "eval_accuracy": 0.4721473077280759,
30
+ "eval_loss": 1.443649411201477,
31
+ "eval_runtime": 15.1007,
32
+ "eval_samples_per_second": 712.086,
33
  "eval_steps_per_second": 7.483,
34
  "step": 674
35
  },
36
  {
37
  "epoch": 2.97,
38
+ "grad_norm": 246200.171875,
39
  "learning_rate": 5.109792284866469e-05,
40
+ "loss": 1.3511,
41
  "step": 1000
42
  },
43
  {
44
  "epoch": 3.0,
45
+ "eval_accuracy": 0.471310332000372,
46
+ "eval_loss": 1.4213874340057373,
47
+ "eval_runtime": 14.9491,
48
+ "eval_samples_per_second": 719.309,
49
+ "eval_steps_per_second": 7.559,
50
  "step": 1011
51
  }
52
  ],
 
55
  "num_input_tokens_seen": 0,
56
  "num_train_epochs": 20,
57
  "save_steps": 500,
58
+ "total_flos": 1.32737670494208e+16,
59
  "train_batch_size": 96,
60
  "trial_name": null,
61
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcf86aa1afbdd702b3daff78f76586a0908e4459d837fc5a7ab105fe1af7cc23
3
  size 4603
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:031e77c7775f2760360cdc9ed1a2d9e618d47728f22b58e85ee32d4d55d0ce3d
3
  size 4603