nour4286 commited on
Commit
49788d2
1 Parent(s): 90de5b5

Training in progress, epoch 2, checkpoint

Browse files
checkpoint-3056/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad463059a49b613eb03df4c048d797ae396203ad55df2966259cf6d0832bf908
3
  size 557116312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b68e41325dbdb1437b0cba550afc81b90e36838c1043f61962d5eded12bdaac6
3
  size 557116312
checkpoint-3056/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13c5b5a9472f5b369c41cc0223a54d821c73eef9313bfc84104b0a8c08145c9f
3
  size 1113991930
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35a3bac36de4f7daf69d45a6a1559474ca3a6d2bbf09bff99f6344ec5339c5cc
3
  size 1113991930
checkpoint-3056/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a10d959c75e03b0f3e40ddccae75cc1c3bb4a7dda726c8500cf7cde82fc0151
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa9d1335bcf626664b9856d1d0008b505cd442c2fc0ed9f9e4da5747018686cf
3
  size 1064
checkpoint-3056/trainer_state.json CHANGED
@@ -42,41 +42,41 @@
42
  },
43
  {
44
  "epoch": 1.3089005235602094,
45
- "grad_norm": 3.447214365005493,
46
- "learning_rate": 3.691099476439791e-05,
47
- "loss": 0.0416,
48
  "step": 2000
49
  },
50
  {
51
  "epoch": 1.6361256544502618,
52
- "grad_norm": 1.726170301437378,
53
- "learning_rate": 3.3638743455497386e-05,
54
- "loss": 0.0536,
55
  "step": 2500
56
  },
57
  {
58
  "epoch": 1.9633507853403143,
59
- "grad_norm": 5.475728511810303,
60
- "learning_rate": 3.036649214659686e-05,
61
- "loss": 0.0841,
62
  "step": 3000
63
  },
64
  {
65
  "epoch": 2.0,
66
- "eval_loss": 5.553058624267578,
67
- "eval_rouge1": 25.1196,
68
- "eval_rouge2": 9.8402,
69
- "eval_rougeL": 21.832,
70
- "eval_runtime": 384.1983,
71
- "eval_samples_per_second": 5.713,
72
- "eval_steps_per_second": 0.573,
73
  "step": 3056
74
  }
75
  ],
76
  "logging_steps": 500,
77
- "max_steps": 7640,
78
  "num_input_tokens_seen": 0,
79
- "num_train_epochs": 5,
80
  "save_steps": 500,
81
  "stateful_callbacks": {
82
  "TrainerControl": {
 
42
  },
43
  {
44
  "epoch": 1.3089005235602094,
45
+ "grad_norm": 3.4732136726379395,
46
+ "learning_rate": 4.3455497382198955e-05,
47
+ "loss": 0.0456,
48
  "step": 2000
49
  },
50
  {
51
  "epoch": 1.6361256544502618,
52
+ "grad_norm": 2.2575156688690186,
53
+ "learning_rate": 4.181937172774869e-05,
54
+ "loss": 0.0619,
55
  "step": 2500
56
  },
57
  {
58
  "epoch": 1.9633507853403143,
59
+ "grad_norm": 6.030032157897949,
60
+ "learning_rate": 4.018324607329843e-05,
61
+ "loss": 0.0993,
62
  "step": 3000
63
  },
64
  {
65
  "epoch": 2.0,
66
+ "eval_loss": 5.542174339294434,
67
+ "eval_rouge1": 25.0744,
68
+ "eval_rouge2": 9.8534,
69
+ "eval_rougeL": 21.6992,
70
+ "eval_runtime": 411.9676,
71
+ "eval_samples_per_second": 5.328,
72
+ "eval_steps_per_second": 0.534,
73
  "step": 3056
74
  }
75
  ],
76
  "logging_steps": 500,
77
+ "max_steps": 15280,
78
  "num_input_tokens_seen": 0,
79
+ "num_train_epochs": 10,
80
  "save_steps": 500,
81
  "stateful_callbacks": {
82
  "TrainerControl": {
checkpoint-3056/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0db0c5c28c9a1e67e13675dc0782cb65baca4516e1c39cf487f5c45dc85be680
3
  size 6904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a35dd57590090f24ebba9a087e2c3d94297cd357e1c5960144536e9514488b6a
3
  size 6904