thobauma commited on
Commit
4312562
1 Parent(s): d0e749b

Model save

Browse files
README.md CHANGED
@@ -2,6 +2,7 @@
2
  tags:
3
  - trl
4
  - reward-trainer
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: opt-350m
 
2
  tags:
3
  - trl
4
  - reward-trainer
5
+ - reward
6
  - generated_from_trainer
7
  model-index:
8
  - name: opt-350m
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.8802837530771891,
4
- "train_runtime": 25.1988,
5
  "train_samples": 42,
6
- "train_samples_per_second": 1.667,
7
- "train_steps_per_second": 0.119
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.8802839120229086,
4
+ "train_runtime": 24.9556,
5
  "train_samples": 42,
6
+ "train_samples_per_second": 1.683,
7
+ "train_steps_per_second": 0.12
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d870db732189102cd621a2e13cdc711302646ba6281271ff71ca5d38be3ac1b
3
  size 1324833016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ae07bcc010e036af1aef0752af8f8476e5bd9a7d31c4f97d54f402b7737fd6
3
  size 1324833016
runs/Apr25_12-24-25_MacBook-Pro-3.local/events.out.tfevents.1714040669.MacBook-Pro-3.local.69341.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2957f15d41d3d3dbfde473cf13f93b62c70e6acc4e1760e603a0ce7a2c89006e
3
+ size 5139
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.8802837530771891,
4
- "train_runtime": 25.1988,
5
  "train_samples": 42,
6
- "train_samples_per_second": 1.667,
7
- "train_steps_per_second": 0.119
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.8802839120229086,
4
+ "train_runtime": 24.9556,
5
  "train_samples": 42,
6
+ "train_samples_per_second": 1.683,
7
+ "train_steps_per_second": 0.12
8
  }
trainer_state.json CHANGED
@@ -12,10 +12,10 @@
12
  "epoch": 1.0,
13
  "step": 3,
14
  "total_flos": 0.0,
15
- "train_loss": 0.8802837530771891,
16
- "train_runtime": 25.1988,
17
- "train_samples_per_second": 1.667,
18
- "train_steps_per_second": 0.119
19
  }
20
  ],
21
  "logging_steps": 10,
 
12
  "epoch": 1.0,
13
  "step": 3,
14
  "total_flos": 0.0,
15
+ "train_loss": 0.8802839120229086,
16
+ "train_runtime": 24.9556,
17
+ "train_samples_per_second": 1.683,
18
+ "train_steps_per_second": 0.12
19
  }
20
  ],
21
  "logging_steps": 10,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0699c140fde4067fef8409878ee9c6d68ba617273dcb7f7f704daa708f40281
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:430908b784a36d5f2e78c16a0a39c811d65b7d21eba03aa2387635559075eab2
3
  size 4920