Training in progress, step 15000
Browse files- pytorch_model.bin +1 -1
- run.sh +3 -3
- runs/Dec21_22-27-22_129-146-176-120/events.out.tfevents.1671661870.129-146-176-120.616427.0 +2 -2
- runs/Dec22_06-11-35_129-146-176-120/1671689582.9981418/events.out.tfevents.1671689582.129-146-176-120.775071.1 +3 -0
- runs/Dec22_06-11-35_129-146-176-120/events.out.tfevents.1671689582.129-146-176-120.775071.0 +3 -0
- runs/Dec22_06-58-44_129-146-176-120/1671692370.2030654/events.out.tfevents.1671692370.129-146-176-120.826490.1 +3 -0
- runs/Dec22_06-58-44_129-146-176-120/events.out.tfevents.1671692370.129-146-176-120.826490.0 +3 -0
- runs/Dec22_07-02-49_129-146-176-120/1671692614.2405128/events.out.tfevents.1671692614.129-146-176-120.826955.1 +3 -0
- runs/Dec22_07-02-49_129-146-176-120/events.out.tfevents.1671692614.129-146-176-120.826955.0 +3 -0
- runs/Dec22_07-05-04_129-146-176-120/1671692749.9612415/events.out.tfevents.1671692749.129-146-176-120.827414.1 +3 -0
- runs/Dec22_07-05-04_129-146-176-120/events.out.tfevents.1671692749.129-146-176-120.827414.0 +3 -0
- runs/Dec22_07-07-18_129-146-176-120/1671692884.170788/events.out.tfevents.1671692884.129-146-176-120.827873.1 +3 -0
- runs/Dec22_07-07-18_129-146-176-120/events.out.tfevents.1671692884.129-146-176-120.827873.0 +3 -0
- runs/Dec22_08-12-29_129-146-176-120/1671696794.6124642/events.out.tfevents.1671696794.129-146-176-120.828902.1 +3 -0
- runs/Dec22_08-12-29_129-146-176-120/events.out.tfevents.1671696794.129-146-176-120.828902.0 +3 -0
- runs/Dec22_09-17-56_129-146-176-120/1671700721.673172/events.out.tfevents.1671700721.129-146-176-120.829664.1 +3 -0
- runs/Dec22_09-17-56_129-146-176-120/events.out.tfevents.1671700721.129-146-176-120.829664.0 +3 -0
- runs/Dec22_09-26-01_129-146-176-120/1671701207.1388845/events.out.tfevents.1671701207.129-146-176-120.830076.1 +3 -0
- runs/Dec22_09-26-01_129-146-176-120/events.out.tfevents.1671701207.129-146-176-120.830076.0 +3 -0
- runs/Dec22_09-29-04_129-146-176-120/1671701389.1176353/events.out.tfevents.1671701389.129-146-176-120.830415.1 +3 -0
- runs/Dec22_09-29-04_129-146-176-120/events.out.tfevents.1671701389.129-146-176-120.830415.0 +3 -0
- runs/Dec22_09-38-38_129-146-176-120/1671701963.8771524/events.out.tfevents.1671701963.129-146-176-120.830862.1 +3 -0
- runs/Dec22_09-38-38_129-146-176-120/events.out.tfevents.1671701963.129-146-176-120.830862.0 +3 -0
- training_args.bin +1 -1
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1527847357
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11b46df1204e6ed7e2611f82da57e36dc37a49141c8dfb83cfe31274015e076d
|
3 |
size 1527847357
|
run.sh
CHANGED
@@ -10,13 +10,13 @@ deepspeed run-ba.py \
|
|
10 |
--text_column_name="sentence" \
|
11 |
--streaming="False" \
|
12 |
--ignore_data_skip \
|
13 |
-
--resume_from_checkpoint="checkpoint-
|
14 |
--torch_compile="True" \
|
15 |
--torch_compile_mode="reduce-overhead" \
|
16 |
--torch_compile_mode="max-autotune" \
|
17 |
--logging_steps="25" \
|
18 |
-
--learning_rate="4e-
|
19 |
-
--max_steps="
|
20 |
--output_dir="./" \
|
21 |
--per_device_train_batch_size="32" \
|
22 |
--gradient_accumulation_steps="1" \
|
|
|
10 |
--text_column_name="sentence" \
|
11 |
--streaming="False" \
|
12 |
--ignore_data_skip \
|
13 |
+
--resume_from_checkpoint="checkpoint-14000" \
|
14 |
--torch_compile="True" \
|
15 |
--torch_compile_mode="reduce-overhead" \
|
16 |
--torch_compile_mode="max-autotune" \
|
17 |
--logging_steps="25" \
|
18 |
+
--learning_rate="4e-4" \
|
19 |
+
--max_steps="20000" \
|
20 |
--output_dir="./" \
|
21 |
--per_device_train_batch_size="32" \
|
22 |
--gradient_accumulation_steps="1" \
|
runs/Dec21_22-27-22_129-146-176-120/events.out.tfevents.1671661870.129-146-176-120.616427.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bf2c23ac80e4b740e1c73703bc74001295951a0ad404a8f08aee84114a48e27
|
3 |
+
size 51287
|
runs/Dec22_06-11-35_129-146-176-120/1671689582.9981418/events.out.tfevents.1671689582.129-146-176-120.775071.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b46fdeaa8667912d519a62c12d25bbaf662a42fe2d7b64d9bae69e8fa7f96902
|
3 |
+
size 5905
|
runs/Dec22_06-11-35_129-146-176-120/events.out.tfevents.1671689582.129-146-176-120.775071.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9a854dbf6e4b110405c24ef8069605b8428407133f65d8da7cdd29b8c78dd35
|
3 |
+
size 4671
|
runs/Dec22_06-58-44_129-146-176-120/1671692370.2030654/events.out.tfevents.1671692370.129-146-176-120.826490.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b75977e9772e7049d5bfe7d4bb5e5a3719c6273ea3daa0356b309ef416458d1
|
3 |
+
size 5905
|
runs/Dec22_06-58-44_129-146-176-120/events.out.tfevents.1671692370.129-146-176-120.826490.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05605ce3aea8ac9c192f3b465ec242b16977ed414786f253d7c2d40d22f093f4
|
3 |
+
size 4671
|
runs/Dec22_07-02-49_129-146-176-120/1671692614.2405128/events.out.tfevents.1671692614.129-146-176-120.826955.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70eeba88d6c85a10c4cb45ee98986eb608ab9a5883fbdaa3d52c0fc9a4dccbb4
|
3 |
+
size 5905
|
runs/Dec22_07-02-49_129-146-176-120/events.out.tfevents.1671692614.129-146-176-120.826955.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbc60c9441471a2dee005083763b749e2e9bf1396a5d033f8e17761718225283
|
3 |
+
size 4671
|
runs/Dec22_07-05-04_129-146-176-120/1671692749.9612415/events.out.tfevents.1671692749.129-146-176-120.827414.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97f3c41c43be9a6a3e443df7812f410a434ff0ef1713348c4fb6a2688717ffe9
|
3 |
+
size 5905
|
runs/Dec22_07-05-04_129-146-176-120/events.out.tfevents.1671692749.129-146-176-120.827414.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:738ab73862f7920333d141bf63bcfcb0a52409bfdbd729c65aced2f21c829b06
|
3 |
+
size 4671
|
runs/Dec22_07-07-18_129-146-176-120/1671692884.170788/events.out.tfevents.1671692884.129-146-176-120.827873.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:188827be8dec1819fcf02481df9daae889824c5d74da2d45274e9f343a62ec02
|
3 |
+
size 5905
|
runs/Dec22_07-07-18_129-146-176-120/events.out.tfevents.1671692884.129-146-176-120.827873.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33159ffa7ec21a13af5c35a040f290248978fcaf300e15fb28be2273bea117a5
|
3 |
+
size 10915
|
runs/Dec22_08-12-29_129-146-176-120/1671696794.6124642/events.out.tfevents.1671696794.129-146-176-120.828902.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a612e4e0e76ccafd42265f9f53a9407805286ab74b74df7c88dba064aa9c05f2
|
3 |
+
size 5905
|
runs/Dec22_08-12-29_129-146-176-120/events.out.tfevents.1671696794.129-146-176-120.828902.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bafdcafb9cae6b86c5f7b4b08c7907a32454d50adfc3d5762b7840f6454da26
|
3 |
+
size 10915
|
runs/Dec22_09-17-56_129-146-176-120/1671700721.673172/events.out.tfevents.1671700721.129-146-176-120.829664.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:371925d8c2877b34b7d200ec6799685d87e1f34f3e6042ceeda0393c45e5e544
|
3 |
+
size 5905
|
runs/Dec22_09-17-56_129-146-176-120/events.out.tfevents.1671700721.129-146-176-120.829664.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:591b71eac48f694a2fb9abb2c3ad07d05ce2648de7346935612428744a70dacc
|
3 |
+
size 4945
|
runs/Dec22_09-26-01_129-146-176-120/1671701207.1388845/events.out.tfevents.1671701207.129-146-176-120.830076.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e59324d351898a5e9f6e94e54f3a65717e507f467ac2029423bbec6457d97182
|
3 |
+
size 5905
|
runs/Dec22_09-26-01_129-146-176-120/events.out.tfevents.1671701207.129-146-176-120.830076.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29950247afa1c3fdeec4bd4c0f2b2a36c0b7de97cbcd4eadad209fbc204de6fd
|
3 |
+
size 4474
|
runs/Dec22_09-29-04_129-146-176-120/1671701389.1176353/events.out.tfevents.1671701389.129-146-176-120.830415.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1cf8be8e6be807ec11501c10f04c8d688b182288a74250c106bbab9ff07a0ef
|
3 |
+
size 5905
|
runs/Dec22_09-29-04_129-146-176-120/events.out.tfevents.1671701389.129-146-176-120.830415.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d79eba07a6ecf643eb3e1347942d3587f775561e20e756229f2cfbc94fa22f8a
|
3 |
+
size 5103
|
runs/Dec22_09-38-38_129-146-176-120/1671701963.8771524/events.out.tfevents.1671701963.129-146-176-120.830862.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b57149c522acd45cd06ed7fee002cbff84dc9a68ddcbc869141b5a84562b649b
|
3 |
+
size 5905
|
runs/Dec22_09-38-38_129-146-176-120/events.out.tfevents.1671701963.129-146-176-120.830862.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6d49c46f27d592545ad76f9a1b6d70e165d659f5d29779ccb161185ff88b843
|
3 |
+
size 10916
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4795
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6e3ac4aeab20cf895e188b7a0ae60077219ad0067d587dfa1da35e123e14fa0
|
3 |
size 4795
|