Training in progress, step 15469
Browse files- logs/attn_loss_fn=raw_mse, attn_weight=10.0, hidden_weight=10.0, hs_loss_fn=mse, learning_rate=4e-06/events.out.tfevents.1723755504.93d6cbb3ad53 +3 -0
- logs/attn_loss_fn=raw_mse, attn_weight=10.0, hidden_weight=10.0, hs_loss_fn=raw_mse, learning_rate=4e-06/events.out.tfevents.1723755341.93d6cbb3ad53 +3 -0
- logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723755813.93d6cbb3ad53 +3 -0
- logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=raw_mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723755700.93d6cbb3ad53 +3 -0
- logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=raw_mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723757387.93d6cbb3ad53 +3 -0
- logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=raw_mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723757829.93d6cbb3ad53 +3 -0
- model.safetensors +1 -1
- training_args.bin +1 -1
logs/attn_loss_fn=raw_mse, attn_weight=10.0, hidden_weight=10.0, hs_loss_fn=mse, learning_rate=4e-06/events.out.tfevents.1723755504.93d6cbb3ad53
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1db90503cfb8f702611ece28f8e089b604a453e545114df222ceb7e490669e88
|
3 |
+
size 6097
|
logs/attn_loss_fn=raw_mse, attn_weight=10.0, hidden_weight=10.0, hs_loss_fn=raw_mse, learning_rate=4e-06/events.out.tfevents.1723755341.93d6cbb3ad53
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6021be405ddf1dae998c5e8d6c7719d1d3d08c187cbdd135f475dc2fdafb550f
|
3 |
+
size 6101
|
logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723755813.93d6cbb3ad53
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae9ea251de631244744922bd37586bcccbceb8c012e2741cce83bd3219bb8825
|
3 |
+
size 6093
|
logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=raw_mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723755700.93d6cbb3ad53
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e312da171a98b3bfccfd712ad10817860d477d495a419c8f5544a35c96fe7872
|
3 |
+
size 6353
|
logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=raw_mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723757387.93d6cbb3ad53
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efe83617afefffe87ecebeb9326fdebd6b7c68361a182f866eea13e4abc230d7
|
3 |
+
size 6408
|
logs/attn_loss_fn=raw_mse, attn_weight=10.0, hs_loss_fn=raw_mse, hs_weight=10.0, learning_rate=4e-06/events.out.tfevents.1723757829.93d6cbb3ad53
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc7c3094a2995789dce4f1de23ad556582153b78b9f70ead7864a17b4da68f6f
|
3 |
+
size 4177665
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 137033984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a64218e3d2c30d196c07cc994eaf051554a03e0f07ebd8cd8baad5a362b72d2
|
3 |
size 137033984
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1017948104
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d665b5b0ccf6b5a8d166fee5cb77c0bd9dc46300ff235f1d51f2fbe7828aef5
|
3 |
size 1017948104
|