Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +17 -0
- checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_2.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_3.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/scheduler.pt +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/training_args.bin +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_2.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_3.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/scheduler.pt +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/training_args.bin +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_0.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_1.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_2.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_3.pth +3 -0
- checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/scheduler.pt +3 -0
.gitattributes
CHANGED
@@ -59,3 +59,20 @@ checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/artifacts/models--Qwen-
|
|
59 |
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
60 |
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
61 |
checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
59 |
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
60 |
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-2072/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
61 |
checkpoints/Qwen2.5-14B/babylm_shuffle_nondeterministic_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
|
62 |
+
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
|
63 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
64 |
+
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
|
65 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
|
66 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text
|
67 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f filter=lfs diff=lfs merge=lfs -text
|
68 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text
|
69 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text
|
70 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462 filter=lfs diff=lfs merge=lfs -text
|
71 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180 filter=lfs diff=lfs merge=lfs -text
|
72 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa filter=lfs diff=lfs merge=lfs -text
|
73 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
74 |
+
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb filter=lfs diff=lfs merge=lfs -text
|
75 |
+
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba filter=lfs diff=lfs merge=lfs -text
|
76 |
+
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75 filter=lfs diff=lfs merge=lfs -text
|
77 |
+
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
78 |
+
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e filter=lfs diff=lfs merge=lfs -text
|
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_hop_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_hop_words4_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
|
3 |
+
size 1698724408
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
|
3 |
+
size 3885134104
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/blobs/e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00001-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e015e2bc9a26b4e46d77913d8c667608ae7e48aa1eca04af5786c2408f4bc0fa
|
3 |
+
size 3885134104
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00002-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7efa1adc8257218813dcb494bb2a3d5775fa268735ab39e5b8119e233c21462
|
3 |
+
size 3995327992
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00003-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68127c9bc4fab170f7aaf63d5c7ac9e182afd10b74a1c6bb8025afefc11447cb
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00004-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7250708a789da850ff40a4a5be335971dfa0d2bd7cba2e9905916dab06744d75
|
3 |
+
size 3995348776
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00005-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754167c1cbaf94b9af9c7eb646a2286a596f9ded5e2e3c4c5e6a4464352c9e
|
3 |
+
size 3979614448
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00006-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045cf78c68178b626546982d12b6e9c8e289f1bf1e65c42225ed13e07847180
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00007-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d870a72c656404ee7524163ba996bf55050fff252dfe639a90715a9e2c47dba
|
3 |
+
size 3995328064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/artifacts/models--Qwen--Qwen2.5-14B/snapshots/97e1e76335b7017d8f67c08a19d103c0504298c9/model-00008-of-00008.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b693615965d8548eab4d1dc6bb578aa063e8656e2b9d25125ad5b8c7f59565f
|
3 |
+
size 1698724408
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6ae0f8c0973bd8f49e7d475791e1334e0204d90696971f9983ce5cb629db508
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:582deaed4156b10690b3823f0fabd8dc67208eff035e24ae52cd85b9d874bb8a
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c0d37a6d8b99cbd89650c46b5f2f132c4da338c68ff6d192f08a6bcefbbceb5
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbdf9f0e9aac95e08af74c5bf009639eb93bbb564c71abd5e3aa81adf1c3991b
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99b1826aaba117362f4adfc02c2de0205a70775a4b414256a9c9ffbc64365305
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
|
3 |
+
size 11422356
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-2072/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7d6815084f9707f1d8d990ce7c2269742cc992d1a36e2e1dceb5b67e6def274
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31effcc966f4272bd7330ebcde7da65f7dbd70afe27a289d2a31856fbc63f379
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99672ac4c61aff9b2bca8a9e80f74417b8b0767809c3454f66042d5f904ced7a
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0365624c9f07469b8549f58376cdc199fd538b48405ad51abe3c46cc06f193ea
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0db9bdc225f9583b93b0affe946bd62f8983aae91455323924cab39bef020b1
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:add49698959c0d68285301bf9cf3bc2d662d3dfb40309603eebc0e6a0d5f7268
|
3 |
+
size 1064
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ca92fdd167a7f358c86fad57991c9ab6bb13b300002b33969176bd01e3e516
|
3 |
+
size 11422356
|
checkpoints/Qwen2.5-14B/babylm_reverse_control_10M_seed0/runs/checkpoint-500/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7d6815084f9707f1d8d990ce7c2269742cc992d1a36e2e1dceb5b67e6def274
|
3 |
+
size 6520
|
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31effcc966f4272bd7330ebcde7da65f7dbd70afe27a289d2a31856fbc63f379
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99672ac4c61aff9b2bca8a9e80f74417b8b0767809c3454f66042d5f904ced7a
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0365624c9f07469b8549f58376cdc199fd538b48405ad51abe3c46cc06f193ea
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0db9bdc225f9583b93b0affe946bd62f8983aae91455323924cab39bef020b1
|
3 |
+
size 14960
|
checkpoints/Qwen2.5-14B/babylm_reverse_partial_10M_seed0/runs/checkpoint-500/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:add49698959c0d68285301bf9cf3bc2d662d3dfb40309603eebc0e6a0d5f7268
|
3 |
+
size 1064
|