BertilBraun
commited on
Commit
•
f4e0887
1
Parent(s):
88ebdf9
Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +4 -2
- generation_config.json +1 -1
- model-00001-of-00048.safetensors +3 -0
- model-00002-of-00048.safetensors +3 -0
- model-00003-of-00048.safetensors +3 -0
- model-00004-of-00048.safetensors +3 -0
- model-00005-of-00048.safetensors +3 -0
- model-00006-of-00048.safetensors +3 -0
- model-00007-of-00048.safetensors +3 -0
- model-00008-of-00048.safetensors +3 -0
- model-00009-of-00048.safetensors +3 -0
- model-00010-of-00048.safetensors +3 -0
- model-00011-of-00048.safetensors +3 -0
- model-00012-of-00048.safetensors +3 -0
- model-00013-of-00048.safetensors +3 -0
- model-00014-of-00048.safetensors +3 -0
- model-00015-of-00048.safetensors +3 -0
- model-00016-of-00048.safetensors +3 -0
- model-00017-of-00048.safetensors +3 -0
- model-00018-of-00048.safetensors +3 -0
- model-00019-of-00048.safetensors +3 -0
- model-00020-of-00048.safetensors +3 -0
- model-00021-of-00048.safetensors +3 -0
- model-00022-of-00048.safetensors +3 -0
- model-00023-of-00048.safetensors +3 -0
- model-00024-of-00048.safetensors +3 -0
- model-00025-of-00048.safetensors +3 -0
- model-00026-of-00048.safetensors +3 -0
- model-00027-of-00048.safetensors +3 -0
- model-00028-of-00048.safetensors +3 -0
- model-00029-of-00048.safetensors +3 -0
- model-00030-of-00048.safetensors +3 -0
- model-00031-of-00048.safetensors +3 -0
- model-00032-of-00048.safetensors +3 -0
- model-00033-of-00048.safetensors +3 -0
- model-00034-of-00048.safetensors +3 -0
- model-00035-of-00048.safetensors +3 -0
- model-00036-of-00048.safetensors +3 -0
- model-00037-of-00048.safetensors +3 -0
- model-00038-of-00048.safetensors +3 -0
- model-00039-of-00048.safetensors +3 -0
- model-00040-of-00048.safetensors +3 -0
- model-00041-of-00048.safetensors +3 -0
- model-00042-of-00048.safetensors +3 -0
- model-00043-of-00048.safetensors +3 -0
- model-00044-of-00048.safetensors +3 -0
- model-00045-of-00048.safetensors +3 -0
- model-00046-of-00048.safetensors +3 -0
- model-00047-of-00048.safetensors +3 -0
- model-00048-of-00048.safetensors +3 -0
config.json
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
{
|
|
|
2 |
"architectures": [
|
3 |
"MixtralForCausalLM"
|
4 |
],
|
@@ -20,10 +21,11 @@
|
|
20 |
"rms_norm_eps": 1e-05,
|
21 |
"rope_theta": 1000000.0,
|
22 |
"router_aux_loss_coef": 0.02,
|
|
|
23 |
"sliding_window": null,
|
24 |
"tie_word_embeddings": false,
|
25 |
-
"torch_dtype": "
|
26 |
-
"transformers_version": "4.
|
27 |
"use_cache": true,
|
28 |
"vocab_size": 32000
|
29 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "./dpo_output/current-finetuned-model_run_3",
|
3 |
"architectures": [
|
4 |
"MixtralForCausalLM"
|
5 |
],
|
|
|
21 |
"rms_norm_eps": 1e-05,
|
22 |
"rope_theta": 1000000.0,
|
23 |
"router_aux_loss_coef": 0.02,
|
24 |
+
"router_jitter_noise": 0.0,
|
25 |
"sliding_window": null,
|
26 |
"tie_word_embeddings": false,
|
27 |
+
"torch_dtype": "float16",
|
28 |
+
"transformers_version": "4.46.3",
|
29 |
"use_cache": true,
|
30 |
"vocab_size": 32000
|
31 |
}
|
generation_config.json
CHANGED
@@ -2,5 +2,5 @@
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
-
"transformers_version": "4.
|
6 |
}
|
|
|
2 |
"_from_model_config": true,
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.46.3"
|
6 |
}
|
model-00001-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:feb719023821e172fe77931fc3c2cf9b45095586f710543bef1d6040f8cd82a8
|
3 |
+
size 1990265312
|
model-00002-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adf296b59faf4d0c8e53889dac0f98fc3e3ed3bb44f3aca8da58a525c60fb189
|
3 |
+
size 1963019104
|
model-00003-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf1802a3f1400ec3d64488d527351e0444bd9c9615de15cb3bfeb58f78eeee92
|
3 |
+
size 1996490936
|
model-00004-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d3383358b4cf5552251b7f36ce97c21b4dc72e89a9d1b94398916760b7589f6
|
3 |
+
size 1963019096
|
model-00005-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b440f206c570fe9c434fcd1dbbc31975e639a98f69b5ce10b76855169cbc6bd
|
3 |
+
size 1963019104
|
model-00006-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef7cf8f6a0494b176293389f2041d0dc16660836695deb37a70512f05e12aed1
|
3 |
+
size 1996507544
|
model-00007-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08030cbdabadd9dd3db16b84d128156e1c6c2a7ed8157a6e80daca5a0ffdbdcb
|
3 |
+
size 1963002488
|
model-00008-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68eba6958bb48316665ae46e13c2b5337655fef2d1a82dd18a22c905535e0d79
|
3 |
+
size 1963019096
|
model-00009-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae6441dbba66cfaaae74a5a9e477bde8c640b9268bbf36ccaf0221514c2774b4
|
3 |
+
size 1963019104
|
model-00010-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1f833617ca3e05135417bc8af1d4e1e9a5a207019d5e158a9235c5a41fbe378
|
3 |
+
size 1996490936
|
model-00011-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f380dd48f7a66fef422c6985dd7b0bd4d5e63234a02d01b6f3ca7ee12fc478f0
|
3 |
+
size 1963019096
|
model-00012-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78b77ee8f2ab77e2d47378cc4508c3a229e4f3ddb6598c2d525797ec20512511
|
3 |
+
size 1963019104
|
model-00013-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61d67a054422175d293380fa978f9db5a2f49c8e8461bceb74623f6de6f9b577
|
3 |
+
size 1996490936
|
model-00014-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:149decbaca6bdac9b3abe75423e6380856d2035acc212117fd2bfb464acbfa28
|
3 |
+
size 1963019096
|
model-00015-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11c287782276e608952c91b71f1830da3d2cef08234a313fafc871b8535fb842
|
3 |
+
size 1963019104
|
model-00016-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:840813c1f23cd529cfa8e39ebd1bbf5578964fb853f280f7c477d7f911b31ff7
|
3 |
+
size 1996490952
|
model-00017-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc6249a4fc240f53b7f3c2dfc3a863a6e002c8a73e9472895f2b79b9762cf113
|
3 |
+
size 1963019120
|
model-00018-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0afe4c3afc0e274c55bd50a9dd06e732e26251f6617fd399a998f975ca7ee53
|
3 |
+
size 1963019128
|
model-00019-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78065d429d815fa8dc871ee9c490a5634364be643b3624c514c857eb4c1a8142
|
3 |
+
size 1996490952
|
model-00020-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaa34e072e18bbd2592740805a60c148f359fb26b02f7c88514bdeeac5827485
|
3 |
+
size 1963019120
|
model-00021-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dff03ddd8698feaac0786457efe5a1a398d25d8e468562a5235f07181ca33fc
|
3 |
+
size 1963019128
|
model-00022-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc5a604692d778e25302999640d1feebb2877d2518124203bb4c5ee88e0d5ca4
|
3 |
+
size 1996490952
|
model-00023-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:378fd4aab0ef8bee4cc5819c6c330b03a485b01b77b80f3300f1cee447ce2371
|
3 |
+
size 1963019120
|
model-00024-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af576db4d79f04350b35b488d2ceddf82df9137c233ca9f78a0af42c93f03477
|
3 |
+
size 1963019128
|
model-00025-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb4da379a85458e81ae2802ab200b76c5b0a1449f49eba55aeb9c92dcec26b69
|
3 |
+
size 1996490952
|
model-00026-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3979feb295e71e8d90b89954e6786630541d9c3ec307eb0fa34f00b2515e40fa
|
3 |
+
size 1963019120
|
model-00027-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed12b8f97e3966ea33b24aab33ad1a6112fcbe8679d727bcac7646a302a2bd85
|
3 |
+
size 1963019128
|
model-00028-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2f104de711c7453ec15304c2dc33b13cd1835fca1106387a5c5c182b0e18cd
|
3 |
+
size 1996490952
|
model-00029-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e758ddda5761052e3c23990d735f7fe62f7fd18d27a8c4d3aefdf7a7817e3ecf
|
3 |
+
size 1963019120
|
model-00030-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2068d388dedf90847ffaae7ae84f0cbd5eedd4145b7ad13200f764b6930e22c
|
3 |
+
size 1963019128
|
model-00031-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7d351d77228974c8c1c59219f0de34c1031b245a17aa2753d01a185b7dfe122
|
3 |
+
size 1996507568
|
model-00032-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32ddec6457bab7746960298f03951982b29a928c9325eeaf2524a0718c6ba823
|
3 |
+
size 1963002512
|
model-00033-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2bd5782125a0aa13c7537e643b4f147e3cac8238e97e0bdae2a88ca38b4c9a99
|
3 |
+
size 1963019120
|
model-00034-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb7acf34db7ac038304541d117653749098c8d5a7c6ff8a40b047913e1103e00
|
3 |
+
size 1963019128
|
model-00035-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5e14c1a6d8d9ad4aaeac31624f8578c6ecd921051346452113add32acb03202
|
3 |
+
size 1996490952
|
model-00036-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55f3dca68d64588e82543a930ccd4b2e429ea14bccf84ba37875edbe8a9f747c
|
3 |
+
size 1963019120
|
model-00037-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b2a79efc9bf145d7d773936ab0903f8825e66296773810fb93b0f1ce259c619
|
3 |
+
size 1963019128
|
model-00038-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:106ac8363e050ceb404e5b1b952c5f3f5ef301d5e1dcaeea6a6e2a665949c5ff
|
3 |
+
size 1996490952
|
model-00039-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7960ee2cc2aac5ae348dfe3e0a87e6870daf00064d8edaa841e1481821742d6
|
3 |
+
size 1963019120
|
model-00040-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f882c4f02a50586501a81f02ef883980faa3cffc9350854264347e81611b6930
|
3 |
+
size 1963019128
|
model-00041-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3947e4d3f5fdca6fec49912a79d4974a1e3ebcee2e25f4432b72ba9af5eeb723
|
3 |
+
size 1996490952
|
model-00042-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1991f6bc563c64355da98abdd06293786ffb55f876295b8b8047f741704edc5a
|
3 |
+
size 1963019120
|
model-00043-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfdb65c494099290f33359bd3cb5d3738e897e6bbfc5ea729dfe60657bafe312
|
3 |
+
size 1963019128
|
model-00044-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0797690eb32e46142981dcbd2e7cc846fe2cca05ab550ac11288c0f0881112dc
|
3 |
+
size 1996490952
|
model-00045-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1b31016919d9401a2ec85f046cd3fb5d53de1cc4d68580c95f1690eb9a5a9f9
|
3 |
+
size 1963019120
|
model-00046-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4813f2708f504871068afb86dbc0287815c8fff7fab7350df27a7842e465b83e
|
3 |
+
size 1963019128
|
model-00047-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7aa7a53968446315499f5b39a49535fd3a4c56c9e371544e227c32ef29ac85e0
|
3 |
+
size 1996490952
|
model-00048-of-00048.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cf655b1361dd6bd5e750871412a209b72574e062874dc9c2488812d97b4996b
|
3 |
+
size 614490944
|