BertilBraun commited on
Commit
f4e0887
1 Parent(s): 88ebdf9

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +4 -2
  2. generation_config.json +1 -1
  3. model-00001-of-00048.safetensors +3 -0
  4. model-00002-of-00048.safetensors +3 -0
  5. model-00003-of-00048.safetensors +3 -0
  6. model-00004-of-00048.safetensors +3 -0
  7. model-00005-of-00048.safetensors +3 -0
  8. model-00006-of-00048.safetensors +3 -0
  9. model-00007-of-00048.safetensors +3 -0
  10. model-00008-of-00048.safetensors +3 -0
  11. model-00009-of-00048.safetensors +3 -0
  12. model-00010-of-00048.safetensors +3 -0
  13. model-00011-of-00048.safetensors +3 -0
  14. model-00012-of-00048.safetensors +3 -0
  15. model-00013-of-00048.safetensors +3 -0
  16. model-00014-of-00048.safetensors +3 -0
  17. model-00015-of-00048.safetensors +3 -0
  18. model-00016-of-00048.safetensors +3 -0
  19. model-00017-of-00048.safetensors +3 -0
  20. model-00018-of-00048.safetensors +3 -0
  21. model-00019-of-00048.safetensors +3 -0
  22. model-00020-of-00048.safetensors +3 -0
  23. model-00021-of-00048.safetensors +3 -0
  24. model-00022-of-00048.safetensors +3 -0
  25. model-00023-of-00048.safetensors +3 -0
  26. model-00024-of-00048.safetensors +3 -0
  27. model-00025-of-00048.safetensors +3 -0
  28. model-00026-of-00048.safetensors +3 -0
  29. model-00027-of-00048.safetensors +3 -0
  30. model-00028-of-00048.safetensors +3 -0
  31. model-00029-of-00048.safetensors +3 -0
  32. model-00030-of-00048.safetensors +3 -0
  33. model-00031-of-00048.safetensors +3 -0
  34. model-00032-of-00048.safetensors +3 -0
  35. model-00033-of-00048.safetensors +3 -0
  36. model-00034-of-00048.safetensors +3 -0
  37. model-00035-of-00048.safetensors +3 -0
  38. model-00036-of-00048.safetensors +3 -0
  39. model-00037-of-00048.safetensors +3 -0
  40. model-00038-of-00048.safetensors +3 -0
  41. model-00039-of-00048.safetensors +3 -0
  42. model-00040-of-00048.safetensors +3 -0
  43. model-00041-of-00048.safetensors +3 -0
  44. model-00042-of-00048.safetensors +3 -0
  45. model-00043-of-00048.safetensors +3 -0
  46. model-00044-of-00048.safetensors +3 -0
  47. model-00045-of-00048.safetensors +3 -0
  48. model-00046-of-00048.safetensors +3 -0
  49. model-00047-of-00048.safetensors +3 -0
  50. model-00048-of-00048.safetensors +3 -0
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "MixtralForCausalLM"
4
  ],
@@ -20,10 +21,11 @@
20
  "rms_norm_eps": 1e-05,
21
  "rope_theta": 1000000.0,
22
  "router_aux_loss_coef": 0.02,
 
23
  "sliding_window": null,
24
  "tie_word_embeddings": false,
25
- "torch_dtype": "bfloat16",
26
- "transformers_version": "4.36.0.dev0",
27
  "use_cache": true,
28
  "vocab_size": 32000
29
  }
 
1
  {
2
+ "_name_or_path": "./dpo_output/current-finetuned-model_run_3",
3
  "architectures": [
4
  "MixtralForCausalLM"
5
  ],
 
21
  "rms_norm_eps": 1e-05,
22
  "rope_theta": 1000000.0,
23
  "router_aux_loss_coef": 0.02,
24
+ "router_jitter_noise": 0.0,
25
  "sliding_window": null,
26
  "tie_word_embeddings": false,
27
+ "torch_dtype": "float16",
28
+ "transformers_version": "4.46.3",
29
  "use_cache": true,
30
  "vocab_size": 32000
31
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
- "transformers_version": "4.36.0.dev0"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
+ "transformers_version": "4.46.3"
6
  }
model-00001-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:feb719023821e172fe77931fc3c2cf9b45095586f710543bef1d6040f8cd82a8
3
+ size 1990265312
model-00002-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adf296b59faf4d0c8e53889dac0f98fc3e3ed3bb44f3aca8da58a525c60fb189
3
+ size 1963019104
model-00003-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf1802a3f1400ec3d64488d527351e0444bd9c9615de15cb3bfeb58f78eeee92
3
+ size 1996490936
model-00004-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d3383358b4cf5552251b7f36ce97c21b4dc72e89a9d1b94398916760b7589f6
3
+ size 1963019096
model-00005-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b440f206c570fe9c434fcd1dbbc31975e639a98f69b5ce10b76855169cbc6bd
3
+ size 1963019104
model-00006-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef7cf8f6a0494b176293389f2041d0dc16660836695deb37a70512f05e12aed1
3
+ size 1996507544
model-00007-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08030cbdabadd9dd3db16b84d128156e1c6c2a7ed8157a6e80daca5a0ffdbdcb
3
+ size 1963002488
model-00008-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68eba6958bb48316665ae46e13c2b5337655fef2d1a82dd18a22c905535e0d79
3
+ size 1963019096
model-00009-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae6441dbba66cfaaae74a5a9e477bde8c640b9268bbf36ccaf0221514c2774b4
3
+ size 1963019104
model-00010-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1f833617ca3e05135417bc8af1d4e1e9a5a207019d5e158a9235c5a41fbe378
3
+ size 1996490936
model-00011-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f380dd48f7a66fef422c6985dd7b0bd4d5e63234a02d01b6f3ca7ee12fc478f0
3
+ size 1963019096
model-00012-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b77ee8f2ab77e2d47378cc4508c3a229e4f3ddb6598c2d525797ec20512511
3
+ size 1963019104
model-00013-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61d67a054422175d293380fa978f9db5a2f49c8e8461bceb74623f6de6f9b577
3
+ size 1996490936
model-00014-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:149decbaca6bdac9b3abe75423e6380856d2035acc212117fd2bfb464acbfa28
3
+ size 1963019096
model-00015-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11c287782276e608952c91b71f1830da3d2cef08234a313fafc871b8535fb842
3
+ size 1963019104
model-00016-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:840813c1f23cd529cfa8e39ebd1bbf5578964fb853f280f7c477d7f911b31ff7
3
+ size 1996490952
model-00017-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc6249a4fc240f53b7f3c2dfc3a863a6e002c8a73e9472895f2b79b9762cf113
3
+ size 1963019120
model-00018-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0afe4c3afc0e274c55bd50a9dd06e732e26251f6617fd399a998f975ca7ee53
3
+ size 1963019128
model-00019-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78065d429d815fa8dc871ee9c490a5634364be643b3624c514c857eb4c1a8142
3
+ size 1996490952
model-00020-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa34e072e18bbd2592740805a60c148f359fb26b02f7c88514bdeeac5827485
3
+ size 1963019120
model-00021-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dff03ddd8698feaac0786457efe5a1a398d25d8e468562a5235f07181ca33fc
3
+ size 1963019128
model-00022-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc5a604692d778e25302999640d1feebb2877d2518124203bb4c5ee88e0d5ca4
3
+ size 1996490952
model-00023-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:378fd4aab0ef8bee4cc5819c6c330b03a485b01b77b80f3300f1cee447ce2371
3
+ size 1963019120
model-00024-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af576db4d79f04350b35b488d2ceddf82df9137c233ca9f78a0af42c93f03477
3
+ size 1963019128
model-00025-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb4da379a85458e81ae2802ab200b76c5b0a1449f49eba55aeb9c92dcec26b69
3
+ size 1996490952
model-00026-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3979feb295e71e8d90b89954e6786630541d9c3ec307eb0fa34f00b2515e40fa
3
+ size 1963019120
model-00027-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed12b8f97e3966ea33b24aab33ad1a6112fcbe8679d727bcac7646a302a2bd85
3
+ size 1963019128
model-00028-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b2f104de711c7453ec15304c2dc33b13cd1835fca1106387a5c5c182b0e18cd
3
+ size 1996490952
model-00029-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e758ddda5761052e3c23990d735f7fe62f7fd18d27a8c4d3aefdf7a7817e3ecf
3
+ size 1963019120
model-00030-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2068d388dedf90847ffaae7ae84f0cbd5eedd4145b7ad13200f764b6930e22c
3
+ size 1963019128
model-00031-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7d351d77228974c8c1c59219f0de34c1031b245a17aa2753d01a185b7dfe122
3
+ size 1996507568
model-00032-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32ddec6457bab7746960298f03951982b29a928c9325eeaf2524a0718c6ba823
3
+ size 1963002512
model-00033-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bd5782125a0aa13c7537e643b4f147e3cac8238e97e0bdae2a88ca38b4c9a99
3
+ size 1963019120
model-00034-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb7acf34db7ac038304541d117653749098c8d5a7c6ff8a40b047913e1103e00
3
+ size 1963019128
model-00035-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5e14c1a6d8d9ad4aaeac31624f8578c6ecd921051346452113add32acb03202
3
+ size 1996490952
model-00036-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55f3dca68d64588e82543a930ccd4b2e429ea14bccf84ba37875edbe8a9f747c
3
+ size 1963019120
model-00037-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b2a79efc9bf145d7d773936ab0903f8825e66296773810fb93b0f1ce259c619
3
+ size 1963019128
model-00038-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:106ac8363e050ceb404e5b1b952c5f3f5ef301d5e1dcaeea6a6e2a665949c5ff
3
+ size 1996490952
model-00039-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7960ee2cc2aac5ae348dfe3e0a87e6870daf00064d8edaa841e1481821742d6
3
+ size 1963019120
model-00040-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f882c4f02a50586501a81f02ef883980faa3cffc9350854264347e81611b6930
3
+ size 1963019128
model-00041-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3947e4d3f5fdca6fec49912a79d4974a1e3ebcee2e25f4432b72ba9af5eeb723
3
+ size 1996490952
model-00042-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1991f6bc563c64355da98abdd06293786ffb55f876295b8b8047f741704edc5a
3
+ size 1963019120
model-00043-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfdb65c494099290f33359bd3cb5d3738e897e6bbfc5ea729dfe60657bafe312
3
+ size 1963019128
model-00044-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0797690eb32e46142981dcbd2e7cc846fe2cca05ab550ac11288c0f0881112dc
3
+ size 1996490952
model-00045-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1b31016919d9401a2ec85f046cd3fb5d53de1cc4d68580c95f1690eb9a5a9f9
3
+ size 1963019120
model-00046-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4813f2708f504871068afb86dbc0287815c8fff7fab7350df27a7842e465b83e
3
+ size 1963019128
model-00047-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aa7a53968446315499f5b39a49535fd3a4c56c9e371544e227c32ef29ac85e0
3
+ size 1996490952
model-00048-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf655b1361dd6bd5e750871412a209b72574e062874dc9c2488812d97b4996b
3
+ size 614490944