Trained with Unsloth
Browse files- config.json +4 -3
- generation_config.json +2 -2
- pytorch_model-00001-of-00004.bin +2 -2
- pytorch_model-00002-of-00004.bin +2 -2
- pytorch_model-00003-of-00004.bin +1 -1
- pytorch_model-00004-of-00004.bin +1 -1
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "unsloth/
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
@@ -31,8 +31,9 @@
|
|
31 |
"rope_theta": 500000.0,
|
32 |
"tie_word_embeddings": false,
|
33 |
"torch_dtype": "float16",
|
34 |
-
"transformers_version": "4.
|
35 |
-
"
|
|
|
36 |
"use_cache": true,
|
37 |
"vocab_size": 128256
|
38 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "unsloth/DeepSeek-R1-Distill-Llama-8B-unsloth-bnb-4bit",
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
|
|
31 |
"rope_theta": 500000.0,
|
32 |
"tie_word_embeddings": false,
|
33 |
"torch_dtype": "float16",
|
34 |
+
"transformers_version": "4.48.3",
|
35 |
+
"unsloth_fixed": true,
|
36 |
+
"unsloth_version": "2025.2.12",
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 128256
|
39 |
}
|
generation_config.json
CHANGED
@@ -6,6 +6,6 @@
|
|
6 |
"max_length": 131072,
|
7 |
"pad_token_id": 128004,
|
8 |
"temperature": 0.6,
|
9 |
-
"top_p": 0.
|
10 |
-
"transformers_version": "4.
|
11 |
}
|
|
|
6 |
"max_length": 131072,
|
7 |
"pad_token_id": 128004,
|
8 |
"temperature": 0.6,
|
9 |
+
"top_p": 0.95,
|
10 |
+
"transformers_version": "4.48.3"
|
11 |
}
|
pytorch_model-00001-of-00004.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:127f56c2f3de7b09aa00835187acfb7726271bc9bb6ad3d17bafc173b6542376
|
3 |
+
size 4976717570
|
pytorch_model-00002-of-00004.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df7eaf90b0ec46cc35db7d639dadd03c1ba8a21c6c66e90107f95421e70bd94e
|
3 |
+
size 4999826566
|
pytorch_model-00003-of-00004.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915939082
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f9953cd48ecf7c142216db5d4c2855ad47e427df2f3fd8fc6e6a2f387d45884
|
3 |
size 4915939082
|
pytorch_model-00004-of-00004.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168140873
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d10301b034a5ea9f1ba82e6a93201ba0a8a8c25196d95ef0bfcc051673f0124
|
3 |
size 1168140873
|