flozi00 commited on
Commit
bde1efc
1 Parent(s): e137217

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "VAGOsolutions/SauerkrautLM-1.5b",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
@@ -19,7 +19,7 @@
19
  "rope_theta": 1000000.0,
20
  "sliding_window": 32768,
21
  "tie_word_embeddings": true,
22
- "torch_dtype": "float32",
23
  "transformers_version": "4.41.2",
24
  "use_cache": false,
25
  "use_sliding_window": false,
 
1
  {
2
+ "_name_or_path": "../educlassifier/checkpoint-500",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
 
19
  "rope_theta": 1000000.0,
20
  "sliding_window": 32768,
21
  "tie_word_embeddings": true,
22
+ "torch_dtype": "bfloat16",
23
  "transformers_version": "4.41.2",
24
  "use_cache": false,
25
  "use_sliding_window": false,
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d71009c8fed2e4c4c5d680199215b792fce20c0ea5f451cb5cefced062a9c6c
3
+ size 3087467144
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:635d436cc8d5e7a2a2efe1ed2a6519275a69bf2704b79004c45ffe40c45b243f
3
- size 3094642882
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9e6b05b5ca8a53e109b703c2ff556cd4d00a1cb2ff28b873130b90335bd3813
3
+ size 3094642562
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8596e8e763631f6218be973d23c17f87c5de1b18960b384dbd7a76dc1dcbe692
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4ea9708d47e60611ed3386f558874c7068fae4997b858668f0cf5d746ffebff
3
  size 1064
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e837a34ab4844742aedf3dd3e7300b434f2db8149439013ddd4cef5ab4cee401
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10d99ede934118bbe755d4b85611af314494d173ca7cbfab325549136045e1d7
3
  size 5240