sanchit-gandhi HF staff commited on
Commit
e3cb80d
1 Parent(s): 9f851e8

Saving final weights of step 100000

Browse files
config.json CHANGED
@@ -20,7 +20,7 @@
20
  "rope_theta": 1000000.0,
21
  "sliding_window": null,
22
  "tie_word_embeddings": false,
23
- "torch_dtype": "float32",
24
  "transformers_version": "4.40.0.dev0",
25
  "use_cache": true,
26
  "vocab_size": 32000
 
20
  "rope_theta": 1000000.0,
21
  "sliding_window": null,
22
  "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
  "transformers_version": "4.40.0.dev0",
25
  "use_cache": true,
26
  "vocab_size": 32000
distil-mistral/events.out.tfevents.1713805939.ip-26-0-163-236.1916906.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c988fd1ef9a524107cde9c9e766e2f9f4f91037347eef45173eecf22e09c740b
3
- size 1322494
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ce92e09e8b23eeceadbba3f76817518dcd28bb8fe60b844c45de153d8f4dc7c
3
+ size 1325784
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:596b562d4f09fcf74cce13b5ced4392bcd772221c4e56955a5fbbba5e8f56f0b
3
+ size 3141646744