1bit

Files changed (8) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "./mnt/final",
   "architectures": [
     "LlamaForCausalLM"
   ],
@@ -18,7 +18,7 @@
   "num_key_value_heads": 8,
   "pretraining_tp": 1,
   "quantization_config": {
-    "in_group_size": 8,
     "linear_weights_not_to_quantize": [
       "model.layers.0.input_layernorm.weight",
       "model.layers.0.post_attention_layernorm.weight",
@@ -194,7 +194,7 @@
   "rope_theta": 500000.0,
   "tie_word_embeddings": false,
   "torch_dtype": "float16",
-  "transformers_version": "4.39.3",
   "use_cache": true,
   "vocab_size": 128256
 }

 {
+  "_name_or_path": "/extra_disk_1/jheuristic/llama-3-70b-hf",
   "architectures": [
     "LlamaForCausalLM"
   ],
   "num_key_value_heads": 8,
   "pretraining_tp": 1,
   "quantization_config": {
+    "in_group_size": 16,
     "linear_weights_not_to_quantize": [
       "model.layers.0.input_layernorm.weight",
       "model.layers.0.post_attention_layernorm.weight",
   "rope_theta": 500000.0,
   "tie_word_embeddings": false,
   "torch_dtype": "float16",
+  "transformers_version": "4.40.1",
   "use_cache": true,
   "vocab_size": 128256
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 128000,
   "eos_token_id": 128001,
-  "transformers_version": "4.39.3"
 }

   "_from_model_config": true,
   "bos_token_id": 128000,
   "eos_token_id": 128001,
+  "transformers_version": "4.40.1"
 }

model-00001-of-00005.safetensors → model-00001-of-00003.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04d7849c56c84541bc2571aa0c9e9469b5d225cbbd53c42e14095a6a6cc1fd80
-size 4999125768

 version https://git-lfs.github.com/spec/v1
+oid sha256:83e2adc347f408d6a3601dad3248bc6df5a6aec729a085309e0f4fad56198e8a
+size 4996053968

model-00002-of-00005.safetensors → model-00002-of-00003.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af4e0fa4698befd4f21af12248914d8962c9d41001cee8a717bbe9ee6ee82ed6
-size 4955928968

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc5f1dd16df466ad4b5e78caafbb570aa253dbb42ef6dafba609d96324a5d416
+size 4995365800

model-00003-of-00005.safetensors → model-00003-of-00003.safetensors RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c9cad7589a4387c52161f8e072d2e7c520344a9a9c781d2863b31325fc4300d2
-size 4991608736

 version https://git-lfs.github.com/spec/v1
+oid sha256:aaf649e098013e6ca25359b240f3434b58c9c6c06867742713152f7f4581b2da
+size 3958346080

model-00004-of-00005.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:91c5cda1023d16ae85b195773c6463205f400db892067197e7b2a4b03411dde5
-size 4870931440

model-00005-of-00005.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:959d1058dd3372a4b636b0d900b3b35b2549a0d283e978f64f84743a9ae30bef
-size 2101346432

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff