修改tie_emb_prj_weight为tie_word_embeddings

Files changed (12) hide show

bert-base-chinese/bert4torch_config.json CHANGED Viewed

@@ -13,5 +13,5 @@
     "pad_token_id": 0,
     "type_vocab_size": 2,
     "vocab_size": 21128,
-	"tie_emb_prj_weight": true
   }

     "pad_token_id": 0,
     "type_vocab_size": 2,
     "vocab_size": 21128,
+	  "tie_word_embeddings": true
   }

bloom-560m/bert4torch_config.json CHANGED Viewed

@@ -22,6 +22,6 @@
     "vocab_size": 250880,
     "segment_vocab_size": 0,
     "pre_layernorm": true,
-    "tie_emb_prj_weight": true,
     "model": "bloom"
   }

     "vocab_size": 250880,
     "segment_vocab_size": 0,
     "pre_layernorm": true,
+    "tie_word_embeddings": true,
     "model": "bloom"
   }

bloomz-560m/bert4torch_config.json CHANGED Viewed

@@ -22,6 +22,6 @@
     "vocab_size": 250880,
     "segment_vocab_size": 0,
     "pre_layernorm": true,
-    "tie_emb_prj_weight": true,
     "model": "bloom"
   }

     "vocab_size": 250880,
     "segment_vocab_size": 0,
     "pre_layernorm": true,
+    "tie_word_embeddings": true,
     "model": "bloom"
   }

chatglm-6b-int4/bert4torch_config.json CHANGED Viewed

@@ -18,7 +18,7 @@
     "segment_vocab_size": 0,
     "skip_init": true,
     "rope_rank": "updown",
-    "tie_emb_prj_weight": false,
     "quantization_bit": 4,
     "quantization_method": "cpm_kernels",
     "target_modules": ["q", "k", "v", "o", "intermediateDense", "outputDense"],

     "segment_vocab_size": 0,
     "skip_init": true,
     "rope_rank": "updown",
+    "tie_word_embeddings": false,
     "quantization_bit": 4,
     "quantization_method": "cpm_kernels",
     "target_modules": ["q", "k", "v", "o", "intermediateDense", "outputDense"],

chatglm-6b-int8/bert4torch_config.json CHANGED Viewed

@@ -21,6 +21,6 @@
     "quantization_bit": 8,
     "quantization_method": "cpm_kernels",
     "target_modules": ["q", "k", "v", "o", "intermediateDense", "outputDense"],
-    "tie_emb_prj_weight": false,
     "generation_config": {"max_length": 2048}
     }

     "quantization_bit": 8,
     "quantization_method": "cpm_kernels",
     "target_modules": ["q", "k", "v", "o", "intermediateDense", "outputDense"],
+    "tie_word_embeddings": false,
     "generation_config": {"max_length": 2048}
     }

chatglm-6b-v0.1.0/bert4torch_config.json CHANGED Viewed

@@ -18,6 +18,6 @@
     "segment_vocab_size": 0,
     "skip_init": true,
     "rope_rank": "updown",
-    "tie_emb_prj_weight": false,
     "generation_config": {"max_length": 2048}
 }

     "segment_vocab_size": 0,
     "skip_init": true,
     "rope_rank": "updown",
+    "tie_word_embeddings": false,
     "generation_config": {"max_length": 2048}
 }

chatglm-6b/bert4torch_config.json CHANGED Viewed

@@ -18,6 +18,6 @@
     "segment_vocab_size": 0,
     "skip_init": true,
     "rope_rank": "updown",
-    "tie_emb_prj_weight": false,
     "generation_config": {"max_length": 2048}
 }

     "segment_vocab_size": 0,
     "skip_init": true,
     "rope_rank": "updown",
+    "tie_word_embeddings": false,
     "generation_config": {"max_length": 2048}
 }

chatglm2-6b-32k/bert4torch_config.json CHANGED Viewed

@@ -11,7 +11,7 @@
   "segment_vocab_size": 0,
   "multi_query_group_num": 2,
   "skip_init": true,
-  "tie_emb_prj_weight": false,
   "eos_token_id": 2,
   "pad_token_id": 2,
   "rmsnorm": true,

   "segment_vocab_size": 0,
   "multi_query_group_num": 2,
   "skip_init": true,
+  "tie_word_embeddings": false,
   "eos_token_id": 2,
   "pad_token_id": 2,
   "rmsnorm": true,

chatglm2-6b-int4/bert4torch_config.json CHANGED Viewed

@@ -11,7 +11,7 @@
     "segment_vocab_size": 0,
     "multi_query_group_num": 2,
     "skip_init": true,
-    "tie_emb_prj_weight": false,
     "eos_token_id": 2,
     "pad_token_id": 2,
     "rmsnorm": true,

     "segment_vocab_size": 0,
     "multi_query_group_num": 2,
     "skip_init": true,
+    "tie_word_embeddings": false,
     "eos_token_id": 2,
     "pad_token_id": 2,
     "rmsnorm": true,

chatglm2-6b/bert4torch_config.json CHANGED Viewed

@@ -11,7 +11,7 @@
     "segment_vocab_size": 0,
     "multi_query_group_num": 2,
     "skip_init": true,
-    "tie_emb_prj_weight": false,
     "eos_token_id": 2,
     "pad_token_id": 2,
     "rmsnorm": true,

     "segment_vocab_size": 0,
     "multi_query_group_num": 2,
     "skip_init": true,
+    "tie_word_embeddings": false,
     "eos_token_id": 2,
     "pad_token_id": 2,
     "rmsnorm": true,

chatglm3-6b-32k/bert4torch_config.json CHANGED Viewed

@@ -11,7 +11,7 @@
   "segment_vocab_size": 0,
   "multi_query_group_num": 2,
   "skip_init": true,
-  "tie_emb_prj_weight": false,
   "eos_token_id": 2,
   "pad_token_id": 2,
   "rmsnorm": true,

   "segment_vocab_size": 0,
   "multi_query_group_num": 2,
   "skip_init": true,
+  "tie_word_embeddings": false,
   "eos_token_id": 2,
   "pad_token_id": 2,
   "rmsnorm": true,

chatglm3-6b/bert4torch_config.json CHANGED Viewed

@@ -11,7 +11,7 @@
     "segment_vocab_size": 0,
     "multi_query_group_num": 2,
     "skip_init": true,
-    "tie_emb_prj_weight": false,
     "eos_token_id": 2,
     "pad_token_id": 0,
     "rmsnorm": true,

     "segment_vocab_size": 0,
     "multi_query_group_num": 2,
     "skip_init": true,
+    "tie_word_embeddings": false,
     "eos_token_id": 2,
     "pad_token_id": 0,
     "rmsnorm": true,