11104491 commited on
Commit
1999ad4
1 Parent(s): 637ee30

Update for vllm

Browse files
Files changed (2) hide show
  1. config.json +6 -2
  2. configuration_bluelm.py +3 -3
config.json CHANGED
@@ -20,12 +20,16 @@
20
  "pad_token_id": 3,
21
  "pretraining_tp": 1,
22
  "rms_norm_eps": 1e-06,
23
- "rope_scaling": null,
24
  "rope_theta": 10000.0,
25
  "tie_word_embeddings": false,
26
  "torch_dtype": "bfloat16",
27
  "transformers_version": "4.30.1",
28
  "use_cache": true,
29
  "use_stable_embedding": true,
30
- "vocab_size": 100096
 
 
 
 
 
31
  }
 
20
  "pad_token_id": 3,
21
  "pretraining_tp": 1,
22
  "rms_norm_eps": 1e-06,
 
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
  "transformers_version": "4.30.1",
27
  "use_cache": true,
28
  "use_stable_embedding": true,
29
+ "vocab_size": 100096,
30
+ "rope_scaling": {
31
+ "type": "ntkmixed",
32
+ "factor": 16.0,
33
+ "power": 0.3
34
+ }
35
  }
configuration_bluelm.py CHANGED
@@ -149,14 +149,14 @@ class BlueLMConfig(PretrainedConfig):
149
  if self.rope_scaling is None:
150
  return
151
 
152
- if not isinstance(self.rope_scaling, dict) or len(self.rope_scaling) != 2:
153
  raise ValueError(
154
- "`rope_scaling` must be a dictionary with with two fields, `type` and `factor`, "
155
  f"got {self.rope_scaling}"
156
  )
157
  rope_scaling_type = self.rope_scaling.get("type", None)
158
  rope_scaling_factor = self.rope_scaling.get("factor", None)
159
- if rope_scaling_type is None or rope_scaling_type not in ["linear", "dynamic"]:
160
  raise ValueError(
161
  f"`rope_scaling`'s type field must be one of ['linear', 'dynamic'], got {rope_scaling_type}"
162
  )
 
149
  if self.rope_scaling is None:
150
  return
151
 
152
+ if not isinstance(self.rope_scaling, dict) or len(self.rope_scaling) != 3:
153
  raise ValueError(
154
+ "`rope_scaling` must be a dictionary with with three fields, `type` , `factor` , `power`, "
155
  f"got {self.rope_scaling}"
156
  )
157
  rope_scaling_type = self.rope_scaling.get("type", None)
158
  rope_scaling_factor = self.rope_scaling.get("factor", None)
159
+ if rope_scaling_type is None or rope_scaling_type not in ["linear", "dynamic","ntkmixed"]:
160
  raise ValueError(
161
  f"`rope_scaling`'s type field must be one of ['linear', 'dynamic'], got {rope_scaling_type}"
162
  )