not-lain commited on
Commit
71e2f68
1 Parent(s): d66ce0c

change config

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. configuration_gemma.py +2 -9
config.json CHANGED
@@ -23,7 +23,7 @@
23
  "mm_projector_lr": null,
24
  "mm_projector_type": "mlp2x_gelu",
25
  "mm_vision_tower": "google/siglip-so400m-patch14-384",
26
- "model_type": "cerule-gemma",
27
  "num_attention_heads": 8,
28
  "num_hidden_layers": 18,
29
  "num_key_value_heads": 1,
 
23
  "mm_projector_lr": null,
24
  "mm_projector_type": "mlp2x_gelu",
25
  "mm_vision_tower": "google/siglip-so400m-patch14-384",
26
+ "model_type": "phi-msft",
27
  "num_attention_heads": 8,
28
  "num_hidden_layers": 18,
29
  "num_key_value_heads": 1,
configuration_gemma.py CHANGED
@@ -25,8 +25,8 @@ GEMMA_PRETRAINED_CONFIG_ARCHIVE_MAP = {
25
  }
26
 
27
 
28
- class GemmaConfig(PretrainedConfig):
29
- model_type = "gemma"
30
  keys_to_ignore_at_inference = ["past_key_values"]
31
 
32
  def __init__(
@@ -162,10 +162,3 @@ class SigLipVisionConfig(PretrainedConfig):
162
 
163
  return cls.from_dict(config_dict, **kwargs)
164
 
165
-
166
- class CeruleGemmaConfig(GemmaConfig):
167
- model_type = "cerule-gemma"
168
-
169
- def __init__(self, **kwargs):
170
- self.gemma_config = GemmaConfig(**kwargs)
171
- super().__init__(**kwargs)
 
25
  }
26
 
27
 
28
+ class CeruleGemmaConfig(PretrainedConfig):
29
+ model_type = "phi-msft"
30
  keys_to_ignore_at_inference = ["past_key_values"]
31
 
32
  def __init__(
 
162
 
163
  return cls.from_dict(config_dict, **kwargs)
164