File size: 376 Bytes
69c51a4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
from transformers.models.qwen2.configuration_qwen2 import Qwen2Config

class MiMoConfig(Qwen2Config):
    model_type = "mimo"

    def __init__(
        self,
        *args,
        num_nextn_predict_layers=0,
        **kwargs
    ):
        self.num_nextn_predict_layers = num_nextn_predict_layers
        super().__init__(
            *args,
            **kwargs,
        )