from transformers import PretrainedConfig class HformerConfig(PretrainedConfig): model_type = 'hformer' _auto_class = 'AutoConfig' def __init__( self, num_query_token=32, visual_hidden_size=4096, llm_hidden_size=768, cross_attention_freq=2, bert="bert-base-uncased", bias=True, qformer_pth=None, **kwargs, ): self.num_query_token=num_query_token self.visual_hidden_size = visual_hidden_size self.llm_hidden_size = llm_hidden_size self.bias = bias self.bert = bert self.cross_attention_freq = cross_attention_freq self.qformer_pth = qformer_pth super().__init__(**kwargs)