Llama-3.1-8B-Vision / modeling_llamavision.py
kadirnar's picture
Create modeling_llamavision.py
73f1049 verified
raw
history blame
475 Bytes
# https://huggingface.co/qresearch/llama-3.1-8B-vision-378/blob/main/configuration_llamavision.py
from transformers import PretrainedConfig, LlamaConfig, SiglipVisionConfig
class LlamavisionConfig(PretrainedConfig):
model_type = "llamavision"
def __init__(self, **kwargs):
self.text_config = LlamaConfig(**kwargs.pop("text_config", {}))
self.vision_config = SiglipVisionConfig(**kwargs.pop("vision_config", {}))
super().__init__(**kwargs)