{ "encoder": "apple/DFN5B-CLIP-ViT-H-14", "tokenizer": "miguelcarv/phi-1_5-slimorca", "decoder": "miguelcarv/phi-1_5-slimorca", "first_level": true, "level": 2, "cross_interval": 2, "from_layer": 0, "reduce": 1, "encoder_dtype": "torch.float32", "decoder_dtype": "torch.float32", "other_params_dtype": "torch.float32" }