{ "architectures": [ "FLASHTransformerForPretrained" ], "auto_map": { "AutoConfig": "dnaflash.FLASHTransformerConfig", "AutoModel": "dnaflash.FLASHTransformerForPretrained", "AutoModelForSequenceClassification": "dnaflash.FLASHTransformerForSequenceClassification" }, "attn_dropout": 0.0, "causal": false, "expansion_factor": 2.0, "group_size": 256, "hidden_size": 1024, "laplace_attn_fn": false, "model_type": "flash_transformer", "norm_type": "scalenorm", "num_layers": 36, "query_key_dim": 128, "reduce_group_non_causal_attn": true, "shift_tokens": true, "torch_dtype": "float32", "transformers_version": "4.39.3", "vocab_size": 4096 }