depth: 28 diffusion_noise_schedule: cosine diffusion_steps: 500 drop_condition: 0.0 ensure_connected: false guide_scale: 2 hidden_size: 1024 lambda_train: - 1 - 10 mlp_ratio: 4 model: graph_dit num_heads: 16 transition: marginal