name: plym_all_2 type: discrete transition: marginal model: graph_dit diffusion_noise_schedule: cosine guide_scale: 2 hidden_size: 1152 diffusion_steps: 500 depth: 8 num_heads: 16 mlp_ratio: 4 drop_condition: 0.1 lambda_train: - 1 - 10