{ "_class_name": "ZImageControlTransformer2DModel", "_diffusers_version": "0.37.0", "add_control_noise_refiner": true, "add_control_noise_refiner_correctly": true, "all_f_patch_size": [ 1 ], "all_patch_size": [ 2 ], "axes_dims": [ 32, 48, 48 ], "axes_lens": [ 1536, 512, 512 ], "cap_feat_dim": 2560, "control_in_dim": 33, "control_layers_places": [ 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28 ], "control_refiner_layers_places": [ 0, 1 ], "dim": 3840, "in_channels": 16, "n_heads": 30, "n_kv_heads": 30, "n_layers": 30, "n_refiner_layers": 2, "norm_eps": 1e-05, "qk_norm": true, "rope_theta": 256.0, "siglip_feat_dim": null, "t_scale": 1000.0 }