{ "sample_size": 128, "patch_size": 2, "in_channels": 16, "num_layers": 24, "attention_head_dim": 64, "num_attention_heads": 24, "joint_attention_dim": 4096, "caption_projection_dim": 1536, "pooled_projection_dim": 2048, "out_channels": 16, "pos_embed_max_size": 192, "attention_type": "layout", "max_boxes_per_image": 10, "_use_default_values": [ "max_boxes_per_image" ], "_class_name": "SD3Transformer2DModel", "_diffusers_version": "0.29.0.dev0", "_name_or_path": "/mnt/bn/zhanghui-test-yg/ai_product_models/stable-diffusion-3-medium-diffusers-layout" }