Bagheera Bghira
v1: from ptx0/coco-xltest, 36000 + 21800 + 14200 steps of mixed LAION/MJ dataset and offset noise with input perturbation on a probability of 25%, 10% caption dropout, cosine LR 4e-7 to 8e-7 every 3200 steps
90816e1
{ | |
"_class_name": "AutoencoderKL", | |
"_diffusers_version": "0.22.0.dev0", | |
"_name_or_path": "madebyollin/sdxl-vae-fp16-fix", | |
"act_fn": "silu", | |
"block_out_channels": [ | |
128, | |
256, | |
512, | |
512 | |
], | |
"down_block_types": [ | |
"DownEncoderBlock2D", | |
"DownEncoderBlock2D", | |
"DownEncoderBlock2D", | |
"DownEncoderBlock2D" | |
], | |
"force_upcast": false, | |
"in_channels": 3, | |
"latent_channels": 4, | |
"layers_per_block": 2, | |
"norm_num_groups": 32, | |
"out_channels": 3, | |
"sample_size": 512, | |
"scaling_factor": 0.13025, | |
"up_block_types": [ | |
"UpDecoderBlock2D", | |
"UpDecoderBlock2D", | |
"UpDecoderBlock2D", | |
"UpDecoderBlock2D" | |
] | |
} | |