Path: blob/master/configs/sd_xl_inpaint.yaml
2447 views
model:1target: sgm.models.diffusion.DiffusionEngine2params:3scale_factor: 0.130254disable_first_stage_autocast: True56denoiser_config:7target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser8params:9num_idx: 10001011weighting_config:12target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting13scaling_config:14target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling15discretization_config:16target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization1718network_config:19target: sgm.modules.diffusionmodules.openaimodel.UNetModel20params:21adm_in_channels: 281622num_classes: sequential23use_checkpoint: False24in_channels: 925out_channels: 426model_channels: 32027attention_resolutions: [4, 2]28num_res_blocks: 229channel_mult: [1, 2, 4]30num_head_channels: 6431use_spatial_transformer: True32use_linear_in_transformer: True33transformer_depth: [1, 2, 10] # note: the first is unused (due to attn_res starting at 2) 32, 16, 8 --> 64, 32, 1634context_dim: 204835spatial_transformer_attn_type: softmax-xformers36legacy: False3738conditioner_config:39target: sgm.modules.GeneralConditioner40params:41emb_models:42# crossattn cond43- is_trainable: False44input_key: txt45target: sgm.modules.encoders.modules.FrozenCLIPEmbedder46params:47layer: hidden48layer_idx: 1149# crossattn and vector cond50- is_trainable: False51input_key: txt52target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder253params:54arch: ViT-bigG-1455version: laion2b_s39b_b160k56freeze: True57layer: penultimate58always_return_pooled: True59legacy: False60# vector cond61- is_trainable: False62input_key: original_size_as_tuple63target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND64params:65outdim: 256 # multiplied by two66# vector cond67- is_trainable: False68input_key: crop_coords_top_left69target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND70params:71outdim: 256 # multiplied by two72# vector cond73- is_trainable: False74input_key: target_size_as_tuple75target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND76params:77outdim: 256 # multiplied by two7879first_stage_config:80target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper81params:82embed_dim: 483monitor: val/rec_loss84ddconfig:85attn_type: vanilla-xformers86double_z: true87z_channels: 488resolution: 25689in_channels: 390out_ch: 391ch: 12892ch_mult: [1, 2, 4, 4]93num_res_blocks: 294attn_resolutions: []95dropout: 0.096lossconfig:97target: torch.nn.Identity9899100