-
-
Save madrang/c82840db02c9b07ba82f8ba55a7940b1 to your computer and use it in GitHub Desktop.
Custom model config for Stable Diffusion 2.0 models, adds an "extra: {attn_precision: 'fp32'}" field to the end of the model config. This "extra" field is recognized by SDKit (https://github.com/easydiffusion/sdkit)
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
model: | |
base_learning_rate: 1.0e-4 | |
target: ldm.models.diffusion.ddpm.LatentDiffusion | |
params: | |
parameterization: "v" | |
linear_start: 0.00085 | |
linear_end: 0.0120 | |
num_timesteps_cond: 1 | |
log_every_t: 200 | |
timesteps: 1000 | |
first_stage_key: "jpg" | |
cond_stage_key: "txt" | |
image_size: 64 | |
channels: 4 | |
cond_stage_trainable: false | |
conditioning_key: crossattn | |
monitor: val/loss_simple_ema | |
scale_factor: 0.18215 | |
use_ema: False # we set this to false because this is an inference only config | |
unet_config: | |
target: ldm.modules.diffusionmodules.openaimodel.UNetModel | |
params: | |
use_checkpoint: True | |
use_fp16: True | |
image_size: 32 # unused | |
in_channels: 4 | |
out_channels: 4 | |
model_channels: 320 | |
attention_resolutions: [ 4, 2, 1 ] | |
num_res_blocks: 2 | |
channel_mult: [ 1, 2, 4, 4 ] | |
num_head_channels: 64 # need to fix for flash-attn | |
use_spatial_transformer: True | |
use_linear_in_transformer: True | |
transformer_depth: 1 | |
context_dim: 1024 | |
legacy: False | |
first_stage_config: | |
target: ldm.models.autoencoder.AutoencoderKL | |
params: | |
embed_dim: 4 | |
monitor: val/rec_loss | |
ddconfig: | |
#attn_type: "vanilla-xformers" | |
double_z: true | |
z_channels: 4 | |
resolution: 256 | |
in_channels: 3 | |
out_ch: 3 | |
ch: 128 | |
ch_mult: | |
- 1 | |
- 2 | |
- 4 | |
- 4 | |
num_res_blocks: 2 | |
attn_resolutions: [] | |
dropout: 0.0 | |
lossconfig: | |
target: torch.nn.Identity | |
cond_stage_config: | |
target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder | |
params: | |
freeze: True | |
layer: "penultimate" | |
extra: | |
attn_precision: "fp32" |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment