diff options
| author | Zac Liu <liuguang@baai.ac.cn> | 2022-12-06 16:16:29 +0800 | 
|---|---|---|
| committer | GitHub <noreply@github.com> | 2022-12-06 16:16:29 +0800 | 
| commit | 9a5c689c4960259f32cf627384ef5691ded5c017 (patch) | |
| tree | 67ff3ae6cbe774c40ade0aa440ca1e4e15eca06e /v2-inference-v.yaml | |
| parent | a25dfebeed5b3411f2dc0f558c2b87a7c1cda420 (diff) | |
| parent | 965fc5ac5a6ccdf38342e21c97183011a04e799e (diff) | |
| download | stable-diffusion-webui-gfx803-9a5c689c4960259f32cf627384ef5691ded5c017.tar.gz | |
Merge pull request #4 from 920232796/master
add hash and fix undo hijack bug
Diffstat (limited to 'v2-inference-v.yaml')
| -rw-r--r-- | v2-inference-v.yaml | 68 | 
1 files changed, 68 insertions, 0 deletions
| diff --git a/v2-inference-v.yaml b/v2-inference-v.yaml new file mode 100644 index 00000000..513cd635 --- /dev/null +++ b/v2-inference-v.yaml @@ -0,0 +1,68 @@ +model: +  base_learning_rate: 1.0e-4 +  target: ldm.models.diffusion.ddpm.LatentDiffusion +  params: +    parameterization: "v" +    linear_start: 0.00085 +    linear_end: 0.0120 +    num_timesteps_cond: 1 +    log_every_t: 200 +    timesteps: 1000 +    first_stage_key: "jpg" +    cond_stage_key: "txt" +    image_size: 64 +    channels: 4 +    cond_stage_trainable: false +    conditioning_key: crossattn +    monitor: val/loss_simple_ema +    scale_factor: 0.18215 +    use_ema: False # we set this to false because this is an inference only config + +    unet_config: +      target: ldm.modules.diffusionmodules.openaimodel.UNetModel +      params: +        use_checkpoint: True +        use_fp16: True +        image_size: 32 # unused +        in_channels: 4 +        out_channels: 4 +        model_channels: 320 +        attention_resolutions: [ 4, 2, 1 ] +        num_res_blocks: 2 +        channel_mult: [ 1, 2, 4, 4 ] +        num_head_channels: 64 # need to fix for flash-attn +        use_spatial_transformer: True +        use_linear_in_transformer: True +        transformer_depth: 1 +        context_dim: 1024 +        legacy: False + +    first_stage_config: +      target: ldm.models.autoencoder.AutoencoderKL +      params: +        embed_dim: 4 +        monitor: val/rec_loss +        ddconfig: +          #attn_type: "vanilla-xformers" +          double_z: true +          z_channels: 4 +          resolution: 256 +          in_channels: 3 +          out_ch: 3 +          ch: 128 +          ch_mult: +          - 1 +          - 2 +          - 4 +          - 4 +          num_res_blocks: 2 +          attn_resolutions: [] +          dropout: 0.0 +        lossconfig: +          target: torch.nn.Identity + +    cond_stage_config: +      target: ldm.modules.encoders.modules.FrozenOpenCLIPEmbedder +      params: +        freeze: True +        layer: "penultimate"
\ No newline at end of file | 
