File size: 884 Bytes
3e8b723
f8a240c
 
3e8b723
 
 
 
 
529c646
3e8b723
 
 
 
 
 
529c646
3e8b723
 
 
529c646
f29faf1
529c646
 
3e8b723
529c646
3e8b723
 
 
 
 
 
 
034d18c
3e8b723
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35

# based on https://github.com/CompVis/stable-diffusion/blob/main/configs/autoencoder/autoencoder_kl_32x32x4.yaml

model:
  base_learning_rate: 4.5e-6
  target: ldm.models.autoencoder.AutoencoderKL
  params:
    monitor: "val/rec_loss"
    embed_dim: 1  # = in_channels
    lossconfig:
      target: ldm.modules.losses.LPIPSWithDiscriminator
      params:
        disc_start: 50001
        kl_weight: 0.000001
        disc_weight: 0.5
        disc_in_channels: 1  # = out_ch

    ddconfig:
      double_z: True
      z_channels: 1  # must = embed_dim due to HF limitation
      resolution: 256  # overriden by input image size
      in_channels: 1
      out_ch: 1
      ch: 128
      ch_mult: [ 1,2,4,4 ]  # num_down = len(ch_mult)-1
      num_res_blocks: 2
      attn_resolutions: [ ]
      dropout: 0.0

lightning:
  trainer:
    benchmark: True
    accelerator: gpu
    devices: 1