lmzjms commited on
Commit
12a5bc8
1 Parent(s): e613657

Upload txt2audio_args.yaml

Browse files
Files changed (1) hide show
  1. configs/inpaint/txt2audio_args.yaml +68 -0
configs/inpaint/txt2audio_args.yaml ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 1.0e-05
3
+ target: ldm.models.diffusion.ddpm_audio.LatentDiffusion_audio
4
+ params:
5
+ linear_start: 0.0015
6
+ linear_end: 0.0205
7
+ log_every_t: 100
8
+ timesteps: 1000
9
+ loss_type: l1
10
+ first_stage_key: image
11
+ cond_stage_key: masked_image
12
+ image_size: 32 # unused
13
+ mel_dim: 10 # 80 // 2^3
14
+ mel_length: 106 # 848 // 2^3
15
+ channels: 4
16
+ concat_mode: true
17
+ monitor: val/loss
18
+ use_ema: False
19
+
20
+ scheduler_config:
21
+ target: ldm.lr_scheduler.LambdaWarmUpCosineScheduler
22
+ params:
23
+ verbosity_interval: 0
24
+ warm_up_steps: 1000
25
+ max_decay_steps: 50000
26
+ lr_start: 0.001
27
+ lr_max: 0.1
28
+ lr_min: 0.0001
29
+
30
+ unet_config:
31
+ target: ldm.modules.diffusionmodules.openaimodel.UNetModel
32
+ params:
33
+ image_size: 32 # ununsed
34
+ in_channels: 9 # 4 + 1 + 4
35
+ out_channels: 4
36
+ model_channels: 320
37
+ attention_resolutions:
38
+ - 1
39
+ - 2
40
+ num_res_blocks: 2
41
+ channel_mult: # num_down = len(ch_mult)-1
42
+ - 1
43
+ - 2
44
+ num_heads: 8
45
+ resblock_updown: true
46
+
47
+ first_stage_config:
48
+ target: ldm.models.autoencoder.AutoencoderKL
49
+ params:
50
+ embed_dim: 4
51
+ monitor: val/rec_loss
52
+ ckpt_path: # /apdcephfs/share_1316500/nlphuang/results/Text_to_audio/ae15/2022-12-15T22-24-00_mixdata_kl_4_tile/epoch=000009-v2.ckpt
53
+ ddconfig:
54
+ double_z: true
55
+ z_channels: 4
56
+ resolution: 848
57
+ in_channels: 1
58
+ out_ch: 1
59
+ ch: 128
60
+ ch_mult: [ 1, 2, 2, 4 ] # num_down = len(ch_mult)-1
61
+ num_res_blocks: 2
62
+ attn_resolutions: [106, 212]
63
+ dropout: 0.0
64
+ lossconfig:
65
+ target: torch.nn.Identity
66
+
67
+ cond_stage_config: __is_first_stage__
68
+