j-min commited on
Commit
4c54f90
·
1 Parent(s): bcd3a81

Upload 2 files

Browse files
clevr_data2023-03-02T11-07-16-lightning.yaml ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ lightning:
2
+ find_unused_parameters: false
3
+ modelcheckpoint:
4
+ params:
5
+ monitor: train/loss_simple
6
+ save_top_k: -1
7
+ every_n_train_steps: 405
8
+ callbacks:
9
+ image_logger:
10
+ target: main.ImageLogger
11
+ params:
12
+ batch_frequency: 10000000
13
+ log_on_batch_idx: true
14
+ max_images: 4
15
+ increase_log_steps: false
16
+ log_images_kwargs:
17
+ inpaint: false
18
+ plot_denoise_rows: false
19
+ plot_progressive_rows: false
20
+ plot_diffusion_rows: false
21
+ 'N': 4
22
+ ddim_steps: 50
23
+ trainer:
24
+ benchmark: true
25
+ max_steps: 20000
26
+ check_val_every_n_epoch: 1000
27
+ num_sanity_val_steps: 0
28
+ accumulate_grad_batches: 8
29
+ accelerator: gpu
30
+ strategy: ddp
31
+ num_nodes: 2
32
+ gpus: 0,1,2,3,4,5,6,7
clevr_data2023-03-02T11-07-16-project.yaml ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 0.0001
3
+ target: ldm.models.diffusion.ddpm.LatentInpaintDiffusion
4
+ params:
5
+ linear_start: 0.00085
6
+ linear_end: 0.012
7
+ num_timesteps_cond: 1
8
+ log_every_t: 200
9
+ timesteps: 1000
10
+ first_stage_key: image
11
+ cond_stage_key: caption
12
+ image_size: 64
13
+ channels: 4
14
+ cond_stage_trainable: true
15
+ conditioning_key: hybrid
16
+ monitor: val/loss_simple_ema
17
+ scale_factor: 0.18215
18
+ finetune_keys: null
19
+ scheduler_config:
20
+ target: ldm.lr_scheduler.LambdaLinearScheduler
21
+ params:
22
+ warm_up_steps:
23
+ - 1
24
+ cycle_lengths:
25
+ - 10000000000000
26
+ f_start:
27
+ - 1.0e-06
28
+ f_max:
29
+ - 1.0
30
+ f_min:
31
+ - 1.0
32
+ unet_config:
33
+ target: ldm.modules.diffusionmodules.openaimodel.UNetModel
34
+ params:
35
+ image_size: 32
36
+ in_channels: 9
37
+ out_channels: 4
38
+ model_channels: 320
39
+ attention_resolutions:
40
+ - 4
41
+ - 2
42
+ - 1
43
+ num_res_blocks: 2
44
+ channel_mult:
45
+ - 1
46
+ - 2
47
+ - 4
48
+ - 4
49
+ num_heads: 8
50
+ use_spatial_transformer: true
51
+ transformer_depth: 1
52
+ context_dim: 768
53
+ use_checkpoint: true
54
+ legacy: false
55
+ first_stage_config:
56
+ target: ldm.models.autoencoder.AutoencoderKL
57
+ params:
58
+ embed_dim: 4
59
+ monitor: val/rec_loss
60
+ ddconfig:
61
+ double_z: true
62
+ z_channels: 4
63
+ resolution: 512
64
+ in_channels: 3
65
+ out_ch: 3
66
+ ch: 128
67
+ ch_mult:
68
+ - 1
69
+ - 2
70
+ - 4
71
+ - 4
72
+ num_res_blocks: 2
73
+ attn_resolutions: []
74
+ dropout: 0.0
75
+ lossconfig:
76
+ target: torch.nn.Identity
77
+ cond_stage_config:
78
+ target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
79
+ params:
80
+ with_bbox: true
81
+ num_bins: 1000
82
+ extend_outputlen: 616
83
+ max_length: 616
84
+ ckpt_path: preload_model_checkpoints/SD_checkpoints/sd-v1-5-inpainting.ckpt
85
+ data:
86
+ target: main.DataModuleFromConfig
87
+ params:
88
+ batch_size: 1
89
+ num_workers: 8
90
+ wrap: false
91
+ train:
92
+ target: ldm.data.clevr.CLEVRDataset
93
+ params:
94
+ size: 512
95
+ old_clevr: true
96
+ set: train
97
+ with_bbox: true
98
+ num_bins: 1000
99
+ flip_p: 0.5
100
+ box_descp: caption
101
+ max_src_length: 616
102
+ has_global_caption: false
103
+ inpaint: iterative
104
+ validation:
105
+ target: ldm.data.clevr.CLEVRDataset
106
+ params:
107
+ size: 512
108
+ old_clevr: true
109
+ set: test
110
+ with_bbox: true
111
+ num_bins: 1000
112
+ flip_p: 0.5
113
+ box_descp: caption
114
+ max_src_length: 616
115
+ has_global_caption: false
116
+ inpaint: iterative