hdparmar commited on
Commit
e2b4f23
·
1 Parent(s): bbfeb9e

Upload folder using huggingface_hub

Browse files
configs/2023-10-22T14-53-45-lightning.yaml ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ lightning:
2
+ find_unused_parameters: false
3
+ modelcheckpoint:
4
+ params:
5
+ every_n_train_steps: 2000
6
+ save_top_k: -1
7
+ monitor: null
8
+ callbacks:
9
+ image_logger:
10
+ target: main.ImageLogger
11
+ params:
12
+ batch_frequency: 2000
13
+ max_images: 4
14
+ increase_log_steps: false
15
+ log_first_step: true
16
+ log_all_val: true
17
+ log_images_kwargs:
18
+ use_ema_scope: true
19
+ inpaint: false
20
+ plot_progressive_rows: false
21
+ plot_diffusion_rows: false
22
+ 'N': 4
23
+ unconditional_guidance_scale: 3.0
24
+ unconditional_guidance_label:
25
+ - ''
26
+ trainer:
27
+ benchmark: true
28
+ num_sanity_val_steps: 0
29
+ accumulate_grad_batches: 2
30
+ accelerator: ddp
31
+ check_val_every_n_epoch: 6
32
+ gpus: 0,1,
configs/2023-10-22T14-53-45-project.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 0.0001
3
+ target: ldm.models.diffusion.ddpm.LatentDiffusion
4
+ params:
5
+ linear_start: 0.00085
6
+ linear_end: 0.012
7
+ num_timesteps_cond: 1
8
+ log_every_t: 200
9
+ timesteps: 1000
10
+ first_stage_key: image
11
+ cond_stage_key: txt
12
+ image_size: 64
13
+ channels: 4
14
+ cond_stage_trainable: false
15
+ conditioning_key: crossattn
16
+ scale_factor: 0.18215
17
+ scheduler_config:
18
+ target: ldm.lr_scheduler.LambdaLinearScheduler
19
+ params:
20
+ warm_up_steps:
21
+ - 10000
22
+ cycle_lengths:
23
+ - 10000000000000
24
+ f_start:
25
+ - 1.0e-06
26
+ f_max:
27
+ - 1.0
28
+ f_min:
29
+ - 1.0
30
+ unet_config:
31
+ target: ldm.modules.diffusionmodules.openaimodel.UNetModel
32
+ params:
33
+ image_size: 32
34
+ in_channels: 4
35
+ out_channels: 4
36
+ model_channels: 320
37
+ attention_resolutions:
38
+ - 4
39
+ - 2
40
+ - 1
41
+ num_res_blocks: 2
42
+ channel_mult:
43
+ - 1
44
+ - 2
45
+ - 4
46
+ - 4
47
+ num_heads: 8
48
+ use_spatial_transformer: true
49
+ transformer_depth: 1
50
+ context_dim: 768
51
+ use_checkpoint: true
52
+ legacy: false
53
+ first_stage_config:
54
+ target: ldm.models.autoencoder.AutoencoderKL
55
+ ckpt_path: models/first_stage_models/kl-f8/model.ckpt
56
+ params:
57
+ embed_dim: 4
58
+ monitor: val/rec_loss
59
+ ddconfig:
60
+ double_z: true
61
+ z_channels: 4
62
+ resolution: 256
63
+ in_channels: 3
64
+ out_ch: 3
65
+ ch: 128
66
+ ch_mult:
67
+ - 1
68
+ - 2
69
+ - 4
70
+ - 4
71
+ num_res_blocks: 2
72
+ attn_resolutions: []
73
+ dropout: 0.0
74
+ lossconfig:
75
+ target: torch.nn.Identity
76
+ cond_stage_config:
77
+ target: ldm.modules.encoders.modules.FrozenCLIPEmbedder
78
+ data:
79
+ target: main.DataModuleFromConfig
80
+ params:
81
+ batch_size: 4
82
+ num_workers: 4
83
+ num_val_workers: 0
84
+ train:
85
+ target: ldm.data.simple.hf_dataset
86
+ params:
87
+ name: hdparmar/irish-traditional-tunes
88
+ image_transforms:
89
+ - target: torchvision.transforms.RandomHorizontalFlip
90
+ validation:
91
+ target: ldm.data.simple.TextOnly
92
+ params:
93
+ captions:
94
+ - An Irish Traditional tune with vibrant bouzouki strums
95
+ - An Irish Traditional Tune
96
+ - A traditional Irish slip jig rhythm
97
+ - A lively Irish Traditional Tune with a prominent fiddle lead
98
+ output_size: 512
99
+ n_gpus: 2