yuntian-deng commited on
Commit
801f7e1
·
1 Parent(s): 3026a03

Create config_csllm.yaml

Browse files
Files changed (1) hide show
  1. config_csllm.yaml +90 -0
config_csllm.yaml ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_learning_rate: 8.0e-05
3
+ target: ldm.models.diffusion.ddpm.LatentDiffusion
4
+ params:
5
+ linear_start: 0.0015
6
+ linear_end: 0.0195
7
+ num_timesteps_cond: 1
8
+ log_every_t: 200
9
+ timesteps: 1000
10
+ first_stage_key: image
11
+ cond_stage_key: caption
12
+ hybrid_key: c_concat
13
+ image_size: 64
14
+ channels: 3
15
+ cond_stage_trainable: true
16
+ conditioning_key: hybrid
17
+ monitor: val/loss_simple_ema
18
+
19
+ unet_config:
20
+ target: ldm.modules.diffusionmodules.openaimodel.UNetModel
21
+ params:
22
+ image_size: 64
23
+ in_channels: 24
24
+ out_channels: 3
25
+ model_channels: 192
26
+ attention_resolutions:
27
+ - 8
28
+ - 4
29
+ - 2
30
+ num_res_blocks: 2
31
+ channel_mult:
32
+ - 1
33
+ - 2
34
+ - 3
35
+ - 5
36
+ num_head_channels: 32
37
+ use_spatial_transformer: true
38
+ transformer_depth: 1
39
+ context_dim: 640
40
+ first_stage_config:
41
+ target: ldm.models.autoencoder.VQModelInterface
42
+ params:
43
+ embed_dim: 3
44
+ n_embed: 8192
45
+ monitor: val/rec_loss
46
+
47
+ ddconfig:
48
+ double_z: false
49
+ z_channels: 3
50
+ resolution: 256
51
+ in_channels: 3
52
+ out_ch: 3
53
+ ch: 128
54
+ ch_mult:
55
+ - 1
56
+ - 2
57
+ - 4
58
+ num_res_blocks: 2
59
+ attn_resolutions: []
60
+ dropout: 0.0
61
+ lossconfig:
62
+ target: torch.nn.Identity
63
+
64
+ cond_stage_config:
65
+ target: ldm.modules.encoders.modules.BERTEmbedder
66
+ params:
67
+ n_embed: 640
68
+ n_layer: 32
69
+
70
+ data:
71
+ target: data.datasets.CsllmTrainSeq
72
+ params:
73
+ batch_size: 8
74
+ num_workers: 12
75
+ wrap: false
76
+ train:
77
+ target: data.datasets.CsllmTrainSeq
78
+ params:
79
+ config:
80
+ size: 256
81
+
82
+ lightning:
83
+ trainer:
84
+ benchmark: False
85
+ max_epochs: 200
86
+ accelerator: gpu
87
+ gpus: 1
88
+ gradient_clip_val: 1
89
+ checkpoint_callback: False
90
+ callbacks: []