yuntian-deng commited on
Commit
f24cce5
·
1 Parent(s): 21afa57

Upload pssearch_bsz64_acc1_lr8e5_512_leftclick.yaml

Browse files
pssearch_bsz64_acc1_lr8e5_512_leftclick.yaml ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ save_path: saved_bsz64_acc1_lr8e5_512_leftclick
2
+
3
+ model:
4
+ base_learning_rate: 8.0e-05
5
+ target: latent_diffusion.ldm.models.diffusion.ddpm.LatentDiffusion
6
+ params:
7
+ linear_start: 0.0015
8
+ linear_end: 0.0195
9
+ num_timesteps_cond: 1
10
+ log_every_t: 200
11
+ timesteps: 1000
12
+ first_stage_key: image
13
+ cond_stage_key: action_
14
+ scheduler_sampling_rate: 0.0
15
+ hybrid_key: c_concat
16
+ image_size: 64
17
+ channels: 3
18
+ cond_stage_trainable: true
19
+ conditioning_key: hybrid
20
+ monitor: val/loss_simple_ema
21
+
22
+ unet_config:
23
+ target: latent_diffusion.ldm.modules.diffusionmodules.openaimodel.UNetModel
24
+ params:
25
+ image_size: 64
26
+ in_channels: 34
27
+ out_channels: 4
28
+ model_channels: 192
29
+ attention_resolutions:
30
+ - 8
31
+ - 4
32
+ - 2
33
+ num_res_blocks: 2
34
+ channel_mult:
35
+ - 1
36
+ - 2
37
+ - 3
38
+ - 5
39
+ num_head_channels: 32
40
+ use_spatial_transformer: true
41
+ transformer_depth: 1
42
+ context_dim: 768
43
+ first_stage_config:
44
+ target: latent_diffusion.ldm.models.autoencoder.AutoencoderKL
45
+ params:
46
+ embed_dim: 4
47
+ monitor: val/rec_loss
48
+ ddconfig:
49
+ double_z: true
50
+ z_channels: 4
51
+ resolution: 256
52
+ in_channels: 3
53
+ out_ch: 3
54
+ ch: 128
55
+ ch_mult:
56
+ - 1
57
+ - 2
58
+ - 4
59
+ - 4
60
+ num_res_blocks: 2
61
+ attn_resolutions: []
62
+ dropout: 0.0
63
+ lossconfig:
64
+ target: torch.nn.Identity
65
+
66
+ cond_stage_config:
67
+ target: latent_diffusion.ldm.modules.encoders.modules.GPTEmbedder
68
+ params:
69
+ n_embed: 768
70
+ n_layer: 12
71
+
72
+ data:
73
+ target: data.data_processing.datasets.DataModule
74
+ params:
75
+ batch_size: 64
76
+ num_workers: 4
77
+ wrap: false
78
+ shuffle: True
79
+ drop_last: True
80
+ pin_memory: True
81
+ prefetch_factor: 2
82
+ persistent_workers: True
83
+ train:
84
+ target: data.data_processing.datasets.ActionsData
85
+ params:
86
+ data_csv_path: train_dataset/train_dataset_14frames_firstframe_allframes.csv
87
+ #validation:
88
+ # target: data.data_processing.datasets.ActionsData
89
+ # params:
90
+ # data_csv_path: train_dataset/train_dataset_14frames_firstframe_allframes.csv
91
+
92
+ lightning:
93
+ trainer:
94
+ benchmark: False
95
+ max_epochs: 64
96
+ limit_val_batches: 0
97
+ accelerator: gpu
98
+ gpus: 1
99
+ accumulate_grad_batches: 1
100
+ gradient_clip_val: 1
101
+ checkpoint_callback: True