neural-os

Runtime error

App Files Files Community

da03 commited on Mar 6

Commit

837289b

1 Parent(s): f2aec00

.

Browse files

Files changed (3) hide show

config_rnn_measure_latency.yaml +108 -0
main.py +1 -1
utils.py +7 -7

config_rnn_measure_latency.yaml ADDED Viewed

	@@ -0,0 +1,108 @@

+save_path: saved_standard_challenging_context32_nocond_cont_cont_all_cont_eval
+model:
+  base_learning_rate: 8.0e-05
+  target: ldm.models.diffusion.ddpm.LatentDiffusion
+  params:
+    linear_start: 0.0015
+    linear_end: 0.0195
+    num_timesteps_cond: 1
+    log_every_t: 200
+    timesteps: 1000
+    first_stage_key: image
+    cond_stage_key: action_
+    scheduler_sampling_rate: 0.0
+    hybrid_key: c_concat
+    image_size: [64, 48]
+    channels: 3
+    cond_stage_trainable: false
+    conditioning_key: hybrid
+    monitor: val/loss_simple_ema
+    unet_config:
+      target: ldm.modules.diffusionmodules.openaimodel.UNetModel
+      params:
+        image_size: [64, 48]
+        in_channels: 8
+        out_channels: 4
+        model_channels: 192
+        attention_resolutions:
+        - 8
+        - 4
+        - 2
+        num_res_blocks: 2
+        channel_mult:
+        - 1
+        - 2
+        - 3
+        num_head_channels: 32
+        use_spatial_transformer: false
+        transformer_depth: 1
+    temporal_encoder_config:
+      target: ldm.modules.encoders.temporal_encoder.TemporalEncoder
+      params:
+        input_channels: 6
+        hidden_size: 1024
+        num_layers: 1
+        dropout: 0.1
+        output_channels: 4
+        output_height: 48
+        output_width: 64
+    first_stage_config:
+      target: ldm.models.autoencoder.AutoencoderKL
+      params:
+        embed_dim: 4
+        monitor: val/rec_loss
+        ddconfig:
+          double_z: true
+          z_channels: 4
+          resolution: 256
+          in_channels: 3
+          out_ch: 3
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          num_res_blocks: 2
+          attn_resolutions: []
+          dropout: 0.0
+        lossconfig:
+          target: torch.nn.Identity
+    cond_stage_config: __is_unconditional__
+data:
+  target: data.data_processing.datasets.DataModule
+  params:
+    batch_size: 8
+    num_workers: 1
+    wrap: false
+    shuffle: True
+    drop_last: True
+    pin_memory: True
+    prefetch_factor: 2
+    persistent_workers: True
+    train:
+      target: data.data_processing.datasets.ActionsData
+      params:
+        data_csv_path: desktop_sequences_filtered_with_desktop_1.5k.challenging.train.target_frames.csv
+        normalization: standard
+        context_length: 32
+        #validation:
+        #  target: data.data_processing.datasets.ActionsData
+        #  params:
+lightning:
+  trainer:
+    benchmark: False
+    max_epochs: 6400
+    limit_val_batches: 0
+    accelerator: gpu
+    gpus: 1
+    accumulate_grad_batches: 999999
+    gradient_clip_val: 1
+    checkpoint_callback: True

main.py CHANGED Viewed

@@ -27,7 +27,7 @@ LATENT_DIMS = (4, SCREEN_HEIGHT // 8, SCREEN_WIDTH // 8)
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 # Initialize the model at the start of your application
 #model = initialize_model("config_csllm.yaml", "yuntian-deng/computer-model")
-model = initialize_model("config_rnn.yaml", "yuntian-deng/computer-model")
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 model = model.to(device)

 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 # Initialize the model at the start of your application
 #model = initialize_model("config_csllm.yaml", "yuntian-deng/computer-model")
+model = initialize_model("config_rnn_measure_latency.yaml", "yuntian-deng/computer-model")
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 model = model.to(device)

utils.py CHANGED Viewed

@@ -10,7 +10,7 @@ import os
 import time
 DEBUG = False
-def load_model_from_config(config_path, model_name, device='cuda'):
     # Load the config file
     config = OmegaConf.load(config_path)
@@ -18,12 +18,12 @@ def load_model_from_config(config_path, model_name, device='cuda'):
     model = instantiate_from_config(config.model)
     # Download the model file from Hugging Face
-    model_file = hf_hub_download(repo_id=model_name, filename="model.safetensors", token=os.getenv('HF_TOKEN'))
-    print(f"Loading model from {model_name}")
-    # Load the state dict
-    state_dict = torch.load(model_file, map_location='cpu')
-    model.load_state_dict(state_dict, strict=True)
     model.to(device)
     model.eval()

 import time
 DEBUG = False
+def load_model_from_config(config_path, model_name, device='cuda', load=False):
     # Load the config file
     config = OmegaConf.load(config_path)
     model = instantiate_from_config(config.model)
     # Download the model file from Hugging Face
+    if load:
+        model_file = hf_hub_download(repo_id=model_name, filename="model.safetensors", token=os.getenv('HF_TOKEN'))
+        print(f"Loading model from {model_name}")
+        # Load the state dict
+        state_dict = torch.load(model_file, map_location='cpu')
+        model.load_state_dict(state_dict, strict=True)
     model.to(device)
     model.eval()