xizaoqu commited on
Commit
e8305b5
·
1 Parent(s): 0f2b975
Files changed (2) hide show
  1. algorithms/worldmem/df_video.py +3 -0
  2. app.py +9 -11
algorithms/worldmem/df_video.py CHANGED
@@ -797,13 +797,16 @@ class WorldMemMinecraft(DiffusionForcingBase):
797
  condition_similar_length = self.condition_similar_length
798
 
799
  if self_frames is None:
 
800
  first_frame_encode = self.encode(first_frame[None, None].to(device))
801
  self_frames = first_frame_encode.cpu()
 
802
  self.actions = curr_actions[None, None].to(device)
803
  self_poses = first_pose[None, None].to(device)
804
  new_c2w_mat = euler_to_camera_to_world_matrix(first_pose)
805
  self_memory_c2w = new_c2w_mat[None, None].to(device)
806
  self_frame_idx = torch.tensor([[context_frames_idx]]).to(device)
 
807
  return first_frame, self_frames, self_poses, self_memory_c2w, self_frame_idx
808
  else:
809
  last_frame = self_frames[-1].clone()
 
797
  condition_similar_length = self.condition_similar_length
798
 
799
  if self_frames is None:
800
+ print("inside1", device)
801
  first_frame_encode = self.encode(first_frame[None, None].to(device))
802
  self_frames = first_frame_encode.cpu()
803
+ print("inside2", device)
804
  self.actions = curr_actions[None, None].to(device)
805
  self_poses = first_pose[None, None].to(device)
806
  new_c2w_mat = euler_to_camera_to_world_matrix(first_pose)
807
  self_memory_c2w = new_c2w_mat[None, None].to(device)
808
  self_frame_idx = torch.tensor([[context_frames_idx]]).to(device)
809
+ print("inside3")
810
  return first_frame, self_frames, self_poses, self_memory_c2w, self_frame_idx
811
  else:
812
  last_frame = self_frames[-1].clone()
app.py CHANGED
@@ -257,7 +257,6 @@ def reset():
257
  global self_memory_c2w
258
  global self_frame_idx
259
 
260
- print("self_frame_idx:", self_frame_idx)
261
  # worldmem.reset()
262
  self_frames = None
263
  self_poses = None
@@ -268,16 +267,15 @@ def reset():
268
  memory_curr_frame = 0
269
  input_history = ""
270
 
271
- self_frame_idx = 1
272
- # _, self_frames, self_poses, self_memory_c2w, self_frame_idx = run_interactive(memory_frames[0],
273
- # actions[0],
274
- # poses[0],
275
- # memory_curr_frame,
276
- # device=device,
277
- # self_frames=self_frames,
278
- # self_poses=self_poses,
279
- # self_memory_c2w=self_memory_c2w,
280
- # self_frame_idx=self_frame_idx)
281
 
282
 
283
 
 
257
  global self_memory_c2w
258
  global self_frame_idx
259
 
 
260
  # worldmem.reset()
261
  self_frames = None
262
  self_poses = None
 
267
  memory_curr_frame = 0
268
  input_history = ""
269
 
270
+ _, self_frames, self_poses, self_memory_c2w, self_frame_idx = run_interactive(memory_frames[0],
271
+ actions[0],
272
+ poses[0],
273
+ memory_curr_frame,
274
+ device=device,
275
+ self_frames=self_frames,
276
+ self_poses=self_poses,
277
+ self_memory_c2w=self_memory_c2w,
278
+ self_frame_idx=self_frame_idx)
 
279
 
280
 
281