xizaoqu
commited on
Commit
·
e8305b5
1
Parent(s):
0f2b975
update
Browse files- algorithms/worldmem/df_video.py +3 -0
- app.py +9 -11
algorithms/worldmem/df_video.py
CHANGED
@@ -797,13 +797,16 @@ class WorldMemMinecraft(DiffusionForcingBase):
|
|
797 |
condition_similar_length = self.condition_similar_length
|
798 |
|
799 |
if self_frames is None:
|
|
|
800 |
first_frame_encode = self.encode(first_frame[None, None].to(device))
|
801 |
self_frames = first_frame_encode.cpu()
|
|
|
802 |
self.actions = curr_actions[None, None].to(device)
|
803 |
self_poses = first_pose[None, None].to(device)
|
804 |
new_c2w_mat = euler_to_camera_to_world_matrix(first_pose)
|
805 |
self_memory_c2w = new_c2w_mat[None, None].to(device)
|
806 |
self_frame_idx = torch.tensor([[context_frames_idx]]).to(device)
|
|
|
807 |
return first_frame, self_frames, self_poses, self_memory_c2w, self_frame_idx
|
808 |
else:
|
809 |
last_frame = self_frames[-1].clone()
|
|
|
797 |
condition_similar_length = self.condition_similar_length
|
798 |
|
799 |
if self_frames is None:
|
800 |
+
print("inside1", device)
|
801 |
first_frame_encode = self.encode(first_frame[None, None].to(device))
|
802 |
self_frames = first_frame_encode.cpu()
|
803 |
+
print("inside2", device)
|
804 |
self.actions = curr_actions[None, None].to(device)
|
805 |
self_poses = first_pose[None, None].to(device)
|
806 |
new_c2w_mat = euler_to_camera_to_world_matrix(first_pose)
|
807 |
self_memory_c2w = new_c2w_mat[None, None].to(device)
|
808 |
self_frame_idx = torch.tensor([[context_frames_idx]]).to(device)
|
809 |
+
print("inside3")
|
810 |
return first_frame, self_frames, self_poses, self_memory_c2w, self_frame_idx
|
811 |
else:
|
812 |
last_frame = self_frames[-1].clone()
|
app.py
CHANGED
@@ -257,7 +257,6 @@ def reset():
|
|
257 |
global self_memory_c2w
|
258 |
global self_frame_idx
|
259 |
|
260 |
-
print("self_frame_idx:", self_frame_idx)
|
261 |
# worldmem.reset()
|
262 |
self_frames = None
|
263 |
self_poses = None
|
@@ -268,16 +267,15 @@ def reset():
|
|
268 |
memory_curr_frame = 0
|
269 |
input_history = ""
|
270 |
|
271 |
-
self_frame_idx =
|
272 |
-
|
273 |
-
|
274 |
-
|
275 |
-
|
276 |
-
|
277 |
-
|
278 |
-
|
279 |
-
|
280 |
-
# self_frame_idx=self_frame_idx)
|
281 |
|
282 |
|
283 |
|
|
|
257 |
global self_memory_c2w
|
258 |
global self_frame_idx
|
259 |
|
|
|
260 |
# worldmem.reset()
|
261 |
self_frames = None
|
262 |
self_poses = None
|
|
|
267 |
memory_curr_frame = 0
|
268 |
input_history = ""
|
269 |
|
270 |
+
_, self_frames, self_poses, self_memory_c2w, self_frame_idx = run_interactive(memory_frames[0],
|
271 |
+
actions[0],
|
272 |
+
poses[0],
|
273 |
+
memory_curr_frame,
|
274 |
+
device=device,
|
275 |
+
self_frames=self_frames,
|
276 |
+
self_poses=self_poses,
|
277 |
+
self_memory_c2w=self_memory_c2w,
|
278 |
+
self_frame_idx=self_frame_idx)
|
|
|
279 |
|
280 |
|
281 |
|