Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
87 changes: 87 additions & 0 deletions egomimic/rldb/embodiment/embodiment.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,12 @@
import copy
from abc import ABC
from enum import Enum

import numpy as np
import torch

from egomimic.rldb.zarr.action_chunk_transforms import Transform
from egomimic.utils.type_utils import _to_numpy


class EMBODIMENT(Enum):
Expand Down Expand Up @@ -53,3 +58,85 @@ def viz_transformed_batch(batch):
def get_keymap():
"""Returns a dictionary mapping from the raw keys in the dataset to the canonical keys used by the model."""
raise NotImplementedError

@classmethod
def viz_gt_preds(
cls,
predictions,
batch,
image_key,
action_key,
transform_list=None,
mode="cartesian",
**kwargs,
):
embodiment_id = batch["embodiment"][0].item()
embodiment_name = get_embodiment(embodiment_id).lower()

pred_actions = predictions[
f"{embodiment_name}_{action_key}"
] # TODO: make this work with groundtruth, clone batch and replace actions_keypoints with pred_actions
if transform_list is not None:
pred_batch = copy.deepcopy(batch)
pred_batch[action_key] = pred_actions
batch = cls.apply_transform(batch, transform_list)
pred_batch = cls.apply_transform(pred_batch, transform_list)
pred_actions = pred_batch[action_key]

images = batch[image_key]
actions = batch[action_key]
ims_list = []
images = _to_numpy(images)
actions = _to_numpy(actions)
pred_actions = _to_numpy(pred_actions)
for i in range(images.shape[0]):
image = images[i]
action = actions[i]
pred_action = pred_actions[i]
ims = cls.viz(image, action, mode=mode, color="Reds", **kwargs)
ims = cls.viz(ims, pred_action, mode=mode, color="Greens", **kwargs)
ims_list.append(ims)
ims = np.stack(ims_list, axis=0)
return ims

@classmethod
def apply_transform(cls, batch, transform_list: list[Transform]):
if transform_list:
batch_size = None
for v in batch.values():
if isinstance(v, (np.ndarray, torch.Tensor)):
batch_size = v.shape[0]
break

if batch_size is not None:
# Apply transforms per-sample (matching how ZarrDataset applies them)
results = []
for i in range(batch_size):
sample = {
k: (v[i].cpu().numpy() if isinstance(v, torch.Tensor) else v[i])
if isinstance(v, (np.ndarray, torch.Tensor))
else v
for k, v in batch.items()
}
for transform in transform_list:
sample = transform.transform(sample)
results.append(sample)

batch = {}
for k in results[0]:
vals = [r[k] for r in results]
if isinstance(vals[0], np.ndarray):
batch[k] = np.stack(vals, axis=0)
elif isinstance(vals[0], torch.Tensor):
batch[k] = torch.stack(vals, dim=0)
else:
batch[k] = vals
else:
for transform in transform_list:
batch = transform.transform(batch)

for k, v in batch.items():
if isinstance(v, np.ndarray):
batch[k] = torch.from_numpy(v).to(torch.float32)

return batch
Loading