GaTech-RL2 · ElmoPA · Mar 17, 2026
diff --git a/egomimic/rldb/embodiment/embodiment.py b/egomimic/rldb/embodiment/embodiment.py
@@ -1,7 +1,12 @@
+import copy
 from abc import ABC
 from enum import Enum
 
+import numpy as np
+import torch
+
 from egomimic.rldb.zarr.action_chunk_transforms import Transform
+from egomimic.utils.type_utils import _to_numpy
 
 
 class EMBODIMENT(Enum):
@@ -53,3 +58,85 @@ def viz_transformed_batch(batch):
     def get_keymap():
         """Returns a dictionary mapping from the raw keys in the dataset to the canonical keys used by the model."""
         raise NotImplementedError
+
+    @classmethod
+    def viz_gt_preds(
+        cls,
+        predictions,
+        batch,
+        image_key,
+        action_key,
+        transform_list=None,
+        mode="cartesian",
+        **kwargs,
+    ):
+        embodiment_id = batch["embodiment"][0].item()
+        embodiment_name = get_embodiment(embodiment_id).lower()
+
+        pred_actions = predictions[
+            f"{embodiment_name}_{action_key}"
+        ]  # TODO: make this work with groundtruth, clone batch and replace actions_keypoints with pred_actions
+        if transform_list is not None:
+            pred_batch = copy.deepcopy(batch)
+            pred_batch[action_key] = pred_actions
+            batch = cls.apply_transform(batch, transform_list)
+            pred_batch = cls.apply_transform(pred_batch, transform_list)
+            pred_actions = pred_batch[action_key]
+
+        images = batch[image_key]
+        actions = batch[action_key]
+        ims_list = []
+        images = _to_numpy(images)
+        actions = _to_numpy(actions)
+        pred_actions = _to_numpy(pred_actions)
+        for i in range(images.shape[0]):
+            image = images[i]
+            action = actions[i]
+            pred_action = pred_actions[i]
+            ims = cls.viz(image, action, mode=mode, color="Reds", **kwargs)
+            ims = cls.viz(ims, pred_action, mode=mode, color="Greens", **kwargs)
+            ims_list.append(ims)
+        ims = np.stack(ims_list, axis=0)
+        return ims
+
+    @classmethod
+    def apply_transform(cls, batch, transform_list: list[Transform]):
+        if transform_list:
+            batch_size = None
+            for v in batch.values():
+                if isinstance(v, (np.ndarray, torch.Tensor)):
+                    batch_size = v.shape[0]
+                    break
+
+            if batch_size is not None:
+                # Apply transforms per-sample (matching how ZarrDataset applies them)
+                results = []
+                for i in range(batch_size):
+                    sample = {
+                        k: (v[i].cpu().numpy() if isinstance(v, torch.Tensor) else v[i])
+                        if isinstance(v, (np.ndarray, torch.Tensor))
+                        else v
+                        for k, v in batch.items()
+                    }
+                    for transform in transform_list:
+                        sample = transform.transform(sample)
+                    results.append(sample)
+
+                batch = {}
+                for k in results[0]:
+                    vals = [r[k] for r in results]
+                    if isinstance(vals[0], np.ndarray):
+                        batch[k] = np.stack(vals, axis=0)
+                    elif isinstance(vals[0], torch.Tensor):
+                        batch[k] = torch.stack(vals, dim=0)
+                    else:
+                        batch[k] = vals
+            else:
+                for transform in transform_list:
+                    batch = transform.transform(batch)
+
+        for k, v in batch.items():
+            if isinstance(v, np.ndarray):
+                batch[k] = torch.from_numpy(v).to(torch.float32)
+
+        return batch