`Frame`¶

`dreem.io.Frame` ¶

Data structure containing metadata for a single frame of a video.

Attributes:

Name	Type	Description
`video_id`	`Tensor`	The video index in the dataset.
`frame_id`	`Tensor`	The index of the frame in a video.
`vid_file`	`Tensor`	The path to the video the frame is from.
`img_shape`	`Tensor`	The shape of the original frame (not the crop).
`instances`	`list['Instance']`	A list of Instance objects that appear in the frame.
`asso_output`	`'AssociationMatrix'`	The association matrix between instances output directly from the transformer.
`matches`	`tuple`	matches from LSA algorithm between the instances and available trajectories during tracking.
`traj_score`	`tuple`	Either a dict containing the association matrix between instances and trajectories along postprocessing pipeline or a single association matrix.
`device`	`str`	The device the frame should be moved to.

Source code in dreem/io/frame.py

@attrs.define(eq=False)
class Frame:
    """Data structure containing metadata for a single frame of a video.

    Attributes:
        video_id: The video index in the dataset.
        frame_id: The index of the frame in a video.
        vid_file: The path to the video the frame is from.
        img_shape: The shape of the original frame (not the crop).
        instances: A list of Instance objects that appear in the frame.
        asso_output: The association matrix between instances
            output directly from the transformer.
        matches: matches from LSA algorithm between the instances and
            available trajectories during tracking.
        traj_score: Either a dict containing the association matrix
            between instances and trajectories along postprocessing pipeline
            or a single association matrix.
        device: The device the frame should be moved to.
    """

    _video_id: int = attrs.field(alias="video_id", converter=_to_tensor)
    _frame_id: int = attrs.field(alias="frame_id", converter=_to_tensor)
    _video: str = attrs.field(alias="vid_file", default="")
    _img_shape: ArrayLike = attrs.field(
        alias="img_shape", converter=_to_tensor, factory=list
    )

    _instances: list["Instance"] = attrs.field(alias="instances", factory=list)
    _asso_output: "AssociationMatrix" | None = attrs.field(
        alias="asso_output", default=None
    )
    _matches: tuple = attrs.field(alias="matches", factory=tuple)
    _traj_score: dict = attrs.field(alias="traj_score", factory=dict)
    _device: str | torch.device | None = attrs.field(alias="device", default=None)

    def __attrs_post_init__(self) -> None:
        """Handle more intricate default initializations and moving to device."""
        if len(self.img_shape) == 0:
            self.img_shape = torch.tensor([0, 0, 0])

        for instance in self.instances:
            instance.frame = self

        self.to(self.device)

    def __repr__(self) -> str:
        """Return String representation of the Frame.

        Returns:
            The string representation of the frame.
        """
        return (
            "Frame("
            f"video={self._video.filename if isinstance(self._video, sio.Video) else self._video}, "
            f"video_id={self._video_id.item()}, "
            f"frame_id={self._frame_id.item()}, "
            f"img_shape={self._img_shape}, "
            f"num_detected={self.num_detected}, "
            f"asso_output={self._asso_output}, "
            f"traj_score={self._traj_score}, "
            f"matches={self._matches}, "
            f"instances={self._instances}, "
            f"device={self._device}"
            ")"
        )

    def to(self, map_location: str | torch.device) -> Self:
        """Move frame to different device or dtype (See `torch.to` for more info).

        Args:
            map_location: A string representing the device to move to.

        Returns:
            The frame moved to a different device/dtype.
        """
        self._video_id = self._video_id.to(map_location)
        self._frame_id = self._frame_id.to(map_location)
        self._img_shape = self._img_shape.to(map_location)

        if isinstance(self._asso_output, torch.Tensor):
            self._asso_output = self._asso_output.to(map_location)

        if isinstance(self._matches, torch.Tensor):
            self._matches = self._matches.to(map_location)

        for key, val in self._traj_score.items():
            if isinstance(val, torch.Tensor):
                self._traj_score[key] = val.to(map_location)
        for instance in self.instances:
            instance = instance.to(map_location)

        if isinstance(map_location, (str, torch.device)):
            self._device = map_location

        return self

    @classmethod
    def from_slp(
        cls,
        lf: sio.LabeledFrame,
        video_id: int = 0,
        device: str | None = None,
        **kwargs,
    ) -> Self:
        """Convert `sio.LabeledFrame` to `dreem.io.Frame`.

        Args:
            lf: A sio.LabeledFrame object

        Returns:
            A dreem.io.Frame object
        """
        from dreem.io import Instance

        img_shape = lf.image.shape
        if len(img_shape) == 2:
            img_shape = (1, *img_shape)
        elif len(img_shape) > 2 and img_shape[-1] <= 3:
            img_shape = (lf.image.shape[-1], lf.image.shape[0], lf.image.shape[1])
        return cls(
            video_id=video_id,
            frame_id=(
                lf.frame_idx.astype(np.int32)
                if isinstance(lf.frame_idx, np.number)
                else lf.frame_idx
            ),
            vid_file=lf.video.filename,
            img_shape=img_shape,
            instances=[Instance.from_slp(instance, **kwargs) for instance in lf],
            device=device,
        )

    def to_slp(
        self,
        track_lookup: dict[int, sio.Track] | None = None,
        video: sio.Video | None = None,
    ) -> tuple[sio.LabeledFrame, dict[int, sio.Track]]:
        """Convert Frame to sleap_io.LabeledFrame object.

        Args:
            track_lookup: A lookup dictionary containing the track_id and sio.Track for persistence
            video: An sio.Video object used for overriding.

        Returns: A tuple containing a LabeledFrame object with necessary metadata and
        a lookup dictionary containing the track_id and sio.Track for persistence
        """
        if track_lookup is None:
            track_lookup = {}

        slp_instances = []
        for instance in self.instances:
            slp_instance, track_lookup = instance.to_slp(track_lookup=track_lookup)
            slp_instances.append(slp_instance)

        if video is None:
            video = (
                self.video
                if isinstance(self.video, sio.Video)
                else sio.load_video(self.video)
            )

        return (
            sio.LabeledFrame(
                video=video,
                frame_idx=self.frame_id.item(),
                instances=slp_instances,
            ),
            track_lookup,
        )

    def to_h5(
        self,
        clip_group: h5py.Group,
        instance_labels: list | None = None,
        save: dict[str, bool] | None = None,
    ) -> h5py.Group:
        """Convert frame to h5py group.

        Args:
            clip_group: the h5py group representing the clip (e.g batch/video) the frame belongs to
            instance_labels: the labels used to create instance group names
            save: whether to save crops, features and embeddings for the instance
        Returns:
            An h5py group containing the frame
        """
        if save is None:
            save = {"crop": False, "features": False, "embeddings": False}
        frame_group = clip_group.require_group(f"frame_{self.frame_id.item()}")
        frame_group.attrs.create("frame_id", self.frame_id.item())
        frame_group.attrs.create("vid_id", self.video_id.item())
        frame_group.attrs.create("vid_name", self.vid_name)

        frame_group.create_dataset(
            "asso_matrix",
            data=self.asso_output.numpy() if self.asso_output is not None else [],
        )
        asso_group = frame_group.require_group("traj_scores")
        for key, value in self.get_traj_score().items():
            asso_group.create_dataset(
                key, data=value.to_numpy() if value is not None else []
            )

        if instance_labels is None:
            instance_labels = self.get_gt_track_ids.cpu().numpy()
        for instance_label, instance in zip(instance_labels, self.instances):
            kwargs = {}
            if save.get("crop", False):
                kwargs["crop"] = instance.crop.cpu().numpy()
            if save.get("features", False):
                kwargs["features"] = instance.features.cpu().numpy()
            if save.get("embeddings", False):
                for key, val in instance.get_embedding().items():
                    kwargs[f"{key}_emb"] = val.cpu().numpy()
            _ = instance.to_h5(frame_group, f"instance_{instance_label}", **kwargs)

        return frame_group

    @property
    def device(self) -> str:
        """The device the frame is on.

        Returns:
            The string representation of the device the frame is on.
        """
        return self._device

    @device.setter
    def device(self, device: str) -> None:
        """Set the device.

        Note: Do not set `frame.device = device` normally. Use `frame.to(device)` instead.

        Args:
            device: the device the function should be on.
        """
        self._device = device

    @property
    def video_id(self) -> torch.Tensor:
        """The index of the video the frame comes from.

        Returns:
            A tensor containing the video index.
        """
        return self._video_id

    @video_id.setter
    def video_id(self, video_id: int) -> None:
        """Set the video index.

        Note: Generally the video_id should be immutable after initialization.

        Args:
            video_id: an int representing the index of the video that the frame came from.
        """
        self._video_id = torch.tensor([video_id])

    @property
    def frame_id(self) -> torch.Tensor:
        """The index of the frame in a full video.

        Returns:
            A torch tensor containing the index of the frame in the video.
        """
        return self._frame_id

    @frame_id.setter
    def frame_id(self, frame_id: int) -> None:
        """Set the frame index of the frame.

        Note: The frame_id should generally be immutable after initialization.

        Args:
            frame_id: The int index of the frame in the full video.
        """
        self._frame_id = torch.tensor([frame_id])

    @property
    def video(self) -> sio.Video | str:
        """Get the video associated with the frame.

        Returns: An sio.Video object representing the video or a placeholder string
        if it is not possible to create the sio.Video
        """
        return self._video

    @video.setter
    def video(self, video: sio.Video | str) -> None:
        """Set the video associated with the frame.

        Note: we try to store the video in an sio.Video object.
        However, if this is not possible (e.g. incompatible format or missing filepath)
        then we simply store the string.

        Args:
            video: sio.Video containing the vid reader or string path to video_file
        """
        if isinstance(video, sio.Video):
            self._video = video
        else:
            try:
                self._video = sio.load_video(video)
            except ValueError:
                self._video = video

    @property
    def vid_name(self) -> str:
        """Get the path to the video corresponding to this frame.

        Returns: A str file path corresponding to the frame.
        """
        if isinstance(self.video, str):
            return self.video
        else:
            return self.video.name

    @property
    def img_shape(self) -> torch.Tensor:
        """The shape of the pre-cropped frame.

        Returns:
            A torch tensor containing the shape of the frame. Should generally be (c, h, w)
        """
        return self._img_shape

    @img_shape.setter
    def img_shape(self, img_shape: ArrayLike) -> None:
        """Set the shape of the frame image.

        Note: the img_shape should generally be immutable after initialization.

        Args:
            img_shape: an ArrayLike object containing the shape of the frame image.
        """
        self._img_shape = _to_tensor(img_shape)

    @property
    def instances(self) -> list["Instance"]:
        """A list of instances in the frame.

        Returns:
            The list of instances that appear in the frame.
        """
        return self._instances

    @instances.setter
    def instances(self, instances: list["Instance"]) -> None:
        """Set the frame's instance.

        Args:
            instances: A list of Instances that appear in the frame.
        """
        for instance in instances:
            instance.frame = self
        self._instances = instances

    def has_instances(self) -> bool:
        """Determine whether there are instances in the frame.

        Returns:
            True if there are instances in the frame, otherwise False.
        """
        if self.num_detected == 0:
            return False
        return True

    @property
    def num_detected(self) -> int:
        """The number of instances in the frame.

        Returns:
            the number of instances in the frame.
        """
        return len(self.instances)

    @property
    def asso_output(self) -> "AssociationMatrix":
        """The association matrix between instances outputed directly by transformer.

        Returns:
            An arraylike (n_query, n_nonquery) association matrix between instances.
        """
        return self._asso_output

    def has_asso_output(self) -> bool:
        """Determine whether the frame has an association matrix computed.

        Returns:
            True if the frame has an association matrix otherwise, False.
        """
        if self._asso_output is None or len(self._asso_output.matrix) == 0:
            return False
        return True

    @asso_output.setter
    def asso_output(self, asso_output: "AssociationMatrix") -> None:
        """Set the association matrix of a frame.

        Args:
            asso_output: An arraylike (n_query, n_nonquery) association matrix between instances.
        """
        self._asso_output = asso_output

    @property
    def matches(self) -> tuple:
        """Matches between frame instances and availabel trajectories.

        Returns:
            A tuple containing the instance idx and trajectory idx for the matched instance.
        """
        return self._matches

    @matches.setter
    def matches(self, matches: tuple) -> None:
        """Set the frame matches.

        Args:
            matches: A tuple containing the instance idx and trajectory idx for the matched instance.
        """
        self._matches = matches

    def has_matches(self) -> bool:
        """Check whether or not matches have been computed for frame.

        Returns:
            True if frame contains matches otherwise False.
        """
        if self._matches is not None and len(self._matches) > 0:
            return True
        return False

    def get_traj_score(self, key: str | None = None) -> dict | ArrayLike | None:
        """Get dictionary containing association matrix between instances and trajectories along postprocessing pipeline.

        Args:
            key: The key of the trajectory score to be accessed.
                Can be one of {None, 'initial', 'decay_time', 'max_center_dist', 'iou', 'final'}

        Returns:
            - dictionary containing all trajectory scores if key is None
            - trajectory score associated with key
            - None if the key is not found
        """
        if key is None:
            return self._traj_score
        else:
            try:
                return self._traj_score[key]
            except KeyError as e:
                logger.exception(f"Could not access {key} traj_score due to {e}")
                return None

    def add_traj_score(self, key: str, traj_score: ArrayLike) -> None:
        """Add trajectory score to dictionary.

        Args:
            key: key associated with traj score to be used in dictionary
            traj_score: association matrix between instances and trajectories
        """
        self._traj_score[key] = traj_score

    def has_traj_score(self) -> bool:
        """Check if any trajectory association matrix has been saved.

        Returns:
            True there is at least one association matrix otherwise, false.
        """
        if len(self._traj_score) == 0:
            return False
        return True

    def has_gt_track_ids(self) -> bool:
        """Check if any of frames instances has a gt track id.

        Returns:
            True if at least 1 instance has a gt track id otherwise False.
        """
        if self.has_instances():
            return any([instance.has_gt_track_id() for instance in self.instances])
        return False

    def get_gt_track_ids(self) -> torch.Tensor:
        """Get the gt track ids of all instances in the frame.

        Returns:
            an (N,) shaped tensor with the gt track ids of each instance in the frame.
        """
        if not self.has_instances():
            return torch.tensor([])
        return torch.cat([instance.gt_track_id for instance in self.instances])

    def has_pred_track_ids(self) -> bool:
        """Check if any of frames instances has a pred track id.

        Returns:
            True if at least 1 instance has a pred track id otherwise False.
        """
        if self.has_instances():
            return any([instance.has_pred_track_id() for instance in self.instances])
        return False

    def get_pred_track_ids(self) -> torch.Tensor:
        """Get the pred track ids of all instances in the frame.

        Returns:
            an (N,) shaped tensor with the pred track ids of each instance in the frame.
        """
        if not self.has_instances():
            return torch.tensor([])
        return torch.cat([instance.pred_track_id for instance in self.instances])

    def has_bboxes(self) -> bool:
        """Check if any of frames instances has a bounding box.

        Returns:
            True if at least 1 instance has a bounding box otherwise False.
        """
        if self.has_instances():
            return any([instance.has_bboxes() for instance in self.instances])
        return False

    def get_bboxes(self) -> torch.Tensor:
        """Get the bounding boxes of all instances in the frame.

        Returns:
            an (N,4) shaped tensor with bounding boxes of each instance in the frame.
        """
        if not self.has_instances():
            return torch.empty(0, 4)
        return torch.cat([instance.bbox for instance in self.instances], dim=0)

    def has_crops(self) -> bool:
        """Check if any of frames instances has a crop.

        Returns:
            True if at least 1 instance has a crop otherwise False.
        """
        if self.has_instances():
            return any([instance.has_crop() for instance in self.instances])
        return False

    def get_crops(self) -> torch.Tensor:
        """Get the crops of all instances in the frame.

        Returns:
            an (N, C, H, W) shaped tensor with crops of each instance in the frame.
        """
        if not self.has_instances():
            return torch.tensor([])

        return torch.cat([instance.crop for instance in self.instances], dim=0)

    def has_features(self) -> bool:
        """Check if any of frames instances has reid features already computed.

        Returns:
            True if at least 1 instance have reid features otherwise False.
        """
        if self.has_instances():
            return any([instance.has_features() for instance in self.instances])
        return False

    def get_features(self) -> torch.Tensor:
        """Get the reid feature vectors of all instances in the frame.

        Returns:
            an (N, D) shaped tensor with reid feature vectors of each instance in the frame.
        """
        if not self.has_instances():
            return torch.tensor([])
        return torch.cat([instance.features for instance in self.instances], dim=0)

    def get_anchors(self) -> list[str]:
        """Get the anchor names of instances in the frame.

        Returns:
            A list of anchor names used by the instances to get the crop.
        """
        return [instance.anchor for instance in self.instances]

    def get_centroids(self) -> tuple[list[str], ArrayLike]:
        """Get the centroids around which each instance's crop was formed.

        Returns:
            anchors: the node names for the corresponding point
            points: an n_instances x 2 array containing the centroids
        """
        anchors = [
            anchor for instance in self.instances for anchor in instance.centroid.keys()
        ]

        points = np.array(
            [
                point
                for instance in self.instances
                for point in instance.centroid.values()
            ]
        )

        return (anchors, points)

`asso_output: 'AssociationMatrix'` `property` `writable` ¶

The association matrix between instances outputed directly by transformer.

Returns:

Type	Description
`'AssociationMatrix'`	An arraylike (n_query, n_nonquery) association matrix between instances.

`device: str` `property` `writable` ¶

The device the frame is on.

Returns:

Type	Description
`str`	The string representation of the device the frame is on.

`frame_id: torch.Tensor` `property` `writable` ¶

The index of the frame in a full video.

Returns:

Type	Description
`Tensor`	A torch tensor containing the index of the frame in the video.

`img_shape: torch.Tensor` `property` `writable` ¶

The shape of the pre-cropped frame.

Returns:

Type	Description
`Tensor`	A torch tensor containing the shape of the frame. Should generally be (c, h, w)

`instances: list['Instance']` `property` `writable` ¶

A list of instances in the frame.

Returns:

Type	Description
`list['Instance']`	The list of instances that appear in the frame.

`matches: tuple` `property` `writable` ¶

Matches between frame instances and availabel trajectories.

Returns:

Type	Description
`tuple`	A tuple containing the instance idx and trajectory idx for the matched instance.

`num_detected: int` `property` ¶

The number of instances in the frame.

Returns:

Type	Description
`int`	the number of instances in the frame.

`vid_name: str` `property` ¶

Get the path to the video corresponding to this frame.

Returns: A str file path corresponding to the frame.

`video: sio.Video | str` `property` `writable` ¶

Get the video associated with the frame.

Returns: An sio.Video object representing the video or a placeholder string if it is not possible to create the sio.Video

`video_id: torch.Tensor` `property` `writable` ¶

The index of the video the frame comes from.

Returns:

Type	Description
`Tensor`	A tensor containing the video index.

`__attrs_post_init__()` ¶

Handle more intricate default initializations and moving to device.

Source code in dreem/io/frame.py

def __attrs_post_init__(self) -> None:
    """Handle more intricate default initializations and moving to device."""
    if len(self.img_shape) == 0:
        self.img_shape = torch.tensor([0, 0, 0])

    for instance in self.instances:
        instance.frame = self

    self.to(self.device)

`repr()` ¶

Return String representation of the Frame.

Returns:

Type	Description
`str`	The string representation of the frame.

Source code in dreem/io/frame.py

def __repr__(self) -> str:
    """Return String representation of the Frame.

    Returns:
        The string representation of the frame.
    """
    return (
        "Frame("
        f"video={self._video.filename if isinstance(self._video, sio.Video) else self._video}, "
        f"video_id={self._video_id.item()}, "
        f"frame_id={self._frame_id.item()}, "
        f"img_shape={self._img_shape}, "
        f"num_detected={self.num_detected}, "
        f"asso_output={self._asso_output}, "
        f"traj_score={self._traj_score}, "
        f"matches={self._matches}, "
        f"instances={self._instances}, "
        f"device={self._device}"
        ")"
    )

`add_traj_score(key, traj_score)` ¶

Add trajectory score to dictionary.

Parameters:

Name	Type	Description	Default
`key`	`str`	key associated with traj score to be used in dictionary	required
`traj_score`	`ArrayLike`	association matrix between instances and trajectories	required

Source code in dreem/io/frame.py

def add_traj_score(self, key: str, traj_score: ArrayLike) -> None:
    """Add trajectory score to dictionary.

    Args:
        key: key associated with traj score to be used in dictionary
        traj_score: association matrix between instances and trajectories
    """
    self._traj_score[key] = traj_score

`from_slp(lf, video_id=0, device=None, **kwargs)` `classmethod` ¶

Convert sio.LabeledFrame to dreem.io.Frame.

Parameters:

Name	Type	Description	Default
`lf`	`LabeledFrame`	A sio.LabeledFrame object	required

Returns:

Type	Description
`Self`	A dreem.io.Frame object

Source code in dreem/io/frame.py

@classmethod
def from_slp(
    cls,
    lf: sio.LabeledFrame,
    video_id: int = 0,
    device: str | None = None,
    **kwargs,
) -> Self:
    """Convert `sio.LabeledFrame` to `dreem.io.Frame`.

    Args:
        lf: A sio.LabeledFrame object

    Returns:
        A dreem.io.Frame object
    """
    from dreem.io import Instance

    img_shape = lf.image.shape
    if len(img_shape) == 2:
        img_shape = (1, *img_shape)
    elif len(img_shape) > 2 and img_shape[-1] <= 3:
        img_shape = (lf.image.shape[-1], lf.image.shape[0], lf.image.shape[1])
    return cls(
        video_id=video_id,
        frame_id=(
            lf.frame_idx.astype(np.int32)
            if isinstance(lf.frame_idx, np.number)
            else lf.frame_idx
        ),
        vid_file=lf.video.filename,
        img_shape=img_shape,
        instances=[Instance.from_slp(instance, **kwargs) for instance in lf],
        device=device,
    )

`get_anchors()` ¶

Get the anchor names of instances in the frame.

Returns:

Type	Description
`list[str]`	A list of anchor names used by the instances to get the crop.

Source code in dreem/io/frame.py

def get_anchors(self) -> list[str]:
    """Get the anchor names of instances in the frame.

    Returns:
        A list of anchor names used by the instances to get the crop.
    """
    return [instance.anchor for instance in self.instances]

`get_bboxes()` ¶

Get the bounding boxes of all instances in the frame.

Returns:

Type	Description
`Tensor`	an (N,4) shaped tensor with bounding boxes of each instance in the frame.

Source code in dreem/io/frame.py

def get_bboxes(self) -> torch.Tensor:
    """Get the bounding boxes of all instances in the frame.

    Returns:
        an (N,4) shaped tensor with bounding boxes of each instance in the frame.
    """
    if not self.has_instances():
        return torch.empty(0, 4)
    return torch.cat([instance.bbox for instance in self.instances], dim=0)

`get_centroids()` ¶

Get the centroids around which each instance's crop was formed.

Returns:

Name	Type	Description
`anchors`	`tuple[list[str], ArrayLike]`	the node names for the corresponding point points: an n_instances x 2 array containing the centroids

Source code in dreem/io/frame.py

def get_centroids(self) -> tuple[list[str], ArrayLike]:
    """Get the centroids around which each instance's crop was formed.

    Returns:
        anchors: the node names for the corresponding point
        points: an n_instances x 2 array containing the centroids
    """
    anchors = [
        anchor for instance in self.instances for anchor in instance.centroid.keys()
    ]

    points = np.array(
        [
            point
            for instance in self.instances
            for point in instance.centroid.values()
        ]
    )

    return (anchors, points)

`get_crops()` ¶

Get the crops of all instances in the frame.

Returns:

Type	Description
`Tensor`	an (N, C, H, W) shaped tensor with crops of each instance in the frame.

Source code in dreem/io/frame.py

def get_crops(self) -> torch.Tensor:
    """Get the crops of all instances in the frame.

    Returns:
        an (N, C, H, W) shaped tensor with crops of each instance in the frame.
    """
    if not self.has_instances():
        return torch.tensor([])

    return torch.cat([instance.crop for instance in self.instances], dim=0)

`get_features()` ¶

Get the reid feature vectors of all instances in the frame.

Returns:

Type	Description
`Tensor`	an (N, D) shaped tensor with reid feature vectors of each instance in the frame.

Source code in dreem/io/frame.py

def get_features(self) -> torch.Tensor:
    """Get the reid feature vectors of all instances in the frame.

    Returns:
        an (N, D) shaped tensor with reid feature vectors of each instance in the frame.
    """
    if not self.has_instances():
        return torch.tensor([])
    return torch.cat([instance.features for instance in self.instances], dim=0)

`get_gt_track_ids()` ¶

Get the gt track ids of all instances in the frame.

Returns:

Type	Description
`Tensor`	an (N,) shaped tensor with the gt track ids of each instance in the frame.

Source code in dreem/io/frame.py

def get_gt_track_ids(self) -> torch.Tensor:
    """Get the gt track ids of all instances in the frame.

    Returns:
        an (N,) shaped tensor with the gt track ids of each instance in the frame.
    """
    if not self.has_instances():
        return torch.tensor([])
    return torch.cat([instance.gt_track_id for instance in self.instances])

`get_pred_track_ids()` ¶

Get the pred track ids of all instances in the frame.

Returns:

Type	Description
`Tensor`	an (N,) shaped tensor with the pred track ids of each instance in the frame.

Source code in dreem/io/frame.py

def get_pred_track_ids(self) -> torch.Tensor:
    """Get the pred track ids of all instances in the frame.

    Returns:
        an (N,) shaped tensor with the pred track ids of each instance in the frame.
    """
    if not self.has_instances():
        return torch.tensor([])
    return torch.cat([instance.pred_track_id for instance in self.instances])

`get_traj_score(key=None)` ¶

Get dictionary containing association matrix between instances and trajectories along postprocessing pipeline.

Parameters:

Name	Type	Description	Default
`key`	`str \| None`	The key of the trajectory score to be accessed. Can be one of {None, 'initial', 'decay_time', 'max_center_dist', 'iou', 'final'}	`None`

Returns:

Type	Description
`dict \| ArrayLike \| None`	dictionary containing all trajectory scores if key is None trajectory score associated with key None if the key is not found

Source code in dreem/io/frame.py

def get_traj_score(self, key: str | None = None) -> dict | ArrayLike | None:
    """Get dictionary containing association matrix between instances and trajectories along postprocessing pipeline.

    Args:
        key: The key of the trajectory score to be accessed.
            Can be one of {None, 'initial', 'decay_time', 'max_center_dist', 'iou', 'final'}

    Returns:
        - dictionary containing all trajectory scores if key is None
        - trajectory score associated with key
        - None if the key is not found
    """
    if key is None:
        return self._traj_score
    else:
        try:
            return self._traj_score[key]
        except KeyError as e:
            logger.exception(f"Could not access {key} traj_score due to {e}")
            return None

`has_asso_output()` ¶

Determine whether the frame has an association matrix computed.

Returns:

Type	Description
`bool`	True if the frame has an association matrix otherwise, False.

Source code in dreem/io/frame.py

def has_asso_output(self) -> bool:
    """Determine whether the frame has an association matrix computed.

    Returns:
        True if the frame has an association matrix otherwise, False.
    """
    if self._asso_output is None or len(self._asso_output.matrix) == 0:
        return False
    return True

`has_bboxes()` ¶

Check if any of frames instances has a bounding box.

Returns:

Type	Description
`bool`	True if at least 1 instance has a bounding box otherwise False.

Source code in dreem/io/frame.py

def has_bboxes(self) -> bool:
    """Check if any of frames instances has a bounding box.

    Returns:
        True if at least 1 instance has a bounding box otherwise False.
    """
    if self.has_instances():
        return any([instance.has_bboxes() for instance in self.instances])
    return False

`has_crops()` ¶

Check if any of frames instances has a crop.

Returns:

Type	Description
`bool`	True if at least 1 instance has a crop otherwise False.

Source code in dreem/io/frame.py

def has_crops(self) -> bool:
    """Check if any of frames instances has a crop.

    Returns:
        True if at least 1 instance has a crop otherwise False.
    """
    if self.has_instances():
        return any([instance.has_crop() for instance in self.instances])
    return False

`has_features()` ¶

Check if any of frames instances has reid features already computed.

Returns:

Type	Description
`bool`	True if at least 1 instance have reid features otherwise False.

Source code in dreem/io/frame.py

def has_features(self) -> bool:
    """Check if any of frames instances has reid features already computed.

    Returns:
        True if at least 1 instance have reid features otherwise False.
    """
    if self.has_instances():
        return any([instance.has_features() for instance in self.instances])
    return False

`has_gt_track_ids()` ¶

Check if any of frames instances has a gt track id.

Returns:

Type	Description
`bool`	True if at least 1 instance has a gt track id otherwise False.

Source code in dreem/io/frame.py

def has_gt_track_ids(self) -> bool:
    """Check if any of frames instances has a gt track id.

    Returns:
        True if at least 1 instance has a gt track id otherwise False.
    """
    if self.has_instances():
        return any([instance.has_gt_track_id() for instance in self.instances])
    return False

`has_instances()` ¶

Determine whether there are instances in the frame.

Returns:

Type	Description
`bool`	True if there are instances in the frame, otherwise False.

Source code in dreem/io/frame.py

def has_instances(self) -> bool:
    """Determine whether there are instances in the frame.

    Returns:
        True if there are instances in the frame, otherwise False.
    """
    if self.num_detected == 0:
        return False
    return True

`has_matches()` ¶

Check whether or not matches have been computed for frame.

Returns:

Type	Description
`bool`	True if frame contains matches otherwise False.

Source code in dreem/io/frame.py

def has_matches(self) -> bool:
    """Check whether or not matches have been computed for frame.

    Returns:
        True if frame contains matches otherwise False.
    """
    if self._matches is not None and len(self._matches) > 0:
        return True
    return False

`has_pred_track_ids()` ¶

Check if any of frames instances has a pred track id.

Returns:

Type	Description
`bool`	True if at least 1 instance has a pred track id otherwise False.

Source code in dreem/io/frame.py

def has_pred_track_ids(self) -> bool:
    """Check if any of frames instances has a pred track id.

    Returns:
        True if at least 1 instance has a pred track id otherwise False.
    """
    if self.has_instances():
        return any([instance.has_pred_track_id() for instance in self.instances])
    return False

`has_traj_score()` ¶

Check if any trajectory association matrix has been saved.

Returns:

Type	Description
`bool`	True there is at least one association matrix otherwise, false.

Source code in dreem/io/frame.py

def has_traj_score(self) -> bool:
    """Check if any trajectory association matrix has been saved.

    Returns:
        True there is at least one association matrix otherwise, false.
    """
    if len(self._traj_score) == 0:
        return False
    return True

`to(map_location)` ¶

Move frame to different device or dtype (See torch.to for more info).

Parameters:

Name	Type	Description	Default
`map_location`	`str \| device`	A string representing the device to move to.	required

Returns:

Type	Description
`Self`	The frame moved to a different device/dtype.

Source code in dreem/io/frame.py

def to(self, map_location: str | torch.device) -> Self:
    """Move frame to different device or dtype (See `torch.to` for more info).

    Args:
        map_location: A string representing the device to move to.

    Returns:
        The frame moved to a different device/dtype.
    """
    self._video_id = self._video_id.to(map_location)
    self._frame_id = self._frame_id.to(map_location)
    self._img_shape = self._img_shape.to(map_location)

    if isinstance(self._asso_output, torch.Tensor):
        self._asso_output = self._asso_output.to(map_location)

    if isinstance(self._matches, torch.Tensor):
        self._matches = self._matches.to(map_location)

    for key, val in self._traj_score.items():
        if isinstance(val, torch.Tensor):
            self._traj_score[key] = val.to(map_location)
    for instance in self.instances:
        instance = instance.to(map_location)

    if isinstance(map_location, (str, torch.device)):
        self._device = map_location

    return self

`to_h5(clip_group, instance_labels=None, save=None)` ¶

Convert frame to h5py group.

Parameters:

Name	Type	Description	Default
`clip_group`	`Group`	the h5py group representing the clip (e.g batch/video) the frame belongs to	required
`instance_labels`	`list \| None`	the labels used to create instance group names	`None`
`save`	`dict[str, bool] \| None`	whether to save crops, features and embeddings for the instance	`None`

Returns: An h5py group containing the frame

Source code in dreem/io/frame.py

def to_h5(
    self,
    clip_group: h5py.Group,
    instance_labels: list | None = None,
    save: dict[str, bool] | None = None,
) -> h5py.Group:
    """Convert frame to h5py group.

    Args:
        clip_group: the h5py group representing the clip (e.g batch/video) the frame belongs to
        instance_labels: the labels used to create instance group names
        save: whether to save crops, features and embeddings for the instance
    Returns:
        An h5py group containing the frame
    """
    if save is None:
        save = {"crop": False, "features": False, "embeddings": False}
    frame_group = clip_group.require_group(f"frame_{self.frame_id.item()}")
    frame_group.attrs.create("frame_id", self.frame_id.item())
    frame_group.attrs.create("vid_id", self.video_id.item())
    frame_group.attrs.create("vid_name", self.vid_name)

    frame_group.create_dataset(
        "asso_matrix",
        data=self.asso_output.numpy() if self.asso_output is not None else [],
    )
    asso_group = frame_group.require_group("traj_scores")
    for key, value in self.get_traj_score().items():
        asso_group.create_dataset(
            key, data=value.to_numpy() if value is not None else []
        )

    if instance_labels is None:
        instance_labels = self.get_gt_track_ids.cpu().numpy()
    for instance_label, instance in zip(instance_labels, self.instances):
        kwargs = {}
        if save.get("crop", False):
            kwargs["crop"] = instance.crop.cpu().numpy()
        if save.get("features", False):
            kwargs["features"] = instance.features.cpu().numpy()
        if save.get("embeddings", False):
            for key, val in instance.get_embedding().items():
                kwargs[f"{key}_emb"] = val.cpu().numpy()
        _ = instance.to_h5(frame_group, f"instance_{instance_label}", **kwargs)

    return frame_group

`to_slp(track_lookup=None, video=None)` ¶

Convert Frame to sleap_io.LabeledFrame object.

Parameters:

Name	Type	Description	Default
`track_lookup`	`dict[int, Track] \| None`	A lookup dictionary containing the track_id and sio.Track for persistence	`None`
`video`	`Video \| None`	An sio.Video object used for overriding.	`None`

Returns: A tuple containing a LabeledFrame object with necessary metadata and a lookup dictionary containing the track_id and sio.Track for persistence

Source code in dreem/io/frame.py

def to_slp(
    self,
    track_lookup: dict[int, sio.Track] | None = None,
    video: sio.Video | None = None,
) -> tuple[sio.LabeledFrame, dict[int, sio.Track]]:
    """Convert Frame to sleap_io.LabeledFrame object.

    Args:
        track_lookup: A lookup dictionary containing the track_id and sio.Track for persistence
        video: An sio.Video object used for overriding.

    Returns: A tuple containing a LabeledFrame object with necessary metadata and
    a lookup dictionary containing the track_id and sio.Track for persistence
    """
    if track_lookup is None:
        track_lookup = {}

    slp_instances = []
    for instance in self.instances:
        slp_instance, track_lookup = instance.to_slp(track_lookup=track_lookup)
        slp_instances.append(slp_instance)

    if video is None:
        video = (
            self.video
            if isinstance(self.video, sio.Video)
            else sio.load_video(self.video)
        )

    return (
        sio.LabeledFrame(
            video=video,
            frame_idx=self.frame_id.item(),
            instances=slp_instances,
        ),
        track_lookup,
    )

Frame¶

dreem.io.Frame ¶

asso_output: 'AssociationMatrix' property writable ¶

device: str property writable ¶

frame_id: torch.Tensor property writable ¶

img_shape: torch.Tensor property writable ¶

instances: list['Instance'] property writable ¶

matches: tuple property writable ¶

num_detected: int property ¶

vid_name: str property ¶

video: sio.Video | str property writable ¶

video_id: torch.Tensor property writable ¶

__attrs_post_init__() ¶

__repr__() ¶

add_traj_score(key, traj_score) ¶

from_slp(lf, video_id=0, device=None, **kwargs) classmethod ¶

get_anchors() ¶

get_bboxes() ¶

get_centroids() ¶

get_crops() ¶

get_features() ¶

get_gt_track_ids() ¶

get_pred_track_ids() ¶

get_traj_score(key=None) ¶

has_asso_output() ¶

has_bboxes() ¶

has_crops() ¶

has_features() ¶

has_gt_track_ids() ¶

has_instances() ¶

has_matches() ¶

has_pred_track_ids() ¶

has_traj_score() ¶

to(map_location) ¶

to_h5(clip_group, instance_labels=None, save=None) ¶

to_slp(track_lookup=None, video=None) ¶

`Frame`¶

`dreem.io.Frame` ¶

`asso_output: 'AssociationMatrix'` `property` `writable` ¶

`device: str` `property` `writable` ¶

`frame_id: torch.Tensor` `property` `writable` ¶

`img_shape: torch.Tensor` `property` `writable` ¶

`instances: list['Instance']` `property` `writable` ¶

`matches: tuple` `property` `writable` ¶

`num_detected: int` `property` ¶

`vid_name: str` `property` ¶

`video: sio.Video | str` `property` `writable` ¶

`video_id: torch.Tensor` `property` `writable` ¶

`__attrs_post_init__()` ¶

`repr()` ¶

`add_traj_score(key, traj_score)` ¶

`from_slp(lf, video_id=0, device=None, **kwargs)` `classmethod` ¶

`get_anchors()` ¶

`get_bboxes()` ¶

`get_centroids()` ¶

`get_crops()` ¶

`get_features()` ¶

`get_gt_track_ids()` ¶

`get_pred_track_ids()` ¶

`get_traj_score(key=None)` ¶

`has_asso_output()` ¶

`has_bboxes()` ¶

`has_crops()` ¶

`has_features()` ¶

`has_gt_track_ids()` ¶

`has_instances()` ¶

`has_matches()` ¶

`has_pred_track_ids()` ¶

`has_traj_score()` ¶

`to(map_location)` ¶

`to_h5(clip_group, instance_labels=None, save=None)` ¶

`to_slp(track_lookup=None, video=None)` ¶