iterative · dreadatour · Feb 11, 2025 · shcheklein · Feb 13, 2025 · dreadatour
diff --git a/src/datachain/model/bbox.py b/src/datachain/model/bbox.py
diff --git a/src/datachain/model/pose.py b/src/datachain/model/pose.py
@@ -1,7 +1,12 @@
+from collections.abc import Sequence
+from typing import Optional
+
 from pydantic import Field
 
 from datachain.lib.data_model import DataModel
 
+from .utils import validate_img_size
+
 
 class Pose(DataModel):
     """
@@ -19,22 +24,76 @@ class Pose(DataModel):
     y: list[int] = Field(default=[])
 
     @staticmethod
-    def from_list(points: list[list[float]]) -> "Pose":
+    def from_list(
+        points: Sequence[Sequence[float]],
+        normalized_to: Optional[Sequence[int]] = None,
+    ) -> "Pose":
+        """
+        Create a Pose instance from a list of x and y coordinates.
+
+        If the input coordinates are normalized (i.e., floats between 0 and 1),
+        they will be converted to absolute pixel values based on the provided
+        image size. The image size should be given as a tuple (width, height)
+        via the `normalized_to` argument.
+
+        Args:
+            points (Sequence[Sequence[float]]): The x and y coordinates
+                of the keypoints. List of 2 lists: x and y coordinates.
+            normalized_to (Sequence[int], optional): The reference image size
+                (width, height) for denormalizing the bounding box. If None (default),
+                the coordinates are assumed to be absolute pixel values.
+
+        Returns:
+            Pose: A Pose object.
+        """
+        assert isinstance(points, (tuple, list)), "Pose must be a list of 2 lists."
         assert len(points) == 2, "Pose must be a list of 2 lists: x and y coordinates."
         points_x, points_y = points
+        assert isinstance(points_x, (tuple, list)) and isinstance(
+            points_y, (tuple, list)
+        ), "Pose must be a list of 2 lists."
         assert len(points_x) == len(points_y) == 17, (
             "Pose x and y coordinates must have the same length of 17."
         )
         assert all(
             isinstance(value, (int, float)) for value in [*points_x, *points_y]
         ), "Pose coordinates must be floats or integers."
+
+        if normalized_to is not None:
+            assert all(0 <= coord <= 1 for coord in [*points_x, *points_y]), (
+                "Normalized coordinates must be floats between 0 and 1."
+            )
+            width, height = validate_img_size(normalized_to)
+            points_x = [coord * width for coord in points_x]
+            points_y = [coord * height for coord in points_y]
+
         return Pose(
             x=[round(coord) for coord in points_x],
             y=[round(coord) for coord in points_y],
         )
 
+    def to_normalized(self, img_size: Sequence[int]) -> tuple[list[float], list[float]]:
+        """
+        Return the pose keypoints in normalized coordinates.
+
+        Normalized coordinates are floats between 0 and 1, representing the
+        relative position of the pixels in the image.
+
+        Returns:
+            tuple[list[float], list[float]]: The pose keypoints
+                with normalized coordinates.
+        """
+        width, height = validate_img_size(img_size)
+        assert all(x <= width and y <= height for x, y in zip(self.x, self.y)), (
+            "Pose keypoints are out of image size."
+        )
+        return (
+            [coord / width for coord in self.x],
+            [coord / height for coord in self.y],
+        )
+
     @staticmethod
-    def from_dict(points: dict[str, list[float]]) -> "Pose":
+    def from_dict(points: dict[str, Sequence[float]]) -> "Pose":
         assert isinstance(points, dict) and set(points) == {
             "x",
             "y",
@@ -60,22 +119,86 @@ class Pose3D(DataModel):
     visible: list[float] = Field(default=[])
 
     @staticmethod
-    def from_list(points: list[list[float]]) -> "Pose3D":
+    def from_list(
+        points: Sequence[Sequence[float]],
+        normalized_to: Optional[Sequence[int]] = None,
+    ) -> "Pose3D":
+        """
+        Create a Pose3D instance from a list of x, y coordinates and visibility values.
+
+        If the input coordinates are normalized (i.e., floats between 0 and 1),
+        they will be converted to absolute pixel values based on the provided
+        image size. The image size should be given as a tuple (width, height)
+        via the `normalized_to` argument.
+
+        Args:
+            points (Sequence[Sequence[float]]): The x and y coordinates
+                of the keypoints. List of 3 lists: x, y coordinates
+                and visibility values.
+            normalized_to (Sequence[int], optional): The reference image size
+                (width, height) for denormalizing the bounding box. If None (default),
+                the coordinates are assumed to be absolute pixel values.
+
+        Returns:
+            Pose3D: A Pose3D object.
+
+        """
+        assert isinstance(points, (tuple, list)), (
+            "Pose3D must be a tuple or list of 3 lists."
+        )
         assert len(points) == 3, (
             "Pose3D must be a list of 3 lists: x, y coordinates and visible."
         )
         points_x, points_y, points_v = points
+        assert (
+            isinstance(points_x, (tuple, list))
+            and isinstance(points_y, (tuple, list))
+            and isinstance(points_v, (tuple, list))
+        ), "Pose3D must be a tuple or list of 3 lists."
         assert len(points_x) == len(points_y) == len(points_v) == 17, (
             "Pose3D x, y coordinates and visible must have the same length of 17."
         )
         assert all(
             isinstance(value, (int, float))
             for value in [*points_x, *points_y, *points_v]
         ), "Pose3D coordinates must be floats or integers."
+
+        if normalized_to is not None:
+            assert all(0 <= coord <= 1 for coord in [*points_x, *points_y]), (
+                "Normalized coordinates must be floats between 0 and 1."
+            )
+            width, height = validate_img_size(normalized_to)
+            points_x = [coord * width for coord in points_x]
+            points_y = [coord * height for coord in points_y]
+
         return Pose3D(
             x=[round(coord) for coord in points_x],
             y=[round(coord) for coord in points_y],
-            visible=points_v,
+            visible=list(points_v),
+        )
+
+    def to_normalized(
+        self,
+        img_size: Sequence[int],
+    ) -> tuple[list[float], list[float], list[float]]:
+        """
+        Return the pose 3D keypoints in normalized coordinates.
+
+        Normalized coordinates are floats between 0 and 1, representing the
+        relative position of the pixels in the image.
+
+        Returns:
+            tuple[list[float], list[float], list[float]]: The pose keypoints
+                with normalized coordinates and visibility values.
+        """
+        width, height = validate_img_size(img_size)
+        assert all(x <= width and y <= height for x, y in zip(self.x, self.y)), (
+            "Pose3D keypoints are out of image size."
+        )
+        return (
+            [coord / width for coord in self.x],
+            [coord / height for coord in self.y],
+            self.visible,
         )
 
     @staticmethod

diff --git a/src/datachain/model/segment.py b/src/datachain/model/segment.py
@@ -1,7 +1,12 @@
+from collections.abc import Sequence
+from typing import Optional
+
 from pydantic import Field
 
 from datachain.lib.data_model import DataModel
 
+from .utils import validate_img_size
+
 
 class Segment(DataModel):
     """
@@ -21,23 +26,78 @@ class Segment(DataModel):
     y: list[int] = Field(default=[])
 
     @staticmethod
-    def from_list(points: list[list[float]], title: str = "") -> "Segment":
+    def from_list(
+        points: Sequence[Sequence[float]],
+        title: str = "",
+        normalized_to: Optional[Sequence[int]] = None,
+    ) -> "Segment":
+        """
+        Create a Segment object from a list of x and y coordinates.
+
+        If the input coordinates are normalized (i.e., floats between 0 and 1),
+        they will be converted to absolute pixel values based on the provided
+        image size. The image size should be given as a tuple (width, height)
+        via the `normalized_to` argument.
+
+        Args:
+            points (Sequence[Sequence[float]]): The x and y coordinates
+                of the keypoints. List of 2 lists: x and y coordinates.
+            title (str, optional): The title or label for the segment. Defaults to "".
+            normalized_to (Sequence[int], optional): The reference image size
+                (width, height) for denormalizing the bounding box. If None (default),
+                the coordinates are assumed to be absolute pixel values.
+
+        Returns:
+            Segment: A Segment object.
+        """
+        assert isinstance(points, (tuple, list)), "Segment must be a list of 2 lists."
         assert len(points) == 2, (
             "Segment must be a list of 2 lists: x and y coordinates."
         )
         points_x, points_y = points
+        assert isinstance(points_x, (tuple, list)) and isinstance(
+            points_y, (tuple, list)
+        ), "Segment must be a list of 2 lists."
         assert len(points_x) == len(points_y), (
             "Segment x and y coordinates must have the same length."
         )
         assert all(
             isinstance(value, (int, float)) for value in [*points_x, *points_y]
         ), "Segment coordinates must be floats or integers."
+
+        if normalized_to is not None:
+            assert all(0 <= coord <= 1 for coord in [*points_x, *points_y]), (
+                "Normalized coordinates must be floats between 0 and 1."
+            )
+            width, height = validate_img_size(normalized_to)
+            points_x = [coord * width for coord in points_x]
+            points_y = [coord * height for coord in points_y]
+
         return Segment(
             title=title,
             x=[round(coord) for coord in points_x],
             y=[round(coord) for coord in points_y],
         )
 
+    def to_normalized(self, img_size: Sequence[int]) -> tuple[list[float], list[float]]:
+        """
+        Return the segment in normalized coordinates.
+
+        Normalized coordinates are floats between 0 and 1, representing the
+        relative position of the pixels in the image.
+
+        Returns:
+            tuple[list[float], list[float]]: The segment with normalized coordinates.
+        """
+        width, height = validate_img_size(img_size)
+        assert all(x <= width and y <= height for x, y in zip(self.x, self.y)), (
+            "Segment keypoints are out of image size."
+        )
+        return (
+            [coord / width for coord in self.x],
+            [coord / height for coord in self.y],
+        )
+
     @staticmethod
     def from_dict(points: dict[str, list[float]], title: str = "") -> "Segment":
         assert isinstance(points, dict) and set(points) == {

diff --git a/src/datachain/model/utils.py b/src/datachain/model/utils.py
@@ -0,0 +1,76 @@
+from collections.abc import Sequence
+
+
+def validate_img_size(img_size: Sequence[int]) -> Sequence[int]:
+    """Validate the image size."""
+    assert isinstance(img_size, (tuple, list)), "Image size must be a tuple or list."
+    assert len(img_size) == 2, "Image size must be a tuple or list of 2 integers."
+    assert all(isinstance(value, int) for value in img_size), (
+        "Image size must be integers."
+    )
+    assert all(value > 0 for value in img_size), "Image size must be positive integers."
+    return img_size
+
+
+def validate_bbox(coords: Sequence[float]) -> Sequence[float]:
+    """Validate the bounding box coordinates."""
+    assert isinstance(coords, (tuple, list)), "Bounding box must be a tuple or list."
+    assert len(coords) == 4, "Bounding box must be a tuple or list of 4 coordinates."
+    assert all(isinstance(value, (int, float)) for value in coords), (
+        "Bounding box coordinates must be floats or integers."
+    )
+    assert all(value >= 0 for value in coords), (
+        "Bounding box coordinates must be positive."
+    )
+    return coords
+
+
+def validate_bbox_normalized(
+    coords: Sequence[float], img_size: Sequence[int]
+) -> Sequence[float]:
+    """Validate the bounding box coordinates and normalize them to the image size."""
+    assert isinstance(coords, (tuple, list)), "Bounding box must be a tuple or list."
+    assert len(coords) == 4, "Bounding box must be a tuple or list of 4 coordinates."
+    assert all(isinstance(value, float) for value in coords), (
+        "Bounding box normalized coordinates must be floats."
+    )
+    assert all(0 <= value <= 1 for value in coords), (
+        "Bounding box normalized coordinates must be floats between 0 and 1."
+    )
+
+    width, height = validate_img_size(img_size)
+
+    return [
+        coords[0] * width,
+        coords[1] * height,
+        coords[2] * width,
+        coords[3] * height,
+    ]
+
+
+def normalize_coords(
+    coords: Sequence[int],
+    img_size: Sequence[int],
+) -> list[float]:
+    """Normalize the bounding box coordinates to the image size."""
+    assert isinstance(coords, (tuple, list)), "Coords must be a tuple or list."
+    assert len(coords) == 4, "Coords must be a tuple or list of 4 coordinates."
+    assert all(isinstance(value, int) for value in coords), (
+        "Coords must be a tuple or list of 4 ints."
+    )
+
+    width, height = validate_img_size(img_size)
+
+    assert (
+        0 <= coords[0] <= width
+        and 0 <= coords[1] <= height
+        and 0 <= coords[2] <= width
+        and 0 <= coords[3] <= height
+    ), "Bounding box coordinates are out of image size"
+
+    return [
+        coords[0] / width,
+        coords[1] / height,
+        coords[2] / width,
+        coords[3] / height,
+    ]