From 976b5fd1b27d33f40fc25d88a96cc5ddeda378cd Mon Sep 17 00:00:00 2001
From: Ivan Shcheklein <shcheklein@gmail.com>
Date: Mon, 18 Nov 2024 19:07:39 -0800
Subject: [PATCH] Revert "Update ultralytics models (#592)" (#610)

This reverts commit b62d091062187aa8720f00e67756cb12c6be4005.
---
 src/datachain/lib/models/__init__.py          |   7 +-
 src/datachain/lib/models/bbox.py              | 121 +++--------
 src/datachain/lib/models/pose.py              |  87 +-------
 src/datachain/lib/models/segment.py           |  53 -----
 .../lib/models/ultralytics/__init__.py        |  14 --
 src/datachain/lib/models/ultralytics/bbox.py  | 189 ------------------
 src/datachain/lib/models/ultralytics/pose.py  | 126 ------------
 .../lib/models/ultralytics/segment.py         | 121 -----------
 src/datachain/lib/models/yolo.py              |  39 ++++
 tests/unit/lib/test_models.py                 | 168 ++++------------
 10 files changed, 113 insertions(+), 812 deletions(-)
 delete mode 100644 src/datachain/lib/models/segment.py
 delete mode 100644 src/datachain/lib/models/ultralytics/__init__.py
 delete mode 100644 src/datachain/lib/models/ultralytics/bbox.py
 delete mode 100644 src/datachain/lib/models/ultralytics/pose.py
 delete mode 100644 src/datachain/lib/models/ultralytics/segment.py
 create mode 100644 src/datachain/lib/models/yolo.py

diff --git a/src/datachain/lib/models/__init__.py b/src/datachain/lib/models/__init__.py
index 398bd1a8a..b4335237b 100644
--- a/src/datachain/lib/models/__init__.py
+++ b/src/datachain/lib/models/__init__.py
@@ -1,6 +1,5 @@
-from . import ultralytics
-from .bbox import BBox, OBBox
+from . import yolo
+from .bbox import BBox
 from .pose import Pose, Pose3D
-from .segment import Segments
 
-__all__ = ["BBox", "OBBox", "Pose", "Pose3D", "Segments", "ultralytics"]
+__all__ = ["BBox", "Pose", "Pose3D", "yolo"]
diff --git a/src/datachain/lib/models/bbox.py b/src/datachain/lib/models/bbox.py
index cefc5181d..501ed6296 100644
--- a/src/datachain/lib/models/bbox.py
+++ b/src/datachain/lib/models/bbox.py
@@ -1,3 +1,5 @@
+from typing import Optional
+
 from pydantic import Field
 
 from datachain.lib.data_model import DataModel
@@ -9,7 +11,10 @@ class BBox(DataModel):
 
     Attributes:
         title (str): The title of the bounding box.
-        coords (list[int]): The coordinates of the bounding box.
+        x1 (float): The x-coordinate of the top-left corner of the bounding box.
+        y1 (float): The y-coordinate of the top-left corner of the bounding box.
+        x2 (float): The x-coordinate of the bottom-right corner of the bounding box.
+        y2 (float): The y-coordinate of the bottom-right corner of the bounding box.
 
     The bounding box is defined by two points:
         - (x1, y1): The top-left corner of the box.
@@ -17,100 +22,24 @@ class BBox(DataModel):
     """
 
     title: str = Field(default="")
-    coords: list[int] = Field(default=None)
-
-    @staticmethod
-    def from_list(coords: list[float], title: str = "") -> "BBox":
-        assert len(coords) == 4, "Bounding box coordinates must be a list of 4 floats."
-        assert all(
-            isinstance(value, (int, float)) for value in coords
-        ), "Bounding box coordinates must be integers or floats."
-        return BBox(
-            title=title,
-            coords=[round(c) for c in coords],
-        )
-
-    @staticmethod
-    def from_dict(coords: dict[str, float], title: str = "") -> "BBox":
-        assert (
-            len(coords) == 4
-        ), "Bounding box coordinates must be a dictionary of 4 floats."
-        assert set(coords) == {
-            "x1",
-            "y1",
-            "x2",
-            "y2",
-        }, "Bounding box coordinates must contain keys with coordinates."
-        assert all(
-            isinstance(value, (int, float)) for value in coords.values()
-        ), "Bounding box coordinates must be integers or floats."
-        return BBox(
-            title=title,
-            coords=[
-                round(coords["x1"]),
-                round(coords["y1"]),
-                round(coords["x2"]),
-                round(coords["y2"]),
-            ],
-        )
-
-
-class OBBox(DataModel):
-    """
-    A data model for representing oriented bounding boxes.
-
-    Attributes:
-        title (str): The title of the oriented bounding box.
-        coords (list[int]): The coordinates of the oriented bounding box.
-
-    The oriented bounding box is defined by four points:
-        - (x1, y1): The first corner of the box.
-        - (x2, y2): The second corner of the box.
-        - (x3, y3): The third corner of the box.
-        - (x4, y4): The fourth corner of the box.
-    """
-
-    title: str = Field(default="")
-    coords: list[int] = Field(default=None)
-
-    @staticmethod
-    def from_list(coords: list[float], title: str = "") -> "OBBox":
-        assert (
-            len(coords) == 8
-        ), "Oriented bounding box coordinates must be a list of 8 floats."
-        assert all(
-            isinstance(value, (int, float)) for value in coords
-        ), "Oriented bounding box coordinates must be integers or floats."
-        return OBBox(
-            title=title,
-            coords=[round(c) for c in coords],
-        )
+    x1: float = Field(default=0)
+    y1: float = Field(default=0)
+    x2: float = Field(default=0)
+    y2: float = Field(default=0)
 
     @staticmethod
-    def from_dict(coords: dict[str, float], title: str = "") -> "OBBox":
-        assert set(coords) == {
-            "x1",
-            "y1",
-            "x2",
-            "y2",
-            "x3",
-            "y3",
-            "x4",
-            "y4",
-        }, "Oriented bounding box coordinates must contain keys with coordinates."
-        assert all(
-            isinstance(value, (int, float)) for value in coords.values()
-        ), "Oriented bounding box coordinates must be integers or floats."
-        return OBBox(
-            title=title,
-            coords=[
-                round(coords["x1"]),
-                round(coords["y1"]),
-                round(coords["x2"]),
-                round(coords["y2"]),
-                round(coords["x3"]),
-                round(coords["y3"]),
-                round(coords["x4"]),
-                round(coords["y4"]),
-            ],
-        )
+    def from_xywh(bbox: list[float], title: Optional[str] = None) -> "BBox":
+        """
+        Converts a bounding box in (x, y, width, height) format
+        to a BBox data model instance.
+
+        Args:
+            bbox (list[float]): A bounding box, represented as a list
+                                of four floats [x, y, width, height].
+
+        Returns:
+            BBox2D: An instance of the BBox data model.
+        """
+        assert len(bbox) == 4, f"Bounding box must have 4 elements, got f{len(bbox)}"
+        x, y, w, h = bbox
+        return BBox(title=title or "", x1=x, y1=y, x2=x + w, y2=y + h)
diff --git a/src/datachain/lib/models/pose.py b/src/datachain/lib/models/pose.py
index c4926b463..5cb95a29b 100644
--- a/src/datachain/lib/models/pose.py
+++ b/src/datachain/lib/models/pose.py
@@ -8,48 +8,15 @@ class Pose(DataModel):
     A data model for representing pose keypoints.
 
     Attributes:
-        x (list[int]): The x-coordinates of the keypoints.
-        y (list[int]): The y-coordinates of the keypoints.
+        x (list[float]): The x-coordinates of the keypoints.
+        y (list[float]): The y-coordinates of the keypoints.
 
     The keypoints are represented as lists of x and y coordinates, where each index
     corresponds to a specific body part.
     """
 
-    x: list[int] = Field(default=None)
-    y: list[int] = Field(default=None)
-
-    @staticmethod
-    def from_list(points: list[list[float]]) -> "Pose":
-        assert len(points) == 2, "Pose coordinates must be a list of 2 lists."
-        points_x, points_y = points
-        assert (
-            len(points_x) == len(points_y) == 17
-        ), "Pose x and y coordinates must have the same length of 17."
-        assert all(
-            isinstance(value, (int, float)) for value in [*points_x, *points_y]
-        ), "Pose coordinates must be integers or floats."
-        return Pose(
-            x=[round(coord) for coord in points_x],
-            y=[round(coord) for coord in points_y],
-        )
-
-    @staticmethod
-    def from_dict(points: dict[str, list[float]]) -> "Pose":
-        assert set(points) == {
-            "x",
-            "y",
-        }, "Pose coordinates must contain keys 'x' and 'y'."
-        points_x, points_y = points["x"], points["y"]
-        assert (
-            len(points_x) == len(points_y) == 17
-        ), "Pose x and y coordinates must have the same length of 17."
-        assert all(
-            isinstance(value, (int, float)) for value in [*points_x, *points_y]
-        ), "Pose coordinates must be integers or floats."
-        return Pose(
-            x=[round(coord) for coord in points_x],
-            y=[round(coord) for coord in points_y],
-        )
+    x: list[float] = Field(default=None)
+    y: list[float] = Field(default=None)
 
 
 class Pose3D(DataModel):
@@ -57,52 +24,14 @@ class Pose3D(DataModel):
     A data model for representing 3D pose keypoints.
 
     Attributes:
-        x (list[int]): The x-coordinates of the keypoints.
-        y (list[int]): The y-coordinates of the keypoints.
+        x (list[float]): The x-coordinates of the keypoints.
+        y (list[float]): The y-coordinates of the keypoints.
         visible (list[float]): The visibility of the keypoints.
 
     The keypoints are represented as lists of x, y, and visibility values,
     where each index corresponds to a specific body part.
     """
 
-    x: list[int] = Field(default=None)
-    y: list[int] = Field(default=None)
+    x: list[float] = Field(default=None)
+    y: list[float] = Field(default=None)
     visible: list[float] = Field(default=None)
-
-    @staticmethod
-    def from_list(points: list[list[float]]) -> "Pose3D":
-        assert len(points) == 3, "Pose coordinates must be a list of 3 lists."
-        points_x, points_y, points_v = points
-        assert (
-            len(points_x) == len(points_y) == len(points_v) == 17
-        ), "Pose x, y, and visibility coordinates must have the same length of 17."
-        assert all(
-            isinstance(value, (int, float))
-            for value in [*points_x, *points_y, *points_v]
-        ), "Pose coordinates must be integers or floats."
-        return Pose3D(
-            x=[round(coord) for coord in points_x],
-            y=[round(coord) for coord in points_y],
-            visible=points_v,
-        )
-
-    @staticmethod
-    def from_dict(points: dict[str, list[float]]) -> "Pose3D":
-        assert set(points) == {
-            "x",
-            "y",
-            "visible",
-        }, "Pose coordinates must contain keys 'x', 'y', and 'visible'."
-        points_x, points_y, points_v = points["x"], points["y"], points["visible"]
-        assert (
-            len(points_x) == len(points_y) == len(points_v) == 17
-        ), "Pose x, y, and visibility coordinates must have the same length of 17."
-        assert all(
-            isinstance(value, (int, float))
-            for value in [*points_x, *points_y, *points_v]
-        ), "Pose coordinates must be integers or floats."
-        return Pose3D(
-            x=[round(coord) for coord in points_x],
-            y=[round(coord) for coord in points_y],
-            visible=points_v,
-        )
diff --git a/src/datachain/lib/models/segment.py b/src/datachain/lib/models/segment.py
deleted file mode 100644
index 04e4dec05..000000000
--- a/src/datachain/lib/models/segment.py
+++ /dev/null
@@ -1,53 +0,0 @@
-from pydantic import Field
-
-from datachain.lib.data_model import DataModel
-
-
-class Segments(DataModel):
-    """
-    A data model for representing segments.
-
-    Attributes:
-        title (str): The title of the segments.
-        x (list[int]): The x-coordinates of the segments.
-        y (list[int]): The y-coordinates of the segments.
-
-    The segments are represented as lists of x and y coordinates, where each index
-    corresponds to a specific segment.
-    """
-
-    title: str = Field(default="")
-    x: list[int] = Field(default=None)
-    y: list[int] = Field(default=None)
-
-    @staticmethod
-    def from_list(points: list[list[float]], title: str = "") -> "Segments":
-        assert len(points) == 2, "Segments coordinates must be a list of 2 lists."
-        points_x, points_y = points
-        assert len(points_x) == len(
-            points_y
-        ), "Segments x and y coordinates must have the same length."
-        assert all(
-            isinstance(value, (int, float)) for value in [*points_x, *points_y]
-        ), "Segments coordinates must be integers or floats."
-        return Segments(
-            title=title,
-            x=[round(coord) for coord in points_x],
-            y=[round(coord) for coord in points_y],
-        )
-
-    @staticmethod
-    def from_dict(points: dict[str, list[float]], title: str = "") -> "Segments":
-        assert set(points) == {
-            "x",
-            "y",
-        }, "Segments coordinates must contain keys 'x' and 'y'."
-        points_x, points_y = points["x"], points["y"]
-        assert all(
-            isinstance(value, (int, float)) for value in [*points_x, *points_y]
-        ), "Segments coordinates must be integers or floats."
-        return Segments(
-            title=title,
-            x=[round(coord) for coord in points_x],
-            y=[round(coord) for coord in points_y],
-        )
diff --git a/src/datachain/lib/models/ultralytics/__init__.py b/src/datachain/lib/models/ultralytics/__init__.py
deleted file mode 100644
index 504dccc91..000000000
--- a/src/datachain/lib/models/ultralytics/__init__.py
+++ /dev/null
@@ -1,14 +0,0 @@
-from .bbox import YoloBBox, YoloBBoxes, YoloOBBox, YoloOBBoxes
-from .pose import YoloPose, YoloPoses
-from .segment import YoloSegment, YoloSegments
-
-__all__ = [
-    "YoloBBox",
-    "YoloBBoxes",
-    "YoloOBBox",
-    "YoloOBBoxes",
-    "YoloPose",
-    "YoloPoses",
-    "YoloSegment",
-    "YoloSegments",
-]
diff --git a/src/datachain/lib/models/ultralytics/bbox.py b/src/datachain/lib/models/ultralytics/bbox.py
deleted file mode 100644
index b5fa939ad..000000000
--- a/src/datachain/lib/models/ultralytics/bbox.py
+++ /dev/null
@@ -1,189 +0,0 @@
-"""
-This module contains the YOLO models.
-
-YOLO stands for "You Only Look Once", a family of object detection models that
-are designed to be fast and accurate. The models are trained to detect objects
-in images by dividing the image into a grid and predicting the bounding boxes
-and class probabilities for each grid cell.
-
-More information about YOLO can be found here:
-- https://pjreddie.com/darknet/yolo/
-- https://docs.ultralytics.com/
-"""
-
-from io import BytesIO
-from typing import TYPE_CHECKING
-
-from PIL import Image
-from pydantic import Field
-
-from datachain.lib.data_model import DataModel
-from datachain.lib.models.bbox import BBox, OBBox
-
-if TYPE_CHECKING:
-    from ultralytics.engine.results import Results
-    from ultralytics.models import YOLO
-
-    from datachain.lib.file import File
-
-
-class YoloBBox(DataModel):
-    """
-    A class representing a bounding box detected by a YOLO model.
-
-    Attributes:
-        cls: The class of the detected object.
-        name: The name of the detected object.
-        confidence: The confidence score of the detection.
-        box: The bounding box of the detected object
-    """
-
-    cls: int = Field(default=-1)
-    name: str = Field(default="")
-    confidence: float = Field(default=0)
-    box: BBox = Field(default=None)
-
-    @staticmethod
-    def from_file(yolo: "YOLO", file: "File") -> "YoloBBox":
-        results = yolo(Image.open(BytesIO(file.read())))
-        if len(results) == 0:
-            return YoloBBox()
-        return YoloBBox.from_result(results[0])
-
-    @staticmethod
-    def from_result(result: "Results") -> "YoloBBox":
-        summary = result.summary()
-        if not summary:
-            return YoloBBox()
-        name = summary[0].get("name", "")
-        box = (
-            BBox.from_dict(summary[0]["box"], title=name)
-            if "box" in summary[0]
-            else BBox()
-        )
-        return YoloBBox(
-            cls=summary[0]["class"],
-            name=name,
-            confidence=summary[0]["confidence"],
-            box=box,
-        )
-
-
-class YoloBBoxes(DataModel):
-    """
-    A class representing a list of bounding boxes detected by a YOLO model.
-
-    Attributes:
-        cls: A list of classes of the detected objects.
-        name: A list of names of the detected objects.
-        confidence: A list of confidence scores of the detections.
-        box: A list of bounding boxes of the detected objects
-    """
-
-    cls: list[int]
-    name: list[str]
-    confidence: list[float]
-    box: list[BBox]
-
-    @staticmethod
-    def from_file(yolo: "YOLO", file: "File") -> "YoloBBoxes":
-        results = yolo(Image.open(BytesIO(file.read())))
-        return YoloBBoxes.from_results(results)
-
-    @staticmethod
-    def from_results(results: list["Results"]) -> "YoloBBoxes":
-        cls, names, confidence, box = [], [], [], []
-        for r in results:
-            for s in r.summary():
-                name = s.get("name", "")
-                cls.append(s["class"])
-                names.append(name)
-                confidence.append(s["confidence"])
-                box.append(BBox.from_dict(s.get("box", {}), title=name))
-        return YoloBBoxes(
-            cls=cls,
-            name=names,
-            confidence=confidence,
-            box=box,
-        )
-
-
-class YoloOBBox(DataModel):
-    """
-    A class representing an oriented bounding box detected by a YOLO model.
-
-    Attributes:
-        cls: The class of the detected object.
-        name: The name of the detected object.
-        confidence: The confidence score of the detection.
-        box: The oriented bounding box of the detected object.
-    """
-
-    cls: int = Field(default=-1)
-    name: str = Field(default="")
-    confidence: float = Field(default=0)
-    box: OBBox = Field(default=None)
-
-    @staticmethod
-    def from_file(yolo: "YOLO", file: "File") -> "YoloOBBox":
-        results = yolo(Image.open(BytesIO(file.read())))
-        if len(results) == 0:
-            return YoloOBBox()
-        return YoloOBBox.from_result(results[0])
-
-    @staticmethod
-    def from_result(result: "Results") -> "YoloOBBox":
-        summary = result.summary()
-        if not summary:
-            return YoloOBBox()
-        name = summary[0].get("name", "")
-        box = (
-            OBBox.from_dict(summary[0]["box"], title=name)
-            if "box" in summary[0]
-            else OBBox()
-        )
-        return YoloOBBox(
-            cls=summary[0]["class"],
-            name=name,
-            confidence=summary[0]["confidence"],
-            box=box,
-        )
-
-
-class YoloOBBoxes(DataModel):
-    """
-    A class representing a list of oriented bounding boxes detected by a YOLO model.
-
-    Attributes:
-        cls: A list of classes of the detected objects.
-        name: A list of names of the detected objects.
-        confidence: A list of confidence scores of the detections.
-        box: A list of oriented bounding boxes of the detected objects.
-    """
-
-    cls: list[int]
-    name: list[str]
-    confidence: list[float]
-    box: list[OBBox]
-
-    @staticmethod
-    def from_file(yolo: "YOLO", file: "File") -> "YoloOBBoxes":
-        results = yolo(Image.open(BytesIO(file.read())))
-        return YoloOBBoxes.from_results(results)
-
-    @staticmethod
-    def from_results(results: list["Results"]) -> "YoloOBBoxes":
-        cls, names, confidence, box = [], [], [], []
-        for r in results:
-            for s in r.summary():
-                name = s.get("name", "")
-                cls.append(s["class"])
-                names.append(name)
-                confidence.append(s["confidence"])
-                box.append(OBBox.from_dict(s.get("box", {}), title=name))
-        return YoloOBBoxes(
-            cls=cls,
-            name=names,
-            confidence=confidence,
-            box=box,
-        )
diff --git a/src/datachain/lib/models/ultralytics/pose.py b/src/datachain/lib/models/ultralytics/pose.py
deleted file mode 100644
index e97d48c2f..000000000
--- a/src/datachain/lib/models/ultralytics/pose.py
+++ /dev/null
@@ -1,126 +0,0 @@
-"""
-This module contains the YOLO models.
-
-YOLO stands for "You Only Look Once", a family of object detection models that
-are designed to be fast and accurate. The models are trained to detect objects
-in images by dividing the image into a grid and predicting the bounding boxes
-and class probabilities for each grid cell.
-
-More information about YOLO can be found here:
-- https://pjreddie.com/darknet/yolo/
-- https://docs.ultralytics.com/
-"""
-
-from typing import TYPE_CHECKING
-
-from pydantic import Field
-
-from datachain.lib.data_model import DataModel
-from datachain.lib.models.bbox import BBox
-from datachain.lib.models.pose import Pose3D
-
-if TYPE_CHECKING:
-    from ultralytics.engine.results import Results
-
-
-class YoloPoseBodyPart:
-    """An enumeration of body parts for YOLO pose keypoints."""
-
-    nose = 0
-    left_eye = 1
-    right_eye = 2
-    left_ear = 3
-    right_ear = 4
-    left_shoulder = 5
-    right_shoulder = 6
-    left_elbow = 7
-    right_elbow = 8
-    left_wrist = 9
-    right_wrist = 10
-    left_hip = 11
-    right_hip = 12
-    left_knee = 13
-    right_knee = 14
-    left_ankle = 15
-    right_ankle = 16
-
-
-class YoloPose(DataModel):
-    """
-    A data model for YOLO pose keypoints.
-
-    Attributes:
-        cls: The class of the pose.
-        name: The name of the pose.
-        confidence: The confidence score of the pose.
-        box: The bounding box of the pose.
-        keypoints: The 3D pose keypoints.
-    """
-
-    cls: int = Field(default=-1)
-    name: str = Field(default="")
-    confidence: float = Field(default=0)
-    box: BBox = Field(default=None)
-    keypoints: Pose3D = Field(default=None)
-
-    @staticmethod
-    def from_result(result: "Results") -> "YoloPose":
-        summary = result.summary()
-        if not summary:
-            return YoloPose()
-        name = summary[0].get("name", "")
-        box = (
-            BBox.from_dict(summary[0]["box"], title=name)
-            if "box" in summary[0]
-            else BBox()
-        )
-        keypoints = (
-            Pose3D.from_dict(summary[0]["keypoints"])
-            if "keypoints" in summary[0]
-            else Pose3D()
-        )
-        return YoloPose(
-            cls=summary[0]["class"],
-            name=name,
-            confidence=summary[0]["confidence"],
-            box=box,
-            keypoints=keypoints,
-        )
-
-
-class YoloPoses(DataModel):
-    """
-    A data model for a list of YOLO pose keypoints.
-
-    Attributes:
-        cls: The classes of the poses.
-        name: The names of the poses.
-        confidence: The confidence scores of the poses.
-        box: The bounding boxes of the poses.
-        keypoints: The 3D pose keypoints of the poses.
-    """
-
-    cls: list[int]
-    name: list[str]
-    confidence: list[float]
-    box: list[BBox]
-    keypoints: list[Pose3D]
-
-    @staticmethod
-    def from_results(results: list["Results"]) -> "YoloPoses":
-        cls, names, confidence, box, keypoints = [], [], [], [], []
-        for r in results:
-            for s in r.summary():
-                name = s.get("name", "")
-                cls.append(s["class"])
-                names.append(name)
-                confidence.append(s["confidence"])
-                box.append(BBox.from_dict(s.get("box", {}), title=name))
-                keypoints.append(Pose3D.from_dict(s.get("keypoints", {})))
-        return YoloPoses(
-            cls=cls,
-            name=names,
-            confidence=confidence,
-            box=box,
-            keypoints=keypoints,
-        )
diff --git a/src/datachain/lib/models/ultralytics/segment.py b/src/datachain/lib/models/ultralytics/segment.py
deleted file mode 100644
index 0614e7ed8..000000000
--- a/src/datachain/lib/models/ultralytics/segment.py
+++ /dev/null
@@ -1,121 +0,0 @@
-"""
-This module contains the YOLO models.
-
-YOLO stands for "You Only Look Once", a family of object detection models that
-are designed to be fast and accurate. The models are trained to detect objects
-in images by dividing the image into a grid and predicting the bounding boxes
-and class probabilities for each grid cell.
-
-More information about YOLO can be found here:
-- https://pjreddie.com/darknet/yolo/
-- https://docs.ultralytics.com/
-"""
-
-from io import BytesIO
-from typing import TYPE_CHECKING
-
-from PIL import Image
-from pydantic import Field
-
-from datachain.lib.data_model import DataModel
-from datachain.lib.models.bbox import BBox
-from datachain.lib.models.segment import Segments
-
-if TYPE_CHECKING:
-    from ultralytics.engine.results import Results
-    from ultralytics.models import YOLO
-
-    from datachain.lib.file import File
-
-
-class YoloSegment(DataModel):
-    """
-    A data model for a single YOLO segment.
-
-    Attributes:
-        cls (int): The class of the segment.
-        name (str): The name of the segment.
-        confidence (float): The confidence of the segment.
-        box (BBox): The bounding box of the segment.
-        segments (Segments): The segments of the segment.
-    """
-
-    cls: int = Field(default=-1)
-    name: str = Field(default="")
-    confidence: float = Field(default=0)
-    box: BBox = Field(default=None)
-    segments: Segments = Field(default=None)
-
-    @staticmethod
-    def from_file(yolo: "YOLO", file: "File") -> "YoloSegment":
-        results = yolo(Image.open(BytesIO(file.read())))
-        if len(results) == 0:
-            return YoloSegment()
-        return YoloSegment.from_result(results[0])
-
-    @staticmethod
-    def from_result(result: "Results") -> "YoloSegment":
-        summary = result.summary()
-        if not summary:
-            return YoloSegment()
-        name = summary[0].get("name", "")
-        box = (
-            BBox.from_dict(summary[0]["box"], title=name)
-            if "box" in summary[0]
-            else BBox()
-        )
-        segments = (
-            Segments.from_dict(summary[0]["segments"], title=name)
-            if "segments" in summary[0]
-            else Segments()
-        )
-        return YoloSegment(
-            cls=summary[0]["class"],
-            name=summary[0]["name"],
-            confidence=summary[0]["confidence"],
-            box=box,
-            segments=segments,
-        )
-
-
-class YoloSegments(DataModel):
-    """
-    A data model for a list of YOLO segments.
-
-    Attributes:
-        cls (list[int]): The classes of the segments.
-        name (list[str]): The names of the segments.
-        confidence (list[float]): The confidences of the segments.
-        box (list[BBox]): The bounding boxes of the segments.
-        segments (list[Segments]): The segments of the segments.
-    """
-
-    cls: list[int]
-    name: list[str]
-    confidence: list[float]
-    box: list[BBox]
-    segments: list[Segments]
-
-    @staticmethod
-    def from_file(yolo: "YOLO", file: "File") -> "YoloSegments":
-        results = yolo(Image.open(BytesIO(file.read())))
-        return YoloSegments.from_results(results)
-
-    @staticmethod
-    def from_results(results: list["Results"]) -> "YoloSegments":
-        cls, names, confidence, box, segments = [], [], [], [], []
-        for r in results:
-            for s in r.summary():
-                name = s.get("name", "")
-                cls.append(s["class"])
-                names.append(name)
-                confidence.append(s["confidence"])
-                box.append(BBox.from_dict(s.get("box", {}), title=name))
-                segments.append(Segments.from_dict(s.get("segments", {}), title=name))
-        return YoloSegments(
-            cls=cls,
-            name=names,
-            confidence=confidence,
-            box=box,
-            segments=segments,
-        )
diff --git a/src/datachain/lib/models/yolo.py b/src/datachain/lib/models/yolo.py
new file mode 100644
index 000000000..4231240a6
--- /dev/null
+++ b/src/datachain/lib/models/yolo.py
@@ -0,0 +1,39 @@
+"""
+This module contains the YOLO models.
+
+YOLO stands for "You Only Look Once", a family of object detection models that
+are designed to be fast and accurate. The models are trained to detect objects
+in images by dividing the image into a grid and predicting the bounding boxes
+and class probabilities for each grid cell.
+
+More information about YOLO can be found here:
+- https://pjreddie.com/darknet/yolo/
+- https://docs.ultralytics.com/
+"""
+
+
+class PoseBodyPart:
+    """
+    An enumeration of body parts for YOLO pose keypoints.
+
+    More information about the body parts can be found here:
+    https://docs.ultralytics.com/tasks/pose/
+    """
+
+    nose = 0
+    left_eye = 1
+    right_eye = 2
+    left_ear = 3
+    right_ear = 4
+    left_shoulder = 5
+    right_shoulder = 6
+    left_elbow = 7
+    right_elbow = 8
+    left_wrist = 9
+    right_wrist = 10
+    left_hip = 11
+    right_hip = 12
+    left_knee = 13
+    right_knee = 14
+    left_ankle = 15
+    right_ankle = 16
diff --git a/tests/unit/lib/test_models.py b/tests/unit/lib/test_models.py
index f090f31dd..c3ea2b463 100644
--- a/tests/unit/lib/test_models.py
+++ b/tests/unit/lib/test_models.py
@@ -1,142 +1,50 @@
-import pytest
-
 from datachain.lib import models
-from datachain.lib.models.ultralytics.pose import YoloPoseBodyPart
 
 
-@pytest.mark.parametrize(
-    "bbox",
-    [
-        models.BBox(title="BBox", coords=[0, 1, 2, 3]),
-        models.BBox.from_list([0.3, 1.1, 1.7, 3.4], title="BBox"),
-        models.BBox.from_dict({"x1": 0, "y1": 0.8, "x2": 2.2, "y2": 2.9}, title="BBox"),
-    ],
-)
-def test_bbox(bbox):
+def test_bbox():
+    bbox = models.BBox(title="BBox", x1=0.5, y1=1.5, x2=2.5, y2=3.5)
     assert bbox.model_dump() == {
         "title": "BBox",
-        "coords": [0, 1, 2, 3],
-    }
-
-
-@pytest.mark.parametrize(
-    "obbox",
-    [
-        models.OBBox(title="OBBox", coords=[0, 1, 2, 3, 4, 5, 6, 7]),
-        models.OBBox.from_list([0.3, 1.1, 1.7, 3.4, 4.0, 4.9, 5.6, 7.0], title="OBBox"),
-        models.OBBox.from_dict(
-            {
-                "x1": 0,
-                "y1": 0.8,
-                "x2": 2.2,
-                "y2": 2.9,
-                "x3": 3.9,
-                "y3": 5.4,
-                "x4": 6.0,
-                "y4": 7.4,
-            },
-            title="OBBox",
-        ),
-    ],
-)
-def test_obbox(obbox):
-    assert obbox.model_dump() == {
-        "title": "OBBox",
-        "coords": [0, 1, 2, 3, 4, 5, 6, 7],
+        "x1": 0.5,
+        "y1": 1.5,
+        "x2": 2.5,
+        "y2": 3.5,
     }
 
 
-@pytest.mark.parametrize(
-    "pose",
-    [
-        models.Pose(x=list(range(17)), y=[y * 2 for y in range(17)]),
-        models.Pose.from_list([list(range(17)), [y * 2 for y in range(17)]]),
-        models.Pose.from_dict({"x": list(range(17)), "y": [y * 2 for y in range(17)]}),
-    ],
-)
-def test_pose(pose):
-    assert pose.model_dump() == {
-        "x": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16],
-        "y": [0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32],
-    }
-
+def test_bbox_from_xywh():
+    bbox = models.BBox.from_xywh([0.5, 1.5, 2.5, 3.5])
+    assert bbox.model_dump() == {"title": "", "x1": 0.5, "y1": 1.5, "x2": 3, "y2": 5}
 
-@pytest.mark.parametrize(
-    "pose",
-    [
-        models.Pose3D(
-            x=list(range(17)), y=[y * 2 for y in range(17)], visible=[0.2] * 17
-        ),
-        models.Pose3D.from_list(
-            [list(range(17)), [y * 2 for y in range(17)], [0.2] * 17]
-        ),
-        models.Pose3D.from_dict(
-            {
-                "x": list(range(17)),
-                "y": [y * 2 for y in range(17)],
-                "visible": [0.2] * 17,
-            }
-        ),
-    ],
-)
-def test_pose3d(pose):
-    assert pose.model_dump() == {
-        "x": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16],
-        "y": [0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32],
-        "visible": [
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-            0.2,
-        ],
-    }
-
-
-@pytest.mark.parametrize(
-    "segments",
-    [
-        models.Segments(x=[0, 1, 2], y=[2, 3, 5], title="Segments"),
-        models.Segments.from_list([[0, 1, 2], [2, 3, 5]], title="Segments"),
-        models.Segments.from_dict({"x": [0, 1, 2], "y": [2, 3, 5]}, title="Segments"),
-    ],
-)
-def test_segments(segments):
-    assert segments.model_dump() == {
-        "title": "Segments",
-        "x": [0, 1, 2],
-        "y": [2, 3, 5],
+    bbox = models.BBox.from_xywh([0.5, 1.5, 2.5, 3.5], title="BBox")
+    assert bbox.model_dump() == {
+        "title": "BBox",
+        "x1": 0.5,
+        "y1": 1.5,
+        "x2": 3,
+        "y2": 5,
     }
 
 
-def test_yolo_pose_body_parts():
-    pose = models.Pose(x=list(range(17)), y=list(range(17)))
-    assert pose.x[YoloPoseBodyPart.nose] == 0
-    assert pose.x[YoloPoseBodyPart.left_eye] == 1
-    assert pose.x[YoloPoseBodyPart.right_eye] == 2
-    assert pose.x[YoloPoseBodyPart.left_ear] == 3
-    assert pose.x[YoloPoseBodyPart.right_ear] == 4
-    assert pose.x[YoloPoseBodyPart.left_shoulder] == 5
-    assert pose.x[YoloPoseBodyPart.right_shoulder] == 6
-    assert pose.x[YoloPoseBodyPart.left_elbow] == 7
-    assert pose.x[YoloPoseBodyPart.right_elbow] == 8
-    assert pose.x[YoloPoseBodyPart.left_wrist] == 9
-    assert pose.x[YoloPoseBodyPart.right_wrist] == 10
-    assert pose.x[YoloPoseBodyPart.left_hip] == 11
-    assert pose.x[YoloPoseBodyPart.right_hip] == 12
-    assert pose.x[YoloPoseBodyPart.left_knee] == 13
-    assert pose.x[YoloPoseBodyPart.right_knee] == 14
-    assert pose.x[YoloPoseBodyPart.left_ankle] == 15
-    assert pose.x[YoloPoseBodyPart.right_ankle] == 16
+def test_pose():
+    x = [x * 0.5 for x in range(17)]
+    y = [y * 1.5 for y in range(17)]
+    pose = models.Pose(x=x, y=y)
+    assert pose.model_dump() == {"x": x, "y": y}
+    assert pose.x[models.yolo.PoseBodyPart.nose] == 0
+    assert pose.x[models.yolo.PoseBodyPart.left_eye] == 0.5
+    assert pose.x[models.yolo.PoseBodyPart.right_eye] == 1
+    assert pose.x[models.yolo.PoseBodyPart.left_ear] == 1.5
+    assert pose.x[models.yolo.PoseBodyPart.right_ear] == 2
+    assert pose.x[models.yolo.PoseBodyPart.left_shoulder] == 2.5
+    assert pose.x[models.yolo.PoseBodyPart.right_shoulder] == 3
+    assert pose.x[models.yolo.PoseBodyPart.left_elbow] == 3.5
+    assert pose.x[models.yolo.PoseBodyPart.right_elbow] == 4
+    assert pose.x[models.yolo.PoseBodyPart.left_wrist] == 4.5
+    assert pose.x[models.yolo.PoseBodyPart.right_wrist] == 5
+    assert pose.x[models.yolo.PoseBodyPart.left_hip] == 5.5
+    assert pose.x[models.yolo.PoseBodyPart.right_hip] == 6
+    assert pose.x[models.yolo.PoseBodyPart.left_knee] == 6.5
+    assert pose.x[models.yolo.PoseBodyPart.right_knee] == 7
+    assert pose.x[models.yolo.PoseBodyPart.left_ankle] == 7.5
+    assert pose.x[models.yolo.PoseBodyPart.right_ankle] == 8