Merge branch 'main' into main

2 weeks ago · 4dc4700ce4
parent 0f640086dd cece2ee2cf
commit 4dc4700ce4
55 changed files with 790 additions and 583 deletions
--- a/.github/ISSUE_TEMPLATE/bug-report.yml
+++ b/.github/ISSUE_TEMPLATE/bug-report.yml
@ -52,9 +52,9 @@ body:
  - type: textarea
    attributes:
      label: Environment
-      description: Many issues are often related to dependency versions and hardware. Please provide the output of `yolo checks` or `ultralytics.checks()` command to help us diagnose the problem.
+      description: Many issues are often related to dependency versions and hardware. Please provide the output of `yolo checks` (CLI) or `ultralytics.utils.checks.collect_system_info()` (Python) command to help us diagnose the problem.
      placeholder: |
-        Paste output of `yolo checks` or `ultralytics.checks()` command, i.e.:
+        Paste output of `yolo checks` (CLI) or `ultralytics.utils.checks.collect_system_info()` (Python) command, i.e.:
        ```
        Ultralytics 8.3.2 🚀 Python-3.11.2 torch-2.4.1 CPU (Apple M3)
        Setup complete ✅ (8 CPUs, 16.0 GB RAM, 266.5/460.4 GB disk)
--- a/.github/workflows/docker.yaml
+++ b/.github/workflows/docker.yaml
@ -134,12 +134,12 @@ jobs:
      - name: Build Image
        if: github.event_name == 'push' || github.event.inputs[matrix.dockerfile] == 'true'
-        uses: nick-invision/retry@v3
+        uses: ultralytics/actions/retry@main
        with:
          timeout_minutes: 120
-          retry_wait_seconds: 60
+          retry_delay_seconds: 60
-          max_attempts: 3 # retry twice
+          retries: 2
-          command: |
+          run: |
            docker build \
            --platform ${{ matrix.platforms }} \
            -f docker/${{ matrix.dockerfile }} \
@ -172,7 +172,7 @@ jobs:
          fi
          if [[ "${{ matrix.tags }}" == "latest-python" ]]; then
            t=ultralytics/ultralytics:latest-jupyter
-            v=ultralytics/ultralytics:${{ steps.get_version.outputs.version_tag }}-jupyter
+            v=ultralytics/ultralytics:${{ steps.get_version.outputs.version }}-jupyter
            docker build -f docker/Dockerfile-jupyter -t $t -t $v .
            docker push $t
            if [[ "${{ steps.check_tag.outputs.new_release }}" == "true" ]]; then
--- a/.github/workflows/links.yml
+++ b/.github/workflows/links.yml
@ -29,12 +29,12 @@ jobs:
          sudo mv lychee /usr/local/bin
      - name: Test Markdown and HTML links with retry
-        uses: nick-invision/retry@v3
+        uses: ultralytics/actions/retry@main
        with:
-          timeout_minutes: 5
+          timeout_minutes: 60
-          retry_wait_seconds: 60
+          retry_delay_seconds: 300
-          max_attempts: 3
+          retries: 2
-          command: |
+          run: |
            lychee \
            --scheme https \
            --timeout 60 \
@ -59,12 +59,12 @@ jobs:
      - name: Test Markdown, HTML, YAML, Python and Notebook links with retry
        if: github.event_name == 'workflow_dispatch'
-        uses: nick-invision/retry@v3
+        uses: ultralytics/actions/retry@main
        with:
-          timeout_minutes: 5
+          timeout_minutes: 60
-          retry_wait_seconds: 60
+          retry_delay_seconds: 300
-          max_attempts: 3
+          retries: 2
-          command: |
+          run: |
            lychee \
            --scheme https \
            --timeout 60 \
--- a/.gitignore
+++ b/.gitignore
@ -163,6 +163,7 @@ weights/
 *_openvino_model/
 *_paddle_model/
 *_ncnn_model/
 *_imx_model/
 pnnx*
 # Autogenerated files for tests
--- a/README.md
+++ b/README.md
@ -8,7 +8,7 @@
 <div>
    <a href="https://github.com/ultralytics/ultralytics/actions/workflows/ci.yaml"><img src="https://github.com/ultralytics/ultralytics/actions/workflows/ci.yaml/badge.svg" alt="Ultralytics CI"></a>
-    <a href="https://pepy.tech/project/ultralytics"><img src="https://static.pepy.tech/badge/ultralytics" alt="Ultralytics Downloads"></a>
+    <a href="https://www.pepy.tech/projects/ultralytics"><img src="https://static.pepy.tech/badge/ultralytics" alt="Ultralytics Downloads"></a>
    <a href="https://zenodo.org/badge/latestdoi/264818686"><img src="https://zenodo.org/badge/264818686.svg" alt="Ultralytics YOLO Citation"></a>
    <a href="https://discord.com/invite/ultralytics"><img alt="Ultralytics Discord" src="https://img.shields.io/discord/1089800235347353640?logo=discord&logoColor=white&label=Discord&color=blue"></a>
    <a href="https://community.ultralytics.com/"><img alt="Ultralytics Forums" src="https://img.shields.io/discourse/users?server=https%3A%2F%2Fcommunity.ultralytics.com&logo=discourse&label=Forums&color=blue"></a>
@ -55,7 +55,7 @@ See below for a quickstart install and usage examples, and see our [Docs](https:
 Pip install the ultralytics package including all [requirements](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) in a [**Python>=3.8**](https://www.python.org/) environment with [**PyTorch>=1.8**](https://pytorch.org/get-started/locally/).
-[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Ultralytics Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)
+[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Ultralytics Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)
 ```bash
 pip install ultralytics
--- a/README.zh-CN.md
+++ b/README.zh-CN.md
@ -8,7 +8,7 @@
 <div>
    <a href="https://github.com/ultralytics/ultralytics/actions/workflows/ci.yaml"><img src="https://github.com/ultralytics/ultralytics/actions/workflows/ci.yaml/badge.svg" alt="Ultralytics CI"></a>
-    <a href="https://pepy.tech/project/ultralytics"><img src="https://static.pepy.tech/badge/ultralytics" alt="Ultralytics Downloads"></a>
+    <a href="https://www.pepy.tech/projects/ultralytics"><img src="https://static.pepy.tech/badge/ultralytics" alt="Ultralytics Downloads"></a>
    <a href="https://zenodo.org/badge/latestdoi/264818686"><img src="https://zenodo.org/badge/264818686.svg" alt="Ultralytics YOLO Citation"></a>
    <a href="https://discord.com/invite/ultralytics"><img alt="Ultralytics Discord" src="https://img.shields.io/discord/1089800235347353640?logo=discord&logoColor=white&label=Discord&color=blue"></a>
    <a href="https://community.ultralytics.com/"><img alt="Ultralytics Forums" src="https://img.shields.io/discourse/users?server=https%3A%2F%2Fcommunity.ultralytics.com&logo=discourse&label=Forums&color=blue"></a>
@ -55,7 +55,7 @@
 在 [**Python>=3.8**](https://www.python.org/) 环境中使用 [**PyTorch>=1.8**](https://pytorch.org/get-started/locally/) 通过 pip 安装包含所有[依赖项](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) 的 ultralytics 包。
-[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Ultralytics Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)
+[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Ultralytics Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)
 ```bash
 pip install ultralytics
--- a/docker/Dockerfile-jupyter
+++ b/docker/Dockerfile-jupyter
@ -17,7 +17,7 @@ RUN mkdir /data/weights && /usr/local/bin/yolo settings weights_dir="/data/weigh
 RUN mkdir /data/runs && /usr/local/bin/yolo settings runs_dir="/data/runs"
 # Start JupyterLab with tutorial notebook
-ENTRYPOINT ["/usr/local/bin/jupyter", "lab", "--allow-root", "/ultralytics/examples/tutorial.ipynb"]
+ENTRYPOINT ["/usr/local/bin/jupyter", "lab", "--allow-root", "--ip=*", "/ultralytics/examples/tutorial.ipynb"]
 # Usage Examples -------------------------------------------------------------------------------------------------------
--- a/docs/README.md
+++ b/docs/README.md
@ -15,7 +15,7 @@
 ## 🛠️ Installation
 [![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/)
-[![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics)
+[![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics)
 [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)
 To install the ultralytics package in developer mode, ensure you have Git and Python 3 installed on your system. Then, follow these steps:
--- a/docs/en/guides/analytics.md
+++ b/docs/en/guides/analytics.md
@ -45,126 +45,15 @@ This guide provides a comprehensive overview of three fundamental types of [data
        # generate the pie chart
        yolo solutions analytics analytics_type="pie" show=True
        ```
    === "Python"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        out = cv2.VideoWriter(
            "ultralytics_analytics.avi",
            cv2.VideoWriter_fourcc(*"MJPG"),
            fps,
            (1920, 1080),  # This is fixed
        )
        analytics = solutions.Analytics(
            analytics_type="line",
            show=True,
        )
        frame_count = 0
        while cap.isOpened():
            success, im0 = cap.read()
            if success:
                frame_count += 1
                im0 = analytics.process_data(im0, frame_count)  # update analytics graph every frame
                out.write(im0)  # write the video file
            else:
                break
        cap.release()
        out.release()
        cv2.destroyAllWindows()
        ```
    === "Pie Chart"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        out = cv2.VideoWriter(
            "ultralytics_analytics.avi",
            cv2.VideoWriter_fourcc(*"MJPG"),
            fps,
            (1920, 1080),  # This is fixed
        )
-        analytics = solutions.Analytics(
+        # generate the bar plots
-            analytics_type="pie",
+        yolo solutions analytics analytics_type="bar" show=True
            show=True,
        )
        frame_count = 0
        while cap.isOpened():
            success, im0 = cap.read()
            if success:
                frame_count += 1
                im0 = analytics.process_data(im0, frame_count)  # update analytics graph every frame
                out.write(im0)  # write the video file
            else:
                break
        cap.release()
        out.release()
        cv2.destroyAllWindows()
        ```
    === "Bar Plot"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        out = cv2.VideoWriter(
            "ultralytics_analytics.avi",
            cv2.VideoWriter_fourcc(*"MJPG"),
            fps,
            (1920, 1080),  # This is fixed
        )
-        analytics = solutions.Analytics(
+        # generate the area plots
-            analytics_type="bar",
+        yolo solutions analytics analytics_type="area" show=True
            show=True,
        )
        frame_count = 0
        while cap.isOpened():
            success, im0 = cap.read()
            if success:
                frame_count += 1
                im0 = analytics.process_data(im0, frame_count)  # update analytics graph every frame
                out.write(im0)  # write the video file
            else:
                break
        cap.release()
        out.release()
        cv2.destroyAllWindows()
        ```
-    === "Area chart"
+    === "Python"
        ```python
        import cv2
@ -173,9 +62,9 @@ This guide provides a comprehensive overview of three fundamental types of [data
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        out = cv2.VideoWriter(
            "ultralytics_analytics.avi",
            cv2.VideoWriter_fourcc(*"MJPG"),
@ -183,11 +72,15 @@ This guide provides a comprehensive overview of three fundamental types of [data
            (1920, 1080),  # This is fixed
        )
        # Init analytics
        analytics = solutions.Analytics(
-            analytics_type="area",
+            show=True,  # Display the output
-            show=True,
+            analytics_type="line",  # Pass the analytics type, could be "pie", "bar" or "area".
            model="yolo11n.pt",  # Path to the YOLO11 model file
            # classes=[0, 2],  # If you want to count specific classes i.e person and car with COCO pretrained model.
        )
        # Process video
        frame_count = 0
        while cap.isOpened():
            success, im0 = cap.read()
--- a/docs/en/guides/distance-calculation.md
+++ b/docs/en/guides/distance-calculation.md
@ -55,6 +55,7 @@ Measuring the gap between two objects is known as distance calculation within a
        # Init distance-calculation obj
        distance = solutions.DistanceCalculation(model="yolo11n.pt", show=True)
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
--- a/docs/en/guides/heatmaps.md
+++ b/docs/en/guides/heatmaps.md
@ -47,119 +47,12 @@ A heatmap generated with [Ultralytics YOLO11](https://github.com/ultralytics/ult
        # Pass a custom colormap
        yolo solutions heatmap colormap=cv2.COLORMAP_INFERNO
        ```
    === "Python"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("heatmap_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init heatmap
        heatmap = solutions.Heatmap(
            show=True,
            model="yolo11n.pt",
            colormap=cv2.COLORMAP_PARULA,
        )
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = heatmap.generate_heatmap(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "Line Counting"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("heatmap_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
-        # line for object counting
+        # Heatmaps + object counting
-        line_points = [(20, 400), (1080, 404)]
+        yolo solutions heatmap region=[(20, 400), (1080, 404), (1080, 360), (20, 360)]
        # Init heatmap
        heatmap = solutions.Heatmap(
            show=True,
            model="yolo11n.pt",
            colormap=cv2.COLORMAP_PARULA,
            region=line_points,
        )
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = heatmap.generate_heatmap(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
-    === "Polygon Counting"
+    === "Python"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("heatmap_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Define polygon points
        region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360), (20, 400)]
        # Init heatmap
        heatmap = solutions.Heatmap(
            show=True,
            model="yolo11n.pt",
            colormap=cv2.COLORMAP_PARULA,
            region=region_points,
        )
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = heatmap.generate_heatmap(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "Region Counting"
        ```python
        import cv2
@ -173,51 +66,24 @@ A heatmap generated with [Ultralytics YOLO11](https://github.com/ultralytics/ult
        # Video writer
        video_writer = cv2.VideoWriter("heatmap_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
-        # Define region points
+        # In case you want to apply object counting + heatmaps, you can pass region points.
-        region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360)]
+        # region_points = [(20, 400), (1080, 404)]  # Define line points
-
+        # region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360)]  # Define region points
-        # Init heatmap
+        # region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360), (20, 400)]  # Define polygon points
        heatmap = solutions.Heatmap(
            show=True,
            model="yolo11n.pt",
            colormap=cv2.COLORMAP_PARULA,
            region=region_points,
        )
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = heatmap.generate_heatmap(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "Specific Classes"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("heatmap_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init heatmap
        heatmap = solutions.Heatmap(
-            show=True,
+            show=True,  # Display the output
-            model="yolo11n.pt",
+            model="yolo11n.pt",  # Path to the YOLO11 model file
-            classes=[0, 2],
+            colormap=cv2.COLORMAP_PARULA,  # Colormap of heatmap
            # region=region_points,  # If you want to do object counting with heatmaps, you can pass region_points
            # classes=[0, 2],  # If you want to generate heatmap for specific classes i.e person and car.
            # show_in=True,  # Display in counts
            # show_out=True,  # Display out counts
            # line_width=2,  # Adjust the line width for bounding boxes and text display
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
--- a/docs/en/guides/object-counting.md
+++ b/docs/en/guides/object-counting.md
@ -19,7 +19,7 @@ Object counting with [Ultralytics YOLO11](https://github.com/ultralytics/ultraly
        allowfullscreen>
      </iframe>
      <br>
-      <strong>Watch:</strong> Object Counting using Ultralytics YOLO11
+      <strong>Watch:</strong> Object Counting using Ultralytics YOLOv8
    </td>
    <td align="center">
      <iframe loading="lazy" width="720" height="405" src="https://www.youtube.com/embed/Fj9TStNBVoY"
@ -73,165 +73,22 @@ Object counting with [Ultralytics YOLO11](https://github.com/ultralytics/ultraly
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Define region points
-        region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360)]
+        # region_points = [(20, 400), (1080, 400)]  # For line counting
-
+        region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360)]  # For rectangle region counting
-        # Video writer
+        # region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360), (20, 400)]  # For polygon region counting
        video_writer = cv2.VideoWriter("object_counting_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init Object Counter
        counter = solutions.ObjectCounter(
            show=True,
            region=region_points,
            model="yolo11n.pt",
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = counter.count(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "OBB Object Counting"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # line or region points
        line_points = [(20, 400), (1080, 400)]
        # Video writer
        video_writer = cv2.VideoWriter("object_counting_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init Object Counter
        counter = solutions.ObjectCounter(
            show=True,
            region=line_points,
            model="yolo11n-obb.pt",
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = counter.count(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "Count in Polygon"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Define region points
        region_points = [(20, 400), (1080, 404), (1080, 360), (20, 360), (20, 400)]
        # Video writer
        video_writer = cv2.VideoWriter("object_counting_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init Object Counter
        counter = solutions.ObjectCounter(
            show=True,
            region=region_points,
            model="yolo11n.pt",
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = counter.count(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "Count in Line"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Define region points
        line_points = [(20, 400), (1080, 400)]
        # Video writer
        video_writer = cv2.VideoWriter("object_counting_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init Object Counter
        counter = solutions.ObjectCounter(
            show=True,
            region=line_points,
            model="yolo11n.pt",
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = counter.count(im0)
            video_writer.write(im0)
        cap.release()
        video_writer.release()
        cv2.destroyAllWindows()
        ```
    === "Specific Classes"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("object_counting_output.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init Object Counter
        counter = solutions.ObjectCounter(
-            show=True,
+            show=True,  # Display the output
-            model="yolo11n.pt",
+            region=region_points,  # Pass region points
-            classes=[0, 1],
+            model="yolo11n.pt",  # model="yolo11n-obb.pt" for object counting using YOLO11 OBB model.
            # classes=[0, 2],  # If you want to count specific classes i.e person and car with COCO pretrained model.
            # show_in=True,  # Display in counts
            # show_out=True,  # Display out counts
            # line_width=2,  # Adjust the line width for bounding boxes and text display
        )
        # Process video
--- a/docs/en/guides/queue-management.md
+++ b/docs/en/guides/queue-management.md
@ -60,53 +60,23 @@ Queue management using [Ultralytics YOLO11](https://github.com/ultralytics/ultra
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("queue_management.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
-        queue_region = [(20, 400), (1080, 404), (1080, 360), (20, 360)]
+        # Define queue region points
        queue_region = [(20, 400), (1080, 404), (1080, 360), (20, 360)]  # Define queue region points
        # queue_region = [(20, 400), (1080, 404), (1080, 360), (20, 360), (20, 400)]  # Define queue polygon points
        # Init Queue Manager
        queue = solutions.QueueManager(
-            model="yolo11n.pt",
+            show=True,  # Display the output
-            region=queue_region,
+            model="yolo11n.pt",  # Path to the YOLO11 model file
-        )
+            region=queue_region,  # Pass queue region points
-
+            # classes=[0, 2],  # If you want to count specific classes i.e person and car with COCO pretrained model.
-        while cap.isOpened():
+            # line_width=2,  # Adjust the line width for bounding boxes and text display
            success, im0 = cap.read()
            if success:
                out = queue.process_queue(im0)
                video_writer.write(im0)
                if cv2.waitKey(1) & 0xFF == ord("q"):
                    break
                continue
            print("Video frame is empty or video processing has been successfully completed.")
            break
        cap.release()
        cv2.destroyAllWindows()
        ```
    === "Queue Manager Specific Classes"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        video_writer = cv2.VideoWriter("queue_management.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        queue_region = [(20, 400), (1080, 404), (1080, 360), (20, 360)]
        queue = solutions.QueueManager(
            model="yolo11n.pt",
            classes=3,
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
--- a/docs/en/guides/speed-estimation.md
+++ b/docs/en/guides/speed-estimation.md
@ -61,16 +61,24 @@ keywords: Ultralytics YOLO11, speed estimation, object tracking, computer vision
        from ultralytics import solutions
        cap = cv2.VideoCapture("Path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        # Video writer
        video_writer = cv2.VideoWriter("speed_management.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Define speed region points
        speed_region = [(20, 400), (1080, 404), (1080, 360), (20, 360)]
-        speed = solutions.SpeedEstimator(model="yolo11n.pt", region=speed_region, show=True)
+        speed = solutions.SpeedEstimator(
            show=True,  # Display the output
            model="yolo11n-pose.pt",  # Path to the YOLO11 model file.
            region=speed_region,  # Pass region points
            # classes=[0, 2],  # If you want to estimate speed of specific classes.
            # line_width=2,  # Adjust the line width for bounding boxes and text display
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
--- a/docs/en/guides/streamlit-live-inference.md
+++ b/docs/en/guides/streamlit-live-inference.md
@ -40,6 +40,12 @@ Streamlit makes it simple to build and deploy interactive web applications. Comb
 !!! example "Streamlit Application"
    === "CLI"
        ```bash
        yolo streamlit-predict
        ```
    === "Python"
        ```python
@ -50,12 +56,6 @@ Streamlit makes it simple to build and deploy interactive web applications. Comb
        ### Make sure to run the file using command `streamlit run <file-name.py>`
        ```
    === "CLI"
        ```bash
        yolo streamlit-predict
        ```
 This will launch the Streamlit application in your default web browser. You will see the main title, subtitle, and the sidebar with configuration options. Select your desired YOLO11 model, set the confidence and NMS thresholds, and click the "Start" button to begin the real-time object detection.
 You can optionally supply a specific model in Python:
--- a/docs/en/guides/workouts-monitoring.md
+++ b/docs/en/guides/workouts-monitoring.md
@ -60,40 +60,18 @@ Monitoring workouts through pose estimation with [Ultralytics YOLO11](https://gi
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
-        gym = solutions.AIGym(
+        # Video writer
            model="yolo11n-pose.pt",
            show=True,
            kpts=[6, 8, 10],
        )
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
                print("Video frame is empty or video processing has been successfully completed.")
                break
            im0 = gym.monitor(im0)
        cv2.destroyAllWindows()
        ```
    === "Workouts Monitoring with Save Output"
        ```python
        import cv2
        from ultralytics import solutions
        cap = cv2.VideoCapture("path/to/video/file.mp4")
        assert cap.isOpened(), "Error reading video file"
        w, h, fps = (int(cap.get(x)) for x in (cv2.CAP_PROP_FRAME_WIDTH, cv2.CAP_PROP_FRAME_HEIGHT, cv2.CAP_PROP_FPS))
        video_writer = cv2.VideoWriter("workouts.avi", cv2.VideoWriter_fourcc(*"mp4v"), fps, (w, h))
        # Init AIGym
        gym = solutions.AIGym(
-            show=True,
+            show=True,  # Display the frame
-            kpts=[6, 8, 10],
+            kpts=[6, 8, 10],  # keypoints index of person for monitoring specific exercise, by default it's for pushup
            model="yolo11n-pose.pt",  # Path to the YOLO11 pose estimation model file
            # line_width=2,  # Adjust the line width for bounding boxes and text display
        )
        # Process video
        while cap.isOpened():
            success, im0 = cap.read()
            if not success:
--- a/docs/en/index.md
+++ b/docs/en/index.md
@ -20,7 +20,7 @@ keywords: Ultralytics, YOLO, YOLO11, object detection, image segmentation, deep
 <br>
 <br>
    <a href="https://github.com/ultralytics/ultralytics/actions/workflows/ci.yaml"><img src="https://github.com/ultralytics/ultralytics/actions/workflows/ci.yaml/badge.svg" alt="Ultralytics CI"></a>
-    <a href="https://pepy.tech/project/ultralytics"><img src="https://static.pepy.tech/badge/ultralytics" alt="Ultralytics Downloads"></a>
+    <a href="https://www.pepy.tech/projects/ultralytics"><img src="https://static.pepy.tech/badge/ultralytics" alt="Ultralytics Downloads"></a>
    <a href="https://zenodo.org/badge/latestdoi/264818686"><img src="https://zenodo.org/badge/264818686.svg" alt="Ultralytics YOLO Citation"></a>
    <a href="https://discord.com/invite/ultralytics"><img alt="Ultralytics Discord" src="https://img.shields.io/discord/1089800235347353640?logo=discord&logoColor=white&label=Discord&color=blue"></a>
    <a href="https://community.ultralytics.com/"><img alt="Ultralytics Forums" src="https://img.shields.io/discourse/users?server=https%3A%2F%2Fcommunity.ultralytics.com&logo=discourse&label=Forums&color=blue"></a>
--- a/docs/en/integrations/albumentations.md
+++ b/docs/en/integrations/albumentations.md
@ -158,3 +158,42 @@ If you are interested in learning more about Albumentations, check out the follo
 In this guide, we explored the key aspects of Albumentations, a great Python library for image augmentation. We discussed its wide range of transformations, optimized performance, and how you can use it in your next YOLO11 project.
 Also, if you'd like to know more about other Ultralytics YOLO11 integrations, visit our [integration guide page](../integrations/index.md). You'll find valuable resources and insights there.
 ## FAQ
 ### How can I integrate Albumentations with YOLO11 for improved data augmentation?
 Albumentations integrates seamlessly with YOLO11 and applies automatically during training if you have the package installed. Here's how to get started:
 ```python
 # Install required packages
 # !pip install albumentations ultralytics
 from ultralytics import YOLO
 # Load and train model with automatic augmentations
 model = YOLO("yolo11n.pt")
 model.train(data="coco8.yaml", epochs=100)
 ```
 The integration includes optimized augmentations like blur, median blur, grayscale conversion, and CLAHE with carefully tuned probabilities to enhance model performance.
 ### What are the key benefits of using Albumentations over other augmentation libraries?
 Albumentations stands out for several reasons:
 1. Performance: Built on OpenCV and NumPy with SIMD optimization for superior speed
 2. Flexibility: Supports 70+ transformations across pixel-level, spatial-level, and mixing-level augmentations
 3. Compatibility: Works seamlessly with popular frameworks like [PyTorch](../integrations/torchscript.md) and [TensorFlow](../integrations/tensorboard.md)
 4. Reliability: Extensive test suite prevents silent data corruption
 5. Ease of use: Single unified API for all augmentation types
 ### What types of computer vision tasks can benefit from Albumentations augmentation?
 Albumentations enhances various [computer vision tasks](../tasks/index.md) including:
 - [Object Detection](../tasks/detect.md): Improves model robustness to lighting, scale, and orientation variations
 - [Instance Segmentation](../tasks/segment.md): Enhances mask prediction accuracy through diverse transformations
 - [Classification](../tasks/classify.md): Increases model generalization with color and geometric augmentations
 - [Pose Estimation](../tasks/pose.md): Helps models adapt to different viewpoints and lighting conditions
 The library's diverse augmentation options make it valuable for any vision task requiring robust model performance.
--- a/docs/en/integrations/index.md
+++ b/docs/en/integrations/index.md
@ -61,6 +61,8 @@ Welcome to the Ultralytics Integrations page! This page provides an overview of
 - [Albumentations](albumentations.md): Enhance your Ultralytics models with powerful image augmentations to improve model robustness and generalization.
 - [SONY IMX500](sony-imx500.md): Optimize and deploy [Ultralytics YOLOv8](https://docs.ultralytics.com/models/yolov8/) models on Raspberry Pi AI Cameras with the IMX500 sensor for fast, low-power performance.
 ## Deployment Integrations
 - [CoreML](coreml.md): CoreML, developed by [Apple](https://www.apple.com/), is a framework designed for efficiently integrating machine learning models into applications across iOS, macOS, watchOS, and tvOS, using Apple's hardware for effective and secure [model deployment](https://www.ultralytics.com/glossary/model-deployment).
--- a/docs/en/integrations/sony-imx500.md
+++ b/docs/en/integrations/sony-imx500.md
@ -0,0 +1,325 @@
 ---
 comments: true
 description: Learn to export Ultralytics YOLOv8 models to Sony's IMX500 format to optimize your models for efficient deployment.
 keywords: Sony, IMX500, IMX 500, Atrios, MCT, model export, quantization, pruning, deep learning optimization, Raspberry Pi AI Camera, edge AI, PyTorch, IMX
 ---
 # Sony IMX500 Export for Ultralytics YOLOv8
 This guide covers exporting and deploying Ultralytics YOLOv8 models to Raspberry Pi AI Cameras that feature the Sony IMX500 sensor.
 Deploying computer vision models on devices with limited computational power, such as [Raspberry Pi AI Camera](https://www.raspberrypi.com/products/ai-camera/), can be tricky. Using a model format optimized for faster performance makes a huge difference.
 The IMX500 model format is designed to use minimal power while delivering fast performance for neural networks. It allows you to optimize your [Ultralytics YOLOv8](https://github.com/ultralytics/ultralytics) models for high-speed and low-power inferencing. In this guide, we'll walk you through exporting and deploying your models to the IMX500 format while making it easier for your models to perform well on the [Raspberry Pi AI Camera](https://www.raspberrypi.com/products/ai-camera/).
 <p align="center">
  <img width="100%" src="https://github.com/ultralytics/assets/releases/download/v8.3.0/ai-camera.avif" alt="Raspberry Pi AI Camera">
 </p>
 ## Why Should You Export to IMX500
 Sony's [IMX500 Intelligent Vision Sensor](https://developer.aitrios.sony-semicon.com/en/raspberrypi-ai-camera) is a game-changing piece of hardware in edge AI processing. It's the world's first intelligent vision sensor with on-chip AI capabilities. This sensor helps overcome many challenges in edge AI, including data processing bottlenecks, privacy concerns, and performance limitations.  
 While other sensors merely pass along images and frames, the IMX500 tells a whole story. It processes data directly on the sensor, allowing devices to generate insights in real-time.
 ## Sony's IMX500 Export for YOLOv8 Models
 The IMX500 is designed to transform how devices handle data directly on the sensor, without needing to send it off to the cloud for processing.
 The IMX500 works with quantized models. Quantization makes models smaller and faster without losing much [accuracy](https://www.ultralytics.com/glossary/accuracy). It is ideal for the limited resources of edge computing, allowing applications to respond quickly by reducing latency and allowing for quick data processing locally, without cloud dependency. Local processing also keeps user data private and secure since it's not sent to a remote server.
 **IMX500 Key Features:**
 - **Metadata Output:** Instead of transmitting full images, the IMX500 outputs only metadata, minimizing data size, reducing bandwidth, and lowering costs.
 - **Addresses Privacy Concerns:** By processing data on the device, the IMX500 addresses privacy concerns, ideal for human-centric applications like person counting and occupancy tracking.
 - **Real-time Processing:** Fast, on-sensor processing supports real-time decisions, perfect for edge AI applications such as autonomous systems.
 **Before You Begin:** For best results, ensure your YOLOv8 model is well-prepared for export by following our [Model Training Guide](https://docs.ultralytics.com/modes/train/), [Data Preparation Guide](https://docs.ultralytics.com/datasets/), and [Hyperparameter Tuning Guide](https://docs.ultralytics.com/guides/hyperparameter-tuning/).
 ## Usage Examples
 Export an Ultralytics YOLOv8 model to IMX500 format and run inference with the exported model.
 !!! note
    Here we perform inference just to make sure the model works as expected. However, for deployment and inference on the Raspberry Pi AI Camera, please jump to [Using IMX500 Export in Deployment](#using-imx500-export-in-deployment) section.
 !!! example
    === "Python"
         ```python
         from ultralytics import YOLO
         # Load a YOLOv8n PyTorch model
         model = YOLO("yolov8n.pt")
         # Export the model
         model.export(format="imx")  # exports with PTQ quantization by default
         # Load the exported model
         imx_model = YOLO("yolov8n_imx_model")
         # Run inference
         results = imx_model("https://ultralytics.com/images/bus.jpg")
         ```
    === "CLI"
         ```bash
         # Export a YOLOv8n PyTorch model to imx format with Post-Training Quantization (PTQ)
         yolo export model=yolov8n.pt format=imx
         # Run inference with the exported model
         yolo predict model=yolov8n_imx_model source='https://ultralytics.com/images/bus.jpg'
         ```
 The export process will create an ONNX model for quantization validation, along with a directory named `<model-name>_imx_model`. This directory will include the `packerOut.zip` file, which is essential for packaging the model for deployment on the IMX500 hardware. Additionally, the `<model-name>_imx_model` folder will contain a text file (`labels.txt`) listing all the labels associated with the model.
 ```bash
 yolov8n_imx_model
 ├── dnnParams.xml
 ├── labels.txt
 ├── packerOut.zip
 ├── yolov8n_imx.onnx
 ├── yolov8n_imx500_model_MemoryReport.json
 └── yolov8n_imx500_model.pbtxt
 ```
 ## Arguments
 When exporting a model to IMX500 format, you can specify various arguments:
 | Key      | Value  | Description                                              |
 | -------- | ------ | -------------------------------------------------------- |
 | `format` | `imx`  | Format to export to (imx)                                |
 | `int8`   | `True` | Enable INT8 quantization for the model (default: `True`) |
 | `imgsz`  | `640`  | Image size for the model input (default: `640`)          |
 ## Using IMX500 Export in Deployment
 After exporting Ultralytics YOLOv8n model to IMX500 format, it can be deployed to Raspberry Pi AI Camera for inference.
 ### Hardware Prerequisites
 Make sure you have the below hardware:
 1. Raspberry Pi 5 or Raspberry Pi 4 Model B
 2. Raspberry Pi AI Camera
 Connect the Raspberry Pi AI camera to the 15-pin MIPI CSI connector on the Raspberry Pi and power on the Raspberry Pi
 ### Software Prerequisites
 !!! note
    This guide has been tested with Raspberry Pi OS Bookworm running on a Raspberry Pi 5
 Step 1: Open a terminal window and execute the following commands to update the Raspberry Pi software to the latest version.
 ```bash
 sudo apt update && sudo apt full-upgrade
 ```
 Step 2: Install IMX500 firmware which is required to operate the IMX500 sensor along with a packager tool.
 ```bash
 sudo apt install imx500-all imx500-tools
 ```
 Step 3: Install prerequisites to run `picamera2` application. We will use this application later for the deployment process.
 ```bash
 sudo apt install python3-opencv python3-munkres
 ```
 Step 4: Reboot Raspberry Pi for the changes to take into effect
 ```bash
 sudo reboot
 ```
 ### Package Model and Deploy to AI Camera
 After obtaining `packerOut.zip` from the IMX500 conversion process, you can pass this file into the packager tool to obtain an RPK file. This file can then be deployed directly to the AI Camera using `picamera2`.
 Step 1: Package the model into RPK file
 ```bash
 imx500-package -i <path to packerOut.zip> -o <output folder>
 ```
 The above will generate a `network.rpk` file inside the specified output folder.
 Step 2: Clone `picamera2` repository, install it and navigate to the imx500 examples
 ```bash
 git clone -b next https://github.com/raspberrypi/picamera2
 cd picamera2
 pip install -e .  --break-system-packages
 cd examples/imx500
 ```
 Step 3: Run YOLOv8 object detection, using the labels.txt file that has been generated during the IMX500 export.
 ```bash
 python imx500_object_detection_demo.py --model <path to network.rpk> --fps 25 --bbox-normalization --ignore-dash-labels --bbox-order xy –labels <path to labels.txt>
 ```
 Then you will be able to see live inference output as follows
 <p align="center">
  <img width="100%" src="https://github.com/ultralytics/assets/releases/download/v8.3.0/imx500-inference-rpi.avif" alt="Inference on Raspberry Pi AI Camera">
 </p>
 ## Benchmarks
 YOLOv8 benchmarks below were run by the Ultralytics team on Raspberry Pi AI Camera with `imx` model format measuring speed and accuracy.
 | Model   | Format | Status | Size (MB) | mAP50-95(B) | Inference time (ms/im) |
 | ------- | ------ | ------ | --------- | ----------- | ---------------------- |
 | YOLOv8n | imx    | ✅     | 2.9       | 0.522       | 66.66                  |
 !!! note
    Validation for the above benchmark was done using coco8 dataset
 ## What's Under the Hood?
 <p align="center">
  <img width="640" src="https://github.com/ultralytics/assets/releases/download/v8.3.0/imx500-deploy.avif" alt="IMX500 deployment">
 </p>
 ### Sony Model Compression Toolkit (MCT)
 [Sony's Model Compression Toolkit (MCT)](https://github.com/sony/model_optimization) is a powerful tool for optimizing deep learning models through quantization and pruning. It supports various quantization methods and provides advanced algorithms to reduce model size and computational complexity without significantly sacrificing accuracy. MCT is particularly useful for deploying models on resource-constrained devices, ensuring efficient inference and reduced latency.
 ### Supported Features of MCT
 Sony's MCT offers a range of features designed to optimize neural network models:
 1. **Graph Optimizations**: Transforms models into more efficient versions by folding layers like batch normalization into preceding layers.
 2. **Quantization Parameter Search**: Minimizes quantization noise using metrics like Mean-Square-Error, No-Clipping, and Mean-Average-Error.
 3. **Advanced Quantization Algorithms**:
    - **Shift Negative Correction**: Addresses performance issues from symmetric activation quantization.
    - **Outliers Filtering**: Uses z-score to detect and remove outliers.
    - **Clustering**: Utilizes non-uniform quantization grids for better distribution matching.
    - **Mixed-Precision Search**: Assigns different quantization bit-widths per layer based on sensitivity.
 4. **Visualization**: Use TensorBoard to observe model performance insights, quantization phases, and bit-width configurations.
 #### Quantization
 MCT supports several quantization methods to reduce model size and improve inference speed:
 1. **Post-Training Quantization (PTQ)**:
    - Available via Keras and PyTorch APIs.
    - Complexity: Low
    - Computational Cost: Low (CPU minutes)
 2. **Gradient-based Post-Training Quantization (GPTQ)**:
    - Available via Keras and PyTorch APIs.
    - Complexity: Medium
    - Computational Cost: Moderate (2-3 GPU hours)
 3. **Quantization-Aware Training (QAT)**:
    - Complexity: High
    - Computational Cost: High (12-36 GPU hours)
 MCT also supports various quantization schemes for weights and activations:
 1. Power-of-Two (hardware-friendly)
 2. Symmetric
 3. Uniform
 #### Structured Pruning
 MCT introduces structured, hardware-aware model pruning designed for specific hardware architectures. This technique leverages the target platform's Single Instruction, Multiple Data (SIMD) capabilities by pruning SIMD groups. This reduces model size and complexity while optimizing channel utilization, aligned with the SIMD architecture for targeted resource utilization of weights memory footprint. Available via Keras and PyTorch APIs.
 ### IMX500 Converter Tool (Compiler)
 The IMX500 Converter Tool is integral to the IMX500 toolset, allowing the compilation of models for deployment on Sony's IMX500 sensor (for instance, Raspberry Pi AI Cameras). This tool facilitates the transition of Ultralytics YOLOv8 models processed through Ultralytics software, ensuring they are compatible and perform efficiently on the specified hardware. The export procedure following model quantization involves the generation of binary files that encapsulate essential data and device-specific configurations, streamlining the deployment process on the Raspberry Pi AI Camera.
 ## Real-World Use Cases
 Export to IMX500 format has wide applicability across industries. Here are some examples:
 - **Edge AI and IoT**: Enable object detection on drones or security cameras, where real-time processing on low-power devices is essential.
 - **Wearable Devices**: Deploy models optimized for small-scale AI processing on health-monitoring wearables.
 - **Smart Cities**: Use IMX500-exported YOLOv8 models for traffic monitoring and safety analysis with faster processing and minimal latency.
 - **Retail Analytics**: Enhance in-store monitoring by deploying optimized models in point-of-sale systems or smart shelves.
 ## Conclusion
 Exporting Ultralytics YOLOv8 models to Sony's IMX500 format allows you to deploy your models for efficient inference on IMX500-based cameras. By leveraging advanced quantization and pruning techniques, you can reduce model size and improve inference speed without significantly compromising accuracy.
 For more information and detailed guidelines, refer to Sony's [IMX500 website](https://developer.aitrios.sony-semicon.com/en/raspberrypi-ai-camera).
 ## FAQ
 ### How do I export a YOLOv8 model to IMX500 format for Raspberry Pi AI Camera?
 To export a YOLOv8 model to IMX500 format, use either the Python API or CLI command:
 ```python
 from ultralytics import YOLO
 model = YOLO("yolov8n.pt")
 model.export(format="imx")  # Exports with PTQ quantization by default
 ```
 The export process will create a directory containing the necessary files for deployment, including `packerOut.zip` which can be used with the IMX500 packager tool on Raspberry Pi.
 ### What are the key benefits of using the IMX500 format for edge AI deployment?
 The IMX500 format offers several important advantages for edge deployment:
 - On-chip AI processing reduces latency and power consumption
 - Outputs metadata instead of full images, minimizing bandwidth usage
 - Enhanced privacy by processing data locally without cloud dependency
 - Real-time processing capabilities ideal for time-sensitive applications
 - Optimized quantization for efficient model deployment on resource-constrained devices
 ### What hardware and software prerequisites are needed for IMX500 deployment?
 For deploying IMX500 models, you'll need:
 Hardware:
 - Raspberry Pi 5 or Raspberry Pi 4 Model B
 - Raspberry Pi AI Camera with IMX500 sensor
 Software:
 - Raspberry Pi OS Bookworm
 - IMX500 firmware and tools (`sudo apt install imx500-all imx500-tools`)
 - Python packages for `picamera2` (`sudo apt install python3-opencv python3-munkres`)
 ### What performance can I expect from YOLOv8 models on the IMX500?
 Based on Ultralytics benchmarks on Raspberry Pi AI Camera:
 - YOLOv8n achieves 66.66ms inference time per image
 - mAP50-95 of 0.522 on COCO8 dataset
 - Model size of only 2.9MB after quantization
 This demonstrates that IMX500 format provides efficient real-time inference while maintaining good accuracy for edge AI applications.
 ### How do I package and deploy my exported model to the Raspberry Pi AI Camera?
 After exporting to IMX500 format:
 1. Use the packager tool to create an RPK file:
    ```bash
    imx500-package -i <path to packerOut.zip> -o <output folder>
    ```
 2. Clone and install picamera2:
    ```bash
    git clone -b next https://github.com/raspberrypi/picamera2
    cd picamera2 && pip install -e . --break-system-packages
    ```
 3. Run inference using the generated RPK file:
    ```bash
    python imx500_object_detection_demo.py --model <path to network.rpk> --fps 25 --bbox-normalization --labels <path to labels.txt>
    ```
--- a/docs/en/macros/export-table.md
+++ b/docs/en/macros/export-table.md
@ -14,3 +14,4 @@
 | [PaddlePaddle](../integrations/paddlepaddle.md)   | `paddle`          | `{{ model_name or "yolo11n" }}_paddle_model/`   | ✅       | `imgsz`, `batch`                                                     |
 | [MNN](../integrations/mnn.md)                     | `mnn`             | `{{ model_name or "yolo11n" }}.mnn`             | ✅       | `imgsz`, `batch`, `int8`, `half`                                     |
 | [NCNN](../integrations/ncnn.md)                   | `ncnn`            | `{{ model_name or "yolo11n" }}_ncnn_model/`     | ✅       | `imgsz`, `half`, `batch`                                             |
 | [IMX500](../integrations/sony-imx500.md)          | `imx`             | `{{ model_name or "yolo11n" }}_imx_model/`      | ✅       | `imgsz`, `int8`                                                      |
--- a/docs/en/macros/validation-args.md
+++ b/docs/en/macros/validation-args.md
@ -12,7 +12,7 @@
 | `device`      | `str`   | `None`  | Specifies the device for validation (`cpu`, `cuda:0`, etc.). Allows flexibility in utilizing CPU or GPU resources.                                                                                                                    |
 | `dnn`         | `bool`  | `False` | If `True`, uses the [OpenCV](https://www.ultralytics.com/glossary/opencv) DNN module for ONNX model inference, offering an alternative to [PyTorch](https://www.ultralytics.com/glossary/pytorch) inference methods.                  |
 | `plots`       | `bool`  | `False` | When set to `True`, generates and saves plots of predictions versus ground truth for visual evaluation of the model's performance.                                                                                                    |
-| `rect`        | `bool`  | `False` | If `True`, uses rectangular inference for batching, reducing padding and potentially increasing speed and efficiency.                                                                                                                 |
+| `rect`        | `bool`  | `True`  | If `True`, uses rectangular inference for batching, reducing padding and potentially increasing speed and efficiency.                                                                                                                 |
 | `split`       | `str`   | `val`   | Determines the dataset split to use for validation (`val`, `test`, or `train`). Allows flexibility in choosing the data segment for performance evaluation.                                                                           |
 | `project`     | `str`   | `None`  | Name of the project directory where validation outputs are saved.                                                                                                                                                                     |
 | `name`        | `str`   | `None`  | Name of the validation run. Used for creating a subdirectory within the project folder, where valdiation logs and outputs are stored.                                                                                                 |
--- a/docs/en/models/yolo11.md
+++ b/docs/en/models/yolo11.md
@ -130,7 +130,7 @@ Note that the example below is for YOLO11 [Detect](../tasks/detect.md) models fo
 !!! tip "Ultralytics YOLO11 Publication"
-    Ultralytics has not published a formal research paper for YOLO11 due to the rapidly evolving nature of the models. We focus on advancing the technology and making it easier to use, rather than producing static documentation. For the most up-to-date information on YOLO architecture, features, and usage, please refer to our [GitHub repository](https://github.com/ultralytics/ultralytics) and [documentation](https://docs.ultralytics.com).
+    Ultralytics has not published a formal research paper for YOLO11 due to the rapidly evolving nature of the models. We focus on advancing the technology and making it easier to use, rather than producing static documentation. For the most up-to-date information on YOLO architecture, features, and usage, please refer to our [GitHub repository](https://github.com/ultralytics/ultralytics) and [documentation](https://docs.ultralytics.com/).
 If you use YOLO11 or any other software from this repository in your work, please cite it using the following format:
--- a/docs/en/models/yolov5.md
+++ b/docs/en/models/yolov5.md
@ -94,7 +94,7 @@ This example provides simple YOLOv5 training and inference examples. For full do
 !!! tip "Ultralytics YOLOv5 Publication"
-    Ultralytics has not published a formal research paper for YOLOv5 due to the rapidly evolving nature of the models. We focus on advancing the technology and making it easier to use, rather than producing static documentation. For the most up-to-date information on YOLO architecture, features, and usage, please refer to our [GitHub repository](https://github.com/ultralytics/ultralytics) and [documentation](https://docs.ultralytics.com).
+    Ultralytics has not published a formal research paper for YOLOv5 due to the rapidly evolving nature of the models. We focus on advancing the technology and making it easier to use, rather than producing static documentation. For the most up-to-date information on YOLO architecture, features, and usage, please refer to our [GitHub repository](https://github.com/ultralytics/ultralytics) and [documentation](https://docs.ultralytics.com/).
 If you use YOLOv5 or YOLOv5u in your research, please cite the Ultralytics YOLOv5 repository as follows:
--- a/docs/en/models/yolov8.md
+++ b/docs/en/models/yolov8.md
@ -167,7 +167,7 @@ Note the below example is for YOLOv8 [Detect](../tasks/detect.md) models for obj
 !!! tip "Ultralytics YOLOv8 Publication"
-    Ultralytics has not published a formal research paper for YOLOv8 due to the rapidly evolving nature of the models. We focus on advancing the technology and making it easier to use, rather than producing static documentation. For the most up-to-date information on YOLO architecture, features, and usage, please refer to our [GitHub repository](https://github.com/ultralytics/ultralytics) and [documentation](https://docs.ultralytics.com).
+    Ultralytics has not published a formal research paper for YOLOv8 due to the rapidly evolving nature of the models. We focus on advancing the technology and making it easier to use, rather than producing static documentation. For the most up-to-date information on YOLO architecture, features, and usage, please refer to our [GitHub repository](https://github.com/ultralytics/ultralytics) and [documentation](https://docs.ultralytics.com/).
 If you use the YOLOv8 model or any other software from this repository in your work, please cite it using the following format:
--- a/docs/en/quickstart.md
+++ b/docs/en/quickstart.md
@ -28,7 +28,7 @@ Ultralytics provides various installation methods including pip, conda, and Dock
        Install the `ultralytics` package using pip, or update an existing installation by running `pip install -U ultralytics`. Visit the Python Package Index (PyPI) for more details on the `ultralytics` package: [https://pypi.org/project/ultralytics/](https://pypi.org/project/ultralytics/).
        [![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/)
-        [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics)
+        [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics)
        ```bash
        # Install the ultralytics package from PyPI
--- a/docs/en/reference/utils/torch_utils.md
+++ b/docs/en/reference/utils/torch_utils.md
@ -19,6 +19,10 @@ keywords: Ultralytics, torch utils, model optimization, device selection, infere
 <br><br><hr><br>
 ## ::: ultralytics.utils.torch_utils.FXModel
 <br><br><hr><br>
 ## ::: ultralytics.utils.torch_utils.torch_distributed_zero_first
 <br><br><hr><br>
--- a/docs/mkdocs_github_authors.yaml
+++ b/docs/mkdocs_github_authors.yaml
@ -109,6 +109,9 @@ chr043416@gmail.com:
 davis.justin@mssm.org:
  avatar: https://avatars.githubusercontent.com/u/23462437?v=4
  username: justincdavis
 francesco.mttl@gmail.com:
  avatar: https://avatars.githubusercontent.com/u/3855193?v=4
  username: ambitious-octopus
 glenn.jocher@ultralytics.com:
  avatar: https://avatars.githubusercontent.com/u/26833433?v=4
  username: glenn-jocher
--- a/docs/overrides/javascript/extra.js
+++ b/docs/overrides/javascript/extra.js
@ -47,7 +47,9 @@ checkAutoTheme();
 document.addEventListener("DOMContentLoaded", () => {
  const autoThemeInput = document.getElementById("__palette_1");
  autoThemeInput?.addEventListener("click", () => {
-    if (autoThemeInput.checked) setTimeout(checkAutoTheme);
+    if (autoThemeInput.checked) {
      setTimeout(checkAutoTheme);
    }
  });
 });
@ -165,7 +167,9 @@ let chart = null;  // chart variable will hold the reference to the current char
 // This function is responsible for updating the benchmarks chart.
 function updateChart() {
    // If a chart instance already exists, destroy it.
-    if (chart) chart.destroy();
+    if (chart) {
      chart.destroy();
    }
    // Get the selected algorithms from the checkboxes.
    const selectedAlgorithms = [...document.querySelectorAll('input[name="algorithm"]:checked')].map(e => e.value);
@ -187,7 +191,9 @@ function updateChart() {
    }));
    // If there are no selected algorithms, return without creating a new chart.
-    if (datasets.length === 0) return;
+    if (datasets.length === 0) {
      return;
    }
    // Create a new chart instance.
    chart = new Chart(document.getElementById('chart').getContext('2d'), {
--- a/docs/overrides/javascript/giscus.js
+++ b/docs/overrides/javascript/giscus.js
@ -1,7 +1,9 @@
 // Giscus functionality
 function loadGiscus() {
  const giscusContainer = document.getElementById("giscus-container");
-  if (!giscusContainer || giscusContainer.querySelector("script")) return;
+  if (!giscusContainer || giscusContainer.querySelector("script")) {
    return;
  }
  const script = document.createElement("script");
  script.src = "https://giscus.app/client.js";
--- a/examples/heatmaps.ipynb
+++ b/examples/heatmaps.ipynb
@ -38,7 +38,7 @@
    "\n",
    "Pip install `ultralytics` and [dependencies](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) and check software and hardware.\n",
    "\n",
-    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
+    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
   ]
  },
  {
--- a/examples/hub.ipynb
+++ b/examples/hub.ipynb
@ -36,7 +36,7 @@
    "\n",
    "Pip install `ultralytics` and [dependencies](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) and check software and hardware.\n",
    "\n",
-    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
+    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
   ]
  },
  {
--- a/examples/object_counting.ipynb
+++ b/examples/object_counting.ipynb
@ -38,7 +38,7 @@
    "\n",
    "Pip install `ultralytics` and [dependencies](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) and check software and hardware.\n",
    "\n",
-    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
+    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
   ]
  },
  {
--- a/examples/object_tracking.ipynb
+++ b/examples/object_tracking.ipynb
@ -38,7 +38,7 @@
    "\n",
    "Pip install `ultralytics` and [dependencies](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) and check software and hardware.\n",
    "\n",
-    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
+    "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
   ]
  },
  {
--- a/examples/tutorial.ipynb
+++ b/examples/tutorial.ipynb
@ -55,7 +55,7 @@
        "\n",
        "Pip install `ultralytics` and [dependencies](https://github.com/ultralytics/ultralytics/blob/main/pyproject.toml) and check software and hardware.\n",
        "\n",
-        "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://pepy.tech/project/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
+        "[![PyPI - Version](https://img.shields.io/pypi/v/ultralytics?logo=pypi&logoColor=white)](https://pypi.org/project/ultralytics/) [![Downloads](https://static.pepy.tech/badge/ultralytics)](https://www.pepy.tech/projects/ultralytics) [![PyPI - Python Version](https://img.shields.io/pypi/pyversions/ultralytics?logo=python&logoColor=gold)](https://pypi.org/project/ultralytics/)"
      ]
    },
    {
--- a/mkdocs.yml
+++ b/mkdocs.yml
@ -412,12 +412,14 @@ nav:
      - TF.js: integrations/tfjs.md
      - TFLite: integrations/tflite.md
      - TFLite Edge TPU: integrations/edge-tpu.md
      - Sony IMX500: integrations/sony-imx500.md
      - TensorBoard: integrations/tensorboard.md
      - TensorRT: integrations/tensorrt.md
      - TorchScript: integrations/torchscript.md
      - VS Code: integrations/vscode.md
      - Weights & Biases: integrations/weights-biases.md
      - Albumentations: integrations/albumentations.md
      - SONY IMX500: integrations/sony-imx500.md
  - HUB:
      - hub/index.md
      - Web:
@ -559,7 +561,6 @@ nav:
              - utils: reference/nn/modules/utils.md
          - tasks: reference/nn/tasks.md
      - solutions:
          - solutions: reference/solutions/solutions.md
          - ai_gym: reference/solutions/ai_gym.md
          - analytics: reference/solutions/analytics.md
          - distance_calculation: reference/solutions/distance_calculation.md
@ -567,6 +568,7 @@ nav:
          - object_counter: reference/solutions/object_counter.md
          - parking_management: reference/solutions/parking_management.md
          - queue_management: reference/solutions/queue_management.md
          - solutions: reference/solutions/solutions.md
          - speed_estimation: reference/solutions/speed_estimation.md
          - streamlit_inference: reference/solutions/streamlit_inference.md
      - trackers:
--- a/tests/test_exports.py
+++ b/tests/test_exports.py
@ -205,3 +205,12 @@ def test_export_ncnn():
    """Test YOLO exports to NCNN format."""
    file = YOLO(MODEL).export(format="ncnn", imgsz=32)
    YOLO(file)(SOURCE, imgsz=32)  # exported model inference
@pytest.mark.skipif(True, reason="Test disabled as keras and tensorflow version conflicts with tflite export.")
@pytest.mark.skipif(not LINUX or MACOS, reason="Skipping test on Windows and Macos")
 def test_export_imx():
    """Test YOLOv8n exports to IMX format."""
    model = YOLO("yolov8n.pt")
    file = model.export(format="imx", imgsz=32)
    YOLO(file)(SOURCE, imgsz=32)
--- a/ultralytics/init.py
+++ b/ultralytics/init.py
@ -1,6 +1,6 @@
 # Ultralytics YOLO 🚀, AGPL-3.0 license
-__version__ = "8.3.28"
+__version__ = "8.3.29"
 import os
--- a/ultralytics/data/converter.py
+++ b/ultralytics/data/converter.py
@ -577,7 +577,7 @@ def merge_multi_segment(segments):
    return s
-def yolo_bbox2segment(im_dir, save_dir=None, sam_model="sam_b.pt"):
+def yolo_bbox2segment(im_dir, save_dir=None, sam_model="sam_b.pt", device=None):
    """
    Converts existing object detection dataset (bounding boxes) to segmentation dataset or oriented bounding box (OBB)
    in YOLO format. Generates segmentation data using SAM auto-annotator as needed.
@ -587,6 +587,7 @@ def yolo_bbox2segment(im_dir, save_dir=None, sam_model="sam_b.pt"):
        save_dir (str | Path): Path to save the generated labels, labels will be saved
            into `labels-segment` in the same directory level of `im_dir` if save_dir is None. Default: None.
        sam_model (str): Segmentation model to use for intermediate segmentation data; optional.
        device (int | str): The specific device to run SAM models. Default: None.
    Notes:
        The input directory structure assumed for dataset:
@ -621,7 +622,7 @@ def yolo_bbox2segment(im_dir, save_dir=None, sam_model="sam_b.pt"):
        boxes[:, [0, 2]] *= w
        boxes[:, [1, 3]] *= h
        im = cv2.imread(label["im_file"])
-        sam_results = sam_model(im, bboxes=xywh2xyxy(boxes), verbose=False, save=False)
+        sam_results = sam_model(im, bboxes=xywh2xyxy(boxes), verbose=False, save=False, device=device)
        label["segments"] = sam_results[0].masks.xyn
    save_dir = Path(save_dir) if save_dir else Path(im_dir).parent / "labels-segment"
--- a/ultralytics/engine/exporter.py
+++ b/ultralytics/engine/exporter.py
@ -18,6 +18,7 @@ TensorFlow.js           | `tfjs`                    | yolo11n_web_model/
 PaddlePaddle            | `paddle`                  | yolo11n_paddle_model/
 MNN                     | `mnn`                     | yolo11n.mnn
 NCNN                    | `ncnn`                    | yolo11n_ncnn_model/
 IMX                     | `imx`                     | yolo11n_imx_model/
 Requirements:
    $ pip install "ultralytics[export]"
@ -44,6 +45,7 @@ Inference:
                         yolo11n_paddle_model       # PaddlePaddle
                         yolo11n.mnn                # MNN
                         yolo11n_ncnn_model         # NCNN
                         yolo11n_imx_model          # IMX
 TensorFlow.js:
    $ cd .. && git clone https://github.com/zldrobit/tfjs-yolov5-example.git && cd tfjs-yolov5-example
@ -94,7 +96,7 @@ from ultralytics.utils.checks import check_imgsz, check_is_path_safe, check_requ
 from ultralytics.utils.downloads import attempt_download_asset, get_github_assets, safe_download
 from ultralytics.utils.files import file_size, spaces_in_path
 from ultralytics.utils.ops import Profile
-from ultralytics.utils.torch_utils import TORCH_1_13, get_latest_opset, select_device, smart_inference_mode
+from ultralytics.utils.torch_utils import TORCH_1_13, get_latest_opset, select_device
 def export_formats():
@ -114,6 +116,7 @@ def export_formats():
        ["PaddlePaddle", "paddle", "_paddle_model", True, True],
        ["MNN", "mnn", ".mnn", True, True],
        ["NCNN", "ncnn", "_ncnn_model", True, True],
        ["IMX", "imx", "_imx_model", True, True],
    ]
    return dict(zip(["Format", "Argument", "Suffix", "CPU", "GPU"], zip(*x)))
@ -171,7 +174,6 @@ class Exporter:
        self.callbacks = _callbacks or callbacks.get_default_callbacks()
        callbacks.add_integration_callbacks(self)
    @smart_inference_mode()
    def __call__(self, model=None) -> str:
        """Returns list of exported files/dirs after running callbacks."""
        self.run_callbacks("on_export_start")
@ -194,9 +196,22 @@ class Exporter:
        flags = [x == fmt for x in fmts]
        if sum(flags) != 1:
            raise ValueError(f"Invalid export format='{fmt}'. Valid formats are {fmts}")
-        jit, onnx, xml, engine, coreml, saved_model, pb, tflite, edgetpu, tfjs, paddle, mnn, ncnn = (
+        (
-            flags  # export booleans
+            jit,
-        )
+            onnx,
            xml,
            engine,
            coreml,
            saved_model,
            pb,
            tflite,
            edgetpu,
            tfjs,
            paddle,
            mnn,
            ncnn,
            imx,
        ) = flags  # export booleans
        is_tf_format = any((saved_model, pb, tflite, edgetpu, tfjs))
        # Device
@ -210,6 +225,9 @@ class Exporter:
        self.device = select_device("cpu" if self.args.device is None else self.args.device)
        # Checks
        if imx and not self.args.int8:
            LOGGER.warning("WARNING ⚠️ IMX only supports int8 export, setting int8=True.")
            self.args.int8 = True
        if not hasattr(model, "names"):
            model.names = default_class_names()
        model.names = check_class_names(model.names)
@ -249,6 +267,7 @@ class Exporter:
            )
        if mnn and (IS_RASPBERRYPI or IS_JETSON):
            raise SystemError("MNN export not supported on Raspberry Pi and NVIDIA Jetson")
        # Input
        im = torch.zeros(self.args.batch, 3, *self.imgsz).to(self.device)
        file = Path(
@ -264,6 +283,11 @@ class Exporter:
        model.eval()
        model.float()
        model = model.fuse()
        if imx:
            from ultralytics.utils.torch_utils import FXModel
            model = FXModel(model)
        for m in model.modules():
            if isinstance(m, (Detect, RTDETRDecoder)):  # includes all Detect subclasses like Segment, Pose, OBB
                m.dynamic = self.args.dynamic
@ -273,6 +297,15 @@ class Exporter:
            elif isinstance(m, C2f) and not is_tf_format:
                # EdgeTPU does not support FlexSplitV while split provides cleaner ONNX graph
                m.forward = m.forward_split
            if isinstance(m, Detect) and imx:
                from ultralytics.utils.tal import make_anchors
                m.anchors, m.strides = (
                    x.transpose(0, 1)
                    for x in make_anchors(
                        torch.cat([s / m.stride.unsqueeze(-1) for s in self.imgsz], dim=1), m.stride, 0.5
                    )
                )
        y = None
        for _ in range(2):
@ -347,6 +380,8 @@ class Exporter:
            f[11], _ = self.export_mnn()
        if ncnn:  # NCNN
            f[12], _ = self.export_ncnn()
        if imx:
            f[13], _ = self.export_imx()
        # Finish
        f = [str(x) for x in f if x]  # filter out '' and None
@ -568,8 +603,7 @@ class Exporter:
        f = str(self.file.with_suffix(".mnn"))  # MNN model file
        args = ["", "-f", "ONNX", "--modelFile", f_onnx, "--MNNModel", f, "--bizCode", json.dumps(self.metadata)]
        if self.args.int8:
-            args.append("--weightQuantBits")
+            args.extend(("--weightQuantBits", "8"))
            args.append("8")
        if self.args.half:
            args.append("--fp16")
        mnnconvert.convert(args)
@ -1069,6 +1103,137 @@ class Exporter:
        yaml_save(Path(f) / "metadata.yaml", self.metadata)  # add metadata.yaml
        return f, None
    @try_export
    def export_imx(self, prefix=colorstr("IMX:")):
        """YOLO IMX export."""
        gptq = False
        assert LINUX, "export only supported on Linux. See https://developer.aitrios.sony-semicon.com/en/raspberrypi-ai-camera/documentation/imx500-converter"
        if getattr(self.model, "end2end", False):
            raise ValueError("IMX export is not supported for end2end models.")
        if "C2f" not in self.model.__str__():
            raise ValueError("IMX export is only supported for YOLOv8 detection models")
        check_requirements(("model-compression-toolkit==2.1.1", "sony-custom-layers==0.2.0", "tensorflow==2.12.0"))
        check_requirements("imx500-converter[pt]==3.14.3")  # Separate requirements for imx500-converter
        import model_compression_toolkit as mct
        import onnx
        from sony_custom_layers.pytorch.object_detection.nms import multiclass_nms
        try:
            out = subprocess.run(
                ["java", "--version"], check=True, capture_output=True
            )  # Java 17 is required for imx500-converter
            if "openjdk 17" not in str(out.stdout):
                raise FileNotFoundError
        except FileNotFoundError:
            subprocess.run(["sudo", "apt", "install", "-y", "openjdk-17-jdk", "openjdk-17-jre"], check=True)
        def representative_dataset_gen(dataloader=self.get_int8_calibration_dataloader(prefix)):
            for batch in dataloader:
                img = batch["img"]
                img = img / 255.0
                yield [img]
        tpc = mct.get_target_platform_capabilities(
            fw_name="pytorch", target_platform_name="imx500", target_platform_version="v1"
        )
        config = mct.core.CoreConfig(
            mixed_precision_config=mct.core.MixedPrecisionQuantizationConfig(num_of_images=10),
            quantization_config=mct.core.QuantizationConfig(concat_threshold_update=True),
        )
        resource_utilization = mct.core.ResourceUtilization(weights_memory=3146176 * 0.76)
        quant_model = (
            mct.gptq.pytorch_gradient_post_training_quantization(  # Perform Gradient-Based Post Training Quantization
                model=self.model,
                representative_data_gen=representative_dataset_gen,
                target_resource_utilization=resource_utilization,
                gptq_config=mct.gptq.get_pytorch_gptq_config(n_epochs=1000, use_hessian_based_weights=False),
                core_config=config,
                target_platform_capabilities=tpc,
            )[0]
            if gptq
            else mct.ptq.pytorch_post_training_quantization(  # Perform post training quantization
                in_module=self.model,
                representative_data_gen=representative_dataset_gen,
                target_resource_utilization=resource_utilization,
                core_config=config,
                target_platform_capabilities=tpc,
            )[0]
        )
        class NMSWrapper(torch.nn.Module):
            def __init__(
                self,
                model: torch.nn.Module,
                score_threshold: float = 0.001,
                iou_threshold: float = 0.7,
                max_detections: int = 300,
            ):
                """
                Wrapping PyTorch Module with multiclass_nms layer from sony_custom_layers.
                Args:
                    model (nn.Module): Model instance.
                    score_threshold (float): Score threshold for non-maximum suppression.
                    iou_threshold (float): Intersection over union threshold for non-maximum suppression.
                    max_detections (float): The number of detections to return.
                """
                super().__init__()
                self.model = model
                self.score_threshold = score_threshold
                self.iou_threshold = iou_threshold
                self.max_detections = max_detections
            def forward(self, images):
                # model inference
                outputs = self.model(images)
                boxes = outputs[0]
                scores = outputs[1]
                nms = multiclass_nms(
                    boxes=boxes,
                    scores=scores,
                    score_threshold=self.score_threshold,
                    iou_threshold=self.iou_threshold,
                    max_detections=self.max_detections,
                )
                return nms
        quant_model = NMSWrapper(
            model=quant_model,
            score_threshold=self.args.conf or 0.001,
            iou_threshold=self.args.iou,
            max_detections=self.args.max_det,
        ).to(self.device)
        f = Path(str(self.file).replace(self.file.suffix, "_imx_model"))
        f.mkdir(exist_ok=True)
        onnx_model = f / Path(str(self.file).replace(self.file.suffix, "_imx.onnx"))  # js dir
        mct.exporter.pytorch_export_model(
            model=quant_model, save_model_path=onnx_model, repr_dataset=representative_dataset_gen
        )
        model_onnx = onnx.load(onnx_model)  # load onnx model
        for k, v in self.metadata.items():
            meta = model_onnx.metadata_props.add()
            meta.key, meta.value = k, str(v)
        onnx.save(model_onnx, onnx_model)
        subprocess.run(
            ["imxconv-pt", "-i", str(onnx_model), "-o", str(f), "--no-input-persistency", "--overwrite-output"],
            check=True,
        )
        # Needed for imx models.
        with open(f / "labels.txt", "w") as file:
            file.writelines([f"{name}\n" for _, name in self.model.names.items()])
        return f, None
    def _add_tflite_metadata(self, file):
        """Add metadata to *.tflite models per https://www.tensorflow.org/lite/models/convert/metadata."""
        import flatbuffers
--- a/ultralytics/engine/model.py
+++ b/ultralytics/engine/model.py
@ -2,7 +2,7 @@
 import inspect
 from pathlib import Path
-from typing import List, Union
+from typing import Dict, List, Union
 import numpy as np
 import torch
@ -881,7 +881,7 @@ class Model(nn.Module):
        return self
    @property
-    def names(self) -> list:
+    def names(self) -> Dict[int, str]:
        """
        Retrieves the class names associated with the loaded model.
--- a/ultralytics/engine/results.py
+++ b/ultralytics/engine/results.py
@ -535,9 +535,9 @@ class Results(SimpleClass):
        # Plot Detect results
        if pred_boxes is not None and show_boxes:
            for i, d in enumerate(reversed(pred_boxes)):
-                c, conf, id = int(d.cls), float(d.conf) if conf else None, None if d.id is None else int(d.id.item())
+                c, d_conf, id = int(d.cls), float(d.conf) if conf else None, None if d.id is None else int(d.id.item())
                name = ("" if id is None else f"id:{id} ") + names[c]
-                label = (f"{name} {conf:.2f}" if conf else name) if labels else None
+                label = (f"{name} {d_conf:.2f}" if conf else name) if labels else None
                box = d.xyxyxyxy.reshape(-1, 4, 2).squeeze() if is_obb else d.xyxy.squeeze()
                annotator.box_label(
                    box,
--- a/ultralytics/engine/trainer.py
+++ b/ultralytics/engine/trainer.py
@ -792,7 +792,7 @@ class BaseTrainer:
                    g[0].append(param)
        optimizers = {"Adam", "Adamax", "AdamW", "NAdam", "RAdam", "RMSProp", "SGD", "auto"}
-        name = {x.lower(): x for x in optimizers}.get(name.lower(), None)
+        name = {x.lower(): x for x in optimizers}.get(name.lower())
        if name in {"Adam", "Adamax", "AdamW", "NAdam", "RAdam"}:
            optimizer = getattr(optim, name, optim.Adam)(g[2], lr=lr, betas=(momentum, 0.999), weight_decay=0.0)
        elif name == "RMSProp":
--- a/ultralytics/nn/autobackend.py
+++ b/ultralytics/nn/autobackend.py
@ -123,6 +123,7 @@ class AutoBackend(nn.Module):
            paddle,
            mnn,
            ncnn,
            imx,
            triton,
        ) = self._model_type(w)
        fp16 &= pt or jit or onnx or xml or engine or nn_module or triton  # FP16
@ -182,8 +183,8 @@ class AutoBackend(nn.Module):
            check_requirements("opencv-python>=4.5.4")
            net = cv2.dnn.readNetFromONNX(w)
-        # ONNX Runtime
+        # ONNX Runtime and IMX
-        elif onnx:
+        elif onnx or imx:
            LOGGER.info(f"Loading {w} for ONNX Runtime inference...")
            check_requirements(("onnx", "onnxruntime-gpu" if cuda else "onnxruntime"))
            if IS_RASPBERRYPI or IS_JETSON:
@ -199,7 +200,22 @@ class AutoBackend(nn.Module):
                device = torch.device("cpu")
                cuda = False
            LOGGER.info(f"Preferring ONNX Runtime {providers[0]}")
            if onnx:
                session = onnxruntime.InferenceSession(w, providers=providers)
            else:
                check_requirements(
                    ["model-compression-toolkit==2.1.1", "sony-custom-layers[torch]==0.2.0", "onnxruntime-extensions"]
                )
                w = next(Path(w).glob("*.onnx"))
                LOGGER.info(f"Loading {w} for ONNX IMX inference...")
                import mct_quantizers as mctq
                from sony_custom_layers.pytorch.object_detection import nms_ort  # noqa
                session = onnxruntime.InferenceSession(
                    w, mctq.get_ort_session_options(), providers=["CPUExecutionProvider"]
                )
                task = "detect"
            output_names = [x.name for x in session.get_outputs()]
            metadata = session.get_modelmeta().custom_metadata_map
            dynamic = isinstance(session.get_outputs()[0].shape[0], str)
@ -520,7 +536,7 @@ class AutoBackend(nn.Module):
            y = self.net.forward()
        # ONNX Runtime
-        elif self.onnx:
+        elif self.onnx or self.imx:
            if self.dynamic:
                im = im.cpu().numpy()  # torch to numpy
                y = self.session.run(self.output_names, {self.session.get_inputs()[0].name: im})
@ -537,6 +553,9 @@ class AutoBackend(nn.Module):
                )
                self.session.run_with_iobinding(self.io)
                y = self.bindings
            if self.imx:
                # boxes, conf, cls
                y = np.concatenate([y[0], y[1][:, :, None], y[2][:, :, None]], axis=-1)
        # OpenVINO
        elif self.xml:
--- a/ultralytics/nn/modules/block.py
+++ b/ultralytics/nn/modules/block.py
@ -240,7 +240,8 @@ class C2f(nn.Module):
    def forward_split(self, x):
        """Forward pass using split() instead of chunk()."""
-        y = list(self.cv1(x).split((self.c, self.c), 1))
+        y = self.cv1(x).split((self.c, self.c), 1)
        y = [y[0], y[1]]
        y.extend(m(y[-1]) for m in self.m)
        return self.cv2(torch.cat(y, 1))
--- a/ultralytics/nn/modules/head.py
+++ b/ultralytics/nn/modules/head.py
@ -23,6 +23,7 @@ class Detect(nn.Module):
    dynamic = False  # force grid reconstruction
    export = False  # export mode
    format = None  # export format
    end2end = False  # end2end
    max_det = 300  # max_det
    shape = None
@ -101,7 +102,7 @@ class Detect(nn.Module):
        # Inference path
        shape = x[0].shape  # BCHW
        x_cat = torch.cat([xi.view(shape[0], self.no, -1) for xi in x], 2)
-        if self.dynamic or self.shape != shape:
+        if self.format != "imx" and (self.dynamic or self.shape != shape):
            self.anchors, self.strides = (x.transpose(0, 1) for x in make_anchors(x, self.stride, 0.5))
            self.shape = shape
@ -119,6 +120,11 @@ class Detect(nn.Module):
            grid_size = torch.tensor([grid_w, grid_h, grid_w, grid_h], device=box.device).reshape(1, 4, 1)
            norm = self.strides / (self.stride[0] * grid_size)
            dbox = self.decode_bboxes(self.dfl(box) * norm, self.anchors.unsqueeze(0) * norm[:, :2])
        elif self.export and self.format == "imx":
            dbox = self.decode_bboxes(
                self.dfl(box) * self.strides, self.anchors.unsqueeze(0) * self.strides, xywh=False
            )
            return dbox.transpose(1, 2), cls.sigmoid().permute(0, 2, 1)
        else:
            dbox = self.decode_bboxes(self.dfl(box), self.anchors.unsqueeze(0)) * self.strides
@ -137,9 +143,9 @@ class Detect(nn.Module):
                a[-1].bias.data[:] = 1.0  # box
                b[-1].bias.data[: m.nc] = math.log(5 / m.nc / (640 / s) ** 2)  # cls (.01 objects, 80 classes, 640 img)
-    def decode_bboxes(self, bboxes, anchors):
+    def decode_bboxes(self, bboxes, anchors, xywh=True):
        """Decode bounding boxes."""
-        return dist2bbox(bboxes, anchors, xywh=not self.end2end, dim=1)
+        return dist2bbox(bboxes, anchors, xywh=xywh and (not self.end2end), dim=1)
    @staticmethod
    def postprocess(preds: torch.Tensor, max_det: int, nc: int = 80):
--- a/ultralytics/solutions/solutions.py
+++ b/ultralytics/solutions/solutions.py
@ -72,8 +72,7 @@ class BaseSolution:
        self.model = YOLO(self.CFG["model"])
        self.names = self.model.names
-        if IS_CLI:  # for CLI, download the source and init video writer
+        if IS_CLI and self.CFG["source"] is None:
            if self.CFG["source"] is None:
            d_s = "solutions_ci_demo.mp4" if "-pose" not in self.CFG["model"] else "solution_ci_pose_demo.mp4"
            LOGGER.warning(f"⚠️ WARNING: source not provided. using default source {ASSETS_URL}/{d_s}")
            from ultralytics.utils.downloads import safe_download
--- a/ultralytics/utils/benchmarks.py
+++ b/ultralytics/utils/benchmarks.py
@ -118,6 +118,11 @@ def benchmark(
                assert not IS_JETSON, "MNN export not supported on NVIDIA Jetson"
            if i == 13:  # NCNN
                assert not isinstance(model, YOLOWorld), "YOLOWorldv2 NCNN exports not supported yet"
            if i == 14:  # IMX
                assert not is_end2end
                assert not isinstance(model, YOLOWorld), "YOLOWorldv2 IMX exports not supported"
                assert model.task == "detect", "IMX only supported for detection task"
                assert "C2f" in model.__str__(), "IMX only supported for YOLOv8"
            if "cpu" in device.type:
                assert cpu, "inference not supported on CPU"
            if "cuda" in device.type:
--- a/ultralytics/utils/callbacks/comet.py
+++ b/ultralytics/utils/callbacks/comet.py
@ -291,7 +291,7 @@ def _log_plots(experiment, trainer):
            for plots in EVALUATION_PLOT_NAMES
            for prefix in POSE_METRICS_PLOT_PREFIX
        ]
-    elif isinstance(trainer.validator.metrics, DetMetrics) or isinstance(trainer.validator.metrics, OBBMetrics):
+    elif isinstance(trainer.validator.metrics, (DetMetrics, OBBMetrics)):
        plot_filenames = [trainer.save_dir / f"{plots}.png" for plots in EVALUATION_PLOT_NAMES]
    if plot_filenames is not None:
--- a/ultralytics/utils/callbacks/raytune.py
+++ b/ultralytics/utils/callbacks/raytune.py
@ -16,8 +16,7 @@ def on_fit_epoch_end(trainer):
    """Sends training metrics to Ray Tune at end of each epoch."""
    if ray.train._internal.session._get_session():  # replacement for deprecated ray.tune.is_session_enabled()
        metrics = trainer.metrics
-        metrics["epoch"] = trainer.epoch
+        session.report({**metrics, **{"epoch": trainer.epoch + 1}})
        session.report(metrics)
 callbacks = (
--- a/ultralytics/utils/tal.py
+++ b/ultralytics/utils/tal.py
@ -306,7 +306,7 @@ def make_anchors(feats, strides, grid_cell_offset=0.5):
    assert feats is not None
    dtype, device = feats[0].dtype, feats[0].device
    for i, stride in enumerate(strides):
-        _, _, h, w = feats[i].shape
+        h, w = feats[i].shape[2:] if isinstance(feats, list) else (int(feats[i][0]), int(feats[i][1]))
        sx = torch.arange(end=w, device=device, dtype=dtype) + grid_cell_offset  # shift x
        sy = torch.arange(end=h, device=device, dtype=dtype) + grid_cell_offset  # shift y
        sy, sx = torch.meshgrid(sy, sx, indexing="ij") if TORCH_1_10 else torch.meshgrid(sy, sx)
--- a/ultralytics/utils/torch_utils.py
+++ b/ultralytics/utils/torch_utils.py
@ -729,3 +729,48 @@ class EarlyStopping:
                f"i.e. `patience=300` or use `patience=0` to disable EarlyStopping."
            )
        return stop
 class FXModel(nn.Module):
    """
    A custom model class for torch.fx compatibility.
    This class extends `torch.nn.Module` and is designed to ensure compatibility with torch.fx for tracing and graph manipulation.
    It copies attributes from an existing model and explicitly sets the model attribute to ensure proper copying.
    Args:
        model (torch.nn.Module): The original model to wrap for torch.fx compatibility.
    """
    def __init__(self, model):
        """
        Initialize the FXModel.
        Args:
            model (torch.nn.Module): The original model to wrap for torch.fx compatibility.
        """
        super().__init__()
        copy_attr(self, model)
        # Explicitly set `model` since `copy_attr` somehow does not copy it.
        self.model = model.model
    def forward(self, x):
        """
        Forward pass through the model.
        This method performs the forward pass through the model, handling the dependencies between layers and saving intermediate outputs.
        Args:
            x (torch.Tensor): The input tensor to the model.
        Returns:
            (torch.Tensor): The output tensor from the model.
        """
        y = []  # outputs
        for m in self.model:
            if m.f != -1:  # if not from previous layer
                # from earlier layers
                x = y[m.f] if isinstance(m.f, int) else [x if j == -1 else y[j] for j in m.f]
            x = m(x)  # run
            y.append(x)  # save output
        return x