obss · dhaval-zala · Jun 8, 2023 · Nov 8, 2023 · Nov 8, 2023 · Nov 8, 2023
diff --git a/demo/inference_for_yolov8_openvino.ipynb b/demo/inference_for_yolov8_openvino.ipynb
diff --git a/sahi/auto_model.py b/sahi/auto_model.py
@@ -3,6 +3,7 @@
 from sahi.utils.file import import_model_class
 
 MODEL_TYPE_TO_MODEL_CLASS_NAME = {
+    "yolov8Vino": "Yolov8DetectionVinoModel",
-    "yolov8Vino": "Yolov8DetectionVinoModel",
+    "yolov8openvino": "Yolov8OpenvinoDetectionModel",
-    "yolov8Vino": "Yolov8DetectionVinoModel",
+    "yolov8openvino": "Yolov8OpenvinoDetectionModel",
     "yolov8": "Yolov8DetectionModel",
     "mmdet": "MmdetDetectionModel",
     "yolov5": "Yolov5DetectionModel",

diff --git a/sahi/models/base.py b/sahi/models/base.py
@@ -9,6 +9,7 @@
 from sahi.utils.torch import select_device as select_torch_device
 
 
+
 class DetectionModel:
     def __init__(
         self,
@@ -49,6 +50,8 @@ def __init__(
         self.config_path = config_path
         self.model = None
         self.device = device
+        if ".xml" == self.model_path[-4:]:
+            self.device = "CPU"
         self.mask_threshold = mask_threshold
         self.confidence_threshold = confidence_threshold
         self.category_mapping = category_mapping
@@ -57,7 +60,8 @@ def __init__(
         self._original_predictions = None
         self._object_prediction_list_per_image = None
 
-        self.set_device()
+        if not ".xml" == self.model_path[-4:]:
+            self.set_device()
 
         # automatically load model if load_at_init is True
         if load_at_init:

diff --git a/sahi/models/yolov8Vino.py b/sahi/models/yolov8Vino.py
@@ -0,0 +1,223 @@
+import numpy as np
+import cv2
+import torch
+from openvino.runtime import Core
+from openvino.runtime import Core, AsyncInferQueue
+import logging
+from typing import Any, List, Optional, Tuple
+import time
+logger = logging.getLogger(__name__)
+
+from ultralytics.yolo.utils.ops import non_max_suppression, scale_boxes
+from sahi.models.base import DetectionModel
+from sahi.prediction import ObjectPrediction
+from sahi.utils.compatibility import fix_full_shape_list, fix_shift_amount_list
+from sahi.utils.import_utils import check_requirements
+
+
+class Yolov8DetectionVinoModel(DetectionModel):
-class Yolov8DetectionVinoModel(DetectionModel):
+class Yolov8OpenvinoDetectionModel(DetectionModel):
-class Yolov8DetectionVinoModel(DetectionModel):
+class Yolov8OpenvinoDetectionModel(DetectionModel):
+
+    # def __init__(self):
+    #     self.output = None
+
+    def check_dependencies(self) -> None:
+        check_requirements(["ultralytics"])
+
+    def load_model(self):
+        """
+        OpenVino IR model is initialized and set to self.model.
+        """
+        try:
+            core = Core()
+            ov_model = core.read_model(self.model_path)
+            self.cls = ov_model.rt_info
+            model = core.compile_model(ov_model, self.device)
+            self.infer_queue = AsyncInferQueue(model, 2)
+            self.infer_queue.set_callback(self.callback)
+            self.set_model(model)
+            self.output = None
+        except Exception as e:
+            raise TypeError("model_path is not a valid yolov8 OpenVino model path: ", e)
+
+    def set_model(self, model: Any):
+        """
+        Sets the underlying YOLOv8 model.
+        Args:
+            model: Any
+                A YOLOv8 OpenVino IR model
+        """
+        self.model = model
+        self.input_layer_ir = self.model.input(0)
+        self.output_layer = self.model.output(0)
+
+        # set category_mapping
+        if not self.category_mapping:
+            category_mapping = {str(ind): category_name for ind, category_name in enumerate(self.category_names)}
+            self.category_mapping = category_mapping
+
+    def callback(self,infer_request, info) -> None:
+        """
+        Define the callback function for postprocessing
+
+        :param: infer_request: the infer_request object
+                info: a tuple includes original frame and starts time
+        :returns:
+                None
+        """
+        result = infer_request.get_output_tensor(0).data
+
+        input_hw = self.input_tensor.shape[2:]
+
+        prediction_result = non_max_suppression(
+            torch.from_numpy(result),
+            conf_thres = self.confidence_threshold
+        )
+
+        #Scale the detected bboxes
+        for i, pred in enumerate(prediction_result):
+            shape = self.orig_image.shape      
+            pred[:, :4] = scale_boxes(input_hw, pred[:, :4], shape).round()
+
+        if self.output == None:
+            self.output = prediction_result
+
+    def pad_resize_image(self,
+        cv2_img: np.ndarray,
+        new_size: Tuple[int, int] = (640, 640),
+        color: Tuple[int, int, int] = (125, 125, 125)) -> np.ndarray:
+        """Resize and pad image with color if necessary, maintaining orig scale
+
+        args:
+            cv2_img: numpy.ndarray = cv2 image
+            new_size: tuple(int, int) = (width, height)
+            color: tuple(int, int, int) = (B, G, R)
+        """
+        in_h, in_w = cv2_img.shape[:2]
+        new_w, new_h = new_size
+        # rescale down
+        scale = min(new_w / in_w, new_h / in_h)
+        # get new sacled widths and heights
+        scale_new_w, scale_new_h = int(in_w * scale), int(in_h * scale)
+
+        resized_img = cv2.resize(cv2_img, (scale_new_w, scale_new_h))
+
+        # print(resized_img.shape)
+        # calculate deltas for padding
+        d_w = max(new_w - scale_new_w, 0)
+        d_h = max(new_h - scale_new_h, 0)
+        # center image with padding on top/bottom or left/right
+        top, bottom = d_h // 2, d_h - (d_h // 2)
+        left, right = d_w // 2, d_w - (d_w // 2)
+        pad_resized_img = cv2.copyMakeBorder(resized_img,
+                                            top, bottom, left, right,
+                                            cv2.BORDER_CONSTANT,
+                                            value=color)
+        return pad_resized_img
+
+    def perform_inference(self, image: np.ndarray):
+        """
+        Prediction is performed using self.model and the prediction result is set to self._original_predictions.
+        Args:
+            image: np.ndarray
+                A numpy array that contains the image to be predicted. 3 channel image should be in RGB order.
+        """
+        self.orig_image = image.copy()
+
+        #Resize image and padding for detection.
+        image = self.pad_resize_image(image)
+
+        # Convert HWC to CHW
+        image = image.transpose(2, 0, 1)
+
+        #Image to Tensor
+        image = np.ascontiguousarray(image)
+        input_tensor = image.astype(np.float32)
+        input_tensor /= 255.0
+        if input_tensor.ndim == 3:
+            input_tensor = np.expand_dims(input_tensor, 0)
+        self.input_tensor = input_tensor.astype(np.float32)
+
+        self.infer_queue.start_async({self.input_layer_ir.any_name: self.input_tensor},(self.input_tensor, time.time()))
+        self.infer_queue.wait_all()
+        if self.output != None:
+            self._original_predictions = self.output
+        self.output = None
+
+    @property
+    def category_names(self):
+
+        return eval(self.cls["framework"]["names"].value).values()
+
+    def _create_object_prediction_list_from_original_predictions(
+        self,
+        shift_amount_list: Optional[List[List[int]]] = [[0, 0]],
+        full_shape_list: Optional[List[List[int]]] = None,
+    ):
+        """
+        self._original_predictions is converted to a list of prediction.ObjectPrediction and set to
+        self._object_prediction_list_per_image.
+        Args:
+            shift_amount_list: list of list
+                To shift the box and mask predictions from sliced image to full sized image, should
+                be in the form of List[[shift_x, shift_y],[shift_x, shift_y],...]
+            full_shape_list: list of list
+                Size of the full image after shifting, should be in the form of
+                List[[height, width],[height, width],...]
+        """
+        original_predictions = self._original_predictions
+
+        # compatilibty for sahi v0.8.15
+        shift_amount_list = fix_shift_amount_list(shift_amount_list)
+        full_shape_list = fix_full_shape_list(full_shape_list)
+
+        # handle all predictions
+        object_prediction_list_per_image = []
+        for image_ind, image_predictions_in_xyxy_format in enumerate(original_predictions):
+            shift_amount = shift_amount_list[image_ind]
+            full_shape = None if full_shape_list is None else full_shape_list[image_ind]
+            object_prediction_list = []
+
+            # process predictions
+            for prediction in image_predictions_in_xyxy_format.cpu().detach().numpy():
+                x1 = prediction[0]
+                y1 = prediction[1]
+                x2 = prediction[2]
+                y2 = prediction[3]
+                bbox = [x1, y1, x2, y2]
+                score = prediction[4]
+                category_id = int(prediction[5])
+                category_name = self.category_mapping[str(category_id)]
+
+                # fix negative box coords
+                bbox[0] = max(0, bbox[0])
+                bbox[1] = max(0, bbox[1])
+                bbox[2] = max(0, bbox[2])
+                bbox[3] = max(0, bbox[3])
+
+                # fix out of image box coords
+                if full_shape is not None:
+                    bbox[0] = min(full_shape[1], bbox[0])
+                    bbox[1] = min(full_shape[0], bbox[1])
+                    bbox[2] = min(full_shape[1], bbox[2])
+                    bbox[3] = min(full_shape[0], bbox[3])
+
+                # ignore invalid predictions
+                if not (bbox[0] < bbox[2]) or not (bbox[1] < bbox[3]):
+                    logger.warning(f"ignoring invalid prediction with bbox: {bbox}")
+                    continue
+
+                object_prediction = ObjectPrediction(
+                    bbox=bbox,
+                    category_id=category_id,
+                    score=score,
+                    bool_mask=None,
+                    category_name=category_name,
+                    shift_amount=shift_amount,
+                    full_shape=full_shape,
+                )
+                object_prediction_list.append(object_prediction)
+            object_prediction_list_per_image.append(object_prediction_list)
+        # print(object_prediction_list_per_image)
+        self._object_prediction_list_per_image = object_prediction_list_per_image
+
+
diff --git a/sahi/utils/yolov8.py b/sahi/utils/yolov8.py
@@ -2,6 +2,7 @@
 from os import path
 from pathlib import Path
 from typing import Optional
+from ultralytics import YOLO
 
 
 class Yolov8TestConstants:
@@ -44,27 +45,36 @@ def download_yolov8s_model(destination_path: Optional[str] = None):
         )
 
 
-def download_yolov8m_model(destination_path: Optional[str] = None):
-    if destination_path is None:
-        destination_path = Yolov8TestConstants.YOLOV8M_MODEL_PATH
+def OpenVino_yolov8n_model(yolov8n_model_path: Optional[str] = None):
-def OpenVino_yolov8n_model(yolov8n_model_path: Optional[str] = None):
+def download_yolov8n_openvino_model(yolov8n_model_path: Optional[str] = None):
-def OpenVino_yolov8n_model(yolov8n_model_path: Optional[str] = None):
+def download_yolov8n_openvino_model(yolov8n_model_path: Optional[str] = None):
+    if yolov8n_model_path is None:
+        yolov8n_model_path = Yolov8TestConstants.YOLOV8S_MODEL_PATH
+
+    download_yolov8n_model(yolov8n_model_path)
 
+    destination_path = str(Path(yolov8n_model_path).parent) + "/" + "yolov8n_openvino_model" + "/" + "yolov8n.xml"
     Path(destination_path).parent.mkdir(parents=True, exist_ok=True)
-
+ 
     if not path.exists(destination_path):
-        urllib.request.urlretrieve(
-            Yolov8TestConstants.YOLOV8M_MODEL_URL,
-            destination_path,
-        )
+        try:
+            det_model = YOLO(yolov8n_model_path)
+            det_model.export(format="openvino", dynamic=True, half=False)
+        except Exception as e:
+            raise TypeError("model_path is not a valid yolov8 model path: ", e)
 
 
-def download_yolov8l_model(destination_path: Optional[str] = None):
-    if destination_path is None:
-        destination_path = Yolov8TestConstants.YOLOV8L_MODEL_PATH
+def OpenVino_yolov8s_model(yolov8s_model_path: Optional[str] = None):
-def OpenVino_yolov8s_model(yolov8s_model_path: Optional[str] = None):
+def download_yolov8s_openvino_model(yolov8s_model_path: Optional[str] = None):
-def OpenVino_yolov8s_model(yolov8s_model_path: Optional[str] = None):
+def download_yolov8s_openvino_model(yolov8s_model_path: Optional[str] = None):
+    if yolov8s_model_path is None:
+        yolov8s_model_path = Yolov8TestConstants.YOLOV8S_MODEL_PATH
+    download_yolov8s_model(yolov8s_model_path)
 
+    destination_path = str(Path(yolov8s_model_path).parent) + "/" + "yolov8s_openvino_model" + "/" + "yolov8s.xml"
     Path(destination_path).parent.mkdir(parents=True, exist_ok=True)
 
     if not path.exists(destination_path):
-        urllib.request.urlretrieve(
-            Yolov8TestConstants.YOLOV8L_MODEL_URL,
-            destination_path,
-        )
+        try:
+            det_model = YOLO(yolov8s_model_path)
+            det_model.export(format="openvino", dynamic=True, half=False)
+        except Exception as e:
+            raise TypeError("model_path is not a valid yolov8 model path: ", e)
+
+