-
Notifications
You must be signed in to change notification settings - Fork 607
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Add support for sparse YOLOv5 models (#848)
- Loading branch information
1 parent
7d63528
commit de68008
Showing
7 changed files
with
1,247 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Large diffs are not rendered by default.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,220 @@ | ||
# OBSS SAHI Tool | ||
# Code written by Fatih C Akyon, 2020. | ||
# Using YOLOv5 sparse models from Neural Magic using DeepSparse | ||
# https://neuralmagic.com/deepsparse | ||
|
||
import logging | ||
from typing import Any, Dict, List, Optional | ||
|
||
import numpy as np | ||
|
||
from sahi.models.base import DetectionModel | ||
from sahi.prediction import ObjectPrediction | ||
from sahi.utils.compatibility import fix_full_shape_list, fix_shift_amount_list | ||
from sahi.utils.import_utils import check_package_minimum_version, check_requirements | ||
|
||
logger = logging.getLogger(__name__) | ||
|
||
|
||
class Yolov5SparseDetectionModel(DetectionModel): | ||
def check_dependencies(self) -> None: | ||
check_requirements(["deepsparse", "sparseml"]) | ||
|
||
def load_model(self): | ||
""" | ||
Detection model is initialized and set to self.model. | ||
""" | ||
|
||
from deepsparse import Pipeline | ||
|
||
try: | ||
model = Pipeline.create(task="yolo", model_path=self.model_path) | ||
self.set_model(model) | ||
except Exception as e: | ||
raise TypeError("Could not load the model: ", e) | ||
|
||
def set_model(self, model: Any): | ||
""" | ||
Sets the underlying YOLOv5 model. | ||
Args: | ||
model: Any | ||
A YOLOv5 model | ||
""" | ||
|
||
self.model = model | ||
|
||
# set category_mapping | ||
if not self.category_mapping: | ||
category_mapping = {str(ind): category_name for ind, category_name in enumerate(self.category_names)} | ||
self.category_mapping = category_mapping | ||
|
||
def perform_inference(self, image: np.ndarray): | ||
""" | ||
Prediction is performed using self.model and the prediction result is set to self._original_predictions. | ||
Args: | ||
image: np.ndarray | ||
A numpy array that contains the image to be predicted. 3 channel image should be in RGB order. | ||
""" | ||
|
||
# Confirm model is loaded | ||
if self.model is None: | ||
raise ValueError("Model is not loaded, load it by calling .load_model()") | ||
if self.image_size is not None: | ||
prediction_result = self.model( | ||
images=[image], conf_thres=self.confidence_threshold, image_size=self.image_size | ||
) | ||
else: | ||
prediction_result = self.model(images=[image], conf_thres=self.confidence_threshold) | ||
|
||
self._original_predictions = prediction_result | ||
|
||
@property | ||
def num_categories(self): | ||
""" | ||
Returns number of categories | ||
""" | ||
return 80 | ||
|
||
@property | ||
def category_names(self): | ||
return [ | ||
"person", | ||
"bicycle", | ||
"car", | ||
"motorcycle", | ||
"airplane", | ||
"bus", | ||
"train", | ||
"truck", | ||
"boat", | ||
"traffic light", | ||
"fire hydrant", | ||
"stop sign", | ||
"parking meter", | ||
"bench", | ||
"bird", | ||
"cat", | ||
"dog", | ||
"horse", | ||
"sheep", | ||
"cow", | ||
"elephant", | ||
"bear", | ||
"zebra", | ||
"giraffe" "backpack", | ||
"umbrella", | ||
"handbag", | ||
"tie", | ||
"suitcase", | ||
"frisbee", | ||
"skis", | ||
"snowboard", | ||
"sports ball", | ||
"kite", | ||
"baseball bat", | ||
"baseball glove", | ||
"skateboard", | ||
"surfboard", | ||
"tennis racket", | ||
"bottle", | ||
"wine glass", | ||
"cup", | ||
"fork", | ||
"knife", | ||
"spoon", | ||
"bowl", | ||
"banana", | ||
"apple", | ||
"sandwich", | ||
"orange", | ||
"broccoli", | ||
"carrot", | ||
"hot dog", | ||
"pizza", | ||
"donut", | ||
"cake", | ||
"chair", | ||
"couch", | ||
"potted plant", | ||
"bed", | ||
"dining table", | ||
"toilet", | ||
"tv", | ||
"laptop", | ||
"mouse", | ||
"remote", | ||
"keyboard", | ||
"cell phone", | ||
"microwave", | ||
"oven", | ||
"toaster", | ||
"sink", | ||
"refrigerator", | ||
"book", | ||
"clock", | ||
"vase", | ||
"scissors", | ||
"teddy bear", | ||
"hair drier", | ||
"toothbrush", | ||
] | ||
|
||
def _create_object_prediction_list_from_original_predictions( | ||
self, | ||
shift_amount_list: Optional[List[List[int]]] = [[0, 0]], | ||
full_shape_list: Optional[List[List[int]]] = None, | ||
): | ||
""" | ||
self._original_predictions is converted to a list of prediction.ObjectPrediction and set to | ||
self._object_prediction_list_per_image. | ||
Args: | ||
shift_amount_list: list of list | ||
To shift the box and mask predictions from sliced image to full sized image, should | ||
be in the form of List[[shift_x, shift_y],[shift_x, shift_y],...] | ||
full_shape_list: list of list | ||
Size of the full image after shifting, should be in the form of | ||
List[[height, width],[height, width],...] | ||
""" | ||
|
||
original_predictions = self._original_predictions | ||
# compatilibty for sahi v0.8.15 | ||
shift_amount_list = fix_shift_amount_list(shift_amount_list) | ||
full_shape_list = fix_full_shape_list(full_shape_list) | ||
|
||
# handle all predictions | ||
object_prediction_list_per_image = [] | ||
for image_ind, (prediction_bboxes, prediction_scores, prediction_categories) in enumerate(original_predictions): | ||
shift_amount = shift_amount_list[image_ind] | ||
full_shape = None if full_shape_list is None else full_shape_list[image_ind] | ||
object_prediction_list = [] | ||
|
||
# process predictions | ||
for bbox, score, category_id in zip(prediction_bboxes, prediction_scores, prediction_categories): | ||
category_id = int(float(category_id)) | ||
category_name = self.category_mapping[str(category_id)] | ||
|
||
# fix out of image box coords | ||
if full_shape is not None: | ||
bbox[0] = min(full_shape[1], bbox[0]) | ||
bbox[1] = min(full_shape[0], bbox[1]) | ||
bbox[2] = min(full_shape[1], bbox[2]) | ||
bbox[3] = min(full_shape[0], bbox[3]) | ||
|
||
# ignore invalid predictions | ||
if not (bbox[0] < bbox[2]) or not (bbox[1] < bbox[3]): | ||
logger.warning(f"ignoring invalid prediction with bbox: {bbox}") | ||
continue | ||
|
||
object_prediction = ObjectPrediction( | ||
bbox=bbox, | ||
category_id=category_id, | ||
score=score, | ||
bool_mask=None, | ||
category_name=category_name, | ||
shift_amount=shift_amount, | ||
full_shape=full_shape, | ||
) | ||
object_prediction_list.append(object_prediction) | ||
object_prediction_list_per_image.append(object_prediction_list) | ||
|
||
self._object_prediction_list_per_image = object_prediction_list_per_image |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
class Yolov5TestConstants: | ||
YOLOV_MODEL_URL = "zoo:cv/detection/yolov5-s/pytorch/ultralytics/coco/pruned-aggressive_96" |
Oops, something went wrong.