DeepStack/intelligencelayer/shared/process.py at dev · fblgit/DeepStack

74 lines (61 loc) · 2.2 KB

import argparse
import platform
import shutil
import time
from pathlib import Path
import models
import numpy as np
import torch
import torch.backends.cudnn as cudnn
from models.experimental import attempt_load
from numpy import random
from PIL import Image
from utils.datasets import letterbox
from utils.general import (
    non_max_suppression,
    scale_coords
import torch.nn as nn
from utils.activations import Hardswish
class YOLODetector(object):
    def __init__(self, model_path: str, reso: int = 640, cuda: bool = False):
        self.device = torch.device("cuda:0" if cuda else "cpu")
        self.half = self.device.type != "cpu"
        self.reso = (reso, reso)
        self.cuda = cuda
        self.model = attempt_load(model_path, map_location=self.device)
        # Update model
        for k, m in self.model.named_modules():
            m._non_persistent_buffers_set = set()  # pytorch 1.6.0 compatability
            if isinstance(m, models.common.Conv) and isinstance(m.act, nn.Hardswish):
                m.act = Hardswish()  # assign activation
        self.names = (
            self.model.module.names
            if hasattr(self.model, "module")
            else self.model.names
        if self.half:
            self.model.half()
    def predict(self, img_path: str, confidence: float = 0.4):
        confidence = max(0.1,confidence)
        img0 = Image.open(img_path).convert("RGB")
        img = np.asarray(letterbox(img0, new_shape=self.reso)[0])
        img = img.transpose(2, 0, 1)
        img = np.ascontiguousarray(img)
        img = torch.from_numpy(img).to(self.device)
        img0 = np.asarray(img0)
        img = img.half() if self.half else img.float()  # uint8 to fp16/32
        img /= 255.0  # 0 - 255 to 0.0 - 1.0
        if img.ndimension() == 3:
            img = img.unsqueeze(0)
        pred = self.model(img, augment=False)[0]
        pred = non_max_suppression(
            pred, confidence, 0.45, classes=None, agnostic=False
        )[0]
        if pred is None:
            pred = []
        else:
            # Rescale boxes from img_size to im0 size
            pred[:, :4] = scale_coords(img.shape[2:], pred[:, :4], img0.shape).round()
        return pred

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

process.py

Latest commit

History

process.py

File metadata and controls