RK3588_Detection/rknn_detect_yolov5_best.py

#from rknn.api import RKNN
from rknnlite.api import RKNNLite
import cv2
import numpy as np
import cv2
import time
import os
from PIL import Image
"""
yolov5 预测脚本 for rknn
"""

SIZE = (640, 640)
Width = 640
Height = 640
CLASSES = ("lighting")
OBJ_THRESH = 0.1
NMS_THRESH = 0.1
MASKS = [[0, 1, 2], [3, 4, 5], [6, 7, 8]]
ANCHORS = [[10, 13], [16, 30], [33, 23], [30, 61], [62, 45], [59, 119], [116, 90], [156, 198], [373, 326]]


IMAGE_EXT = [".jpg", "*.JPG", ".jpeg", ".webp", ".bmp", ".png"]

def sigmoid(x):
    return 1 / (1 + np.exp(-x))

def letterbox_image(image, size):
    iw, ih = image.size
    w, h = size
    scale = min(w / iw, h / ih)
    nw = int(iw * scale)
    nh = int(ih * scale)

    image = np.array(image)
    image = cv2.resize(image, (nw, nh), interpolation=cv2.INTER_LINEAR)
    image = Image.fromarray(image)
    new_image = Image.new('RGB', size, (128, 128, 128))
    new_image.paste(image, ((w - nw) // 2, (h - nh) // 2))
    return new_image

def get_image_list(path):
    image_names = []
    for maindir, subdir, file_name_list in os.walk(path):
        for filename in file_name_list:
            apath = os.path.join(maindir, filename)
            ext = os.path.splitext(apath)[1]
            if ext in IMAGE_EXT:
                image_names.append(apath)
    return image_names

def filter_boxes(boxes, box_confidences, box_class_probs) -> (np.ndarray, np.ndarray, np.ndarray):
    box_scores = box_confidences * box_class_probs  # 条件概率， 在该cell存在物体的概率的基础上是某个类别的概率
    box_classes = np.argmax(box_scores, axis=-1)  # 找出概率最大的类别索引
    box_class_scores = np.max(box_scores, axis=-1)  # 最大类别对应的概率值
    pos = np.where(box_class_scores >= OBJ_THRESH)  # 找出概率大于阈值的item
    # pos = box_class_scores >= OBJ_THRESH  # 找出概率大于阈值的item
    boxes = boxes[pos]
    classes = box_classes[pos]
    scores = box_class_scores[pos]
    return boxes, classes, scores


def nms_boxes(boxes, scores):
    x = boxes[:, 0]
    y = boxes[:, 1]
    w = boxes[:, 2]
    h = boxes[:, 3]

    areas = w * h
    order = scores.argsort()[::-1]

    keep = []
    while order.size > 0:
        i = order[0]
        keep.append(i)

        xx1 = np.maximum(x[i], x[order[1:]])
        yy1 = np.maximum(y[i], y[order[1:]])
        xx2 = np.minimum(x[i] + w[i], x[order[1:]] + w[order[1:]])
        yy2 = np.minimum(y[i] + h[i], y[order[1:]] + h[order[1:]])

        w1 = np.maximum(0.0, xx2 - xx1 + 0.00001)
        h1 = np.maximum(0.0, yy2 - yy1 + 0.00001)
        inter = w1 * h1

        ovr = inter / (areas[i] + areas[order[1:]] - inter)
        inds = np.where(ovr <= NMS_THRESH)[0]
        order = order[inds + 1]
    keep = np.array(keep)
    return keep


def load_rknn_model(PATH):
    # Create RKNN object
    rknn = RKNNLite()
    # Load tensorflow model
    print('--> Loading model')
    ret = rknn.load_rknn(PATH)
    if ret != 0:
        print('load rknn model failed')
        exit(ret)
    print('done')
    #ret = rknn.init_runtime(device_id='TS018083200400178', rknn2precompile=True)
    ret = rknn.init_runtime()
    if ret != 0:
        print('Init runtime environment failed')
        exit(ret)
    print('done')
    return rknn


def predict(img_src, rknn):

    img = letterbox_image(img_src, (Width, Height))
    img = np.array(img)

    t0 = time.time()
    #print("img shape               \t:", img.shape)
    pred_onx = rknn.inference(inputs=[img])
    print("--------------------time: \t", time.time() - t0)
    boxes, classes, scores = [], [], []
    for t in range(3):
        input0_data = sigmoid(pred_onx[t][0])
        input0_data = np.transpose(input0_data, (1, 2, 0, 3))
        grid_h, grid_w, channel_n, predict_n = input0_data.shape
        #print("-------------------input0_data.shape----------------",input0_data.shape)
        anchors = [ANCHORS[i] for i in MASKS[t]]
        box_confidence = input0_data[..., 4]
        box_confidence = np.expand_dims(box_confidence, axis=-1)
        box_class_probs = input0_data[..., 5:]
        box_xy = input0_data[..., :2]
        box_wh = input0_data[..., 2:4]
        col = np.tile(np.arange(0, grid_w), grid_h).reshape(-1, grid_w)
        row = np.tile(np.arange(0, grid_h).reshape(-1, 1), grid_w)
        col = col.reshape((grid_h, grid_w, 1, 1)).repeat(3, axis=-2)
        row = row.reshape((grid_h, grid_w, 1, 1)).repeat(3, axis=-2)
        grid = np.concatenate((col, row), axis=-1)
        box_xy = box_xy * 2 - 0.5 + grid
        box_wh = (box_wh * 2) ** 2 * anchors
        box_xy /= (grid_w, grid_h)  # 计算原尺寸的中心
        box_wh /= SIZE  # 计算原尺寸的宽高
        box_xy -= (box_wh / 2.)  # 计算原尺寸的xy
        box = np.concatenate((box_xy, box_wh), axis=-1)
        res = filter_boxes(box, box_confidence, box_class_probs)
        boxes.append(res[0])
        classes.append(res[1])
        scores.append(res[2])
    boxes, classes, scores = np.concatenate(boxes), np.concatenate(classes), np.concatenate(scores)
    #print("------------------------boxes, classes, scores-----------------------",boxes, classes, scores)
    nboxes, nclasses, nscores = [], [], []
    for c in set(classes):
        inds = np.where(classes == c)
        b = boxes[inds]
        c = classes[inds]
        s = scores[inds]
        keep = nms_boxes(b, s)
        #keep = [0,1,2]
        #print("--------------keep-------------",keep)
        nboxes.append(b[keep])
        nclasses.append(c[keep])
        nscores.append(s[keep])
    if len(nboxes) < 1:
        return [], [], []
    boxes = np.concatenate(nboxes)
    classes = np.concatenate(nclasses)
    scores = np.concatenate(nscores)
    #print("------------------------boxes, classes, scores-----------------------",boxes, classes, scores)
    return boxes, classes, scores


def clip_coords(boxes, img_shape):
    # Clip bounding xyxy bounding boxes to image shape (height, width)
    #boxes[:, 0].clp(0, img_shape[1])  # x1
    #boxes[:, 1].clp(0, img_shape[0])  # y1
    #boxes[:, 2].clp(0, img_shape[1])  # x2
    #boxes[:, 3].clp(0, img_shape[0])  # y2
    np.clip(boxes[:, 0],0,img_shape[1])
    np.clip(boxes[:, 1],0,img_shape[0])
    np.clip(boxes[:, 2],0,img_shape[1])
    np.clip(boxes[:, 3],0,img_shape[0])
    return boxes

def scale_coords(img1_shape, coords, img0_shape, ratio_pad=None):
    
    # Rescale coords (xyxy) from img1_shape to img0_shape
    if ratio_pad is None:  # calculate from img0_shape
        gain = min(img1_shape[0]/img0_shape[0], img1_shape[1]/img0_shape[1])  # gain  = old / new
        #print("------------gain-----------",gain)
        pad = (img1_shape[1] - img0_shape[1] * gain) / 2, (img1_shape[0] - img0_shape[0] * gain) / 2  # wh padding
    else:
        gain = ratio_pad[0][0]
        pad = ratio_pad[1]
    #print("-----------old-coords-----------",coords)
    coords[:, [2]] = (coords[:, [0]] + coords[:, [2]]) * img1_shape[1] - pad[0]  # x padding
    coords[:, [3]] = (coords[:, [1]] + coords[:, [3]]) * img1_shape[0] - pad[1]  # y padding
    coords[:, [0]] = coords[:, [0]] * img1_shape[1] - pad[0]  # x padding
    coords[:, [1]] = coords[:, [1]] * img1_shape[0] - pad[1]  # y padding
    #print("-----------new-coords-----------",coords)
    #print("------------pad-----------",pad)
    coords[:, :4] /= gain

    coords = clip_coords(coords, img0_shape)
    return coords


def display(boxes=None, classes=None, scores=None, image_src=None, input_size=(640, 640), line_thickness=None, text_bg_alpha=0.0):
    labels = classes
    boxs = boxes
    confs = scores

    h, w, c = image_src.shape
    if len(boxes) <= 0:
        return image_src
    boxs[:, :] = scale_coords(input_size, boxs[:, :], (h, w)).round()

    tl = line_thickness or round(0.002 * (w + h) / 2) + 1
    for i, box in enumerate(boxs):
        x1, y1, x2, y2 = box

        ratio = (y2-y1)/(x2-x1)

        x1, y1, x2, y2 = int(x1), int(y1), int(x2), int(y2)
        np.random.seed(int(labels[i]) + 2020)
        color = (np.random.randint(0, 255), 0, np.random.randint(0, 255))
        cv2.rectangle(image_src, (x1, y1), (x2, y2), color, max(int((w + h) / 600), 1), cv2.LINE_AA)
        label = '{0:.3f}'.format(confs[i])
        t_size = cv2.getTextSize(label, 0, fontScale=tl / 3, thickness=1)[0]
        c2 = x1 + t_size[0] + 3, y1 - t_size[1] - 5
        if text_bg_alpha == 0.0:
            cv2.rectangle(image_src, (x1 - 1, y1), c2, color, cv2.FILLED, cv2.LINE_AA)
        else:
            # 透明文本背景
            alphaReserve = text_bg_alpha  # 0：不透明 1：透明
            BChannel, GChannel, RChannel = color
            xMin, yMin = int(x1 - 1), int(y1 - t_size[1] - 3)
            xMax, yMax = int(x1 + t_size[0]), int(y1)
            image_src[yMin:yMax, xMin:xMax, 0] = image_src[yMin:yMax, xMin:xMax, 0] * alphaReserve + BChannel * (1 - alphaReserve)
            image_src[yMin:yMax, xMin:xMax, 1] = image_src[yMin:yMax, xMin:xMax, 1] * alphaReserve + GChannel * (1 - alphaReserve)
            image_src[yMin:yMax, xMin:xMax, 2] = image_src[yMin:yMax, xMin:xMax, 2] * alphaReserve + RChannel * (1 - alphaReserve)
        cv2.putText(image_src, label, (x1 + 3, y1 - 4), 0, tl / 3, [255, 255, 255],
                    thickness=1, lineType=cv2.LINE_AA)
    return image_src


if __name__ == '__main__':
    path = "./imgs/"
    save_folder = "./result/"
    RKNN_MODEL_PATH = r"23best_640x640.rknn"
    rknn = load_rknn_model(RKNN_MODEL_PATH)
    predict.__defaults__ = (None, rknn)
    files = get_image_list(path)
    current_time = time.localtime()
    for image_name in files:
        print("--------------------------image_name-----------------------", image_name)
        image_src = Image.open(image_name)
        boxes, classes, scores = predict(image_src)
        image = np.array(image_src)
        save_image = display(boxes, classes, scores, image)
        save_image = cv2.cvtColor(save_image, cv2.COLOR_BGR2RGB)
        save_file_name = os.path.join(save_folder, os.path.basename(image_name))
        cv2.imwrite(save_file_name,save_image)

        print("--------------------------res-----------------------",boxes, classes, scores)