yolov10模型精度问题

[复制链接] · 发表于 2025-5-16 14:57:22

本帖最后由 asdasdasd 于 2025-5-16 15:14 编辑

想请教一下，yolov10的模型不量化转出的rknn（连扳runtime精度校验没有问题），在rknn_model_zoo/example/yolov10/上也能正常推理，命令如下：
python yolov10.py --model_path /home/zionchu/Desktop/Engineering/RK3588_dev/model_calibration/models/nosigmoid.rknn --target Rk3588 --img_show --device_id 0973f07c156de1b4

但是把这个代码移植到rk3588上运行，输入同一张图片推理会有分类结果不匹配的问题，精度也降低很多，有什么可能影响的原因吗？命令如下：
python yolov10.py --model_path /home/pi/zzh/metal_detection_rknn/weights/nosigmoid.rknn --img_save
代码提供：1.yolov10

import os

import cv2

import sys

import argparse

import torch

# add path

realpath = os.path.abspath(__file__)

_sep = os.path.sep

realpath = realpath.split(_sep)

sys.path.append(os.path.join(realpath[0]+_sep, *realpath[1:realpath.index('official_yolov10_python')+1]))



from py_utils.coco_utils import COCO_test_helper

import numpy as np





OBJ_THRESH = 0.25

NMS_THRESH = 0.45



# The follew two param is for map test

# OBJ_THRESH = 0.001

# NMS_THRESH = 0.65



IMG_SIZE = (640, 640)  # (width, height), such as (1280, 736)



CLASSES = ("1", "2", "3")



coco_id_list = [1, 2, 3]



def filter_boxes(boxes, box_confidences, box_class_probs):

    """Filter boxes with object threshold.

    """

    box_confidences = box_confidences.reshape(-1)

    candidate, class_num = box_class_probs.shape



    class_max_score = np.max(box_class_probs, axis=-1)

    classes = np.argmax(box_class_probs, axis=-1)



    _class_pos = np.where(class_max_score* box_confidences >= OBJ_THRESH)

    scores = (class_max_score* box_confidences)[_class_pos]



    boxes = boxes[_class_pos]

    classes = classes[_class_pos]



    return boxes, classes, scores



def nms_boxes(boxes, scores):

    """Suppress non-maximal boxes.

    # Returns

        keep: ndarray, index of effective boxes.

    """

    x = boxes[:, 0]

    y = boxes[:, 1]

    w = boxes[:, 2] - boxes[:, 0]

    h = boxes[:, 3] - boxes[:, 1]



    areas = w * h

    order = scores.argsort()[::-1]



    keep = []

    while order.size > 0:

        i = order[0]

        keep.append(i)



        xx1 = np.maximum(x[i], x[order[1:]])

        yy1 = np.maximum(y[i], y[order[1:]])

        xx2 = np.minimum(x[i] + w[i], x[order[1:]] + w[order[1:]])

        yy2 = np.minimum(y[i] + h[i], y[order[1:]] + h[order[1:]])



        w1 = np.maximum(0.0, xx2 - xx1 + 0.00001)

        h1 = np.maximum(0.0, yy2 - yy1 + 0.00001)

        inter = w1 * h1



        ovr = inter / (areas[i] + areas[order[1:]] - inter)

        inds = np.where(ovr <= NMS_THRESH)[0]

        order = order[inds + 1]

    keep = np.array(keep)

    return keep



def dfl(position):

    # Distribution Focal Loss (DFL)

    import torch

    x = torch.tensor(position)

    n,c,h,w = x.shape

    p_num = 4

    mc = c//p_num

    y = x.reshape(n,p_num,mc,h,w)

    y = y.softmax(2)

    acc_metrix = torch.tensor(range(mc)).float().reshape(1,1,mc,1,1)

    y = (y*acc_metrix).sum(2)

    return y.numpy()





def box_process(position):

    grid_h, grid_w = position.shape[2:4]

    col, row = np.meshgrid(np.arange(0, grid_w), np.arange(0, grid_h))

    col = col.reshape(1, 1, grid_h, grid_w)

    row = row.reshape(1, 1, grid_h, grid_w)

    grid = np.concatenate((col, row), axis=1)

    stride = np.array([IMG_SIZE[1]//grid_h, IMG_SIZE[0]//grid_w]).reshape(1,2,1,1)



    position = dfl(position)

    box_xy  = grid +0.5 -position[:,0:2,:,:]

    box_xy2 = grid +0.5 +position[:,2:4,:,:]

    xyxy = np.concatenate((box_xy*stride, box_xy2*stride), axis=1)



    return xyxy



def post_process(input_data):

    boxes, scores, classes_conf = [], [], []

    defualt_branch=3

    pair_per_branch = len(input_data)//defualt_branch

    # Python 忽略 score_sum 输出

    for i in range(defualt_branch):

        boxes.append(box_process(input_data[pair_per_branch*i]))

        classes_conf.append(input_data[pair_per_branch*i+1])

        scores.append(np.ones_like(input_data[pair_per_branch*i+1][:,:1,:,:], dtype=np.float32))



    def sp_flatten(_in):

        ch = _in.shape[1]

        _in = _in.transpose(0,2,3,1)

        return _in.reshape(-1, ch)



    boxes = [sp_flatten(_v) for _v in boxes]

    classes_conf = [sp_flatten(_v) for _v in classes_conf]

    scores = [sp_flatten(_v) for _v in scores]



    boxes = np.concatenate(boxes)

    classes_conf = np.concatenate(classes_conf)

    scores = np.concatenate(scores)



    # filter according to threshold

    boxes, classes, scores = filter_boxes(boxes, scores, classes_conf)



    # nms

    nboxes, nclasses, nscores = [], [], []

    for c in set(classes):

        inds = np.where(classes == c)

        b = boxes[inds]

        c = classes[inds]

        s = scores[inds]

        keep = nms_boxes(b, s)



        if len(keep) != 0:

            nboxes.append(b[keep])

            nclasses.append(c[keep])

            nscores.append(s[keep])



    if not nclasses and not nscores:

        return None, None, None



    boxes = np.concatenate(nboxes)

    classes = np.concatenate(nclasses)

    scores = np.concatenate(nscores)



    return boxes, classes, scores





def post_process_yolov10(input_data):

    max_det, nc = 300, len(CLASSES)



    boxes, scores = [], []

    defualt_branch=3

    pair_per_branch = len(input_data)//defualt_branch

    # Python 忽略 score_sum 输出

    for i in range(defualt_branch):

        boxes.append(box_process(input_data[pair_per_branch*i]))

        scores.append(input_data[pair_per_branch*i+1])



    def sp_flatten(_in):

        ch = _in.shape[1]

        _in = _in.transpose(0,2,3,1)

        return _in.reshape(-1, ch)



    boxes = [sp_flatten(_v) for _v in boxes]

    scores = [sp_flatten(_v) for _v in scores]



    boxes = torch.from_numpy(np.expand_dims(np.concatenate(boxes), axis=0))

    scores = torch.from_numpy(np.expand_dims(np.concatenate(scores), axis=0))



    max_scores = scores.amax(dim=-1)

    max_scores, index = torch.topk(max_scores, max_det, axis=-1)

    index = index.unsqueeze(-1)

    boxes = torch.gather(boxes, dim=1, index=index.repeat(1, 1, boxes.shape[-1]))

    scores = torch.gather(scores, dim=1, index=index.repeat(1, 1, scores.shape[-1]))



    scores, index = torch.topk(scores.flatten(1), max_det, axis=-1)

    labels = index % nc

    index = index // nc

    boxes = boxes.gather(dim=1, index=index.unsqueeze(-1).repeat(1, 1, boxes.shape[-1]))



    preds = torch.cat([boxes, scores.unsqueeze(-1), labels.unsqueeze(-1)], dim=-1)



    mask = preds[..., 4] > OBJ_THRESH



    preds = [p[mask[idx]] for idx, p in enumerate(preds)][0]

    boxes = preds[..., :4].numpy()

    scores =  preds[..., 4].numpy()

    classes = preds[..., 5].numpy().astype(np.int64)



    return boxes, classes, scores



def draw(image, boxes, scores, classes):

    for box, score, cl in zip(boxes, scores, classes):

        top, left, right, bottom = [int(_b) for _b in box]

        print("%s @ (%d %d %d %d) %.3f" % (CLASSES[cl], top, left, right, bottom, score))

        cv2.rectangle(image, (top, left), (right, bottom), (255, 0, 0), 2)

        cv2.putText(image, '{0} {1:.2f}'.format(CLASSES[cl], score),

                    (top, left - 6), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 0, 255), 2)



def setup_model(args):

    model_path = args.model_path

    if model_path.endswith('.pt') or model_path.endswith('.torchscript'):

        platform = 'pytorch'

        from py_utils.pytorch_executor import Torch_model_container

        model = Torch_model_container(args.model_path)

    elif model_path.endswith('.rknn'):

        platform = 'rknn'

        from py_utils.rknn_executor import RKNN_model_container 

        model = RKNN_model_container(args.model_path)

    elif model_path.endswith('onnx'):

        platform = 'onnx'

        from py_utils.onnx_executor import ONNX_model_container

        model = ONNX_model_container(args.model_path)

    else:

        assert False, "{} is not rknn/pytorch/onnx model".format(model_path)

    print('Model-{} is {} model, starting val'.format(model_path, platform))

    return model, platform



def img_check(path):

    img_type = ['.jpg', '.jpeg', '.png', '.bmp']

    for _type in img_type:

        if path.endswith(_type) or path.endswith(_type.upper()):

            return True

    return False



if __name__ == '__main__':

    parser = argparse.ArgumentParser(description='Process some integers.')

    # basic params

    parser.add_argument('--model_path', type=str, required= True, help='model path, could be .pt or .rknn file')

    parser.add_argument('--target', type=str, default='rk3566', help='target RKNPU platform')

    parser.add_argument('--device_id', type=str, default=None, help='device id')

    

    parser.add_argument('--img_show', action='store_true', default=False, help='draw the result and show')

    parser.add_argument('--img_save', action='store_true', default=False, help='save the result')



    # data params

    parser.add_argument('--anno_json', type=str, default='../../../datasets/COCO/annotations/instances_val2017.json', help='coco annotation path')

    # coco val folder: '../../../datasets/COCO//val2017'

    parser.add_argument('--img_folder', type=str, default='../model', help='img folder path')

    parser.add_argument('--coco_map_test', action='store_true', help='enable coco map test')



    args = parser.parse_args()



    # init model

    model, platform = setup_model(args)



    file_list = sorted(os.listdir(args.img_folder))

    img_list = []

    for path in file_list:

        if img_check(path):

            img_list.append(path)

    co_helper = COCO_test_helper(enable_letter_box=True)



    # run test

    for i in range(len(img_list)):

        print('infer {}/{}'.format(i+1, len(img_list)), end='\r')



        img_name = img_list[i]

        img_path = os.path.join(args.img_folder, img_name)

        if not os.path.exists(img_path):

            print("{} is not found", img_name)

            continue



        img_src = cv2.imread(img_path)

        if img_src is None:

            continue



        # Due to rga init with (0,0,0), we using pad_color (0,0,0) instead of (114, 114, 114)

        pad_color = (0,0,0)

        img = co_helper.letter_box(im= img_src.copy(), new_shape=(IMG_SIZE[1], IMG_SIZE[0]), pad_color=(0,0,0))

        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)



        input_data = img

        input_data = np.expand_dims(img, axis=0) 



        outputs = model.run([input_data])

        boxes, classes, scores = post_process_yolov10(outputs)



        if args.img_show or args.img_save:

            print('\n\nIMG: {}'.format(img_name))

            img_p = img_src.copy()

            if boxes is not None:

                draw(img_p, co_helper.get_real_box(boxes), scores, classes)



            if args.img_save:

                if not os.path.exists('./result'):

                    os.mkdir('./result')

                result_path = os.path.join('./result', img_name)

                cv2.imwrite(result_path, img_p)

                print('Detection result save to {}'.format(result_path))

                        

            if args.img_show:

                cv2.imshow("full post process result", img_p)

                cv2.waitKeyEx(0)



        # record maps

        if args.coco_map_test is True:

            if boxes is not None:

                for i in range(boxes.shape[0]):

                    co_helper.add_single_record(image_id = int(img_name.split('.')[0]),

                                                category_id = coco_id_list[int(classes[i])],

                                                bbox = boxes[i],

                                                score = round(scores[i], 5).item()

                                                )



    # calculate maps

    if args.coco_map_test is True:

        pred_json = args.model_path.split('.')[-2]+ '_{}'.format(platform) +'.json'

        pred_json = pred_json.split('/')[-1]

        pred_json = os.path.join('./', pred_json)

        co_helper.export_to_json(pred_json)



        from py_utils.coco_utils import coco_eval_with_json

        coco_eval_with_json(args.anno_json, pred_json)



    # release

    model.release()

复制代码

2.rknn_excutor

from rknnlite.api import RKNNLite





class RKNN_model_container():

    def __init__(self, model_path):

        rknn = RKNNLite()



        # Direct Load RKNN Model

        rknn.load_rknn(model_path)



        print('--> Init runtime environment')

        rknn.init_runtime()

        print('done')

        

        self.rknn = rknn



    # def __del__(self):

    #     self.release()



    def run(self, inputs):

        if self.rknn is None:

            print("ERROR: rknn has been released")

            return []



        if isinstance(inputs, list) or isinstance(inputs, tuple):

            pass

        else:

            inputs = [inputs]



        result = self.rknn.inference(inputs=inputs)

    

        return result



    def release(self):

        self.rknn.release()

        self.rknn = None
复制代码

只看该作者 · 发表于 2025-5-19 08:52:57

请参看文档进行逐层输出调试，以及量化和不量化对比

只看该作者 · 发表于 2025-5-19 10:06:22

jefferyzhang 发表于 2025-5-19 08:52
请参看文档进行逐层输出调试，以及量化和不量化对比

您好，非量化情况下逐层输出没有问题
C:\Users\zhuzi\Desktop\1.png

只看该作者 · 发表于 2025-5-19 10:30:21

jefferyzhang 发表于 2025-5-19 08:52
请参看文档进行逐层输出调试，以及量化和不量化对比

您好，不量化逐层调试精度都是0.99，想请问一下官方提供的rknn python推理框架是在板端npu推理的还是pc模拟的

只看该作者 · 发表于 2025-5-20 08:36:40

asdasdasd 发表于 2025-5-19 10:30
您好，不量化逐层调试精度都是0.99，想请问一下官方提供的rknn python推理框架是在板端npu推理的还是pc模 ...

都可以，可以pc仿真，也可以pc调用板端推理，也可以在板端推理。
量化精度不准问题一样要逐层调试，如果他模型有两个不一样值域范围的结果给concat在一起的，需要用分组量化或者手动拆开。

yolov10模型精度问题

浏览过的版块