wenhongquan
/
dsh


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145
							#!/usr/bin/env python3
import cv2
import numpy as np
from rknnlite.api import RKNNLite
from dataclasses import dataclass
from typing import List, Tuple, Optional

@dataclass
class Detection:
    class_id: int
    class_name: str
    confidence: float
    bbox: Tuple[int, int, int, int]

LABEL_MAP = {0: '安全帽', 4: '安全衣', 3: '人'}
INPUT_SIZE = (640, 640)

def nms(dets, iou_threshold=0.45):
    if len(dets) == 0:
        return []
    
    boxes = np.array([[d.bbox[0], d.bbox[1], d.bbox[2], d.bbox[3], d.confidence] for d in dets])
    x1 = boxes[:, 0]
    y1 = boxes[:, 1]
    x2 = boxes[:, 2]
    y2 = boxes[:, 3]
    scores = boxes[:, 4]
    
    areas = (x2 - x1 + 1) * (y2 - y1 + 1)
    order = scores.argsort()[::-1]
    
    keep = []
    while order.size > 0:
        i = order[0]
        keep.append(i)
        
        xx1 = np.maximum(x1[i], x1[order[1:]])
        yy1 = np.maximum(y1[i], y1[order[1:]])
        xx2 = np.minimum(x2[i], x2[order[1:]])
        yy2 = np.minimum(y2[i], y2[order[1:]])
        
        w = np.maximum(0.0, xx2 - xx1 + 1)
        h = np.maximum(0.0, yy2 - yy1 + 1)
        inter = w * h
        ovr = inter / (areas[i] + areas[order[1:]] - inter)
        
        inds = np.where(ovr <= iou_threshold)[0]
        order = order[inds + 1]
    
    return [dets[i] for i in keep]

def letterbox(image, input_size=(640, 640)):
    h0, w0 = image.shape[:2]
    ih, iw = input_size
    scale = min(iw / w0, ih / h0)
    new_w, new_h = int(w0 * scale), int(h0 * scale)
    pad_w = (iw - new_w) // 2
    pad_h = (ih - new_h) // 2
    resized = cv2.resize(image, (new_w, new_h))
    canvas = np.full((ih, iw, 3), 114, dtype=np.uint8)
    canvas[pad_h:pad_h+new_h, pad_w:pad_w+new_w] = resized
    return canvas, scale, pad_w, pad_h, h0, w0

def test_model():
    model_path = "yolo11m_safety.rknn"
    conf_threshold_map = {3: 0.8, 0: 0.5, 4: 0.5}
    
    rknn = RKNNLite()
    
    ret = rknn.load_rknn(model_path)
    if ret != 0:
        print("[ERROR] load_rknn failed")
        return
    
    ret = rknn.init_runtime(core_mask=RKNNLite.NPU_CORE_0_1_2)
    if ret != 0:
        print("[ERROR] init_runtime failed")
        return
    
    image = cv2.imread("b.jpg")
    if image is None:
        print("无法读取测试图片")
        return
    
    canvas, scale, pad_w, pad_h, h0, w0 = letterbox(image)
    
    # RKNN expects NHWC input: (1, H, W, C), RGB, float32 normalized 0-1
    img = canvas[..., ::-1].astype(np.float32) / 255.0
    blob = img[None, ...]  # (1, 640, 640, 3)
    
    outputs = rknn.inference(inputs=[blob])
    
    if outputs:
        output = outputs[0]
        if len(output.shape) == 3:
            output = output[0]
        
        num_classes = 5
        dets = []
        for i in range(output.shape[1]):
            x_center = float(output[0, i])
            y_center = float(output[1, i])
            width = float(output[2, i])
            height = float(output[3, i])
            
            class_probs = output[4:4+num_classes, i]
            best_class = int(np.argmax(class_probs))
            confidence = float(class_probs[best_class])
            
            if best_class not in LABEL_MAP:
                continue
            
            conf_threshold = conf_threshold_map.get(best_class, 0.5)
            if confidence < conf_threshold:
                continue
            
            # Remove padding and scale to original image
            x1 = int(((x_center - width / 2) - pad_w) / scale)
            y1 = int(((y_center - height / 2) - pad_h) / scale)
            x2 = int(((x_center + width / 2) - pad_w) / scale)
            y2 = int(((y_center + height / 2) - pad_h) / scale)
            
            x1 = max(0, min(w0, x1))
            y1 = max(0, min(h0, y1))
            x2 = max(0, min(w0, x2))
            y2 = max(0, min(h0, y2))
            
            det = Detection(
                class_id=best_class,
                class_name=LABEL_MAP[best_class],
                confidence=confidence,
                bbox=(x1, y1, x2, y2)
            )
            dets.append(det)
        
        dets = nms(dets, iou_threshold=0.45)
        
        print(f"检测结果: {len(dets)} 个目标")
        for d in dets:
            print(f"  {d.class_name}: conf={d.confidence:.3f}, box={d.bbox}")
    
    rknn.release()

if __name__ == "__main__":
    test_model()