| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212 |
- """
- 通用推理后端
- 为 UltralyticsTracker 提供 RKNN / ONNX 模型的统一检测接口,
- 与安全检测(安全帽/反光衣)解耦。
- """
- import os
- import cv2
- import numpy as np
- from typing import List, Tuple, Dict, Any
- from dataclasses import dataclass
- @dataclass
- class Detection:
- """检测结果 (用于 RKNN/ONNX 模型)"""
- class_id: int
- class_name: str
- confidence: float
- bbox: Tuple[int, int, int, int]
- def nms(dets, iou_threshold=0.45):
- """非极大值抑制"""
- if len(dets) == 0:
- return []
- boxes = np.array([[d.bbox[0], d.bbox[1], d.bbox[2], d.bbox[3], d.confidence] for d in dets])
- x1 = boxes[:, 0]
- y1 = boxes[:, 1]
- x2 = boxes[:, 2]
- y2 = boxes[:, 3]
- scores = boxes[:, 4]
- areas = (x2 - x1 + 1) * (y2 - y1 + 1)
- order = scores.argsort()[::-1]
- keep = []
- while order.size > 0:
- i = order[0]
- keep.append(i)
- xx1 = np.maximum(x1[i], x1[order[1:]])
- yy1 = np.maximum(y1[i], y1[order[1:]])
- xx2 = np.minimum(x2[i], x2[order[1:]])
- yy2 = np.minimum(y2[i], y2[order[1:]])
- w = np.maximum(0.0, xx2 - xx1 + 1)
- h = np.maximum(0.0, yy2 - yy1 + 1)
- inter = w * h
- ovr = inter / (areas[i] + areas[order[1:]] - inter)
- inds = np.where(ovr <= iou_threshold)[0]
- order = order[inds + 1]
- return [dets[i] for i in keep]
- class BaseDetector:
- """检测器基类 (用于 RKNN/ONNX 模型)"""
- # 默认 COCO 类别映射;子类可覆盖
- LABEL_MAP = {0: 'person'}
- def __init__(self, label_map: Dict[int, str] = None):
- self.input_size = (640, 640)
- self.num_classes = len(label_map) if label_map else max(self.LABEL_MAP.keys()) + 1
- if label_map:
- self.LABEL_MAP = label_map
- def letterbox(self, image):
- """Letterbox 预处理,保持宽高比"""
- h0, w0 = image.shape[:2]
- ih, iw = self.input_size
- scale = min(iw / w0, ih / h0)
- new_w, new_h = int(w0 * scale), int(h0 * scale)
- pad_w = (iw - new_w) // 2
- pad_h = (ih - new_h) // 2
- resized = cv2.resize(image, (new_w, new_h))
- canvas = np.full((ih, iw, 3), 114, dtype=np.uint8)
- canvas[pad_h:pad_h+new_h, pad_w:pad_w+new_w] = resized
- return canvas, scale, pad_w, pad_h, h0, w0
- def postprocess(self, outputs, scale, pad_w, pad_h, h0, w0, conf_threshold_map):
- """后处理"""
- dets = []
- if not outputs:
- return dets
- output = outputs[0]
- if len(output.shape) == 3:
- output = output[0]
- num_boxes = output.shape[1]
- for i in range(num_boxes):
- x_center = float(output[0, i])
- y_center = float(output[1, i])
- width = float(output[2, i])
- height = float(output[3, i])
- class_probs = output[4:4+self.num_classes, i]
- best_class = int(np.argmax(class_probs))
- confidence = float(class_probs[best_class])
- if best_class not in self.LABEL_MAP:
- continue
- conf_threshold = conf_threshold_map.get(best_class, 0.5)
- if confidence < conf_threshold:
- continue
- # 移除 padding 并缩放到原始图像尺寸
- x1 = int(((x_center - width / 2) - pad_w) / scale)
- y1 = int(((y_center - height / 2) - pad_h) / scale)
- x2 = int(((x_center + width / 2) - pad_w) / scale)
- y2 = int(((y_center + height / 2) - pad_h) / scale)
- x1 = max(0, min(w0, x1))
- y1 = max(0, min(h0, y1))
- x2 = max(0, min(w0, x2))
- y2 = max(0, min(h0, y2))
- det = Detection(
- class_id=best_class,
- class_name=self.LABEL_MAP[best_class],
- confidence=confidence,
- bbox=(x1, y1, x2, y2)
- )
- dets.append(det)
- dets = nms(dets, iou_threshold=0.45)
- return dets
- def detect(self, image, conf_threshold_map):
- raise NotImplementedError
- def release(self):
- pass
- class RKNNDetector(BaseDetector):
- """RKNN 检测器 - 使用 NHWC 输入格式 (1, H, W, C)"""
- def __init__(self, model_path: str, label_map: Dict[int, str] = None):
- super().__init__(label_map=label_map)
- self.model_path = model_path
- self.rknn = None
- try:
- from rknnlite.api import RKNNLite
- self.rknn = RKNNLite()
- except ImportError:
- raise ImportError("未安装 rknnlite,请运行: pip install rknnlite2 或参考 testrk3588/setup_rknn.sh")
- ret = self.rknn.load_rknn(model_path)
- if ret != 0:
- raise RuntimeError(f"加载 RKNN 模型失败: {model_path}")
- ret = self.rknn.init_runtime(core_mask=RKNNLite.NPU_CORE_0_1_2)
- if ret != 0:
- raise RuntimeError("初始化 RKNN 运行时失败")
- print(f"RKNN 模型加载成功: {model_path}")
- def detect(self, image, conf_threshold_map):
- canvas, scale, pad_w, pad_h, h0, w0 = self.letterbox(image)
- # RKNN 期望 NHWC (1, H, W, C), RGB, 归一化 0-1
- img = canvas[..., ::-1].astype(np.float32) / 255.0
- blob = img[None, ...] # (1, 640, 640, 3)
- outs = self.rknn.inference(inputs=[blob])
- return self.postprocess(outs, scale, pad_w, pad_h, h0, w0, conf_threshold_map)
- def release(self):
- if self.rknn:
- self.rknn.release()
- self.rknn = None
- class ONNXDetector(BaseDetector):
- """ONNX 检测器 - 使用 NCHW 输入格式 (1, C, H, W)"""
- def __init__(self, model_path: str, label_map: Dict[int, str] = None):
- super().__init__(label_map=label_map)
- self.model_path = model_path
- try:
- import onnxruntime as ort
- self.session = ort.InferenceSession(model_path)
- self.input_name = self.session.get_inputs()[0].name
- self.output_name = self.session.get_outputs()[0].name
- print(f"ONNX 模型加载成功: {model_path}")
- except ImportError:
- raise ImportError("未安装 onnxruntime,请运行: pip install onnxruntime")
- except Exception as e:
- raise RuntimeError(f"加载 ONNX 模型失败: {e}")
- def detect(self, image, conf_threshold_map):
- canvas, scale, pad_w, pad_h, h0, w0 = self.letterbox(image)
- # ONNX 期望 NCHW (1, C, H, W), RGB, 归一化 0-1
- img = canvas[..., ::-1].astype(np.float32) / 255.0
- img = img.transpose(2, 0, 1)
- blob = img[None, ...] # (1, 3, 640, 640)
- outs = self.session.run([self.output_name], {self.input_name: blob})
- return self.postprocess(outs, scale, pad_w, pad_h, h0, w0, conf_threshold_map)
- def release(self):
- self.session = None
|