更新charge振捣判断

2026-03-10 16:51:57 +08:00
parent 235101b4d8
commit 5d79686ba0
15 changed files with 268873 additions and 0 deletions
--- a/1.txt
+++ b/1.txt
@ -0,0 +1,25 @@
+(zjsh) teamhd@teamhd:~/Downloads/rkmpp/build/linux/aarch64$ sudo apt install gcc-aarch64-linux-gnu
+Reading package lists... Done
+Building dependency tree... Done
+Reading state information... Done
+Note, selecting 'gcc' instead of 'gcc-aarch64-linux-gnu'
+Some packages could not be installed. This may mean that you have
+requested an impossible situation or if you are using the unstable
+distribution that some required packages have not yet been created
+or been moved out of Incoming.
+The following information may help to resolve the situation:
+
+The following packages have unmet dependencies:
+ gcc-11 : Depends: cpp-11 (= 11.4.0-1ubuntu1~22.04.3) but 11.4.0-1ubuntu1~22.04 is to be installed
+          Depends: gcc-11-base (= 11.4.0-1ubuntu1~22.04.3) but 11.4.0-1ubuntu1~22.04 is to be installed
+ libasan6 : Depends: gcc-11-base (= 11.4.0-1ubuntu1~22.04.3) but 11.4.0-1ubuntu1~22.04 is to be installed
+ libcc1-0 : Depends: gcc-12-base (= 12.3.0-1ubuntu1~22.04.3) but 12.3.0-1ubuntu1~22.04 is to be installed
+ libgcc-11-dev : Depends: gcc-11-base (= 11.4.0-1ubuntu1~22.04.3) but 11.4.0-1ubuntu1~22.04 is to be installed
+ libhwasan0 : Depends: gcc-12-base (= 12.3.0-1ubuntu1~22.04.3) but 12.3.0-1ubuntu1~22.04 is to be installed
+ libitm1 : Depends: gcc-12-base (= 12.3.0-1ubuntu1~22.04.3) but 12.3.0-1ubuntu1~22.04 is to be installed
+ liblsan0 : Depends: gcc-12-base (= 12.3.0-1ubuntu1~22.04.3) but 12.3.0-1ubuntu1~22.04 is to be installed
+ libtsan0 : Depends: gcc-11-base (= 11.4.0-1ubuntu1~22.04.3) but 11.4.0-1ubuntu1~22.04 is to be installed
+ libubsan1 : Depends: gcc-12-base (= 12.3.0-1ubuntu1~22.04.3) but 12.3.0-1ubuntu1~22.04 is to be installed
+E: Unable to correct problems, you have held broken packages.
+(zjsh) teamhd@teamhd:~/Downloads/rkmpp/build/linux/aarch64$ 
+
--- a/charge_3cls/charge_cls.rknn
+++ b/charge_3cls/charge_cls.rknn
--- a/charge_3cls/charge_cls_rknn.py
+++ b/charge_3cls/charge_cls_rknn.py
@ -0,0 +1,198 @@
+import os
+import cv2
+import numpy as np
+from rknnlite.api import RKNNLite
+from collections import deque
+
+class StableClassJudge:
+    """
+    连续三帧稳定判决器：
+    - class0 / class1 连续 3 帧 -> 输出
+    - class2 -> 清空计数，重新统计
+    """
+
+    def __init__(self, stable_frames=3, ignore_class=2):
+        self.stable_frames = stable_frames
+        self.ignore_class = ignore_class
+        self.buffer = deque(maxlen=stable_frames)
+
+    def reset(self):
+        self.buffer.clear()
+
+    def update(self, class_id):
+        """
+        输入单帧分类结果
+        返回：
+          - None：尚未稳定
+          - class_id：稳定输出结果
+        """
+
+        # 遇到 class2，直接清空重新计数
+        if class_id == self.ignore_class:
+            self.reset()
+            return None
+
+        self.buffer.append(class_id)
+
+        # 缓冲未满
+        if len(self.buffer) < self.stable_frames:
+            return None
+
+        # 三帧完全一致
+        if len(set(self.buffer)) == 1:
+            stable_class = self.buffer[0]
+            self.reset()   # 输出一次后重新计数（防止重复触发）
+            return stable_class
+
+        return None
+
+# ---------------------------
+# 三分类映射
+# ---------------------------
+CLASS_NAMES = {
+    0: "插好",
+    1: "未插好",
+    2: "有遮挡"
+}
+
+# ---------------------------
+# RKNN 全局实例（只加载一次）
+# ---------------------------
+_global_rknn = None
+
+
+def init_rknn_model(model_path):
+    global _global_rknn
+    if _global_rknn is not None:
+        return _global_rknn
+
+    rknn = RKNNLite(verbose=False)
+    ret = rknn.load_rknn(model_path)
+    if ret != 0:
+        raise RuntimeError(f"Load RKNN failed: {ret}")
+
+    ret = rknn.init_runtime(core_mask=RKNNLite.NPU_CORE_0)
+    if ret != 0:
+        raise RuntimeError(f"Init runtime failed: {ret}")
+
+    _global_rknn = rknn
+    print(f"[INFO] RKNN 模型加载成功：{model_path}")
+    return rknn
+
+
+# ---------------------------
+# 预处理
+# ---------------------------
+def letterbox(image, new_size=640, color=(114, 114, 114)):
+    h, w = image.shape[:2]
+    scale = min(new_size / h, new_size / w)
+    nh, nw = int(h * scale), int(w * scale)
+    resized = cv2.resize(image, (nw, nh))
+    new_img = np.full((new_size, new_size, 3), color, dtype=np.uint8)
+    top = (new_size - nh) // 2
+    left = (new_size - nw) // 2
+    new_img[top:top + nh, left:left + nw] = resized
+    return new_img
+
+
+def resize_stretch(image, size=640):
+    return cv2.resize(image, (size, size))
+
+
+def preprocess_image_for_rknn(
+        img,
+        size=640,
+        resize_mode="stretch",
+        to_rgb=True,
+        normalize=False,
+        layout="NHWC"
+):
+    if resize_mode == "letterbox":
+        img_box = letterbox(img, new_size=size)
+    else:
+        img_box = resize_stretch(img, size=size)
+
+    if to_rgb:
+        img_box = cv2.cvtColor(img_box, cv2.COLOR_BGR2RGB)
+
+    img_f = img_box.astype(np.float32)
+
+    if normalize:
+        img_f /= 255.0
+
+    if layout == "NHWC":
+        out = np.expand_dims(img_f, axis=0)
+    else:
+        out = np.expand_dims(np.transpose(img_f, (2, 0, 1)), axis=0)
+
+    return np.ascontiguousarray(out)
+
+
+# ---------------------------
+# 单次 RKNN 推理（三分类）
+# ---------------------------
+def rknn_classify_preprocessed(input_tensor, model_path):
+    rknn = init_rknn_model(model_path)
+
+    outs = rknn.inference([input_tensor])
+    logits = outs[0].reshape(-1).astype(np.float32)  # shape = (3,)
+
+    # softmax
+    exp = np.exp(logits - np.max(logits))
+    probs = exp / np.sum(exp)
+
+    class_id = int(np.argmax(probs))
+    return class_id, probs
+
+
+# ---------------------------
+# 单张图片推理（三分类）- 已移除 ROI 逻辑
+# ---------------------------
+def classify_single_image(
+        frame,
+        model_path,
+        size=640,
+        resize_mode="stretch",
+        to_rgb=True,
+        normalize=False,
+        layout="NHWC"
+):
+    if frame is None:
+        raise FileNotFoundError("❌ 输入帧为空")
+
+    # 直接使用整图，不再裁剪
+    input_tensor = preprocess_image_for_rknn(
+        frame,
+        size=size,
+        resize_mode=resize_mode,
+        to_rgb=to_rgb,
+        normalize=normalize,
+        layout=layout
+    )
+
+    class_id, probs = rknn_classify_preprocessed(input_tensor, model_path)
+    class_name = CLASS_NAMES.get(class_id, f"未知类别 ({class_id})")
+
+    return {
+        "class_id": class_id,
+        "class": class_name,
+        "score": round(float(probs[class_id]), 4),
+        "raw": probs.tolist()
+    }
+
+
+# ---------------------------
+# 示例调用
+# ---------------------------
+if __name__ == "__main__":
+    model_path = "charge_cls.rknn"
+    # roi_file 已移除
+    image_path = "class2.png"
+
+    frame = cv2.imread(image_path)
+    if frame is None:
+        raise FileNotFoundError(f"❌ 无法读取图片：{image_path}")
+
+    # 调用
+    result = classify_single_image(frame, model_path)
+    print("[RESULT]", result)
--- a/charge_3cls/class1.png
+++ b/charge_3cls/class1.png
--- a/charge_3cls/class2.png
+++ b/charge_3cls/class2.png
--- a/image_01.py
+++ b/image_01.py
@ -0,0 +1,170 @@
+import cv2
+import time
+import os
+import numpy as np
+from PIL import Image
+from skimage.metrics import structural_similarity as ssim
+
+# ================== 配置区域 ==================
+RTSP_URL = "rtsp://admin:XJ123456@192.168.10.50:554/streaming/channels/101"
+
+SAVE_INTERVAL = 10     # 每 20 帧尝试一次处理
+DISPLAY_STREAM = False  # 是否显示画面
+
+# --- 灰图过滤配置 ---
+GRAY_LOWER = 70
+GRAY_UPPER = 230
+GRAY_RATIO_THRESHOLD = 0.7  # 灰色像素占比超过此值视为灰图
+
+# --- SSIM 去重配置 ---
+SSIM_THRESHOLD = 0.9        # 相似度超过此值视为重复图片
+
+# --- 保存目录 ---
+OUTPUT_DIR = "camera02_save"
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+
+# ================== 辅助函数 ==================
+
+def is_large_gray(image):
+    """
+    检测图像是否为大面积灰图
+    image: PIL Image 对象 (RGB)
+    """
+    arr = np.array(image)
+    # 检查 R, G, B 三个通道是否都在灰色范围内
+    gray_mask = (
+        (arr[:, :, 0] >= GRAY_LOWER) & (arr[:, :, 0] <= GRAY_UPPER) &
+        (arr[:, :, 1] >= GRAY_LOWER) & (arr[:, :, 1] <= GRAY_UPPER) &
+        (arr[:, :, 2] >= GRAY_LOWER) & (arr[:, :, 2] <= GRAY_UPPER)
+    )
+    # 计算灰色像素占比
+    return np.mean(gray_mask) > GRAY_RATIO_THRESHOLD
+
+def open_camera(url):
+    cap = cv2.VideoCapture(url)
+    if not cap.isOpened():
+        return None
+    cap.set(cv2.CAP_PROP_BUFFERSIZE, 1)
+    cap.set(cv2.CAP_PROP_OPEN_TIMEOUT_MSEC, 5000)
+    cap.set(cv2.CAP_PROP_READ_TIMEOUT_MSEC, 5000)
+    return cap
+
+def get_valid_frame(cap):
+    """安全读取一帧"""
+    if cap is None or not cap.isOpened():
+        return None, False
+    
+    ret, frame = cap.read()
+    if not ret or frame is None or frame.size == 0:
+        return None, False
+    return frame, True
+
+# ================== 主程序 ==================
+
+print(f"✅ 正在连接摄像头: {RTSP_URL} ...")
+cap = open_camera(RTSP_URL)
+
+if cap is None:
+    print(f"❌ 连接失败！请检查 IP、账号密码或网络。")
+    exit(1)
+
+print("📡 摄像头已连接，开始采集...")
+print(f"   - 保存目录: {os.path.abspath(OUTPUT_DIR)}")
+print(f"   - 灰度阈值: [{GRAY_LOWER}, {GRAY_UPPER}], 占比 > {GRAY_RATIO_THRESHOLD}")
+print(f"   - SSIM 去重阈值: > {SSIM_THRESHOLD}")
+print("   - 按 Ctrl+C 停止\n")
+
+frame_count = 0
+saved_count = 0
+last_gray_frame = None  # 用于存储上一帧的灰度图以计算 SSIM
+
+try:
+    while True:
+        frame, ret = get_valid_frame(cap)
+
+        if not ret:
+            print("⚠️ 读取帧失败，尝试重连...")
+            time.sleep(2)
+            cap.release()
+            cap = open_camera(RTSP_URL)
+            if cap is None:
+                print("❌ 重连失败，退出程序。")
+                break
+            last_gray_frame = None  # 重连后重置对比帧
+            continue
+
+        frame_count += 1
+
+        # 间隔采样：不是指定间隔的帧直接跳过（可选显示）
+        if frame_count % SAVE_INTERVAL != 0:
+            if DISPLAY_STREAM:
+                cv2.imshow("Camera Stream", frame)
+                if cv2.waitKey(1) & 0xFF == ord('q'):
+                    break
+            continue
+
+        # --- 步骤 1: 灰图检测 ---
+        try:
+            # 转 RGB 供 PIL 使用
+            img_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+            pil_img = Image.fromarray(img_rgb)
+            
+            if is_large_gray(pil_img):
+                print(f"⏭️ 跳过：检测到灰图 (帧 {frame_count})")
+                continue
+        except Exception as e:
+            print(f"⚠️ 灰图检测异常: {e}")
+            continue
+
+        # --- 步骤 2: SSIM 相似性去重 ---
+        try:
+            gray_curr = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+            
+            if last_gray_frame is not None:
+                # 计算结构相似性
+                # resize 确保尺寸一致（防止分辨率动态变化导致报错）
+                if last_gray_frame.shape != gray_curr.shape:
+                    last_gray_frame = cv2.resize(last_gray_frame, (gray_curr.shape[1], gray_curr.shape[0]))
+                
+                sim_score = ssim(last_gray_frame, gray_curr)
+                
+                if sim_score > SSIM_THRESHOLD:
+                    print(f"⏭️ 跳过：画面重复 (SSIM={sim_score:.3f}, 帧 {frame_count})")
+                    continue
+            
+            # 更新参考帧
+            last_gray_frame = gray_curr.copy()
+            
+        except Exception as e:
+            print(f"⚠️ SSIM 计算异常: {e}")
+            # 如果计算出错，可以选择跳过或强制保存，这里选择跳过以防崩溃
+            continue
+
+        # --- 步骤 3: 保存图片 ---
+        ts = time.strftime("%Y%m%d_%H%M%S")
+        ms = int((time.time() % 1) * 1000)
+        filename = f"img_{ts}_{ms:03d}.png"
+        save_path = os.path.join(OUTPUT_DIR, filename)
+        
+        # 如果需要旋转/翻转，在这里操作 (例如翻转 180 度)
+        # frame = cv2.flip(frame, -1) 
+        
+        cv2.imwrite(save_path, frame)
+        saved_count += 1
+        print(f"✅ [{saved_count}] 已保存有效图片: {filename}")
+
+        if DISPLAY_STREAM:
+            cv2.putText(frame, f"Saved: {filename}", (10, 30), 
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 0), 2)
+            cv2.imshow("Camera Stream", frame)
+            if cv2.waitKey(1) & 0xFF == ord('q'):
+                break
+
+except KeyboardInterrupt:
+    print("\n🛑 用户手动停止")
+
+finally:
+    if cap:
+        cap.release()
+    cv2.destroyAllWindows()
+    print(f"🔚 程序结束。共保存 {saved_count} 张图片。")
--- a/miniforge/Miniforge3-Linux-aarch64.sh
+++ b/miniforge/Miniforge3-Linux-aarch64.sh
--- a/rknn_save/yiliao_cls_60_0123.rknn
+++ b/rknn_save/yiliao_cls_60_0123.rknn
--- a/yemian_seg_diff_61/main.py
+++ b/yemian_seg_diff_61/main.py
@ -75,10 +75,12 @@ def largest_intersect_cc(mask_bin, bbox):
 # RANSAC 直线拟合（核心新增）
 # ---------------------------
 def fit_line_ransac(pts, max_dist=2.5, min_inliers_ratio=0.6, iters=100):
+
    """
    拟合 x = m*y + b
    pts: Nx2 -> [x,y]
    """
+    np.random.seed(42)
    if len(pts) < 10:
        return None

--- a/zdb_cls/main.py
+++ b/zdb_cls/main.py
@ -0,0 +1,117 @@
+import os
+import cv2
+from rknnlite.api import RKNNLite
+
+# classify_single_image, StableClassJudge, CLASS_NAMES 已在 muju_cls_rknn 中定义
+from zdb_cls_rknn import classify_single_image, StableClassJudge, CLASS_NAMES
+
+
+def run_stable_classification_loop(
+    model_path,
+    roi_file,
+    image_source,
+    stable_frames=3,
+    display_scale=0.5,      # 显示缩放比例（0.5 = 显示为原来 50%）
+    show_window=False        # 是否显示窗口
+):
+    """
+    image_source: cv2.VideoCapture 对象
+    """
+
+    judge = StableClassJudge(
+        stable_frames=stable_frames,
+        ignore_class=2  # 忽略“有遮挡”类别参与稳定判断
+    )
+
+    cap = image_source
+    if not hasattr(cap, "read"):
+        raise TypeError("image_source 必须是 cv2.VideoCapture 实例")
+
+    # 可选：创建可缩放窗口
+    if show_window:
+        cv2.namedWindow("RTSP Stream - Press 'q' to quit", cv2.WINDOW_NORMAL)
+
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            print("无法读取视频帧（可能是流断开或结束）")
+            break
+
+        # ---------------------------
+        # 单帧推理
+        # ---------------------------
+        result = classify_single_image(frame, model_path, roi_file)
+
+        class_id = result["class_id"]
+        class_name = result["class"]
+        score = result["score"]
+
+        print(f"[FRAME] {class_name} | conf={score:.3f}")
+
+        # ---------------------------
+        # 稳定判断
+        # ---------------------------
+        stable_class_id = judge.update(class_id)
+
+        if stable_class_id is not None:
+            print(f"\n稳定输出: {CLASS_NAMES[stable_class_id]}\n")
+
+        # ---------------------------
+        # 显示画面（缩小窗口）
+        # ---------------------------
+        if show_window:
+            h, w = frame.shape[:2]
+            display_frame = cv2.resize(
+                frame,
+                (int(w * display_scale), int(h * display_scale)),
+                interpolation=cv2.INTER_AREA
+            )
+
+            cv2.imshow("RTSP Stream - Press 'q' to quit", display_frame)
+
+            if cv2.waitKey(1) & 0xFF == ord('q'):
+                break
+
+    cap.release()
+    cv2.destroyAllWindows()
+
+
+if __name__ == "__main__":
+    # ---------------------------
+    # 配置参数
+    # ---------------------------
+    MODEL_PATH = "zdb_cls.rknn"
+    ROI_FILE = "./roi_coordinates/zdb_roi.txt"
+    RTSP_URL = "rtsp://admin:XJ123456@192.168.250.60:554/streaming/channels/101"
+
+    STABLE_FRAMES = 3
+    DISPLAY_SCALE = 0.5     # 显示窗口缩放比例
+    SHOW_WINDOW = False      # 部署时改成 False，测试的时候打开
+
+    # ---------------------------
+    # 打开 RTSP 视频流
+    # ---------------------------
+    print(f"正在连接 RTSP 流: {RTSP_URL}")
+    cap = cv2.VideoCapture(RTSP_URL)
+
+    # 降低 RTSP 延迟（部分摄像头支持）
+    cap.set(cv2.CAP_PROP_BUFFERSIZE, 1)
+
+    if not cap.isOpened():
+        print("无法打开 RTSP 流，请检查网络、账号密码或 URL")
+        exit(1)
+
+    print("RTSP 流连接成功，开始推理...")
+
+    # ---------------------------
+    # 启动稳定分类循环三帧稳定判断
+    # ---------------------------
+    run_stable_classification_loop(
+        model_path=MODEL_PATH,
+        roi_file=ROI_FILE,
+        image_source=cap,
+        stable_frames=STABLE_FRAMES,
+        display_scale=DISPLAY_SCALE,
+        show_window=SHOW_WINDOW
+    )
+
--- a/zdb_cls/roi_coordinates/zdb_roi.txt
+++ b/zdb_cls/roi_coordinates/zdb_roi.txt
@ -0,0 +1 @@
+2,880,385,200
--- a/zdb_cls/test.png
+++ b/zdb_cls/test.png
--- a/zdb_cls/test_imagesave.py
+++ b/zdb_cls/test_imagesave.py
@ -0,0 +1,275 @@
+import os
+import cv2
+import time
+import numpy as np
+from datetime import datetime
+from collections import deque
+from rknnlite.api import RKNNLite
+
+# =====================================================
+# 稳定判决器
+# =====================================================
+class StableClassJudge:
+    """
+    连续 N 帧稳定判决：
+    - class0 / class1 连续 N 帧 -> 输出
+    - class2 -> 清空计数
+    """
+
+    def __init__(self, stable_frames=3, ignore_class=2):
+        self.stable_frames = stable_frames
+        self.ignore_class = ignore_class
+        self.buffer = deque(maxlen=stable_frames)
+
+    def reset(self):
+        self.buffer.clear()
+
+    def update(self, class_id):
+        if class_id == self.ignore_class:
+            self.reset()
+            return None
+
+        self.buffer.append(class_id)
+
+        if len(self.buffer) < self.stable_frames:
+            return None
+
+        if len(set(self.buffer)) == 1:
+            stable = self.buffer[0]
+            self.reset()
+            return stable
+
+        return None
+
+
+# =====================================================
+# 类别定义
+# =====================================================
+CLASS_NAMES = {
+    0: "未插入振捣棒",
+    1: "安全插入振捣棒",
+    2: "有遮挡"
+}
+
+
+# =====================================================
+# RKNN 全局实例
+# =====================================================
+_global_rknn = None
+
+
+def init_rknn_model(model_path):
+    global _global_rknn
+    if _global_rknn is not None:
+        return _global_rknn
+
+    rknn = RKNNLite(verbose=False)
+
+    ret = rknn.load_rknn(model_path)
+    if ret != 0:
+        raise RuntimeError(f"Load RKNN failed: {ret}")
+
+    ret = rknn.init_runtime(core_mask=RKNNLite.NPU_CORE_0)
+    if ret != 0:
+        raise RuntimeError(f"Init runtime failed: {ret}")
+
+    _global_rknn = rknn
+    print(f"[INFO] RKNN 模型加载成功: {model_path}")
+    return rknn
+
+
+# =====================================================
+# 图像预处理
+# =====================================================
+def letterbox(image, new_size=640, color=(114, 114, 114)):
+    h, w = image.shape[:2]
+    scale = min(new_size / h, new_size / w)
+    nh, nw = int(h * scale), int(w * scale)
+
+    resized = cv2.resize(image, (nw, nh))
+    canvas = np.full((new_size, new_size, 3), color, dtype=np.uint8)
+
+    top = (new_size - nh) // 2
+    left = (new_size - nw) // 2
+    canvas[top:top + nh, left:left + nw] = resized
+    return canvas
+
+
+def resize_stretch(image, size=640):
+    return cv2.resize(image, (size, size))
+
+
+def preprocess_image_for_rknn(
+        img,
+        size=640,
+        resize_mode="stretch",
+        to_rgb=True,
+        normalize=False,
+        layout="NHWC"
+):
+    if resize_mode == "letterbox":
+        img = letterbox(img, size)
+    else:
+        img = resize_stretch(img, size)
+
+    if to_rgb:
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+
+    img = img.astype(np.float32)
+
+    if normalize:
+        img /= 255.0
+
+    if layout == "NHWC":
+        img = np.expand_dims(img, axis=0)
+    else:
+        img = np.expand_dims(np.transpose(img, (2, 0, 1)), axis=0)
+
+    return np.ascontiguousarray(img)
+
+
+# =====================================================
+# RKNN 单次推理
+# =====================================================
+def rknn_classify_preprocessed(input_tensor, model_path):
+    rknn = init_rknn_model(model_path)
+    outs = rknn.inference([input_tensor])
+    probs = outs[0].reshape(-1).astype(float)
+    class_id = int(np.argmax(probs))
+    return class_id, probs
+
+
+# =====================================================
+# ROI 处理
+# =====================================================
+def load_single_roi(txt_path):
+    if not os.path.exists(txt_path):
+        raise RuntimeError(f"ROI 文件不存在: {txt_path}")
+
+    with open(txt_path) as f:
+        for line in f:
+            line = line.strip()
+            if not line:
+                continue
+            x, y, w, h = map(int, line.split(","))
+            return (x, y, w, h)
+
+    raise RuntimeError("ROI 文件为空")
+
+
+def crop_and_return_roi(img, roi):
+    x, y, w, h = roi
+    H, W = img.shape[:2]
+
+    if x < 0 or y < 0 or x + w > W or y + h > H:
+        raise RuntimeError(f"ROI 超出图像范围: {roi}")
+
+    return img[y:y + h, x:x + w]
+
+
+# =====================================================
+# 单帧分类
+# =====================================================
+def classify_single_image(frame, model_path, roi_file):
+    roi = load_single_roi(roi_file)
+    roi_img = crop_and_return_roi(frame, roi)
+
+    input_tensor = preprocess_image_for_rknn(
+        roi_img,
+        size=640,
+        resize_mode="stretch",
+        to_rgb=True,
+        normalize=False,
+        layout="NHWC"
+    )
+
+    class_id, probs = rknn_classify_preprocessed(input_tensor, model_path)
+
+    return {
+        "class_id": class_id,
+        "class": CLASS_NAMES[class_id],
+        "score": round(float(probs[class_id]), 4),
+        "raw": probs.tolist()
+    }
+
+
+# =====================================================
+# RTSP 推理 + 保存分类结果
+# =====================================================
+def run_rtsp_classification_and_save(
+        model_path,
+        roi_file,
+        rtsp_url,
+        save_root="clsimg",
+        stable_frames=3,
+        save_mode="all"  # all / stable
+):
+    for cid in CLASS_NAMES.keys():
+        os.makedirs(os.path.join(save_root, f"class{cid}"), exist_ok=True)
+
+    cap = cv2.VideoCapture(rtsp_url)
+    if not cap.isOpened():
+        raise RuntimeError(f"无法打开 RTSP: {rtsp_url}")
+
+    judge = StableClassJudge(stable_frames=stable_frames, ignore_class=2)
+
+    print("[INFO] RTSP 推理开始")
+
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            print("[WARN] RTSP 读帧失败")
+            time.sleep(0.1)
+            continue
+
+        frame = cv2.flip(frame, -1)
+
+        result = classify_single_image(frame, model_path, roi_file)
+        class_id = result["class_id"]
+        score = result["score"]
+
+        print(f"[FRAME] {result['class']}  conf={score}")
+
+        stable = judge.update(class_id)
+
+        save_flag = False
+        save_class = class_id
+
+        if save_mode == "all":
+            save_flag = True
+        elif save_mode == "stable" and stable is not None:
+            save_flag = True
+            save_class = stable
+
+        if save_flag:
+            ts = datetime.now().strftime("%Y%m%d_%H%M%S_%f")
+            filename = f"{ts}_conf{score:.2f}.jpg"
+            save_dir = os.path.join(save_root, f"class{save_class}")
+            cv2.imwrite(os.path.join(save_dir, filename), frame)
+            print(f"[SAVE] class{save_class}/{filename}")
+
+        if cv2.waitKey(1) & 0xFF == ord('q'):
+            break
+
+    cap.release()
+    cv2.destroyAllWindows()
+
+
+# =====================================================
+# main
+# =====================================================
+if __name__ == "__main__":
+    model_path = "zdb_cls.rknn"
+    roi_file = "./roi_coordinates/zdb_roi.txt"
+
+    rtsp_url = "rtsp://admin:XJ123456@192.168.250.60:554/streaming/channels/101"
+
+    run_rtsp_classification_and_save(
+        model_path=model_path,
+        roi_file=roi_file,
+        rtsp_url=rtsp_url,
+        save_root="clsimg",
+        stable_frames=3,
+        save_mode="all"     # 改成 "stable" 只存稳定结果
+    )
+
--- a/zdb_cls/zdb_cls.rknn
+++ b/zdb_cls/zdb_cls.rknn
--- a/zdb_cls/zdb_cls_rknn.py
+++ b/zdb_cls/zdb_cls_rknn.py
@ -0,0 +1,282 @@
+import os
+import cv2
+import numpy as np
+from rknnlite.api import RKNNLite
+
+from collections import deque
+
+class StableClassJudge:
+    """
+    连续三帧稳定判决器：
+    - class0 / class1 连续 3 帧 -> 输出
+    - class2 -> 清空计数，重新统计
+    """
+
+    def __init__(self, stable_frames=3, ignore_class=2):
+        self.stable_frames = stable_frames
+        self.ignore_class = ignore_class
+        self.buffer = deque(maxlen=stable_frames)
+
+    def reset(self):
+        self.buffer.clear()
+
+    def update(self, class_id):
+        """
+        输入单帧分类结果
+        返回：
+          - None：尚未稳定
+          - class_id：稳定输出结果
+        """
+
+        # 遇到 class2，直接清空重新计数
+        if class_id == self.ignore_class:
+            self.reset()
+            return None
+
+        self.buffer.append(class_id)
+
+        # 缓冲未满
+        if len(self.buffer) < self.stable_frames:
+            return None
+
+        # 三帧完全一致
+        if len(set(self.buffer)) == 1:
+            stable_class = self.buffer[0]
+            self.reset()   # 输出一次后重新计数（防止重复触发）
+            return stable_class
+
+        return None
+
+# ---------------------------
+# 三分类映射，模具车1是小的，模具车2是大的
+# ---------------------------
+CLASS_NAMES = {
+    0: "模具车1",
+    1: "模具车2",
+    2: "有遮挡"
+}
+
+# ---------------------------
+# RKNN 全局实例（只加载一次）
+# ---------------------------
+_global_rknn = None
+
+
+def init_rknn_model(model_path):
+    global _global_rknn
+    if _global_rknn is not None:
+        return _global_rknn
+
+    rknn = RKNNLite(verbose=False)
+    ret = rknn.load_rknn(model_path)
+    if ret != 0:
+        raise RuntimeError(f"Load RKNN failed: {ret}")
+
+    ret = rknn.init_runtime(core_mask=RKNNLite.NPU_CORE_0)
+    if ret != 0:
+        raise RuntimeError(f"Init runtime failed: {ret}")
+
+    _global_rknn = rknn
+    print(f"[INFO] RKNN 模型加载成功: {model_path}")
+    return rknn
+
+
+# ---------------------------
+# 预处理
+# ---------------------------
+def letterbox(image, new_size=640, color=(114, 114, 114)):
+    h, w = image.shape[:2]
+    scale = min(new_size / h, new_size / w)
+    nh, nw = int(h * scale), int(w * scale)
+    resized = cv2.resize(image, (nw, nh))
+    new_img = np.full((new_size, new_size, 3), color, dtype=np.uint8)
+    top = (new_size - nh) // 2
+    left = (new_size - nw) // 2
+    new_img[top:top + nh, left:left + nw] = resized
+    return new_img
+
+
+def resize_stretch(image, size=640):
+    return cv2.resize(image, (size, size))
+
+
+def preprocess_image_for_rknn(
+        img,
+        size=640,
+        resize_mode="stretch",
+        to_rgb=True,
+        normalize=False,
+        layout="NHWC"
+):
+    if resize_mode == "letterbox":
+        img_box = letterbox(img, new_size=size)
+    else:
+        img_box = resize_stretch(img, size=size)
+
+    if to_rgb:
+        img_box = cv2.cvtColor(img_box, cv2.COLOR_BGR2RGB)
+
+    img_f = img_box.astype(np.float32)
+
+    if normalize:
+        img_f /= 255.0
+
+    if layout == "NHWC":
+        out = np.expand_dims(img_f, axis=0)
+    else:
+        out = np.expand_dims(np.transpose(img_f, (2, 0, 1)), axis=0)
+
+    return np.ascontiguousarray(out)
+
+
+# ---------------------------
+# 单次 RKNN 推理（三分类）
+# ---------------------------
+def rknn_classify_preprocessed(input_tensor, model_path):
+    rknn = init_rknn_model(model_path)
+
+    input_tensor = np.ascontiguousarray(input_tensor.astype(np.float32))
+    outs = rknn.inference([input_tensor])
+
+    pred = outs[0].reshape(-1).astype(float)  # shape = (3,)
+    class_id = int(np.argmax(pred))
+
+    return class_id, pred
+
+# ---------------------------
+# ROI
+# ---------------------------
+def load_single_roi(txt_path):
+    if not os.path.exists(txt_path):
+        raise RuntimeError(f"ROI 文件不存在: {txt_path}")
+
+    with open(txt_path) as f:
+        for line in f:
+            s = line.strip()
+            if not s:
+                continue
+            x, y, w, h = map(int, s.split(','))
+            return (x, y, w, h)
+
+    raise RuntimeError("ROI 文件为空")
+
+
+def crop_and_return_roi(img, roi):
+    x, y, w, h = roi
+    h_img, w_img = img.shape[:2]
+
+    if x < 0 or y < 0 or x + w > w_img or y + h > h_img:
+        raise RuntimeError(f"ROI 超出图像范围: {roi}")
+
+    return img[y:y + h, x:x + w]
+
+
+# ---------------------------
+# 单张图片推理（三分类）
+# ---------------------------
+def classify_single_image(
+        frame,
+        model_path,
+        roi_file,
+        size=640,
+        resize_mode="stretch",
+        to_rgb=True,
+        normalize=False,
+        layout="NHWC"
+):
+    if frame is None:
+        raise FileNotFoundError("输入帧为空")
+
+    roi = load_single_roi(roi_file)
+    roi_img = crop_and_return_roi(frame, roi)
+
+    input_tensor = preprocess_image_for_rknn(
+        roi_img,
+        size=size,
+        resize_mode=resize_mode,
+        to_rgb=to_rgb,
+        normalize=normalize,
+        layout=layout
+    )
+
+    class_id, probs = rknn_classify_preprocessed(input_tensor, model_path)
+    class_name = CLASS_NAMES.get(class_id, f"未知类别({class_id})")
+
+    return {
+        "class_id": class_id,
+        "class": class_name,
+        "score": round(float(probs[class_id]), 4),
+        "raw": probs.tolist()
+    }
+
+
+
+# ---------------------------
+# 示例调用
+# ---------------------------
+if __name__ == "__main__":
+    model_path = "zdb_cls.rknn"
+    roi_file = "./roi_coordinates/zdb_roi.txt"
+    image_path = "./test_image/test.png"
+
+    frame = cv2.imread(image_path)
+    if frame is None:
+        raise FileNotFoundError(f"无法读取图片: {image_path}")
+
+    result = classify_single_image(frame, model_path, roi_file)
+    print("[RESULT]", result)
+
+# ---------------------------
+# 示例判断逻辑
+'''
+import cv2
+from muju_cls_rknn import classify_single_image,StableClassJudge,CLASS_NAMES
+
+def run_stable_classification_loop(
+        model_path,
+        roi_file,
+        image_source,
+        stable_frames=3
+):
+    """
+    image_source:
+      - cv2.VideoCapture
+    """
+    judge = StableClassJudge(
+        stable_frames=stable_frames,
+        ignore_class=2   # 有遮挡
+    )
+    
+    cap = image_source
+    if not hasattr(cap, "read"):
+        raise TypeError("image_source 必须是 cv2.VideoCapture")
+
+    while True:
+        ret, frame = cap.read()
+        # 上下左右翻转
+        frame = cv2.flip(frame, -1)
+        
+        if not ret:
+            print("读取帧失败，退出")
+            break
+
+        result = classify_single_image(frame, model_path, roi_file)
+
+        class_id = result["class_id"]
+        class_name = result["class"]
+        score = result["score"]
+
+        print(f"[FRAME] {class_name}  conf={score}")
+
+        stable = judge.update(class_id)
+
+        if stable is not None:
+            print(f"\n稳定输出: {CLASS_NAMES[stable]} \n")
+
+        if cv2.waitKey(1) & 0xFF == ord('q'):
+            break
+
+    cap.release()
+    cv2.destroyAllWindows()
+'''
+# ---------------------------