添加状态分类和液面分割

2025-09-01 14:14:18 +08:00
parent 6e553f6a20
commit ad52ab9125
2379 changed files with 102501 additions and 1465 deletions
--- a/angle_base_seg/pycache/test_seg_angle_f1.cpython-39-pytest-8.4.1.pyc
+++ b/angle_base_seg/pycache/test_seg_angle_f1.cpython-39-pytest-8.4.1.pyc
--- a/angle_base_seg/pycache/test_seg_angle_f2.cpython-39-pytest-8.4.1.pyc
+++ b/angle_base_seg/pycache/test_seg_angle_f2.cpython-39-pytest-8.4.1.pyc
--- a/angle_base_seg/angle_main.py
+++ b/angle_base_seg/angle_main.py
@ -4,7 +4,7 @@ import numpy as np
 import os

 # ------------------ 模型与路径配置 ------------------
-MODEL_PATH = '../ultralytics_yolo11-main/runs/train/exp4/weights/best.pt'
+MODEL_PATH = '../ultralytics_yolo11-main/runs/train/seg_j/exp/weights/best.pt'
 OUTPUT_DIR = '../test_image'
 os.makedirs(OUTPUT_DIR, exist_ok=True)

@ -34,7 +34,7 @@ def detect_jaw_angle(image_path, mode='show'):

    # 创建掩码并检测
    composite_mask = np.zeros((h, w), dtype=np.uint8)
-    results = model(image_path, imgsz=1280, conf=0.5)
+    results = model(image_path, imgsz=640, conf=0.5)

    jaws = []
    for r in results:
@ -143,13 +143,13 @@ def detect_jaw_angle(image_path, mode='show'):

 # ------------------ 主函数 ------------------
 if __name__ == '__main__':
-    # ✅ 设置输入图像路径
-    image_path = '/test_image/1.png'  # ← 修改为你自己的图片路径
+    # ✅ 设置输入图像路
+    image_path = r"/home/hx/yolo/output_masks/2.jpg"  # ← 修改为你自己的图片路径

    # ✅ 模式选择：
    #   mode='show': 保存可视化图像
    #   mode='silent': 只返回角度
-    mode = 'silent'  # 或 'silent'
+    mode = 'show'  # 或 'silent'

    print(f"🔍 正在处理图像: {image_path}")
    angle = detect_jaw_angle(image_path, mode=mode)
--- a/angle_base_seg/angle_test.py
+++ b/angle_base_seg/angle_test.py
@ -6,7 +6,7 @@ import torch
 import torch.nn.functional as F

 # ------------------ 模型与路径配置 ------------------
-MODEL_PATH = '../ultralytics_yolo11-main/runs/train/exp4/weights/best.pt'
+MODEL_PATH = '../ultralytics_yolo11-main/runs/train/seg/exp2/weights/best.pt'
 OUTPUT_DIR = '../test_image'
 os.makedirs(OUTPUT_DIR, exist_ok=True)

@ -24,7 +24,7 @@ def detect_jaw_angle_fast(image_path, mode='silent'):
    name_only = os.path.splitext(filename)[0]

    # 推理（批量可进一步提速）
-    results = model(image_path, imgsz=1280, conf=0.5, device='cuda')
+    results = model(image_path, imgsz=1280, conf=0.15, device='cuda')
    r = results[0]

    if r.masks is None:
@ -100,9 +100,9 @@ def detect_jaw_angle_fast(image_path, mode='silent'):

 # ------------------ 测试 ------------------
 if __name__ == '__main__':
-    image_path = '/test_image/1.png'
+    image_path = '/home/hx/yolo/output_masks/1.jpg'
    print(f"🚀 处理: {image_path}")
-    angle = detect_jaw_angle_fast(image_path, mode='silent')
+    angle = detect_jaw_angle_fast(image_path, mode='show')
    if angle is not None:
        print(f"✅ 角度: {angle}°")
    else:
--- a/angle_base_seg/angle_test_1.py
+++ b/angle_base_seg/angle_test_1.py
@ -0,0 +1,109 @@
+from ultralytics import YOLO
+import cv2
+import numpy as np
+import os
+import torch
+import torch.nn.functional as F
+
+# ------------------ 模型与路径配置 ------------------
+MODEL_PATH = '../ultralytics_yolo11-main/runs/train/seg/exp3/weights/best.pt'
+OUTPUT_DIR = '../test_image'
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+
+model = YOLO(MODEL_PATH)
+model.to('cuda')
+
+
+def detect_jaw_angle_fast(image_path, mode='silent'):
+    img = cv2.imread(image_path)
+    if img is None:
+        raise FileNotFoundError(f"无法读取图像: {image_path}")
+
+    h, w = img.shape[:2]
+    filename = os.path.basename(image_path)
+    name_only = os.path.splitext(filename)[0]
+
+    # 推理（批量可进一步提速）
+    results = model(image_path, imgsz=640, conf=0.5, device='cuda')
+    r = results[0]
+
+    if r.masks is None:
+        return None
+
+    # 【优化1】一次性上采样所有 masks
+    masks_tensor = r.masks.data  # [N, h_m, w_m]
+    boxes = r.boxes.xyxy.cpu().numpy()
+
+    masks = F.interpolate(
+        masks_tensor.unsqueeze(0).float(),
+        size=(h, w),
+        mode='bilinear',
+        align_corners=False
+    )
+    masks = (masks[0] > 0.5).cpu().numpy().astype(np.uint8)  # [N, h, w]
+
+    jaws = []
+
+    for i, (mask, box) in enumerate(zip(masks, boxes)):
+        x1, y1, x2, y2 = map(int, box)
+
+        # 【优化4】提前过滤小框
+        if (x2 - x1) * (y2 - y1) < 100:
+            continue
+
+        # 【优化2】裁剪区域
+        x1c, y1c = max(0, x1), max(0, y1)
+        x2c, y2c = min(w, x2), min(h, y2)
+        mask_crop = mask[y1c:y2c, x1c:x2c]
+
+        # 【优化3】使用 findNonZero + convexHull
+        coords = cv2.findNonZero(mask_crop)
+        if coords is None or len(coords) < 5:
+            continue
+
+        hull = cv2.convexHull(coords)
+        area = cv2.contourArea(hull)
+        if area < 100:
+            continue
+
+        rect = cv2.minAreaRect(hull)
+        jaws.append({'rect': rect, 'area': area})
+
+    if len(jaws) < 2:
+        return None
+
+    jaws = sorted(jaws, key=lambda x: x['area'], reverse=True)[:2]
+    rect1, rect2 = jaws[0]['rect'], jaws[1]['rect']
+
+    def get_angle(rect):
+        w, h = rect[1]
+        angle = rect[2]
+        return angle + 90 if w < h else angle
+
+    angle1 = get_angle(rect1) % 180
+    angle2 = get_angle(rect2) % 180
+    opening_angle = min(abs(angle1 - angle2), 180 - abs(angle1 - angle2))
+
+    # 可视化（可选）
+    if mode == 'show':
+        vis = np.zeros((h, w, 3), dtype=np.uint8)
+        box1 = cv2.boxPoints(rect1)
+        box2 = cv2.boxPoints(rect2)
+        cv2.drawContours(vis, [np.int32(box1)], 0, (0, 0, 255), 2)
+        cv2.drawContours(vis, [np.int32(box2)], 0, (255, 0, 0), 2)
+        cv2.putText(vis, f"{opening_angle:.1f}°", (20, 50),
+                    cv2.FONT_HERSHEY_SIMPLEX, 1.0, (0, 255, 0), 2)
+        cv2.imwrite(os.path.join(OUTPUT_DIR, f"fast_{name_only}.png"), vis)
+
+    return round(opening_angle, 2)
+
+
+# ------------------ 测试 ------------------
+if __name__ == '__main__':
+    image_path = '/home/hx/yolo/output_masks/2.jpg'
+    print(f"🚀 处理: {image_path}")
+    angle = detect_jaw_angle_fast(image_path, mode='show')
+    if angle is not None:
+        print(f"✅ 角度: {angle}°")
+    else:
+        print("❌ 未检测到两个夹具")
--- a/angle_base_seg/bushu.py
+++ b/angle_base_seg/bushu.py
@ -0,0 +1,206 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+import os
+import cv2
+import numpy as np
+import argparse
+import torch
+import torch.nn.functional as F
+import torchvision
+
+# ---------------- 配置 ----------------
+OBJ_THRESH = 0.25
+NMS_THRESH = 0.45
+MAX_DETECT = 300
+IMG_SIZE = (640, 640)  # (W,H)
+
+OUTPUT_DIR = "result"
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+
+
+# ---------------- 工具函数 ----------------
+def sigmoid(x):
+    return 1 / (1 + np.exp(-x))
+
+def dfl(position):
+    x = torch.tensor(position)
+    n, c, h, w = x.shape
+    y = x.reshape(n, 4, c // 4, h, w)
+    y = y.softmax(2)
+    acc_metrix = torch.arange(c // 4).float().reshape(1, 1, c // 4, 1, 1)
+    y = (y * acc_metrix).sum(2)
+    return y.numpy()
+
+def box_process(position):
+    grid_h, grid_w = position.shape[2:4]
+    col, row = np.meshgrid(np.arange(0, grid_w), np.arange(0, grid_h))
+    col, row = col.reshape(1, 1, grid_h, grid_w), row.reshape(1, 1, grid_h, grid_w)
+    grid = np.concatenate((col, row), axis=1)
+    stride = np.array([IMG_SIZE[1] // grid_h, IMG_SIZE[0] // grid_w]).reshape(1, 2, 1, 1)
+
+    position = dfl(position)
+    box_xy = grid + 0.5 - position[:, 0:2, :, :]
+    box_xy2 = grid + 0.5 + position[:, 2:4, :, :]
+    xyxy = np.concatenate((box_xy * stride, box_xy2 * stride), axis=1)
+    return xyxy
+
+def _crop_mask(masks, boxes):
+    n, h, w = masks.shape
+    x1, y1, x2, y2 = torch.chunk(boxes[:, :, None], 4, 1)
+    r = torch.arange(w, device=masks.device, dtype=x1.dtype)[None, None, :]
+    c = torch.arange(h, device=masks.device, dtype=x1.dtype)[None, :, None]
+    return masks * ((r >= x1) * (r < x2) * (c >= y1) * (c < y2))
+
+def post_process(input_data):
+    proto = input_data[-1]
+    boxes, scores, seg_part = [], [], []
+    default_branch = 3
+    pair_per_branch = len(input_data) // default_branch
+
+    for i in range(default_branch):
+        boxes.append(box_process(input_data[pair_per_branch * i]))
+        scores.append(np.ones_like(input_data[pair_per_branch * i + 1][:, :1, :, :], dtype=np.float32))
+        seg_part.append(input_data[pair_per_branch * i + 3])
+
+    def sp_flatten(_in):
+        ch = _in.shape[1]
+        _in = _in.transpose(0, 2, 3, 1)
+        return _in.reshape(-1, ch)
+
+    boxes = np.concatenate([sp_flatten(v) for v in boxes])
+    scores = np.concatenate([sp_flatten(v) for v in scores])
+    seg_part = np.concatenate([sp_flatten(v) for v in seg_part])
+
+    # 阈值过滤
+    keep = np.where(scores.reshape(-1) >= OBJ_THRESH)
+    boxes, scores, seg_part = boxes[keep], scores[keep], seg_part[keep]
+
+    # NMS
+    ids = torchvision.ops.nms(torch.tensor(boxes, dtype=torch.float32),
+                              torch.tensor(scores, dtype=torch.float32), NMS_THRESH)
+    ids = ids.tolist()[:MAX_DETECT]
+    boxes, scores, seg_part = boxes[ids], scores[ids], seg_part[ids]
+
+    # mask decode
+    ph, pw = proto.shape[-2:]
+    proto = proto.reshape(seg_part.shape[-1], -1)
+    seg_img = np.matmul(seg_part, proto)
+    seg_img = sigmoid(seg_img)
+    seg_img = seg_img.reshape(-1, ph, pw)
+    seg_img = F.interpolate(torch.tensor(seg_img)[None], torch.Size([640, 640]), mode='bilinear', align_corners=False)[0]
+    seg_img_t = _crop_mask(seg_img, torch.tensor(boxes))
+    seg_img = seg_img_t.numpy() > 0.5
+
+    return boxes, scores, seg_img
+
+
+# ---------------- 角度计算 ----------------
+def compute_angle(boxes, seg_img, h, w, filename, mode="show"):
+    composite_mask = np.zeros((h, w), dtype=np.uint8)
+    jaws = []
+
+    for i, box in enumerate(boxes):
+        x1, y1, x2, y2 = map(int, box)
+        x1, y1 = max(0, x1), max(0, y1)
+        x2, y2 = min(w, x2), min(h, y2)
+
+        obj_mask = np.zeros((h, w), dtype=np.uint8)
+        mask_resized = cv2.resize(seg_img[i].astype(np.uint8), (w, h))
+        obj_mask[y1:y2, x1:x2] = mask_resized[y1:y2, x1:x2] * 255
+
+        contours, _ = cv2.findContours(obj_mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)
+        if len(contours) == 0:
+            continue
+
+        largest_contour = max(contours, key=cv2.contourArea)
+        area = cv2.contourArea(largest_contour)
+        if area < 100:
+            continue
+
+        rect = cv2.minAreaRect(largest_contour)
+        jaws.append({'contour': largest_contour, 'rect': rect, 'area': area})
+        composite_mask = np.maximum(composite_mask, obj_mask)
+
+    if len(jaws) < 2:
+        print(f"❌ 检测到的夹具少于2个（共{len(jaws)}个）")
+        return None
+
+    jaws.sort(key=lambda x: x['area'], reverse=True)
+    jaw1, jaw2 = jaws[0], jaws[1]
+
+    def get_long_edge_vector(rect):
+        center, (w_, h_), angle = rect
+        rad = np.radians(angle + (0 if w_ >= h_ else 90))
+        return np.array([np.cos(rad), np.sin(rad)])
+
+    def get_center(contour):
+        M = cv2.moments(contour)
+        return np.array([M['m10']/M['m00'], M['m01']/M['m00']]) if M['m00'] != 0 else np.array([0, 0])
+
+    dir1, dir2 = get_long_edge_vector(jaw1['rect']), get_long_edge_vector(jaw2['rect'])
+    center1, center2 = get_center(jaw1['contour']), get_center(jaw2['contour'])
+    fixture_center = (center1 + center2) / 2
+
+    to_center1, to_center2 = fixture_center - center1, fixture_center - center2
+    if np.linalg.norm(to_center1) > 1e-6 and np.dot(dir1, to_center1) < 0:
+        dir1 = -dir1
+    if np.linalg.norm(to_center2) > 1e-6 and np.dot(dir2, to_center2) < 0:
+        dir2 = -dir2
+
+    cos_angle = np.clip(np.dot(dir1, dir2), -1.0, 1.0)
+    angle = np.degrees(np.arccos(cos_angle))
+    opening_angle = min(angle, 180 - angle)
+
+    if mode == "show":
+        vis_img = np.stack([composite_mask]*3, axis=-1)
+        vis_img[composite_mask > 0] = [255, 255, 255]
+
+        box1, box2 = np.int32(cv2.boxPoints(jaw1['rect'])), np.int32(cv2.boxPoints(jaw2['rect']))
+        cv2.drawContours(vis_img, [box1], 0, (0, 0, 255), 2)
+        cv2.drawContours(vis_img, [box2], 0, (255, 0, 0), 2)
+
+        scale = 60
+        c1, c2 = tuple(np.int32(center1)), tuple(np.int32(center2))
+        end1, end2 = tuple(np.int32(center1 + scale * dir1)), tuple(np.int32(center2 + scale * dir2))
+        cv2.arrowedLine(vis_img, c1, end1, (0, 255, 0), 2, tipLength=0.3)
+        cv2.arrowedLine(vis_img, c2, end2, (0, 255, 0), 2, tipLength=0.3)
+
+        cv2.putText(vis_img, f"Angle: {opening_angle:.2f}°", (20, 50),
+                    cv2.FONT_HERSHEY_SIMPLEX, 0.8, (0, 255, 0), 2)
+
+        save_path = os.path.join(OUTPUT_DIR, f'angle_{filename}')
+        cv2.imwrite(save_path, vis_img)
+        print(f"✅ 结果已保存: {save_path}")
+
+    return round(opening_angle, 2)
+
+
+# ---------------- 主程序 ----------------
+def main():
+    # 固定路径（写死）
+    MODEL_PATH = "/userdata/bushu/seg.rknn"
+    IMG_PATH   = "/userdata/bushu/test.jpg"
+
+    from py_utils.rknn_executor import RKNN_model_container
+    model = RKNN_model_container(MODEL_PATH, target='rk3588', device_id=None)
+
+    img_src = cv2.imread(IMG_PATH)
+    if img_src is None:
+        print("❌ 图片路径错误:", IMG_PATH)
+        return
+    h, w = img_src.shape[:2]
+    img = cv2.resize(img_src, IMG_SIZE)
+
+    outputs = model.run([img])
+    boxes, scores, seg_img = post_process(outputs)
+
+    filename = os.path.basename(IMG_PATH)
+    angle = compute_angle(boxes, seg_img, h, w, filename, mode="show")
+    if angle is not None:
+        print(f"🎉 检测到的夹具开合角度: {angle}°")
+
+    model.release()
+
+
+if __name__ == "__main__":
+    main()
--- a/angle_base_seg/test_line_angle_f.py
+++ b/angle_base_seg/test_line_angle_f.py
@ -5,7 +5,7 @@ import os

 # ------------------ 配置 ------------------
 model_path = '../ultralytics_yolo11-main/runs/train/exp4/weights/best.pt'
-img_folder = '/home/hx/yolo/ultralytics_yolo11-main/dataset1/test'  # 你的图片文件夹路径
+img_folder = '/home/hx/yolo/test_image'  # 你的图片文件夹路径
 output_mask_dir = 'output_masks1'
 os.makedirs(output_mask_dir, exist_ok=True)

--- a/angle_base_seg/test_seg_angle_f1.py
+++ b/angle_base_seg/test_seg_angle_f1.py
@ -4,8 +4,8 @@ import numpy as np
 import os

 # ------------------ 配置 ------------------
-model_path = '../ultralytics_yolo11-main/runs/train/exp4/weights/best.pt'
-img_folder = '/home/hx/yolo/ultralytics_yolo11-main/dataset1/test'
+model_path = '/home/hx/yolo/ultralytics_yolo11-main/runs/train/seg/exp3/weights/best.pt'
+img_folder = '/media/hx/04e879fa-d697-4b02-ac7e-a4148876ebb0/dataset/seg/dataset2/test'
 output_mask_dir = 'output_masks1'
 os.makedirs(output_mask_dir, exist_ok=True)

@ -139,9 +139,9 @@ def process_image(img_path, output_dir):
                composite_mask = np.maximum(composite_mask, obj_mask)

    # 保存合并掩码
-    mask_save_path = os.path.join(output_dir, f'mask_{name_only}.png')
-    cv2.imwrite(mask_save_path, composite_mask)
-    print(f"✅ 掩码已保存: {mask_save_path}")
+    #mask_save_path = os.path.join(output_dir, f'mask_{name_only}.png')
+    #cv2.imwrite(mask_save_path, composite_mask)
+    #print(f"✅ 掩码已保存: {mask_save_path}")

    if len(rotated_rects) < 2:
        print(f"⚠️ 检测到的对象少于2个（共{len(rotated_rects)}个）: {filename}")
--- a/angle_base_seg/test_seg_angle_f2.py
+++ b/angle_base_seg/test_seg_angle_f2.py
@ -4,8 +4,8 @@ import numpy as np
 import os

 # ------------------ 配置 ------------------
-model_path = '../ultralytics_yolo11-main/runs/train/exp4/weights/best.pt'
-img_folder = '/home/hx/yolo/ultralytics_yolo11-main/dataset1/test'
+model_path = '/home/hx/yolo/ultralytics_yolo11-main/runs/train/seg/exp3/weights/best.pt'
+img_folder = '/media/hx/04e879fa-d697-4b02-ac7e-a4148876ebb0/dataset/seg/dataset2/test'
 output_mask_dir = 'output_masks1'
 os.makedirs(output_mask_dir, exist_ok=True)