bushu

2025-10-21 14:11:52 +08:00
parent 349449f2b7
commit df7c0730f5
363 changed files with 5386 additions and 578 deletions
--- a/angle_base_obb/view_E.py
+++ b/angle_base_obb/view_E.py
@ -0,0 +1,191 @@
+import os
+import cv2
+import numpy as np
+from ultralytics import YOLO
+import matplotlib.pyplot as plt
+
+# ================== 配置参数 ==================
+MODEL_PATH = r"obb.pt"
+IMAGE_SOURCE_DIR = r"/media/hx/04e879fa-d697-4b02-ac7e-a4148876ebb0/dataset/obb4/train"
+LABEL_SOURCE_DIR = IMAGE_SOURCE_DIR  # 假设标签和图像在同一目录
+OUTPUT_DIR = "./inference_results"
+VISUAL_DIR = os.path.join(OUTPUT_DIR, "visual_errors_gt5deg")  # 保存误差 >5° 的可视化图
+IMG_EXTENSIONS = {'.jpg', '.jpeg', '.png', '.bmp', '.tif', '.tiff', '.webp'}
+
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+os.makedirs(VISUAL_DIR, exist_ok=True)
+
+# 加载模型
+print("🔄 加载 YOLO OBB 模型...")
+model = YOLO(MODEL_PATH)
+print("✅ 模型加载完成")
+
+# 获取图像列表
+image_files = [
+    f for f in os.listdir(IMAGE_SOURCE_DIR)
+    if os.path.splitext(f.lower())[1] in IMG_EXTENSIONS
+]
+
+if not image_files:
+    print(f"❌ 错误：未找到图像文件")
+    exit(1)
+print(f"📁 发现 {len(image_files)} 张图像待处理")
+
+all_angle_errors = []  # 存储每张图的夹角误差（度）
+
+# ================== 工具函数 ==================
+
+def parse_obb_label_file(label_path, img_shape):
+    """
+    解析 OBB 标签文件，并将归一化坐标转换为像素坐标
+    img_shape: (height, width) 用于去归一化
+    """
+    boxes = []
+    h, w = img_shape[:2]
+    if not os.path.exists(label_path):
+        print(f"⚠️  标签文件不存在: {label_path}")
+        return boxes
+    with open(label_path, 'r') as f:
+        for line in f:
+            parts = line.strip().split()
+            if len(parts) != 9:
+                print(f"⚠️  标签行格式错误 (期望9列): {parts}")
+                continue
+            cls_id = int(parts[0])
+            coords = list(map(float, parts[1:]))
+            points = np.array(coords).reshape(4, 2)
+            points[:, 0] *= w  # x * width
+            points[:, 1] *= h  # y * height
+            boxes.append({'cls': cls_id, 'points': points})
+    return boxes
+
+
+def compute_main_direction(points):
+    """根据四个顶点计算旋转框的主方向（长边方向），返回 [0, π) 范围内的弧度值"""
+    edges = []
+    for i in range(4):
+        p1 = points[i]
+        p2 = points[(i + 1) % 4]
+        vec = p2 - p1
+        length = np.linalg.norm(vec)
+        if length > 1e-6:
+            edges.append((length, vec))
+
+    if not edges:
+        return 0.0
+
+    longest_edge = max(edges, key=lambda x: x[0])[1]
+    angle_rad = np.arctan2(longest_edge[1], longest_edge[0])
+    angle_rad = angle_rad % np.pi
+    return angle_rad
+
+
+def compute_min_angle_between_two_dirs(dir1_rad, dir2_rad):
+    """计算两个方向之间的最小夹角（0 ~ 90°），返回角度制"""
+    diff = abs(dir1_rad - dir2_rad)
+    min_diff_rad = min(diff, np.pi - diff)
+    return np.degrees(min_diff_rad)
+
+
+def draw_boxes_on_image(image, pred_boxes=None, true_boxes=None):
+    """在图像上绘制预测框（绿色）和真实框（红色）"""
+    img_vis = image.copy()
+
+    # 绘制真实框（红色）
+    if true_boxes is not None:
+        for box in true_boxes:
+            pts = np.int32(box['points']).reshape((-1, 1, 2))
+            cv2.polylines(img_vis, [pts], isClosed=True, color=(0, 0, 255), thickness=2)
+
+    # 绘制预测框（绿色）
+    if pred_boxes is not None:
+        for box in pred_boxes:
+            xyxyxyxy = box.xyxyxyxy.cpu().numpy()[0]
+            pts = xyxyxyxy.reshape(4, 2).astype(int)
+            pts = pts.reshape((-1, 1, 2))
+            cv2.polylines(img_vis, [pts], isClosed=True, color=(0, 255, 0), thickness=2)
+
+    return img_vis
+
+# ================== 主循环 ==================
+for img_filename in image_files:
+    img_path = os.path.join(IMAGE_SOURCE_DIR, img_filename)
+    label_path = os.path.join(LABEL_SOURCE_DIR, os.path.splitext(img_filename)[0] + ".txt")
+
+    print(f"\n🖼️ 处理: {img_filename}")
+
+    # 读图
+    img = cv2.imread(img_path)
+    if img is None:
+        print("❌ 无法读取图像")
+        continue
+
+    # 推理
+    results = model(img, imgsz=640, conf=0.15, verbose=False)
+    result = results[0]
+    pred_boxes = result.obb
+
+    # === 提取预测框主方向 ===
+    pred_dirs = []
+    if pred_boxes is not None and len(pred_boxes) >= 2:
+        for box in pred_boxes[:2]:
+            xywhr = box.xywhr.cpu().numpy()[0]
+            cx, cy, w, h, r_rad = xywhr
+            main_dir = r_rad if w >= h else r_rad + np.pi / 2
+            pred_dirs.append(main_dir % np.pi)
+        pred_angle = compute_min_angle_between_two_dirs(pred_dirs[0], pred_dirs[1])
+    else:
+        print("❌ 预测框不足两个")
+        continue
+
+    # === 提取真实框主方向 ===
+    true_boxes = parse_obb_label_file(label_path, img.shape)
+    if len(true_boxes) < 2:
+        print("❌ 标签框不足两个")
+        continue
+
+    true_dirs = []
+    for tb in true_boxes[:2]:
+        d = compute_main_direction(tb['points'])
+        true_dirs.append(d)
+    true_angle = compute_min_angle_between_two_dirs(true_dirs[0], true_dirs[1])
+
+    # === 计算夹角误差 ===
+    error_deg = abs(pred_angle - true_angle)
+    all_angle_errors.append(error_deg)
+
+    print(f"  🔹 预测夹角: {pred_angle:.2f}°")
+    print(f"  🔹 真实夹角: {true_angle:.2f}°")
+    print(f"  🔺 夹角误差: {error_deg:.2f}°")
+
+    # === 可视化误差 >5° 的情况 ===
+    if error_deg > 3:
+        print(f"  🎯 误差 >5°，生成可视化图像...")
+        img_with_boxes = draw_boxes_on_image(img, pred_boxes=pred_boxes, true_boxes=true_boxes)
+        # 添加文字
+        cv2.putText(img_with_boxes, f"Error: {error_deg:.2f}°", (20, 50),
+                    cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
+        vis_output_path = os.path.join(VISUAL_DIR, f"error_{error_deg:.2f}deg_{img_filename}")
+        cv2.imwrite(vis_output_path, img_with_boxes)
+        print(f"  ✅ 已保存可视化图像: {vis_output_path}")
+
+# ================== 输出统计 ==================
+print("\n" + "=" * 60)
+print("📊 夹角误差统计（基于两框间最小夹角）")
+print("=" * 60)
+if all_angle_errors:
+    mean_error = np.mean(all_angle_errors)
+    std_error = np.std(all_angle_errors)
+    max_error = np.max(all_angle_errors)
+    min_error = np.min(all_angle_errors)
+
+    print(f"有效图像数: {len(all_angle_errors)}")
+    print(f"平均夹角误差: {mean_error:.2f}°")
+    print(f"标准差: {std_error:.2f}°")
+    print(f"最大误差: {max_error:.2f}°")
+    print(f"最小误差: {min_error:.2f}°")
+else:
+    print("❌ 无有效数据用于统计")
+
+print("=" * 60)
+print("🎉 所有图像处理完成！")