#!/usr/bin/env python # -*- coding: UTF-8 -*- ''' @Project :AutoControlSystem-master @File :camera_coordinate_dete.py @IDE :PyCharm @Author :hjw @Date :2024/8/27 14:24 ''' import numpy as np import cv2 import open3d as o3d from .tool.CameraRVC import camera from .yolo.yolov8_pt_seg import yolov8_segment class Detection: def __init__(self, model_path, device): self.camera_rvc = camera() self.model = yolov8_segment() self.model.load_model(model_path, device) if self.camera_rvc.caminit_isok == True: print("RVC X Camera is opened!") else: print("RVC X Camera is not opened!") def get_position(self): "" ''' :param api: None :return: ret , img, (x,y,z), (nx, ny, nz) ''' ret, img, pm = self.camera_rvc.get_img_and_point_map() # 拍照,获取图像及 if self.camera_rvc.caminit_isok == True: if ret == 1: flag, det_cpu, dst_img, masks, category_names = self.model.model_inference(img, 0) if flag == 1: xyz = [] nx_ny_nz = [] for i, item in enumerate(det_cpu): # 画box box_x1, box_y1, box_x2, box_y2 = item[0:4].astype(np.int32) label = category_names[int(item[5])] rand_color = (0, 255, 255) score = item[4] org = (int((box_x1 + box_x2) / 2), int((box_y1 + box_y2) / 2)) x_center = int((box_x1 + box_x2) / 2) y_center = int((box_y1 + box_y2) / 2) text = '{}|{:.2f}'.format(label, score) cv2.putText(img, text, org=org, fontFace=cv2.FONT_HERSHEY_SIMPLEX, fontScale=0.8, color=rand_color, thickness=2) # 画mask # mask = masks[i].cpu().numpy().astype(int) mask = masks[i].cpu().data.numpy().astype(int) # mask = masks[i].numpy().astype(int) bbox_image = img[box_y1:box_y2, box_x1:box_x2] h, w = box_y2 - box_y1, box_x2 - box_x1 mask_colored = np.zeros((h, w, 3), dtype=np.uint8) mask_colored[np.where(mask)] = rand_color ################################## imgray = cv2.cvtColor(mask_colored, cv2.COLOR_BGR2GRAY) # cv2.imshow('mask',imgray) # cv2.waitKey(1) # 2、二进制图像 ret, binary = cv2.threshold(imgray, 10, 255, 0) # 阈值 二进制图像 # cv2.imshow('bin',binary) # cv2.waitKey(1) contours, hierarchy = cv2.findContours(binary, cv2.RETR_TREE, cv2.CHAIN_APPROX_NONE) # all_piont_list = contours_in(contours) # print(len(all_piont_list)) max_contour = None max_perimeter = 0 for contour in contours: # 排除小分割区域或干扰区域 perimeter = cv2.arcLength(contour, True) if perimeter > max_perimeter: max_perimeter = perimeter max_contour = contour ''' 提取区域范围内的(x, y) ''' mask_inside = np.zeros(binary.shape, np.uint8) cv2.drawContours(mask_inside, [max_contour], 0, 255, -1) pixel_point2 = cv2.findNonZero(mask_inside) # result = np.zeros_like(color_image) select_point = [] for i in range(pixel_point2.shape[0]): # k = pixel_point2[i] select_point.append(pm[pixel_point2[i][0][1], pixel_point2[i][0][0]]) select_point = np.array(select_point) pm_seg = select_point.reshape(-1, 3) pm_seg = pm_seg[~np.isnan(pm_seg).all(axis=-1), :] # 剔除 nan # cv2.imshow('result', piont_result) ''' 拟合平面,计算法向量 ''' pcd = o3d.geometry.PointCloud() pcd.points = o3d.utility.Vector3dVector(pm_seg) # pcd = o3d.io.read_point_cloud("./Data/seg_point.xyz") plane_model, inliers = pcd.segment_plane(distance_threshold=0.1, ransac_n=3, num_iterations=100) [a, b, c, d] = plane_model print(f"Plane equation: {a:.2f}x + {b:.2f}y + {c:.2f}z + {d:.2f} = 0") # inlier_cloud = pcd.select_by_index(inliers) # 点云可视化 # inlier_cloud.paint_uniform_color([1.0, 0, 0]) # outlier_cloud = pcd.select_by_index(inliers, invert=True) # outlier_cloud.paint_uniform_color([0, 1, 0]) # o3d.visualization.draw_geometries([inlier_cloud, outlier_cloud]) ''' 拟合最小外接矩形,计算矩形中心 ''' rect = cv2.minAreaRect(max_contour) # cv2.boxPoints可以将轮廓点转换为四个角点坐标 box = cv2.boxPoints(rect) # 这一步不影响后面的画图,但是可以保证四个角点坐标为顺时针 startidx = box.sum(axis=1).argmin() box = np.roll(box, 4 - startidx, 0) # 在原图上画出预测的外接矩形 box = box.reshape((-1, 1, 2)).astype(np.int32) box = box + [[[box_x1, box_y1]], [[box_x1, box_y1]], [[box_x1, box_y1]], [[box_x1, box_y1]]] x_rotation_center = int((box[0][0][0] + box[1][0][0] + box[2][0][0] + box[3][0][0]) / 4) y_rotation_center = int((box[0][0][1] + box[1][0][1] + box[2][0][1] + box[3][0][1]) / 4) point_x, point_y, point_z =pm[x_rotation_center, y_rotation_center] cv2.circle(img, (x_rotation_center, y_rotation_center), 4, (255, 255, 255), 5) # 标出中心点 x1, y1, z1, = pm[x_rotation_center+1, y_rotation_center+1] print('x1 y1 z1 :', x1, y1, z1) #print('像素坐标(x, y):', x_rotation_center,y_rotation_center) print('x y z :', point_x, point_y, point_z) # point_x=point_x*1000 # point_y=point_y*1000 # point_z=point_z*1000 print('nx ny nz :', a, b, c) # getPosition(x, y, z, a, b, c) if(point_x == np.nan): continue else: xyz.append([x1*1000, y1*1000, z1*1000]) nx_ny_nz.append([a, b, c]) cv2.polylines(img, [box], True, (0, 255, 0), 2) return 1, img, xyz, nx_ny_nz else: return 1, img, None, None else: print("RVC X Camera capture failed!") return 0, None, None, None else: print("RVC X Camera is not opened!") return 0, None, None, None