PythonOpenCV实战从零构建ArUco视觉测距系统计算机视觉正在重塑我们与物理世界的交互方式。想象一下你的设备能够像人类一样理解周围物体的位置和方向——这正是ArUco码结合OpenCV实现的魔法。本文将带你从零开始构建一个完整的视觉测距系统不仅能识别特定标记还能精确计算相机与标记之间的三维空间关系。1. 环境配置与基础准备任何优秀的项目都始于稳固的基础。我们需要确保开发环境配置正确避免后续出现难以排查的问题。推荐使用Python 3.7和OpenCV 4.5版本这是经过验证的稳定组合。安装核心依赖只需一行命令pip install opencv-contrib-python numpy为什么选择opencv-contrib而不是基础版因为ArUco模块包含在contrib扩展包中。安装后验证是否成功import cv2 print(cv2.__version__) # 应显示4.5.x硬件准备同样重要相机选择普通USB摄像头即可但建议使用分辨率至少720p的型号打印ArUco标记使用标准DICT_5X5_100字典生成尺寸建议10x10cm以上标定棋盘建议使用8x11内角点的棋盘格实际角点数为7x10注意相机分辨率一旦确定整个项目流程中必须保持一致。这是影响精度的关键因素之一。2. 相机标定精度之源相机标定是后续所有工作的基石。这个过程相当于为相机建立视力档案记录它如何将三维世界映射到二维图像。2.1 数据采集最佳实践采集20-30张棋盘格图像覆盖相机视野的各个区域。注意棋盘格应占据图像1/3到1/2面积包含各种倾斜角度但避免极端角度确保光照均匀避免反光和阴影import cv2 import glob # 设置视频流分辨率与后续使用一致 cap cv2.VideoCapture(0) cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) count 0 while True: ret, frame cap.read() cv2.imshow(Calibration, frame) key cv2.waitKey(1) if key ord(s): # 按s保存 cv2.imwrite(fcalib_{count}.jpg, frame) count 1 elif key ord(q): # 按q退出 break cap.release() cv2.destroyAllWindows()2.2 标定流程与质量优化标定质量直接影响最终精度。我们采用重投影误差筛选法提升标定结果误差阈值保留图像数平均重投影误差无筛选250.42像素0.3像素180.21像素0.2像素120.15像素优化后的标定代码def calibrate_camera(images_path, board_size(7,10)): # 准备对象点 objp np.zeros((board_size[0]*board_size[1],3), np.float32) objp[:,:2] np.mgrid[0:board_size[0],0:board_size[1]].T.reshape(-1,2) # 收集所有图像的点 objpoints [] # 3D点 imgpoints [] # 2D点 images glob.glob(f{images_path}/*.jpg) for fname in images: img cv2.imread(fname) gray cv2.cvtColor(img, cv2.COLOR_BGR2GRAY) # 查找角点 ret, corners cv2.findChessboardCorners(gray, board_size, None) if ret: objpoints.append(objp) corners2 cv2.cornerSubPix(gray,corners,(11,11),(-1,-1), (cv2.TERM_CRITERIA_EPS cv2.TERM_CRITERIA_MAX_ITER, 30, 0.001)) imgpoints.append(corners2) # 初次标定 ret, mtx, dist, rvecs, tvecs cv2.calibrateCamera(objpoints, imgpoints, gray.shape[::-1], None, None) # 误差筛选 new_objpoints [] new_imgpoints [] for i in range(len(objpoints)): imgpoints2, _ cv2.projectPoints(objpoints[i], rvecs[i], tvecs[i], mtx, dist) error cv2.norm(imgpoints[i], imgpoints2, cv2.NORM_L2)/len(imgpoints2) if error 0.3: # 筛选阈值 new_objpoints.append(objpoints[i]) new_imgpoints.append(imgpoints[i]) # 最终标定 ret, mtx, dist, rvecs, tvecs cv2.calibrateCamera(new_objpoints, new_imgpoints, gray.shape[::-1], None, None) return mtx, dist保存标定结果供后续使用import pickle with open(camera_calib.pkl, wb) as f: pickle.dump({mtx:mtx, dist:dist}, f)3. ArUco检测与位姿估计3.1 检测流程全解析ArUco检测看似简单实则包含多个关键步骤图像预处理转换为灰度图可能应用自适应阈值标记检测寻找候选四边形验证内部编码位姿估计利用PnP算法求解相机姿态def detect_aruco(frame, mtx, dist): gray cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY) aruco_dict cv2.aruco.Dictionary_get(cv2.aruco.DICT_5X5_100) parameters cv2.aruco.DetectorParameters_create() # 核心检测函数 corners, ids, rejected cv2.aruco.detectMarkers( gray, aruco_dict, parametersparameters, cameraMatrixmtx, distCoeffdist) return corners, ids, rejected3.2 位姿估计数学原理estimatePoseSingleMarkers函数返回的rvec和tvec表示标记在相机坐标系中的位置。但实际应用中我们通常需要相机在标记坐标系中的位姿——这需要进行坐标系转换。转换关系推导旋转向量 → 旋转矩阵R_marker_to_cam, _ cv2.Rodrigues(rvec)相机在标记坐标系中的旋转R_cam_to_marker R_marker_to_cam.T相机在标记坐标系中的位置t_cam_to_marker -R_cam_to_marker tvec.reshape(3,1)完整位姿估计函数def estimate_pose(frame, mtx, dist, marker_length0.1): corners, ids, _ detect_aruco(frame, mtx, dist) if ids is not None: rvecs, tvecs, _ cv2.aruco.estimatePoseSingleMarkers( corners, marker_length, mtx, dist) for i in range(len(ids)): # 绘制坐标系 cv2.aruco.drawDetectedMarkers(frame, corners) cv2.drawFrameAxes(frame, mtx, dist, rvecs[i], tvecs[i], 0.05) # 坐标系转换 R, _ cv2.Rodrigues(rvecs[i]) R_inv R.T tvec tvecs[i].reshape(3,1) camera_pos -R_inv tvec # 计算距离和角度 distance np.linalg.norm(camera_pos) angle np.degrees(np.arctan2(camera_pos[0,0], camera_pos[2,0])) # 显示信息 cv2.putText(frame, fDist: {distance[0]:.2f}m, (10,30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0,255,0), 2) cv2.putText(frame, fAngle: {angle:.1f}deg, (10,70), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0,255,0), 2) return frame4. 实战优化与性能提升4.1 常见问题解决方案问题1检测不稳定原因光照变化或标记部分遮挡解决添加卡尔曼滤波平滑输出from pykalman import KalmanFilter class PoseFilter: def __init__(self): self.kf KalmanFilter(transition_matricesnp.eye(6), observation_matricesnp.eye(6)) self.state_means None self.state_covariances None def update(self, pose): if self.state_means is None: self.state_means pose self.state_covariances np.eye(6) else: self.state_means, self.state_covariances ( self.kf.filter_update(self.state_means, self.state_covariances, observationpose)) return self.state_means问题2测距误差大检查清单标定质量重投影误差0.3像素标记物理尺寸测量准确分辨率一致性采集、标定、检测阶段相同4.2 多标记协同定位单个标记的视野有限多标记系统可扩展工作范围def multi_marker_pose(frame, mtx, dist): corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None or len(ids) 2: return frame # 构建3D-2D对应点 obj_points [] img_points [] marker_length 0.1 # 实际尺寸 for i in range(len(ids)): # 假设标记在XY平面Z0 corners3d np.array([ [-marker_length/2, marker_length/2, 0], [marker_length/2, marker_length/2, 0], [marker_length/2, -marker_length/2, 0], [-marker_length/2, -marker_length/2, 0] ]) # 根据ID设置不同位置 corners3d [ids[i][0]*0.2, 0, 0] obj_points.extend(corners3d) img_points.extend(corners[i][0]) # 使用所有标记求解位姿 _, rvec, tvec cv2.solvePnP( np.array(obj_points), np.array(img_points), mtx, dist) # 可视化 cv2.drawFrameAxes(frame, mtx, dist, rvec, tvec, 0.1) return frame4.3 性能优化技巧实时性优化降低分辨率保持精度前提下使用ROI限制检测区域多线程处理采集与计算分离from threading import Thread import queue class VideoStream: def __init__(self, src0): self.stream cv2.VideoCapture(src) self.stream.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) self.stream.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) self.stopped False self.queue queue.Queue(maxsize1) def start(self): Thread(targetself.update, args()).start() return self def update(self): while True: if self.stopped: return if not self.queue.full(): ret, frame self.stream.read() if ret: self.queue.put(frame) def read(self): return self.queue.get() def stop(self): self.stopped True5. 应用扩展与高级功能5.1 三维测量实践利用已知尺寸的ArUco标记可以测量其他物体的尺寸def measure_object(frame, mtx, dist, marker_length0.1): # 检测标记 corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None: return frame # 估计标记位姿 rvec, tvec, _ cv2.aruco.estimatePoseSingleMarkers( corners, marker_length, mtx, dist) # 选择要测量的点示例鼠标点击 def click_event(event, x, y, flags, params): if event cv2.EVENT_LBUTTONDOWN: # 将2D点转换为3D射线 point_2d np.array([[[x, y]]], dtypenp.float32) undistorted cv2.undistortPoints(point_2d, mtx, dist) # 计算在标记坐标系中的3D坐标 R, _ cv2.Rodrigues(rvec[0]) point_3d R.T (undistorted[0,0] * tvec[0,0,2] - tvec[0,0]) cv2.putText(frame, fPosition: {point_3d.T[0]:.2f}m, (x,y), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0,0,255), 2) cv2.imshow(Measurement, frame) cv2.setMouseCallback(Measurement, click_event) return frame5.2 与ROS集成对于机器人应用可将位姿信息发布到ROS话题#!/usr/bin/env python import rospy from geometry_msgs.msg import PoseStamped import tf def publish_pose(mtx, dist): rospy.init_node(aruco_pose_publisher) pub rospy.Publisher(aruco_pose, PoseStamped, queue_size10) cap cv2.VideoCapture(0) rate rospy.Rate(30) # 30Hz while not rospy.is_shutdown(): ret, frame cap.read() if not ret: continue corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None: continue rvec, tvec, _ cv2.aruco.estimatePoseSingleMarkers( corners, 0.1, mtx, dist) # 创建ROS消息 pose_msg PoseStamped() pose_msg.header.stamp rospy.Time.now() pose_msg.header.frame_id camera # 转换坐标系 R cv2.Rodrigues(rvec[0])[0] quat tf.transformations.quaternion_from_matrix( np.vstack((np.hstack((R, tvec[0].T)), [0,0,0,1]))) pose_msg.pose.position.x tvec[0][0][0] pose_msg.pose.position.y tvec[0][0][1] pose_msg.pose.position.z tvec[0][0][2] pose_msg.pose.orientation.x quat[0] pose_msg.pose.orientation.y quat[1] pose_msg.pose.orientation.z quat[2] pose_msg.pose.orientation.w quat[3] pub.publish(pose_msg) rate.sleep()5.3 增强现实应用结合OpenGL或Unity3D可以实现基于ArUco的AR场景import pyglet from pyglet.gl import * def ar_demo(mtx, dist): window pyglet.window.Window(1280, 720) cap cv2.VideoCapture(0) cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) window.event def on_draw(): ret, frame cap.read() if not ret: return # 检测标记 corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None: return # 估计位姿 rvec, tvec, _ cv2.aruco.estimatePoseSingleMarkers( corners, 0.1, mtx, dist) # 设置OpenGL投影矩阵 glMatrixMode(GL_PROJECTION) glLoadIdentity() fx, fy mtx[0,0], mtx[1,1] cx, cy mtx[0,2], mtx[1,2] glFrustum(-cx/fx, (1280-cx)/fx, -(720-cy)/fy, cy/fy, 1, 100) # 设置模型视图矩阵 glMatrixMode(GL_MODELVIEW) glLoadIdentity() R cv2.Rodrigues(rvec[0])[0] T tvec[0][0] glLoadMatrixf([R[0,0], R[1,0], R[2,0], 0, R[0,1], R[1,1], R[2,1], 0, R[0,2], R[1,2], R[2,2], 0, T[0], T[1], T[2], 1]) # 绘制3D内容 glBegin(GL_TRIANGLES) glColor3f(1,0,0) glVertex3f(0,0,0) glVertex3f(0.1,0,0) glVertex3f(0,0.1,0) glEnd() pyglet.app.run()6. 完整项目架构对于实际应用建议采用模块化设计aruco_vision_system/ ├── calibration/ # 标定相关 │ ├── calibrate.py # 标定脚本 │ └── calib_images/ # 标定图像 ├── config/ │ └── camera_params.pkl # 相机参数 ├── detection/ # 检测模块 │ ├── detector.py # ArUco检测 │ └── pose_estimator.py # 位姿估计 ├── utils/ │ ├── filters.py # 卡尔曼滤波 │ └── visualizer.py # 可视化工具 └── main.py # 主程序主程序示例import cv2 import pickle from detection.detector import ArucoDetector from detection.pose_estimator import PoseEstimator from utils.filters import PoseFilter def main(): # 加载相机参数 with open(config/camera_params.pkl, rb) as f: params pickle.load(f) # 初始化各模块 detector ArucoDetector() estimator PoseEstimator(params[mtx], params[dist]) pose_filter PoseFilter() # 视频流 cap cv2.VideoCapture(0) cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) while True: ret, frame cap.read() if not ret: break # 处理流程 corners, ids detector.detect(frame) if ids is not None: rvecs, tvecs estimator.estimate(corners, marker_length0.1) filtered_pose pose_filter.update(np.concatenate([rvecs[0], tvecs[0]])) # 可视化 frame estimator.draw_axes(frame, rvecs[0], tvecs[0]) cv2.putText(frame, fDistance: {filtered_pose[5]:.2f}m, (10,30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0,255,0), 2) cv2.imshow(ARUCO Vision, frame) if cv2.waitKey(1) ord(q): break cap.release() cv2.destroyAllWindows() if __name__ __main__: main()在真实项目中我们遇到的最棘手问题往往是标定质量不稳定。有次为了获得最佳标定结果我们专门制作了高精度棋盘格并使用三脚架固定相机最终将重投影误差控制在0.15像素以下测距精度达到了毫米级。这告诉我们在计算机视觉领域前期的基础工作质量直接决定了最终效果的上限。
保姆级教程:用Python+OpenCV玩转ArUco码,实现相机位姿估计与测距(附完整代码)
发布时间:2026/5/24 2:04:15
PythonOpenCV实战从零构建ArUco视觉测距系统计算机视觉正在重塑我们与物理世界的交互方式。想象一下你的设备能够像人类一样理解周围物体的位置和方向——这正是ArUco码结合OpenCV实现的魔法。本文将带你从零开始构建一个完整的视觉测距系统不仅能识别特定标记还能精确计算相机与标记之间的三维空间关系。1. 环境配置与基础准备任何优秀的项目都始于稳固的基础。我们需要确保开发环境配置正确避免后续出现难以排查的问题。推荐使用Python 3.7和OpenCV 4.5版本这是经过验证的稳定组合。安装核心依赖只需一行命令pip install opencv-contrib-python numpy为什么选择opencv-contrib而不是基础版因为ArUco模块包含在contrib扩展包中。安装后验证是否成功import cv2 print(cv2.__version__) # 应显示4.5.x硬件准备同样重要相机选择普通USB摄像头即可但建议使用分辨率至少720p的型号打印ArUco标记使用标准DICT_5X5_100字典生成尺寸建议10x10cm以上标定棋盘建议使用8x11内角点的棋盘格实际角点数为7x10注意相机分辨率一旦确定整个项目流程中必须保持一致。这是影响精度的关键因素之一。2. 相机标定精度之源相机标定是后续所有工作的基石。这个过程相当于为相机建立视力档案记录它如何将三维世界映射到二维图像。2.1 数据采集最佳实践采集20-30张棋盘格图像覆盖相机视野的各个区域。注意棋盘格应占据图像1/3到1/2面积包含各种倾斜角度但避免极端角度确保光照均匀避免反光和阴影import cv2 import glob # 设置视频流分辨率与后续使用一致 cap cv2.VideoCapture(0) cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) count 0 while True: ret, frame cap.read() cv2.imshow(Calibration, frame) key cv2.waitKey(1) if key ord(s): # 按s保存 cv2.imwrite(fcalib_{count}.jpg, frame) count 1 elif key ord(q): # 按q退出 break cap.release() cv2.destroyAllWindows()2.2 标定流程与质量优化标定质量直接影响最终精度。我们采用重投影误差筛选法提升标定结果误差阈值保留图像数平均重投影误差无筛选250.42像素0.3像素180.21像素0.2像素120.15像素优化后的标定代码def calibrate_camera(images_path, board_size(7,10)): # 准备对象点 objp np.zeros((board_size[0]*board_size[1],3), np.float32) objp[:,:2] np.mgrid[0:board_size[0],0:board_size[1]].T.reshape(-1,2) # 收集所有图像的点 objpoints [] # 3D点 imgpoints [] # 2D点 images glob.glob(f{images_path}/*.jpg) for fname in images: img cv2.imread(fname) gray cv2.cvtColor(img, cv2.COLOR_BGR2GRAY) # 查找角点 ret, corners cv2.findChessboardCorners(gray, board_size, None) if ret: objpoints.append(objp) corners2 cv2.cornerSubPix(gray,corners,(11,11),(-1,-1), (cv2.TERM_CRITERIA_EPS cv2.TERM_CRITERIA_MAX_ITER, 30, 0.001)) imgpoints.append(corners2) # 初次标定 ret, mtx, dist, rvecs, tvecs cv2.calibrateCamera(objpoints, imgpoints, gray.shape[::-1], None, None) # 误差筛选 new_objpoints [] new_imgpoints [] for i in range(len(objpoints)): imgpoints2, _ cv2.projectPoints(objpoints[i], rvecs[i], tvecs[i], mtx, dist) error cv2.norm(imgpoints[i], imgpoints2, cv2.NORM_L2)/len(imgpoints2) if error 0.3: # 筛选阈值 new_objpoints.append(objpoints[i]) new_imgpoints.append(imgpoints[i]) # 最终标定 ret, mtx, dist, rvecs, tvecs cv2.calibrateCamera(new_objpoints, new_imgpoints, gray.shape[::-1], None, None) return mtx, dist保存标定结果供后续使用import pickle with open(camera_calib.pkl, wb) as f: pickle.dump({mtx:mtx, dist:dist}, f)3. ArUco检测与位姿估计3.1 检测流程全解析ArUco检测看似简单实则包含多个关键步骤图像预处理转换为灰度图可能应用自适应阈值标记检测寻找候选四边形验证内部编码位姿估计利用PnP算法求解相机姿态def detect_aruco(frame, mtx, dist): gray cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY) aruco_dict cv2.aruco.Dictionary_get(cv2.aruco.DICT_5X5_100) parameters cv2.aruco.DetectorParameters_create() # 核心检测函数 corners, ids, rejected cv2.aruco.detectMarkers( gray, aruco_dict, parametersparameters, cameraMatrixmtx, distCoeffdist) return corners, ids, rejected3.2 位姿估计数学原理estimatePoseSingleMarkers函数返回的rvec和tvec表示标记在相机坐标系中的位置。但实际应用中我们通常需要相机在标记坐标系中的位姿——这需要进行坐标系转换。转换关系推导旋转向量 → 旋转矩阵R_marker_to_cam, _ cv2.Rodrigues(rvec)相机在标记坐标系中的旋转R_cam_to_marker R_marker_to_cam.T相机在标记坐标系中的位置t_cam_to_marker -R_cam_to_marker tvec.reshape(3,1)完整位姿估计函数def estimate_pose(frame, mtx, dist, marker_length0.1): corners, ids, _ detect_aruco(frame, mtx, dist) if ids is not None: rvecs, tvecs, _ cv2.aruco.estimatePoseSingleMarkers( corners, marker_length, mtx, dist) for i in range(len(ids)): # 绘制坐标系 cv2.aruco.drawDetectedMarkers(frame, corners) cv2.drawFrameAxes(frame, mtx, dist, rvecs[i], tvecs[i], 0.05) # 坐标系转换 R, _ cv2.Rodrigues(rvecs[i]) R_inv R.T tvec tvecs[i].reshape(3,1) camera_pos -R_inv tvec # 计算距离和角度 distance np.linalg.norm(camera_pos) angle np.degrees(np.arctan2(camera_pos[0,0], camera_pos[2,0])) # 显示信息 cv2.putText(frame, fDist: {distance[0]:.2f}m, (10,30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0,255,0), 2) cv2.putText(frame, fAngle: {angle:.1f}deg, (10,70), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0,255,0), 2) return frame4. 实战优化与性能提升4.1 常见问题解决方案问题1检测不稳定原因光照变化或标记部分遮挡解决添加卡尔曼滤波平滑输出from pykalman import KalmanFilter class PoseFilter: def __init__(self): self.kf KalmanFilter(transition_matricesnp.eye(6), observation_matricesnp.eye(6)) self.state_means None self.state_covariances None def update(self, pose): if self.state_means is None: self.state_means pose self.state_covariances np.eye(6) else: self.state_means, self.state_covariances ( self.kf.filter_update(self.state_means, self.state_covariances, observationpose)) return self.state_means问题2测距误差大检查清单标定质量重投影误差0.3像素标记物理尺寸测量准确分辨率一致性采集、标定、检测阶段相同4.2 多标记协同定位单个标记的视野有限多标记系统可扩展工作范围def multi_marker_pose(frame, mtx, dist): corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None or len(ids) 2: return frame # 构建3D-2D对应点 obj_points [] img_points [] marker_length 0.1 # 实际尺寸 for i in range(len(ids)): # 假设标记在XY平面Z0 corners3d np.array([ [-marker_length/2, marker_length/2, 0], [marker_length/2, marker_length/2, 0], [marker_length/2, -marker_length/2, 0], [-marker_length/2, -marker_length/2, 0] ]) # 根据ID设置不同位置 corners3d [ids[i][0]*0.2, 0, 0] obj_points.extend(corners3d) img_points.extend(corners[i][0]) # 使用所有标记求解位姿 _, rvec, tvec cv2.solvePnP( np.array(obj_points), np.array(img_points), mtx, dist) # 可视化 cv2.drawFrameAxes(frame, mtx, dist, rvec, tvec, 0.1) return frame4.3 性能优化技巧实时性优化降低分辨率保持精度前提下使用ROI限制检测区域多线程处理采集与计算分离from threading import Thread import queue class VideoStream: def __init__(self, src0): self.stream cv2.VideoCapture(src) self.stream.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) self.stream.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) self.stopped False self.queue queue.Queue(maxsize1) def start(self): Thread(targetself.update, args()).start() return self def update(self): while True: if self.stopped: return if not self.queue.full(): ret, frame self.stream.read() if ret: self.queue.put(frame) def read(self): return self.queue.get() def stop(self): self.stopped True5. 应用扩展与高级功能5.1 三维测量实践利用已知尺寸的ArUco标记可以测量其他物体的尺寸def measure_object(frame, mtx, dist, marker_length0.1): # 检测标记 corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None: return frame # 估计标记位姿 rvec, tvec, _ cv2.aruco.estimatePoseSingleMarkers( corners, marker_length, mtx, dist) # 选择要测量的点示例鼠标点击 def click_event(event, x, y, flags, params): if event cv2.EVENT_LBUTTONDOWN: # 将2D点转换为3D射线 point_2d np.array([[[x, y]]], dtypenp.float32) undistorted cv2.undistortPoints(point_2d, mtx, dist) # 计算在标记坐标系中的3D坐标 R, _ cv2.Rodrigues(rvec[0]) point_3d R.T (undistorted[0,0] * tvec[0,0,2] - tvec[0,0]) cv2.putText(frame, fPosition: {point_3d.T[0]:.2f}m, (x,y), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0,0,255), 2) cv2.imshow(Measurement, frame) cv2.setMouseCallback(Measurement, click_event) return frame5.2 与ROS集成对于机器人应用可将位姿信息发布到ROS话题#!/usr/bin/env python import rospy from geometry_msgs.msg import PoseStamped import tf def publish_pose(mtx, dist): rospy.init_node(aruco_pose_publisher) pub rospy.Publisher(aruco_pose, PoseStamped, queue_size10) cap cv2.VideoCapture(0) rate rospy.Rate(30) # 30Hz while not rospy.is_shutdown(): ret, frame cap.read() if not ret: continue corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None: continue rvec, tvec, _ cv2.aruco.estimatePoseSingleMarkers( corners, 0.1, mtx, dist) # 创建ROS消息 pose_msg PoseStamped() pose_msg.header.stamp rospy.Time.now() pose_msg.header.frame_id camera # 转换坐标系 R cv2.Rodrigues(rvec[0])[0] quat tf.transformations.quaternion_from_matrix( np.vstack((np.hstack((R, tvec[0].T)), [0,0,0,1]))) pose_msg.pose.position.x tvec[0][0][0] pose_msg.pose.position.y tvec[0][0][1] pose_msg.pose.position.z tvec[0][0][2] pose_msg.pose.orientation.x quat[0] pose_msg.pose.orientation.y quat[1] pose_msg.pose.orientation.z quat[2] pose_msg.pose.orientation.w quat[3] pub.publish(pose_msg) rate.sleep()5.3 增强现实应用结合OpenGL或Unity3D可以实现基于ArUco的AR场景import pyglet from pyglet.gl import * def ar_demo(mtx, dist): window pyglet.window.Window(1280, 720) cap cv2.VideoCapture(0) cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) window.event def on_draw(): ret, frame cap.read() if not ret: return # 检测标记 corners, ids, _ detect_aruco(frame, mtx, dist) if ids is None: return # 估计位姿 rvec, tvec, _ cv2.aruco.estimatePoseSingleMarkers( corners, 0.1, mtx, dist) # 设置OpenGL投影矩阵 glMatrixMode(GL_PROJECTION) glLoadIdentity() fx, fy mtx[0,0], mtx[1,1] cx, cy mtx[0,2], mtx[1,2] glFrustum(-cx/fx, (1280-cx)/fx, -(720-cy)/fy, cy/fy, 1, 100) # 设置模型视图矩阵 glMatrixMode(GL_MODELVIEW) glLoadIdentity() R cv2.Rodrigues(rvec[0])[0] T tvec[0][0] glLoadMatrixf([R[0,0], R[1,0], R[2,0], 0, R[0,1], R[1,1], R[2,1], 0, R[0,2], R[1,2], R[2,2], 0, T[0], T[1], T[2], 1]) # 绘制3D内容 glBegin(GL_TRIANGLES) glColor3f(1,0,0) glVertex3f(0,0,0) glVertex3f(0.1,0,0) glVertex3f(0,0.1,0) glEnd() pyglet.app.run()6. 完整项目架构对于实际应用建议采用模块化设计aruco_vision_system/ ├── calibration/ # 标定相关 │ ├── calibrate.py # 标定脚本 │ └── calib_images/ # 标定图像 ├── config/ │ └── camera_params.pkl # 相机参数 ├── detection/ # 检测模块 │ ├── detector.py # ArUco检测 │ └── pose_estimator.py # 位姿估计 ├── utils/ │ ├── filters.py # 卡尔曼滤波 │ └── visualizer.py # 可视化工具 └── main.py # 主程序主程序示例import cv2 import pickle from detection.detector import ArucoDetector from detection.pose_estimator import PoseEstimator from utils.filters import PoseFilter def main(): # 加载相机参数 with open(config/camera_params.pkl, rb) as f: params pickle.load(f) # 初始化各模块 detector ArucoDetector() estimator PoseEstimator(params[mtx], params[dist]) pose_filter PoseFilter() # 视频流 cap cv2.VideoCapture(0) cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280) cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720) while True: ret, frame cap.read() if not ret: break # 处理流程 corners, ids detector.detect(frame) if ids is not None: rvecs, tvecs estimator.estimate(corners, marker_length0.1) filtered_pose pose_filter.update(np.concatenate([rvecs[0], tvecs[0]])) # 可视化 frame estimator.draw_axes(frame, rvecs[0], tvecs[0]) cv2.putText(frame, fDistance: {filtered_pose[5]:.2f}m, (10,30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0,255,0), 2) cv2.imshow(ARUCO Vision, frame) if cv2.waitKey(1) ord(q): break cap.release() cv2.destroyAllWindows() if __name__ __main__: main()在真实项目中我们遇到的最棘手问题往往是标定质量不稳定。有次为了获得最佳标定结果我们专门制作了高精度棋盘格并使用三脚架固定相机最终将重投影误差控制在0.15像素以下测距精度达到了毫米级。这告诉我们在计算机视觉领域前期的基础工作质量直接决定了最终效果的上限。