工业场景视觉测距实战：AGV 导航与避障

1. AGV 视觉导航需求

复制代码

AGV 视觉导航功能：
├── 定位：视觉 SLAM / 二维码定位
├── 测距：障碍物距离检测
├── 避障：实时障碍物规避
├── 导航：路径规划与跟踪
└── 装载：货物对接与装卸

2. 障碍物距离检测

python 复制代码

#!/usr/bin/env python3
"""agv_obstacle.py - AGV 障碍物检测"""
import cv2
import numpy as np
from ultralytics import YOLO

class AGVObstacleDetector:
    """AGV 障碍物检测器"""
    
    def __init__(self, model_path, camera_matrix, safety_distance=2.0):
        self.model = YOLO(model_path)
        self.camera_matrix = camera_matrix
        self.safety_distance = safety_distance  # 安全距离（米）
        self.fx = camera_matrix[0, 0]
        self.fy = camera_matrix[1, 1]
        
        # 已知物体尺寸
        self.known_sizes = {
            'person': 1.7,
            'forklift': 2.0,
            'pallet': 0.15,
            'box': 0.4,
            'obstacle': 1.0,
        }
    
    def detect_obstacles(self, image):
        """检测障碍物并估算距离"""
        results = self.model.predict(image, conf=0.3, verbose=False)
        
        obstacles = []
        for r in results:
            for box in r.boxes:
                cls_name = self.model.names[int(box.cls)]
                bbox = box.xyxy[0].tolist()
                conf = float(box.conf)
                
                # 估算距离
                distance = self._estimate_distance(bbox, cls_name)
                
                # 判断是否在安全距离内
                is_danger = distance < self.safety_distance
                
                obstacles.append({
                    'class': cls_name,
                    'bbox': bbox,
                    'confidence': conf,
                    'distance': distance,
                    'is_danger': is_danger,
                })
        
        return obstacles
    
    def _estimate_distance(self, bbox, cls_name):
        """估算距离"""
        x1, y1, x2, y2 = bbox
        pixel_height = y2 - y1
        
        if cls_name in self.known_sizes:
            real_height = self.known_sizes[cls_name]
            distance = (real_height * self.fy) / pixel_height
        else:
            # 默认估算
            distance = 500 / pixel_height
        
        return distance
    
    def get_navigation_command(self, obstacles):
        """根据障碍物生成导航命令"""
        # 检查前方障碍物
        front_obstacles = [o for o in obstacles if o['is_danger']]
        
        if not front_obstacles:
            return {'action': 'forward', 'speed': 'normal'}
        
        # 计算障碍物方向
        for obs in front_obstacles:
            cx = (obs['bbox'][0] + obs['bbox'][2]) / 2
            img_center = self.camera_matrix[0, 2]
            
            if cx < img_center - 100:
                return {'action': 'turn_right', 'reason': obs['class']}
            elif cx > img_center + 100:
                return {'action': 'turn_left', 'reason': obs['class']}
            else:
                return {'action': 'stop', 'reason': obs['class']}
        
        return {'action': 'stop', 'reason': 'obstacle'}

if __name__ == "__main__":
    calib = np.load("calibration.npz")
    detector = AGVObstacleDetector("yolo26n.pt", calib["camera_matrix"])
    
    cap = cv2.VideoCapture(0)
    
    while True:
        ret, frame = cap.read()
        if not ret:
            break
        
        obstacles = detector.detect_obstacles(frame)
        command = detector.get_navigation_command(obstacles)
        
        # 绘制
        for obs in obstacles:
            x1, y1, x2, y2 = map(int, obs['bbox'])
            color = (0, 0, 255) if obs['is_danger'] else (0, 255, 0)
            cv2.rectangle(frame, (x1, y1), (x2, y2), color, 2)
            label = f"{obs['class']} {obs['distance']:.1f}m"
            cv2.putText(frame, label, (x1, y1-10),
                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, color, 2)
        
        # 显示导航命令
        cv2.putText(frame, f"CMD: {command['action']}", (10, 30),
                   cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 255), 2)
        
        cv2.imshow("AGV", frame)
        if cv2.waitKey(1) & 0xFF == ord('q'):
            break
    
    cap.release()
    cv2.destroyAllWindows()

3. 深度相机避障

python 复制代码

#!/usr/bin/env python3
"""depth_avoidance.py - 深度相机避障"""
import cv2
import numpy as np
import pyrealsense2 as rs

class DepthAvoidance:
    """深度相机避障"""
    
    def __init__(self, safety_distance=1.0):
        self.pipeline = rs.pipeline()
        config = rs.config()
        config.enable_stream(rs.stream.depth, 640, 480, rs.format.z16, 30)
        self.pipeline.start(config)
        
        self.safety_distance = safety_distance * 1000  # m → mm
    
    def check_obstacles(self):
        """检查障碍物"""
        frames = self.pipeline.wait_for_frames()
        depth_frame = frames.get_depth_frame()
        depth = np.asanyarray(depth_frame.get_data())
        
        # 分区域检查
        h, w = depth.shape
        regions = {
            'left': depth[:, :w//3],
            'center': depth[:, w//3:2*w//3],
            'right': depth[:, 2*w//3:],
        }
        
        obstacles = {}
        for name, region in regions.items():
            # 忽略 0 值（无效深度）
            valid = region[region > 0]
            if len(valid) > 0:
                min_distance = np.percentile(valid, 5)  # 5% 分位数
                obstacles[name] = {
                    'min_distance': min_distance / 1000,  # mm → m
                    'is_safe': min_distance > self.safety_distance,
                }
        
        return obstacles, depth
    
    def get_avoidance_command(self, obstacles):
        """避障命令"""
        left_safe = obstacles.get('left', {}).get('is_safe', True)
        center_safe = obstacles.get('center', {}).get('is_safe', True)
        right_safe = obstacles.get('right', {}).get('is_safe', True)
        
        if center_safe:
            return {'action': 'forward'}
        elif left_safe:
            return {'action': 'turn_left'}
        elif right_safe:
            return {'action': 'turn_right'}
        else:
            return {'action': 'stop'}

if __name__ == "__main__":
    avoidance = DepthAvoidance(safety_distance=1.0)
    
    while True:
        obstacles, depth = avoidance.check_obstacles()
        command = avoidance.get_avoidance_command(obstacles)
        
        print(f"障碍物: {obstacles}")
        print(f"命令: {command}")

4. 货物对接测距

python 复制代码

#!/usr/bin/env python3
"""docking.py - 货物对接"""
import cv2
import numpy as np

class CargoDocking:
    """货物对接"""
    
    def __init__(self, camera_matrix):
        self.fx = camera_matrix[0, 0]
        self.fy = camera_matrix[1, 1]
        self.cx = camera_matrix[0, 2]
        self.cy = camera_matrix[1, 2]
    
    def detect_docking_target(self, image, marker_size=0.1):
        """检测对接目标（ArUco 标记）"""
        aruco_dict = cv2.aruco.getPredefinedDictionary(cv2.aruco.DICT_4X4_50)
        detector = cv2.aruco.ArucoDetector(aruco_dict)
        
        corners, ids, _ = detector.detectMarkers(image)
        
        targets = []
        if ids is not None:
            for i, (corner, marker_id) in enumerate(zip(corners, ids.flatten())):
                # 估计位姿
                rvec, tvec, _ = cv2.aruco.estimatePoseSingleMarkers(
                    corner, marker_size, np.eye(3), np.zeros(5)
                )
                
                distance = np.linalg.norm(tvec[0][0])
                x_offset = tvec[0][0][0]
                y_offset = tvec[0][0][1]
                
                targets.append({
                    'id': marker_id,
                    'distance': distance,
                    'x_offset': x_offset,
                    'y_offset': y_offset,
                    'rvec': rvec[0][0],
                    'tvec': tvec[0][0],
                })
        
        return targets
    
    def get_docking_command(self, target):
        """生成对接命令"""
        if target is None:
            return {'action': 'search'}
        
        distance = target['distance']
        x_offset = target['x_offset']
        
        # 对接精度
        distance_threshold = 0.05  # 5cm
        angle_threshold = 0.05  # ~3°
        
        if distance < distance_threshold and abs(x_offset) < angle_threshold:
            return {'action': 'dock', 'status': 'aligned'}
        elif distance < distance_threshold:
            return {'action': 'adjust_lateral', 'offset': x_offset}
        elif abs(x_offset) > angle_threshold:
            return {'action': 'rotate', 'angle': x_offset}
        else:
            return {'action': 'approach', 'distance': distance}

if __name__ == "__main__":
    calib = np.load("calibration.npz")
    docking = CargoDocking(calib["camera_matrix"])
    
    cap = cv2.VideoCapture(0)
    
    while True:
        ret, frame = cap.read()
        if not ret:
            break
        
        targets = docking.detect_docking_target(frame)
        
        if targets:
            command = docking.get_docking_command(targets[0])
            print(f"目标: {targets[0]['id']}, 距离: {targets[0]['distance']:.3f}m")
            print(f"命令: {command}")
        
        cv2.imshow("Docking", frame)
        if cv2.waitKey(1) & 0xFF == ord('q'):
            break
    
    cap.release()
    cv2.destroyAllWindows()

总结

功能	传感器	精度	响应时间
障碍物检测	单目+YOLO	±10%	30ms
避障	深度相机	±2%	30ms
货物对接	ArUco+深度	±1cm	50ms
路径跟踪	视觉 SLAM	±5cm	100ms