基于SIFT / ORB的Homography estimation

SIFT

ORB

python 复制代码
import copy
import time

import cv2
import numpy as np


def draw_kpts(image0, image1, mkpts0, mkpts1, margin=10):
    H0, W0 = image0.shape
    H1, W1 = image1.shape
    H, W = max(H0, H1), W0 + W1 + margin
    out = 255 * np.ones((H, W), np.uint8)
    out[:H0, :W0] = image0
    out[:H1, W0+margin:] = image1
    out = np.stack([out]*3, -1)

    mkpts0, mkpts1 = np.round(mkpts0).astype(int), np.round(mkpts1).astype(int)
    # print(f"mkpts0.shape : {mkpts0.shape}")
    c = (0, 255, 0)
    for (new, old) in zip(mkpts0, mkpts1):
        x0, y0 = new.ravel()
        x1, y1 = old.ravel()
        # print(f"x0 : {x0}")
        # cv2.line(out, (x0, y0), (x1 + margin + W0, y1),
        #         color=c, thickness=1, lineType=cv2.LINE_AA)
        # display line end-points as circles
        cv2.circle(out, (x0, y0), 2, c, -1, lineType=cv2.LINE_AA)
        cv2.circle(out, (x1 + margin + W0, y1), 2, c, -1,
                lineType=cv2.LINE_AA)
        
    return out

if __name__ == "__main__":
    img0Path = "/training/datasets/orchard/orchard_imgs_/000130.jpg"
    img1Path = "/training/datasets/orchard/orchard_imgs_/000132.jpg"

    img0 = cv2.imread(img0Path, 0)
    img1 = cv2.imread(img1Path, 0)
    h, w = img0.shape

    mask = np.zeros_like(img0)
    mask[int(0.02 * h): int(0.98 * h), int(0.02 * w): int(0.98 * w)] = 255
    
    feature_detector_threshold = 20
    matcher_norm_type = cv2.NORM_HAMMING
    # detector = cv2.FastFeatureDetector_create(threshold=feature_detector_threshold)
    # extractor = cv2.ORB_create()
    # matcher = cv2.BFMatcher(matcher_norm_type)
    detector = cv2.SIFT_create(nOctaveLayers=3, contrastThreshold=0.02, edgeThreshold=20)
    extractor = cv2.SIFT_create(nOctaveLayers=3, contrastThreshold=0.02, edgeThreshold=20)
    matcher = cv2.BFMatcher(cv2.NORM_L2)

    # find static keypoints
    prev_keypoints = detector.detect(img0, mask)
    keypoints = detector.detect(img1, mask)

    # compute the descriptors
    prev_keypoints, prev_descriptors = extractor.compute(img0, prev_keypoints)
    keypoints, descriptors = extractor.compute(img1, keypoints)

    # Match descriptors.
    knnMatches = matcher.knnMatch(prev_descriptors, descriptors, k=2)

    # filtered matches based on smallest spatial distance
    matches = []
    spatial_distances = []
    max_spatial_distance = 0.25 * np.array([w, h])

    for m, n in knnMatches:
        if m.distance < 0.9 * n.distance:
            prevKeyPointLocation = prev_keypoints[m.queryIdx].pt
            currKeyPointLocation = keypoints[m.trainIdx].pt

            spatial_distance = (prevKeyPointLocation[0] - currKeyPointLocation[0],
                                prevKeyPointLocation[1] - currKeyPointLocation[1])

            if (np.abs(spatial_distance[0]) < max_spatial_distance[0]) and \
                    (np.abs(spatial_distance[1]) < max_spatial_distance[1]):
                spatial_distances.append(spatial_distance)
                matches.append(m)

    mean_spatial_distances = np.mean(spatial_distances, 0)
    std_spatial_distances = np.std(spatial_distances, 0)

    inliesrs = (spatial_distances - mean_spatial_distances) < 2.5 * std_spatial_distances

    goodMatches = []
    prevPoints = []
    currPoints = []
    for i in range(len(matches)):
        if inliesrs[i, 0] and inliesrs[i, 1]:
            goodMatches.append(matches[i])
            prevPoints.append(prev_keypoints[matches[i].queryIdx].pt)
            currPoints.append(keypoints[matches[i].trainIdx].pt)

    prevPoints = np.array(prevPoints)
    currPoints = np.array(currPoints)

     # find rigid matrix
    if (np.size(prevPoints, 0) > 4) and (np.size(prevPoints, 0) == np.size(prevPoints, 0)):
        H, inliesrs = cv2.estimateAffinePartial2D(prevPoints, currPoints, cv2.RANSAC)
    else:
        print('Warning: not enough matching points')
    
    print(f"H : {H}")

    out = draw_kpts(img0, img1, prevPoints, currPoints)
    cv2.imwrite("keypoints.jpg", out)
相关推荐
武子康2 小时前
调查研究-198 Agent 到底该记住什么?读懂《What Must Generalist Agents Remember?》
人工智能·openai·agent
aqi002 小时前
15天学会AI应用开发(九)利用Chroma持久化向量数据
人工智能·python·大模型·ai编程·ai应用
武子康4 小时前
调查研究-197 FAISS vs Elasticsearch 全面对比:从向量检索、全文搜索到 RAG 选型指南
人工智能·elasticsearch·agent
青禾网络4 小时前
Web 前端如何接入 AI 音效生成:从零到可用的完整方案
人工智能·设计模式
用户252736278144 小时前
【技术实战】用 Spring Boot + Vue3 + LM Studio 在本地跑通 RAG 知识库
人工智能
用户5191495848454 小时前
VBScript随机数生成器内部机制:从时间种子到密码令牌破解
人工智能·aigc
米小虾4 小时前
Context Engineering —— 知识与记忆的窗口
人工智能·agent
IT_陈寒5 小时前
Python里这个赋值坑,连老司机都能翻车
前端·人工智能·后端
Shockang15 小时前
AI 设计工作流全景拆解:Figma MCP / Claude Design / Codex / Google Stitch
人工智能