python - 对极几何姿态估计 : Epipolar lines look good but wrong pose-6ren

python - 对极几何姿态估计 : Epipolar lines look good but wrong pose

转载作者：太空宇宙更新时间：2023-11-03 20:53:36

我正在尝试使用 OpenCV 来估计相机相对于另一个的一个姿势，使用 SIFT 特征跟踪、FLANN 匹配以及基本矩阵和基本矩阵的后续计算。分解基本矩阵后，我检查退化配置并获得“正确的”R 和 t。

问题是，他们似乎从来都不是对的。我包括几个图像对:

图像 2 沿 Y 轴旋转 45 度且位置与 w.r.t. 相同。图 1。

图像对

结果

图片 2 取自大约。沿负 X 方向几米远，负 Y 方向轻微位移。约相机姿势沿 Y 轴旋转 45-60 度。

图像对

结果

第二种情况下的平移向量似乎高估了 Y 方向的运动而低估了 X 方向的运动。在这两种情况下，转换为欧拉角的旋转矩阵都会给出错误的结果。许多其他数据集也会发生这种情况。我已经尝试在 RANSAC、LMEDS 等之间切换基本矩阵计算技术，现在我正在使用 RANSAC 进行计算，第二次计算仅使用 8 点法的内点。更改特征检测方法也无济于事。对极线似乎是适当的，基本矩阵满足x'.F.x = 0

我是否遗漏了一些根本性的错误？如果程序正确理解对极几何，可能会发生什么导致完全错误的姿势？我正在检查以确保点位于两个摄像头前面。任何想法/建议都会非常有帮助。谢谢!

编辑:尝试使用相同的技术，将两个不同的校准相机隔开；并计算基本矩阵为 K2'.F.K1，但平移和旋转仍然有很大差距。

Code供引用

import cv2
import numpy as np

from matplotlib import pyplot as plt

# K2 = np.float32([[1357.3, 0, 441.413], [0, 1355.9, 259.393], [0, 0, 1]]).reshape(3,3)
# K1 = np.float32([[1345.8, 0, 394.9141], [0, 1342.9, 291.6181], [0, 0, 1]]).reshape(3,3)

# K1_inv = np.linalg.inv(K1)
# K2_inv = np.linalg.inv(K2)

K = np.float32([3541.5, 0, 2088.8, 0, 3546.9, 1161.4, 0, 0, 1]).reshape(3,3)
K_inv = np.linalg.inv(K)

def in_front_of_both_cameras(first_points, second_points, rot, trans):
    # check if the point correspondences are in front of both images
    rot_inv = rot
    for first, second in zip(first_points, second_points):
        first_z = np.dot(rot[0, :] - second[0]*rot[2, :], trans) / np.dot(rot[0, :] - second[0]*rot[2, :], second)
        first_3d_point = np.array([first[0] * first_z, second[0] * first_z, first_z])
        second_3d_point = np.dot(rot.T, first_3d_point) - np.dot(rot.T, trans)

        if first_3d_point[2] < 0 or second_3d_point[2] < 0:
            return False

    return True

def drawlines(img1,img2,lines,pts1,pts2):
    ''' img1 - image on which we draw the epilines for the points in img1
        lines - corresponding epilines '''
    pts1 = np.int32(pts1)
    pts2 = np.int32(pts2)
    r,c = img1.shape
    img1 = cv2.cvtColor(img1,cv2.COLOR_GRAY2BGR)
    img2 = cv2.cvtColor(img2,cv2.COLOR_GRAY2BGR)
    for r,pt1,pt2 in zip(lines,pts1,pts2):
        color = tuple(np.random.randint(0,255,3).tolist())
        x0,y0 = map(int, [0, -r[2]/r[1] ])
        x1,y1 = map(int, [c, -(r[2]+r[0]*c)/r[1] ])
        cv2.line(img1, (x0,y0), (x1,y1), color,1)
        cv2.circle(img1,tuple(pt1), 10, color, -1)
        cv2.circle(img2,tuple(pt2), 10,color,-1)
    return img1,img2


img1 = cv2.imread('C:\\Users\\Sai\\Desktop\\room1.jpg', 0)  
img2 = cv2.imread('C:\\Users\\Sai\\Desktop\\room0.jpg', 0) 
img1 = cv2.resize(img1, (0,0), fx=0.5, fy=0.5)
img2 = cv2.resize(img2, (0,0), fx=0.5, fy=0.5)

sift = cv2.SIFT()

# find the keypoints and descriptors with SIFT
kp1, des1 = sift.detectAndCompute(img1,None)
kp2, des2 = sift.detectAndCompute(img2,None)

# FLANN parameters
FLANN_INDEX_KDTREE = 0
index_params = dict(algorithm = FLANN_INDEX_KDTREE, trees = 5)
search_params = dict(checks=50)   # or pass empty dictionary

flann = cv2.FlannBasedMatcher(index_params,search_params)

matches = flann.knnMatch(des1,des2,k=2)

good = []
pts1 = []
pts2 = []

# ratio test as per Lowe's paper
for i,(m,n) in enumerate(matches):
    if m.distance < 0.7*n.distance:
        good.append(m)
        pts2.append(kp2[m.trainIdx].pt)
        pts1.append(kp1[m.queryIdx].pt)

pts2 = np.float32(pts2)
pts1 = np.float32(pts1)
F, mask = cv2.findFundamentalMat(pts1,pts2,cv2.FM_RANSAC)

# Selecting only the inliers
pts1 = pts1[mask.ravel()==1]
pts2 = pts2[mask.ravel()==1]

F, mask = cv2.findFundamentalMat(pts1,pts2,cv2.FM_8POINT)

print "Fundamental matrix is"
print 
print F

pt1 = np.array([[pts1[0][0]], [pts1[0][1]], [1]])
pt2 = np.array([[pts2[0][0], pts2[0][1], 1]])

print "Fundamental matrix error check: %f"%np.dot(np.dot(pt2,F),pt1)
print " "


# drawing lines on left image
lines1 = cv2.computeCorrespondEpilines(pts2.reshape(-1,1,2), 2,F)
lines1 = lines1.reshape(-1,3)
img5,img6 = drawlines(img1,img2,lines1,pts1,pts2)

# drawing lines on right image
lines2 = cv2.computeCorrespondEpilines(pts1.reshape(-1,1,2), 1,F)
lines2 = lines2.reshape(-1,3)
img3,img4 = drawlines(img2,img1,lines2,pts2,pts1)

E = K.T.dot(F).dot(K)

print "The essential matrix is"
print E
print 

U, S, Vt = np.linalg.svd(E)
W = np.array([0.0, -1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0]).reshape(3, 3)

first_inliers = []
second_inliers = []
for i in range(len(pts1)):
    # normalize and homogenize the image coordinates
    first_inliers.append(K_inv.dot([pts1[i][0], pts1[i][1], 1.0]))
    second_inliers.append(K_inv.dot([pts2[i][0], pts2[i][1], 1.0]))

# Determine the correct choice of second camera matrix
# only in one of the four configurations will all the points be in front of both cameras
# First choice: R = U * Wt * Vt, T = +u_3 (See Hartley Zisserman 9.19)

R = U.dot(W).dot(Vt)
T = U[:, 2]
if not in_front_of_both_cameras(first_inliers, second_inliers, R, T):

    # Second choice: R = U * W * Vt, T = -u_3
    T = - U[:, 2]
    if not in_front_of_both_cameras(first_inliers, second_inliers, R, T):

        # Third choice: R = U * Wt * Vt, T = u_3
        R = U.dot(W.T).dot(Vt)
        T = U[:, 2]

        if not in_front_of_both_cameras(first_inliers, second_inliers, R, T):

            # Fourth choice: R = U * Wt * Vt, T = -u_3
            T = - U[:, 2]

# Computing Euler angles

thetaX = np.arctan2(R[1][2], R[2][2])
c2 = np.sqrt((R[0][0]*R[0][0] + R[0][1]*R[0][1]))

thetaY = np.arctan2(-R[0][2], c2)

s1 = np.sin(thetaX)
c1 = np.cos(thetaX)

thetaZ = np.arctan2((s1*R[2][0] - c1*R[1][0]), (c1*R[1][1] - s1*R[2][1]))

print "Pitch: %f, Yaw: %f, Roll: %f"%(thetaX*180/3.1415, thetaY*180/3.1415, thetaZ*180/3.1415)

print "Rotation matrix:"
print R
print
print "Translation vector:"
print T

plt.subplot(121),plt.imshow(img5)
plt.subplot(122),plt.imshow(img3)
plt.show()

最佳答案

有很多因素会导致根据点对应关系对相机位姿的估计不准确。您必须考虑的一些因素:-

(*) 8 点法最小化代数误差 ( x'.F.x = 0)。通常最好找到一个能最小化有意义的几何误差的解决方案。例如，您可以在 RANSAC 实现中使用重新投影误差。

(*) 从8点求解基本矩阵的线性算法对噪声敏感。亚像素级精确点匹配、适当的数据归一化和精确的相机校准对于获得更好的结果都很重要。

(*) 特征点定位和匹配导致噪声点匹配，因此通过求解代数方程 x'Fx 得到的解应该真正用作初始估计，并且需要应用参数优化等进一步步骤优化解决方案。

(*) 一些双 View 相机配置可能会导致模糊的解决方案，因此需要进一步的方法(例如第三 View 消歧)以获得可靠的结果。

关于python - 对极几何姿态估计 : Epipolar lines look good but wrong pose，我们在Stack Overflow上找到一个类似的问题： https://stackoverflow.com/questions/31737688/

文章推荐： c# - 在递归中使用 Math.Pow() 时超出了 c# 的执行时间限制

文章推荐： javascript - 坚持到顶部然后放入 css - [我有示例网站]

文章推荐： c# - 使用 ML.NET 的动态训练/测试类

wpf - 我如何将简单的形状位图转换为矢量(几何)
我想知道是否可以将简单的位图转换为几何对象最佳答案是的，您可以使用跟踪。 Potrace是一个开源的位图到矢量跟踪器库。然而，位图追踪并不完美。对于高质量的矢量图像，line tracer 一般
math - 几何:找到点两点之间的特定距离
这类似于this question，但是却相反。我有两个地理位置(纬度，经度)A和B。假设它们相距40海里。我想计算在A和B之间的直线上，从A点起10海里处的坐标。数学(我每天使用的其他一些数学)，
javascript - 几何 - 计算点到线的距离
我想计算一个点到由 2 个点定义的直线的距离。我正在使用 javascript，这就是我使用维基百科得出的结论:https://en.wikipedia.org/wiki/Distance_from
c++ - boost 、几何
我对 boost::geomentry 有疑问。 #include #include #include #include int main(){ typedef boost::geometry
c++ - 几何、交集
我有一个问题。我想将四边形与四边形相交。 int main(){ typedef boost::geometry::model::point_xy TBoostPoint; typedef b
c++ - 几何 -> OpenGL
我无法在 OpleGL 中获得正确的转换。我有 point3D - P(X,Y,Z) 和投影矩阵 M，它等于 K*(R|T) 其中 K - 相机标定矩阵 (R|T)——点(物)坐标系变换(R——旋转
algorithm - 几何 - 两侧为凸面的两个圆围绕几何中心旋转
我想做一个凸面(由一些直线或圆弧组成)围绕它的几何中心(Cx,Cy)旋转。同时凸面两侧有两个圆(由半径给出:R 和左中心:(Lx,Cy)，右中心:(Rx,Cy))。表示与几何(Cy) X 轴相同的圆心
.net - 几何 HitTest 中的错误
我有一个 DrawingVisual表示路径的元素，该路径的几何描述由此 syntax : "m106,59.3c0-1.98,0,0-4.95,0.989-3.96,0.989-13.8,3.96-
python - 如何创建图神经网络数据集？ (pytorch 几何)
如何将我自己的数据集转换为可供 pytorch 几何图形神经网络使用的数据集？所有教程都使用已转换为 pytorch 可用的现有数据集。例如，如果我有自己的点云数据集，我如何使用它来训练图神经网络的
python - 无法从类传递调整大小的 QLabel 几何
我正在使用 PyQt5 和 OpenCV。我想创建一个读取视频帧并执行橡皮筋拉伸(stretch)以生成几何图形的类，该几何图形将由不同的类用于裁剪视频流(此示例中不包括第二类)。在此示例中，从网络
database - 最近的(几何)点作为外键
我们有两个 (PostgreSQL 9.2) 表。第一城市: loc_id | integer | not null name | character
sql - Postgis 几何 where 条件
我有一张 table : create table if not exists places( id bigserial not null constraint places_pkey primary
postgresql - 在不查询数据库的情况下将经纬度转换为 PostGIS 几何
我在 postgresql 中有一个带有 PostGIS geometry(point, 4326) 列(位置，使用 SRID 4326)的表，我有一个使用 SQL Alchemy 更新表(其余列)的
C++ 11和 boost 几何
我开始使用 c++11 并尝试使用 boost geometry 运行一些示例代码 #include #include #include #include BOOST_GEOMETRY_REG
python - 将一列多边形从字符串转换为 GeoPandas 几何
我有一个存储为 csv 文件的数据框，其中一列是多边形对象。但是，此列存储为字符串而不是 GeoPandas 几何对象。如何将此列转换为 Geopandas 几何对象以便执行地理分析？这是我的数据的
opencv - 多 View 几何
我从两台相同品牌的相机拍摄的两张图像相距一定距离，拍摄相同的场景。我想计算两个相机之间的真实世界旋转和平移。为了实现这一点，我首先提取了两个图像的 SIFT 特征并匹配它们。我现在有了基本矩阵以及单
c++ - boost 几何/空间查询形状
我目前正在使用 boost 几何/空间索引库，以便对 3d 边界框执行范围查询。例如，我能够获得与查询边界框重叠的所有边界框的列表。文档 ( http://www.boost.org/doc/lib
c++ - 使用运行时指定尺寸的 boost 几何
boost::geometry::model::point 将点的维度作为编译时参数。例如， typedef bg::model::point point; 有没有什么方法可以在运行时指定维度，比如说
javascript - 将纹理添加到自定义 three.js 几何
我一直在寻找一种在 three.js 中将 uv 映射添加到我的自定义几何体的方法。我找到了这样做的方法，但我找到的解决方案都没有用。谁能解释一下 uv-mapping 的工作原理以及如何正确使用它？
iphone - 数学(几何): Rectangle projection?
在我的应用程序中，用户可以使用 iPhone 的 GPS 定义足球场的三个角落，方法是一个接一个地走到角落，然后点击按钮。这很好用，我可以在屏幕上绘制生成的矩形，类似于它在 Google map 中的

太空宇宙

个人简介

我是一名优秀的程序员,十分优秀！

作者热门文章

滴滴打车优惠券免费领取

全站热门文章

首页

博学

6Ren·AI

商城

python - 对极几何姿态估计 : Epipolar lines look good but wrong pose