ProReRansac.py

import numpy as np
import torch as t

import cv2
import random
from ReDefineError import angle_error
from ReDefineError import reprojection_error
from ReDefineError import end_iter_thresh
import time

def init():
    Pic= np.load('scenes_coordinate1.npy')   ##大小为1×3×480×640
    Pic = np.squeeze(Pic)   #压缩掉第一维1
    Pic = np.array(Pic, dtype=np.float32)
    #Pic=t.Tensor(Pic)
    distCoeffs = np.zeros(5, dtype=np.float32)
    #distCoeffs=t.Tensor(distCoeffs)
    CameraMatrix = np.array([[525, 0, 324],
                             [0, 525, 244],
                             [0, 0, 1]], dtype=np.float32)
    #CameraMatrix=t.Tensor(CameraMatrix)
    return Pic,distCoeffs,CameraMatrix

def Ran_Stard_test(Pic,CameraMatrix,distCoeffs):
    RanPw=[]
    RanPc=[]
    for i in range(Pic.shape[1]):
        for j in range(Pic.shape[2]):
            a=np.array(Pic[:, i, j])
            RanPw.append(a)
            RanPc.append(np.array([j,i]))

    RanPw=np.array(RanPw,dtype=np.float32)   #变为307200×3
    RanPc=np.array(RanPc,dtype=np.float32)

    _,R,trans,inliers=cv2.solvePnPRansac(RanPw,RanPc,CameraMatrix,distCoeffs,reprojectionError=10)
    r,_=cv2.Rodrigues(R)
    print('旋转平移的GT值为')
    print('R=',r)
    print('t=',trans)
    T=np.zeros((4,4),dtype=np.float32)
    T[0:3,0:3]=r
    T[0:3,3:4]=trans
    T[3][3]=1
    T_ni=np.linalg.inv(T)
    print('Tni=',T_ni)


    ra=random.randint(0,4799)
    pos_world=np.expand_dims((RanPw[ra]),axis=1)
    print('pos_world=',pos_world)
    zer=np.zeros((3,1),dtype=np.float32)

    pos_world=t.from_numpy(pos_world)
    pos_image=np.expand_dims(RanPc[ra],axis=1)
    pos_image=t.from_numpy(pos_image)
    CameraMatrix_tensor=t.from_numpy(CameraMatrix)

    Tni_tensor=t.from_numpy(T_ni)
    T_tensor=t.from_numpy(T)
    reloss = reprojection_error(Pose_Trans=T_tensor, Pos_world=pos_world, Internal_ref=CameraMatrix_tensor, GT=pos_image)

    anloss=angel_error(Pose_Trans=T_tensor,Pos_world=pos_world,Internal_ref=CameraMatrix_tensor,GT=pos_image)
    print('re_loss=',reloss)
    print('anloss=',anloss)


def Get_World_Pos(PointSet,WH_3Pw):
    '从选出的点中得到点对应的世界坐标系下的坐标'
    long=PointSet.shape[0]
    Point=np.zeros((long,3),dtype=np.float32)
    for i in range(long):
        x=int(PointSet[i][1])
        y=int(PointSet[i][0])      ##由于图像颠倒,ij换位
        pw = WH_3Pw[:,x,y]
        Point[i]=pw
    return Point

def Select256Rt(WH_3Pw,CameraMatrix,repro_threshold,distCoeffs):
    '选择256个重投影超过阈值的位姿:  WH_3Pw:numpy或tensor,3×w/8×h/8;  CameraMatrix: numpy，3×3；distCoeffs：numpy'
    CameraMatrix_np=np.array(CameraMatrix,dtype=np.float32)
    CameraMatrix_tensor= t.from_numpy(CameraMatrix_np)
    distCoeffs_np=np.array(distCoeffs,dtype=np.float32)
    distCoeffs_tensor=t.from_numpy(distCoeffs_np)
    Pic_width = WH_3Pw.shape[1]
    Pic_height = WH_3Pw.shape[2]

    Choose_point = np.zeros((Pic_width, Pic_height), dtype=np.int)  ##创建初始全0矩阵480×640，选过的点记为1
    Rt_set = []
    num_Rt = 0
    while (num_Rt != 256):  ##选256个Rt
        choose1 = random.randint(0, Pic_width - 1)     #0~479
        choose2 = random.randint(0, Pic_height - 1)    #0~639
        Four_point_set = []
        Num_of_Fourset = 0
        while (Num_of_Fourset < 4):  # 选4个点
            if (Choose_point[choose1][choose2] == 0):  ##点还未选过，可以用
                Four_point_set.append([choose2, choose1])    ##  由于图像颠倒，i,j 换位
                Num_of_Fourset = Num_of_Fourset + 1  ##四点组中组数+1
            choose1 = random.randint(0, Pic_width - 1)
            choose2 = random.randint(0, Pic_height - 1)
        ##到此为止 未重复的四点组合已经选入FourPointSet中，大小为4×2  等待确认是否可用

        P4image = np.array(Four_point_set, dtype=np.float32)  # 把四点组的图像坐标转变为numpy格式
        P4w = Get_World_Pos(P4image, WH_3Pw)  # 得到四点组的世界坐标，大小为4×3

        # 计算位姿
        bool, Rotate, trans = cv2.solvePnP(P4w, P4image, CameraMatrix_np, distCoeffs_np)
        #bool, Rotate, trans = cv2.solvePnP(P4w, P4image, CameraMatrix, distCoeffs,flags=cv2.SOLVEPNP_P3P)
        P4w = np.squeeze(P4w)
        P4image = np.squeeze(P4image)

        #得到大T矩阵
        Rotate, _ = cv2.Rodrigues(Rotate)
        TensorRotate = t.from_numpy(Rotate)
        TensorTrans = t.from_numpy(trans)
        TensorTT = t.zeros(4, 4)
        TensorTT[0:3, 0:3] = TensorRotate
        TensorTT[0:3, 3:4] = TensorTrans
        TensorTT[3][3] = 1

        Ok_flag = True
        for pw,pp in zip(P4w,P4image):
            pw=np.expand_dims(pw,axis=1)  ##把一个点的世界坐标系变为3×1的大小
            pw=t.from_numpy(pw)

            pp=np.expand_dims(pp,axis=1)  ##把一个点的图像坐标系变为2×1的大小
            pp=t.from_numpy(pp)

            RepreError = reprojection_error(TensorTT, pw, CameraMatrix_tensor, pp)
            print(RepreError)
            if ( RepreError > repro_threshold):
                Ok_flag = False
                print("大于阈值"+str(repro_threshold)+",跳过重选")
                break     ##四点组要是有一个小于阈值，则重新来,退出 for pw,pp in zip(……)，之后的全部写在flag==True里面

        # 在阈值范围内，保存Rt，修改初始记点矩阵
        if (Ok_flag == True):
            Rt_set.append(TensorTT)  ##保存T
            num_Rt = num_Rt + 1  # 保存了一个Rt
            print('重投影阈值设置为' + str(repro_threshold) +' 四点重投影误差均小于阈值，已被记录，当前共' + str(num_Rt) + '个Rt位姿')
            for pp in Four_point_set:
                x = int(pp[0])
                y = int(pp[1])
                Choose_point[y][x] = 1  ##记为四个点已经用过,xy调换
    print('256个位姿已经选择完成！')
    show=random.randint(0,255)
    print('随机取第'+str(show)+'个位姿展示：（该位姿未必正确）')
    print(np.linalg.inv(Rt_set[show]))   ##本身Rt为tensor类型，为显示更多的位数，拿np显示，取随机展示观察,该位姿未必正确
    return Rt_set


def Rt_compute_Dsample_Point(WH_3Pw,CameraMatrix,repro_threshold,distCoeffs):
    '输入np和tensor都可以，但最好是tensor：WH_3Pw: [3,w/8,h/8]; CameraMatrix:内参,3×3; repro_threshold：重投影阈值,常数'
    Numof_downsampe=int(8)   ##采样指数，算480*640则改成int(1)，算60*80则用int(8)
    CameraMatrix_np=np.array(CameraMatrix,dtype=np.float32)
    CameraMatrix_tensor=t.Tensor(CameraMatrix)
    Rt_set=Select256Rt(WH_3Pw=WH_3Pw,CameraMatrix=CameraMatrix_np,repro_threshold=repro_threshold,distCoeffs=distCoeffs)

    Pic_world=[]
    Pic_image=[]
    height=WH_3Pw.shape[1]/Numof_downsampe
    height=int(height)
    width=WH_3Pw.shape[2]/Numof_downsampe
    width=int(width)
    for x in range(height):
        for y in range(width):
            Pic_world.append(t.Tensor(np.expand_dims(WH_3Pw[:, Numof_downsampe*x, Numof_downsampe*y], axis=1)))  ##WH_3Pw[:, x, y]为大小为3的数组，加一个轴变为3×1大小
            Pic_image.append(t.from_numpy(np.array([[Numof_downsampe*y],
                                       [Numof_downsampe*x]],dtype=np.float32)))
    Num_RT=0 # 用来为输入第几个位姿变换计数，不输出可以删掉
    InThres=[]  ##用来存放不同位姿下的内点的数目
    Rt_inliers=[]  #用来存放不同位姿的内点图
    startt=time.time()
    for Rt in Rt_set:
        In_thresh=0 #内点数初始记为0
        inliers_map = []  ##用来存放某一位姿具体的内点，计划放在Rt_inliers里
        for pos_world,pos_img in zip(Pic_world,Pic_image):
            loss=reprojection_error(Pose_Trans=Rt,Pos_world=pos_world,Internal_ref=CameraMatrix_tensor,GT=pos_img)
            if(loss < repro_threshold):
                In_thresh=In_thresh+1    ##用来存放Rt的内点个数
                x=pos_img[0][0]
                y=pos_img[1][0]
                inliers_map.append([x,y])    #记录内点图

        Num_RT=Num_RT+1    # 用来为输入第几个位姿变换计数，不需要输出可以删掉
        print('当前正在计算第'+str(Num_RT)+'个位姿变换的重投影误差在阈值内的个数，个数为'+str(In_thresh)+'个')
        InThres.append(In_thresh)  ##将当前Rt的内点个数存入列表
        Rt_inliers.append(inliers_map) ##将当前Rt的内点图存入列表

    endd=time.time()
    print('256个位姿变换及其对应内点计算完成,共耗时:',endd-startt)
    MAXRt=InThres.index(max(InThres))
    print('第'+str(MAXRt)+'个位姿在阈值内的个数最多，最多为：'+str(max(InThres)))
    print('对应位姿为:',np.linalg.inv(Rt_set[MAXRt]))

    Inlier=np.array(Rt_inliers[MAXRt],dtype=np.float32)
    print('\n内点图大小为:',Inlier.shape)

    return Rt_set[MAXRt],Inlier    ##Rt为tensor类型，Inlier为numpy类型

def Custom_Ransac(WH_3Pw,CameraMatrix,repro_threshold,distCoeffs,finish_iter_threshold):
    '输入np和tensor都可以：WH_3Pw: [3,w/8,h/8]; CameraMatrix:内参,3×3; repro_threshold：重投影阈值,常数'
    CameraMatrix_np = np.array(CameraMatrix, dtype=np.float32)
    CameraMatrix_tensor = t.from_numpy(CameraMatrix_np)
    distCoeffs_np = np.array(distCoeffs, dtype=np.float32)
    distCoeffs_tensor= t.from_numpy(distCoeffs_np)
    Numof_downsampe = 8  ##采样指数，算480*640则改成int(1)，算60*80则用int(8)

    Rt,Inlier=Rt_compute_Dsample_Point(WH_3Pw=WH_3Pw,CameraMatrix=CameraMatrix,repro_threshold=repro_threshold,
                                        distCoeffs=distCoeffs)   #获取256个位姿下内点最多的位姿及其对应内点
    Orign_Rt=t.Tensor(Rt)
    Pw=Get_World_Pos(Inlier, WH_3Pw)  #获取对应内点的世界坐标系

    Pw=np.ascontiguousarray(Pw)
    Inlier=np.ascontiguousarray(Inlier)


    bool_,Rotate,trans=cv2.solvePnP(Pw,Inlier,CameraMatrix_np,distCoeffs_np)
    Rotate, _ = cv2.Rodrigues(Rotate)
    TensorRotate = t.from_numpy(Rotate)
    TensorTrans = t.from_numpy(trans)
    new_Rt = t.zeros(4, 4)
    new_Rt[0:3, 0:3] = TensorRotate
    new_Rt[0:3, 3:4] = TensorTrans
    new_Rt[3][3] = 1
    print('求出新的位姿变换：')
    print(new_Rt)

    diff=end_iter_thresh(Orign_Rt,new_Rt)
    print('与前一位姿差值为：',diff)
    Num=0
    while(diff > finish_iter_threshold): #开始迭代
        Num=Num+1
        print('设置终止阈值为',finish_iter_threshold,',该差值大于终止阈值，循环继续，当前正在进行第%s轮循环。'%Num)
        Orign_Rt=t.Tensor(new_Rt)
        Pic_world = []
        Pic_image = []
        height = WH_3Pw.shape[1] / Numof_downsampe
        height = int(height)
        width = WH_3Pw.shape[2] / Numof_downsampe
        width = int(width)
        for x in range(height):
            for y in range(width):
                Pic_world.append(t.Tensor(np.expand_dims(WH_3Pw[:, Numof_downsampe * x, Numof_downsampe * y],
                                                         axis=1)))  ##WH_3Pw[:, x, y]为大小为3的数组，加一个轴变为3×1大小
                Pic_image.append(t.from_numpy(np.array([[Numof_downsampe * y],
                                                        [Numof_downsampe * x]], dtype=np.float32)))
        inliers_map = []  ##用来存放某一位姿具体的内点，计划放在Rt_inliers里
        for pos_world, pos_img in zip(Pic_world, Pic_image):
            loss = reprojection_error(Pose_Trans=Rt, Pos_world=pos_world, Internal_ref=CameraMatrix_tensor,
                                      GT=pos_img)
            if (loss < repro_threshold):
                x = pos_img[0][0]
                y = pos_img[1][0]
                inliers_map.append([x, y])  # 记录内点图

        Inlier = np.array(inliers_map,dtype=np.float32)
        Pw = Get_World_Pos(Inlier, WH_3Pw)  # 获取对应内点的世界坐标系

        Pw1 = np.ascontiguousarray(Pw)
        Inlier1 = np.ascontiguousarray(Inlier)


        bool_, Rotate, trans = cv2.solvePnP(Pw1, Inlier1, CameraMatrix_np, distCoeffs_np)
        Rotate, _ = cv2.Rodrigues(Rotate)
        TensorRotate = t.from_numpy(Rotate)
        TensorTrans = t.from_numpy(trans)
        new_Rt = t.zeros(4, 4)
        new_Rt[0:3, 0:3] = TensorRotate
        new_Rt[0:3, 3:4] = TensorTrans
        new_Rt[3][3] = 1
        print('求出新的位姿变换：')
        print(np.linalg.inv(new_Rt))
        diff = end_iter_thresh(Orign_Rt, new_Rt)
        print('与前一位姿差值为：', diff.item())
    print('与前一时刻位姿相差小于阈值',finish_iter_threshold,',循环结束,求出位姿。')
    print('最终位姿为：')
    print(np.linalg.inv(new_Rt))


if __name__=='__main__':
    start=time.time()
    Pic,distCoeffs, CameraMatrix=init()
    #Pic,distCoeffs, CameraMatrix=init()
    #Ran_Stard_test(Pic=Pic, CameraMatrix=CameraMatrix, distCoeffs=distCoeffs)   #此句用来验证标准PnPRansac输出,测试完成
    #Rt_set=Select256Rt(WH_3Pw=Pic, CameraMatrix=CameraMatrix, repro_threshold=10, distCoeffs=distCoeffs)  ##此句用来验证选择256位姿正确性，测试完成
    #Rt_compute_Dsample_Point(WH_3Pw=Pic, CameraMatrix=CameraMatrix, repro_threshold=10, distCoeffs=distCoeffs)##此句用来验证选择内点最多的256位姿之一算法，测试完成
    Custom_Ransac(WH_3Pw=Pic, CameraMatrix=CameraMatrix, repro_threshold=10, distCoeffs=distCoeffs, finish_iter_threshold=1.2008e-07)
    end=time.time()
    print("时间=%s"%(end-start))