修复一份SFN代码（可运行）

环境：python,cv2,需自行安装：mayavi

config.py(参数配置文件)：


import os
import numpy as np
 
image_dir = '设置图片目录路径'
MRT = 0.7
#相机内参矩阵,其中，K[0][0]和K[1][1]代表相机焦距，而K[0][2]和K[1][2]
#代表图像的中心像素。
K = np.array([
        [2362.12, 0, 720],
        [0, 2362.12,  578],
        [0, 0, 1]])
 
#选择性删除所选点的范围。
x = 0.5
y = 1

main.py(主文件）：


'''
原理可参考https://zhuanlan.zhihu.com/p/30033898
'''
import os
import cv2
import sys
import math
import config
import collections
import numpy as np
import matplotlib.pyplot as plt
from mayavi import mlab
from scipy.linalg import lstsq
from mpl_toolkits.mplot3d import Axes3D
from scipy.optimize import least_squares
 
##########################
#两张图之间的特征提取及匹配
##########################
def extract_features(image_names):
    
    #-------------wsy fixed--------------------------------
    # sift = cv2.xfeatures2d.SIFT_create(0, 3, 0.04, 10)
    sift = cv2.SIFT_create(0, 3, 0.04, 10)
    #-------------------------------------------------
    key_points_for_all = []
    descriptor_for_all = []
    colors_for_all = []
    for image_name in image_names:
        image = cv2.imread(image_name)
        
        if image is None:
            continue
        key_points, descriptor = sift.detectAndCompute(cv2.cvtColor(image, cv2.COLOR_BGR2GRAY), None) # 抽取关键点和描述符
        
        if len(key_points) <= 10:
            continue
        
        key_points_for_all.append(key_points) # 1788，1245, 2226
        descriptor_for_all.append(descriptor)
        colors = np.zeros((len(key_points), 3)) # 保存关键点的颜色信息（rgb) 
        for i, key_point in enumerate(key_points):
            p = key_point.pt
            colors[i] = image[int(p[1])][int(p[0])]         
        colors_for_all.append(colors)
    return np.array(key_points_for_all), np.array(descriptor_for_all), np.array(colors_for_all)
 
def match_features(query, train): # 使用knn算法匹配特征点
    bf = cv2.BFMatcher(cv2.NORM_L2)
    knn_matches = bf.knnMatch(query, train, k=2)
    matches = []
    #Apply Lowe's SIFT matching ratio test(MRT)，值得一提的是，这里的匹配没有
    #标准形式，可以根据需求进行改动。
    for m, n in knn_matches:
        if m.distance < config.MRT * n.distance: # 调试：此处条件可以满足所以暂时先不注释
            matches.append(m)
 
    return np.array(matches) # 44 ,26
 
def match_all_features(descriptor_for_all):
    matches_for_all = []
    for i in range(len(descriptor_for_all) - 1):
        matches = match_features(descriptor_for_all[i], descriptor_for_all[i + 1])
        matches_for_all.append(matches)
    return np.array(matches_for_all)
        
######################
#寻找图与图之间的对应相机旋转角度以及相机平移
######################
def find_transform(K, p1, p2):  
    
    focal_length = 0.5 * (K[0, 0] + K[1, 1])
    principle_point = (K[0, 2], K[1, 2])
    E,mask = cv2.findEssentialMat(p1, p2, focal_length, principle_point, cv2.RANSAC, 0.999, 1.0)
    cameraMatrix = np.array([[focal_length, 0, principle_point[0]], [0, focal_length, principle_point[1]], [0, 0, 1]])
    pass_count, R, T, mask = cv2.recoverPose(E, p1, p2, cameraMatrix, mask)
    
    return R, T, mask
 
def get_matched_points(p1, p2, matches):
    
    src_pts = np.asarray([p1[m.queryIdx].pt for m in matches])
    dst_pts = np.asarray([p2[m.trainIdx].pt for m in matches])
 
    return src_pts, dst_pts
 
def get_matched_colors(c1, c2, matches):
    
    color_src_pts = np.asarray([c1[m.queryIdx] for m in matches])
    color_dst_pts = np.asarray([c2[m.trainIdx] for m in matches])    
 
    return color_src_pts, color_dst_pts
 
#选择重合的点
def maskout_points(p1, mask):   
    
    p1_copy = []
    for i in range(len(mask)):
        if mask[i] > 0:
            p1_copy.append(p1[i])
    
    return np.array(p1_copy) # 也不为空
    
def init_structure(K, key_points_for_all, colors_for_all, matches_for_all):  
    p1, p2 = get_matched_points(key_points_for_all[0], key_points_for_all[1], matches_for_all[0])
    c1, c2 = get_matched_colors(colors_for_all[0], colors_for_all[1], matches_for_all[0])
    
    if find_transform(K, p1, p2):
        R,T,mask = find_transform(K, p1, p2)
    else:
        R,T,mask = np.array([]), np.array([]), np.array([])
                
    p1 = maskout_points(p1, mask)
    p2 = maskout_points(p2, mask)
    colors = maskout_points(c1, mask)
    #设置第一个相机的变换矩阵，即作为剩下摄像机矩阵变换的基准。
    R0 = np.eye(3, 3)
    T0 = np.zeros((3, 1))
    structure = reconstruct(K, R0, T0, R, T, p1, p2)
    rotations = [R0, R]
    motions = [T0, T]
    correspond_struct_idx = []
    for key_p in key_points_for_all:
        correspond_struct_idx.append(np.ones(len(key_p)) *- 1) # 说明此处len(key_p)=0 不是，这个只是用来指定维度的
    correspond_struct_idx = np.array(correspond_struct_idx) # 此处得到的全是-1
    idx = 0
    matches = matches_for_all[0] # 注此处只取了0
    print("####################init_structure:queryIdx & trainIdx")
    for i, match in enumerate(matches): 
        if mask[i] == 0:
            continue
        correspond_struct_idx[0][int(match.queryIdx)] = idx # 此处代码也会被执行到 correspond[0]元素其实就是queryidx和trainidx进行相互对应
        #------------wsy add------------------------
        print(match.queryIdx," & ", match.trainIdx)
        #-----------------------------------------
        correspond_struct_idx[1][int(match.trainIdx)] = idx # 
        idx += 1
    print("")
    return structure, correspond_struct_idx, colors, rotations, motions
    
#############
#三维重建
#############
def reconstruct(K, R1, T1, R2, T2, p1, p2):
    
    proj1 = np.zeros((3, 4))
    proj2 = np.zeros((3, 4))
    proj1[0:3, 0:3] = np.float32(R1)
    proj1[:, 3] = np.float32(T1.T)
    proj2[0:3, 0:3] = np.float32(R2)
    proj2[:, 3] = np.float32(T2.T)
    fk = np.float32(K)
    proj1 = np.dot(fk, proj1)
    proj2 = np.dot(fk, proj2)
    s = cv2.triangulatePoints(proj1, proj2, p1.T, p2.T)
    structure = []
    
    for i in range(len(s[0])):
        col = s[:, i]
        col /= col[3]
        structure.append([col[0], col[1], col[2]])
    
    return np.array(structure) # 不为空
 
###########################
#将已作出的点云进行融合
###########################
def fusion_structure(matches, struct_indices, next_struct_indices, structure, next_structure, colors, next_colors):
    
    for i,match in enumerate(matches):  
        query_idx = match.queryIdx
        train_idx = match.trainIdx
        struct_idx = struct_indices[query_idx]  
        if struct_idx >= 0:
            next_struct_indices[train_idx] = struct_idx
            continue
        structure = np.append(structure, [next_structure[i]], axis = 0) # 此处代码会被执行
        colors = np.append(colors, [next_colors[i]], axis = 0)
        struct_indices[query_idx] = next_struct_indices[train_idx] = len(structure) - 1
    return struct_indices, next_struct_indices, structure, colors
 
#制作图像点以及空间点
def get_objpoints_and_imgpoints(matches, struct_indices, structure, key_points):
    
    object_points = []
    image_points = []
    #-----------wsy add ---------------------------
    print("####################get_objpoints_and_imgpoints:queryIdx & trainIdx:")
    #---------------------------------
    for match in matches:
        query_idx = match.queryIdx
        train_idx = match.trainIdx
        #---------------wsy add---------------------
        print(query_idx," & ",train_idx) 
        #-----------------wsy fixed-----------------------
        # struct_idx = struct_indices[query_idx]   # 因为此处得到的都是-1，所以返回为空，但是struct_indices不都是-1，所以还与索引有关
        struct_idx = struct_indices[0][query_idx] # 
        #-------------------------------------------------
        if struct_idx < 0: 
            continue
        object_points.append(structure[int(struct_idx)]) # 此处代码未被执行
        image_points.append(key_points[train_idx].pt)
    print("")
    return np.array(object_points), np.array(image_points)
 
########################
#bundle adjustment
########################
 
# 这部分中，函数get_3dpos是原方法中对某些点的调整，而get_3dpos2是根据笔者的需求进行的修正，即将原本需要修正的点全部删除。
# bundle adjustment请参见https://www.cnblogs.com/zealousness/archive/2018/12/21/10156733.html
 
def get_3dpos(pos, ob, r, t, K):
    dtype = np.float32
    def F(x):
        p,J = cv2.projectPoints(x.reshape(1, 1, 3), r, t, K, np.array([]))
        p = p.reshape(2)
        e = ob - p
        err = e    
                
        return err
    res = least_squares(F, pos)
    return res.x
 
def get_3dpos_v1(pos,ob,r,t,K):
    p,J = cv2.projectPoints(pos.reshape(1, 1, 3), r, t, K, np.array([]))
    p = p.reshape(2)
    e = ob - p
    if abs(e[0]) > config.x or abs(e[1]) > config.y:        
        return None
    return pos
 
def bundle_adjustment(rotations, motions, K, correspond_struct_idx, key_points_for_all, structure):
    
    for i in range(len(rotations)):
        r, _ = cv2.Rodrigues(rotations[i])
        rotations[i] = r
    for i in range(len(correspond_struct_idx)):
        point3d_ids = correspond_struct_idx[i]
        key_points = key_points_for_all[i]
        r = rotations[i]
        t = motions[i]
        for j in range(len(point3d_ids)):
            point3d_id = int(point3d_ids[j])
            if point3d_id < 0:
                continue
            new_point = get_3dpos_v1(structure[point3d_id], key_points[j].pt, r, t, K)
            structure[point3d_id] = new_point
    
    return structure
 
#######################
#作图
#######################
 
# 这里有两种方式作图，其中一个是matplotlib做的，但是第二个是基于mayavi做的，效果上看，fig_v1效果更好。fig_v2是mayavi加颜色的效果。
 
def fig(structure, colors):
    colors /= 255
    for i in range(len(colors)):
        colors[i, :] = colors[i, :][[2, 1, 0]]
    fig = plt.figure()
    fig.suptitle('3d')
    ax = fig.gca(projection = '3d')
    for i in range(len(structure)):
        ax.scatter(structure[i, 0], structure[i, 1], structure[i, 2], color = colors[i, :], s = 5)
    ax.set_xlabel('x axis')
    ax.set_ylabel('y axis')
    ax.set_zlabel('z axis')
    ax.view_init(elev = 135, azim = 90)
    plt.show()
 
def fig_v1(structure):
 
    mlab.points3d(structure[:, 0], structure[:, 1], structure[:, 2], mode = 'point', name = 'dinosaur')
    mlab.show() # 显示了一个灰图，好像是有一些白色的点
    a=1
 
def fig_v2(structure, colors):
 
    for i in range(len(structure)):
        
        # mlab.points3d(structure[i][0], structure[i][1], structure[i][2], 
        #     mode = 'point', name = 'dinosaur', color = colors[i])
        mlab.points3d(structure[i][0], structure[i][1], structure[i][2], 
            mode = 'point', name = 'dinosaur', color = (colors[i][0],colors[i][1],colors[i][2]))
 
    mlab.show()
    a=1
    
def main():
    imgdir = config.image_dir # note 图片文件目录
    img_names = os.listdir(imgdir)
    img_names = sorted(img_names)
    
    for i in range(len(img_names)):
        img_names[i] = imgdir + img_names[i]
    # img_names = img_names[0:10]
 
    # K是摄像头的参数矩阵
    K = config.K
    
    key_points_for_all, descriptor_for_all, colors_for_all = extract_features(img_names)
    matches_for_all = match_all_features(descriptor_for_all) # 匹配特征（果然看的每一个资料中的每一句话都是有用的
    structure, correspond_struct_idx, colors, rotations, motions = init_structure(K, key_points_for_all, colors_for_all, matches_for_all)   
    
    for i in range(1, len(matches_for_all)): # len(matches_for_all) =2，所以其实下方只有一次循环
        #---------------wsy fixed-----------------------------
        # object_points, image_points = get_objpoints_and_imgpoints(matches_for_all[i], correspond_struct_idx[i], structure, key_points_for_all[i + 1]) # correspnd_struct_idx需要查看赋值的地方
        object_points, image_points = get_objpoints_and_imgpoints(matches_for_all[0], correspond_struct_idx, structure, key_points_for_all[i + 1]) 
        # 在python的opencv中solvePnPRansac函数的第一个参数长度需要大于7，否则会报错
		#这里对小于7的点集做一个重复填充操作，即用点集中的第一个点补满7个 wsy：还需要考虑点集为空的情况
        if len(image_points) < 7:
            #------------wsy add------------
            if len(image_points)==0:
                # image_points=np.insert(image_points,0,0)
                # object_points=np.insert(object_points,0,0)
                continue
            #---------------------------------
            while len(image_points) < 7:
                object_points = np.append(object_points, [object_points[0]], axis = 0) # 报错：index 0 is out of bounds for axis 0 with size 0
                image_points = np.append(image_points, [image_points[0]], axis = 0)
        
        #--------wsy add------------------------------
        # image_points.dtype=np.float32
        # object_points.dtype=np.float32
        #---------------------------------------------
        _, r, T, _ = cv2.solvePnPRansac(object_points, image_points, K, np.array([]))
        """
        报错：error: (-215:Assertion failed) npoints >= 4 && npoints == std::max(ipoints.checkVector(2, CV_32F), i
        """
        R, _ = cv2.Rodrigues(r)
        rotations.append(R)
        motions.append(T)
        p1, p2 = get_matched_points(key_points_for_all[i], key_points_for_all[i + 1], matches_for_all[i])
        c1, c2 = get_matched_colors(colors_for_all[i], colors_for_all[i + 1], matches_for_all[i])
        next_structure = reconstruct(K, rotations[i], motions[i], R, T, p1, p2)
        
        correspond_struct_idx[i], correspond_struct_idx[i + 1], structure, colors = fusion_structure(matches_for_all[i],correspond_struct_idx[i],correspond_struct_idx[i+1],structure,next_structure,colors,c1)
    structure = bundle_adjustment(rotations, motions, K, correspond_struct_idx, key_points_for_all, structure)
    i = 0
    # 由于经过bundle_adjustment的structure，会产生一些空的点（实际代表的意思是已被删除）
	# 这里删除那些为空的点
    while i < len(structure):
        if math.isnan(structure[i][0]):
            structure = np.delete(structure, i, 0)
            colors = np.delete(colors, i, 0)
            i -= 1
        i += 1
        
    print(len(structure)) # 4
    print(len(motions)) # 3
    # np.save('structure.npy', structure)
    # np.save('colors.npy', colors)
    
    fig(structure,colors) # 就只是一个简单的3维坐标，有几个点
    # fig_v1(structure) # 灰图，有几个白点
    fig_v2(structure, colors) # 也是一个灰图，几个白点。
   
if __name__ == '__main__':
    main()

原始代码来源：adnappp/Sfm-python: 三维重建算法Structure from Motion(Sfm)的python实现 (github.com)
虽然可以运行，但最终结果和理想不太一样，希望有跑出好的结果的朋友交流一下~

相关阅读:
Python多线程教程
 doris手动添加分区自动消失的问题
 Android不带电池设备文件系统配置
 SpringFramework：Spring 概述
 Android 获取设备内存和外存
 每日一题： leetcode1726 同积元组
 .NET程序配置文件
 `算法知识` 最大公约数GCD
使用DIV+CSS技术设计的非遗文化网页与实现制作（web前端网页制作课作业）
炒冷饭、语雀崩、领会员-我最主观的一段文字
原文地址：https://blog.csdn.net/weixin_45647721/article/details/126869327