Add examples for 'Solving Problems'

sunglok · sunglok · commit 27dca0c12890 · 2022-09-26T11:10:03.000+09:00
diff --git a/examples/affine_estimation.py b/examples/affine_estimation.py
@@ -0,0 +1,29 @@
+import cv2 as cv
+import numpy as np
+
+def getAffineTransform(src, dst):
+    if len(src) == len(dst):
+        # Solve 'Ax = b'
+        A, b = [], []
+        for p, q in zip(src, dst):
+            A.append([p[0], p[1], 0, 0, 1, 0])
+            A.append([0, 0, p[0], p[1], 0, 1])
+            b.append(q[0])
+            b.append(q[1])
+        x = np.linalg.pinv(A) @ b
+
+        # Reorganize 'H'
+        H = np.array([[x[0], x[1], x[4]], [x[2], x[3], x[5]]])
+        return H
+
+if __name__ == '__main__':
+    src = np.array([[115, 401], [776, 180], [330, 793]], dtype=np.float32)
+    dst = np.array([[0, 0], [900, 0], [0, 500]], dtype=np.float32)
+
+    my_H = getAffineTransform(src, dst)
+    cv_H = cv.getAffineTransform(src, dst) # Note) It accepts only 3 pairs of points.
+
+    print('\n### My Affine Transformation')
+    print(my_H)
+    print('\n### OpenCV Affine Transformation')
+    print(cv_H)
diff --git a/examples/camera_calibration_implement.py b/examples/camera_calibration_implement.py
@@ -0,0 +1,44 @@
+import numpy as np
+from scipy.optimize import least_squares
+from pose_estimation_implement import project_no_distort
+
+def fcxcy_to_K(f, cx, cy):
+    return np.array([[f, 0, cx], [0, f, cy], [0, 0, 1]])
+
+def reproject_error_calib(unknown, Xs, xs):
+    K = fcxcy_to_K(*unknown[0:3])
+    err = []
+    for i in range(len(xs)):
+        offset = 3 + 6 * i
+        rvec, tvec = unknown[offset:offset+3], unknown[offset+3:offset+6]
+        xp = project_no_distort(Xs[i], rvec, tvec, K)
+        err.append(xs[i] - xp)
+    return np.vstack(err).ravel()
+
+def calibrateCamera(obj_pts, img_pts, img_size):
+    img_n = len(img_pts)
+    unknown_init = np.array([img_size[0], img_size[0]/2, img_size[1]/2] + img_n * [0, 0, 0, 0, 0, 1.]) # Sequence: f, cx, cy, img_n * (rvec, tvec)
+    result = least_squares(reproject_error_calib, unknown_init, args=(obj_pts, img_pts))
+    K = fcxcy_to_K(*result['x'][0:3])
+    rvecs = [result['x'][(6*i+3):(6*i+6)] for i in range(img_n)]
+    tvecs = [result['x'][(6*i+6):(6*i+9)] for i in range(img_n)]
+    return result['cost'], K, np.zeros(5), rvecs, tvecs
+
+if __name__ == '__main__':
+    img_size = (640, 480)
+    img_files = ['../bin/data/image_formation1.xyz', '../bin/data/image_formation2.xyz']
+    img_pts = []
+    for file in img_files:
+        pts = np.loadtxt('../bin/data/image_formation1.xyz', dtype=np.float32)
+        img_pts.append(pts[:,:2])
+
+    pts = np.loadtxt('../bin/data/box.xyz', dtype=np.float32)
+    obj_pts = [pts] * len(img_pts) # Copy the object point as much as the number of image observation
+
+    # Calibrate the camera
+    _, K, *_ = calibrateCamera(obj_pts, img_pts, img_size)
+
+    print('\n### Ground Truth')
+    print('* f, cx, cy = 1000, 320, 240')
+    print('\n### My Calibration')
+    print(f'* f, cx, cy = {K[0,0]:.1f}, {K[0,2]:.1f}, {K[1,2]:.1f}')
diff --git a/examples/fundamental_mat_estimation.py b/examples/fundamental_mat_estimation.py
@@ -0,0 +1,36 @@
+import cv2 as cv
+import numpy as np
+
+def findFundamentalMat(pts1, pts2):
+    if len(pts1) == len(pts2):
+        # Make homogeneous coordiates if necessary
+        if pts1.shape[1] == 2:
+            pts1 = np.hstack((pts1, np.ones((len(pts1), 1), dtype=pts1.dtype)))
+        if pts2.shape[1] == 2:
+            pts2 = np.hstack((pts2, np.ones((len(pts2), 1), dtype=pts2.dtype)))
+
+        # Solve 'Ax = 0'
+        A = []
+        for p, q in zip(pts1, pts2):
+            A.append([q[0]*p[0], q[0]*p[1], q[0]*p[2], q[1]*p[0], q[1]*p[1], q[1]*p[2], q[2]*p[0], q[2]*p[1], q[2]*p[2]])
+        _, _, Vt = np.linalg.svd(A, full_matrices=True)
+        x = Vt[-1]
+
+        # Reorganize 'F' and enforce 'rank(F) = 2'
+        F = x.reshape(3, -1)
+        U, S, Vt = np.linalg.svd(F)
+        S[-1] = 0
+        F = U @ np.diag(S) @ Vt
+        return F / F[-1,-1] # Normalize the last element as 1
+
+if __name__ == '__main__':
+    pts0 = np.loadtxt('../bin/data/image_formation0.xyz')
+    pts1 = np.loadtxt('../bin/data/image_formation1.xyz')
+
+    my_F = findFundamentalMat(pts0, pts1)
+    cv_F, _ = cv.findFundamentalMat(pts0, pts1, cv.FM_8POINT)
+
+    print('\n### My Fundamental Matrix')
+    print(my_F)
+    print('\n### OpenCV Fundamental Matrix')
+    print(cv_F) # Note) The result is slightly different because OpenCV considered normalization
diff --git a/examples/homography_estimation.py b/examples/homography_estimation.py
@@ -0,0 +1,34 @@
+import cv2 as cv
+import numpy as np
+
+def getPerspectiveTransform(src, dst):
+    if len(src) == len(dst):
+        # Make homogeneous coordiates if necessary
+        if src.shape[1] == 2:
+            src = np.hstack((src, np.ones((len(src), 1), dtype=src.dtype)))
+        if dst.shape[1] == 2:
+            dst = np.hstack((dst, np.ones((len(dst), 1), dtype=dst.dtype)))
+
+        # Solve 'Ax = 0'
+        A = []
+        for p, q in zip(src, dst):
+            A.append([0, 0, 0, q[2]*p[0], q[2]*p[1], q[2]*p[2], -q[1]*p[0], -q[1]*p[1], -q[1]*p[2]])
+            A.append([q[2]*p[0], q[2]*p[1], q[2]*p[2], 0, 0, 0, -q[0]*p[0], -q[0]*p[1], -q[0]*p[2]])
+        _, _, Vt = np.linalg.svd(A, full_matrices=True)
+        x = Vt[-1]
+
+        # Reorganize 'H'
+        H = x.reshape(3, -1) / x[-1] # Normalize the last element as 1
+        return H
+
+if __name__ == '__main__':
+    src = np.array([[115, 401], [776, 180], [330, 793], [1080, 383]], dtype=np.float32)
+    dst = np.array([[0, 0], [900, 0], [0, 500], [900, 500]], dtype=np.float32)
+
+    my_H = getPerspectiveTransform(src, dst)
+    cv_H = cv.getPerspectiveTransform(src, dst) # Note) It accepts only 4 pairs of points.
+
+    print('\n### My Planar Homography')
+    print(my_H)
+    print('\n### OpenCV Planar Homography')
+    print(cv_H)
diff --git a/examples/image_warping.py b/examples/image_warping.py
@@ -0,0 +1,52 @@
+import cv2 as cv
+import numpy as np
+from homography_estimation import getPerspectiveTransform
+
+def warpPerspective1(src, H, dst_size):
+    # Generate an empty image
+    width, height = dst_size
+    channel = src.shape[2] if src.ndim > 2 else 1
+    dst = np.zeros((height, width, channel), dtype=src.dtype)
+
+    # Copy a pixel from 'src' to 'dst'
+    for py in range(img.shape[0]):
+        for px in range(img.shape[1]):
+            q = H @ [px, py, 1]
+            qx, qy = int(q[0]/q[-1] + 0.5), int(q[1]/q[-1] + 0.5)
+            if qx >= 0 and qy >= 0 and qx < width and qy < height:
+                dst[qy, qx] = src[py, px]
+    return dst
+
+def warpPerspective2(src, H, dst_size):
+    # Generate an empty image
+    width, height = dst_size
+    channel = src.shape[2] if src.ndim > 2 else 1
+    dst = np.zeros((height, width, channel), dtype=src.dtype)
+
+    # Copy a pixel from 'src' to 'dst'
+    H_inv = np.linalg.inv(H)
+    for qy in range(height):
+        for qx in range(width):
+            p = H_inv @ [qx, qy, 1]
+            px, py = int(p[0]/p[-1] + 0.5), int(p[1]/p[-1] + 0.5)
+            if px >= 0 and py >= 0 and px < img.shape[1] and py < img.shape[0]:
+                dst[qy, qx] = src[py, px]
+    return dst
+
+if __name__ == '__main__':
+    img = cv.imread('../bin/data/sunglok_desk.jpg')
+    wnd_name = '3DV Tutorial: Image Warping'
+    card_size = (900, 500)
+    src = np.array([[115, 401], [776, 180], [330, 793], [1080, 383]], dtype=np.float32)
+    dst = np.array([[0, 0], [card_size[0], 0], [0, card_size[1]], card_size], dtype=np.float32)
+
+    # Find planar homography and transform the original image
+    H = getPerspectiveTransform(src, dst)
+    warp1 = warpPerspective1(img, H, card_size)
+    warp2 = warpPerspective2(img, H, card_size)
+
+    # Show images generated from two methods
+    cv.imshow(wnd_name + ' (Method 1)', warp1)
+    cv.imshow(wnd_name + ' (Method 2)', warp2)
+    cv.waitKey(0)
+    cv.destroyAllWindows()
diff --git a/examples/line_fitting_m_estimation.cpp b/examples/line_fitting_m_estimation.cpp
diff --git a/examples/line_fitting_m_estimation.py b/examples/line_fitting_m_estimation.py
diff --git a/examples/pose_estimation_implement.py b/examples/pose_estimation_implement.py
@@ -0,0 +1,51 @@
+import cv2 as cv
+import numpy as np
+from scipy.optimize import least_squares
+from scipy.spatial.transform import Rotation
+
+def project_no_distort(X, rvec, t, K):
+    R = Rotation.from_rotvec(rvec.flatten()).as_matrix()
+    XT = X @ R.T + t                     # Transpose of 'X = R @ X + t'
+    xT = XT @ K.T                        # Transpose of 'x = KX'
+    xT = xT / xT[:,-1].reshape((-1, 1))  # Normalize
+    return xT[:,0:2]
+
+def reproject_error_pnp(unknown, X, x, K):
+    rvec, tvec = unknown[:3], unknown[3:]
+    xp = project_no_distort(X, rvec, tvec, K)
+    err = x - xp
+    return err.ravel()
+
+def solvePnP(obj_pts, img_pts, K):
+    unknown_init = np.array([0, 0, 0, 0, 0, 1.]) # Sequence: rvec(3), tvec(3)
+    result = least_squares(reproject_error_pnp, unknown_init, args=(obj_pts, img_pts, K))
+    return result['success'], result['x'][:3], result['x'][3:]
+
+if __name__ == '__main__':
+    f, cx, cy = 1000., 320., 240.
+    obj_pts = np.loadtxt('../bin/data/box.xyz')
+    img_pts = np.loadtxt('../bin/data/image_formation1.xyz')[:,:2].copy()
+    K = np.array([[f, 0, cx], [0, f, cy], [0, 0, 1]])
+    dist_coeff = np.zeros(4)
+
+    # Estimate camera pose
+    _, rvec, tvec = solvePnP(obj_pts, img_pts, K) # Note) Ignore lens distortion
+    R = Rotation.from_rotvec(rvec.flatten()).as_matrix()
+    my_ori = Rotation.from_matrix(R.T).as_euler('xyz')
+    my_pos = -R.T @ tvec
+
+    # Estimate camera pose using OpenCV
+    _, rvec, tvec = cv.solvePnP(obj_pts, img_pts, K, dist_coeff)
+    R = Rotation.from_rotvec(rvec.flatten()).as_matrix()
+    cv_ori = Rotation.from_matrix(R.T).as_euler('xyz')
+    cv_pos = -R.T @ tvec.flatten()
+
+    print('\n### Ground Truth')
+    print('* Camera orientation: [-15, 15, 0] [deg]')
+    print('* Camera position   : [-2, -2, 0] [m]')
+    print('\n### My Camera Pose')
+    print(f'* Camera orientation: {np.rad2deg(my_ori)} [deg]')
+    print(f'* Camera position   : {my_pos} [m]')
+    print('\n### OpenCV Camera Pose')
+    print(f'* Camera orientation: {np.rad2deg(cv_ori)} [deg]')
+    print(f'* Camera position   : {cv_pos} [m]')
diff --git a/examples/triangulation.py b/examples/triangulation.py
@@ -1,40 +1,25 @@
-
-import cv2
+import cv2 as cv
 import numpy as np
 
-def main():
-    input0, input1 =  "../bin/data/image_formation0.xyz", "../bin/data/image_formation1.xyz"
-    points0, points1 = None, None
-    file0, file1 = open(input0, 'rt'), open(input1, 'rt')
-    
-    with open(input0,'rt') as file0: 
-        points0 = [ list(xyz.split(' '))[:2] for xyz in file0.read().splitlines() if xyz != None ]
-        points0 = np.array(points0, dtype=np.float32)
-    with open(input1,'rt') as file0: 
-        points1 = [ list(xyz.split(' '))[:2] for xyz in file1.read().splitlines() if xyz != None ]
-        points1 = np.array(points1, dtype=np.float32)
-
-    f, cx, cy = 1000, 320, 240
-    # print(points0.shape)
-    if len(points0) != len(points1): raise Exception("Not matching!")
+if __name__ == '__main__':
+    f, cx, cy = 1000., 320., 240.
+    pts0 = np.loadtxt('../bin/data/image_formation0.xyz')[:,:2]
+    pts1 = np.loadtxt('../bin/data/image_formation1.xyz')[:,:2]
+    output_file = '../bin/triangulation.xyz'
 
-    # # Estimate relative pose of two view
-    F,_ = cv2.findFundamentalMat(points0, points1, cv2.FM_8POINT)
-    K = np.array([[f,0,cx],[0,f,cy],[0,0,1]])
+    # Estimate relative pose of two view
+    F, _ = cv.findFundamentalMat(pts0, pts1, cv.FM_8POINT)
+    K = np.array([[f, 0, cx], [0, f, cy], [0, 0, 1]])
     E = K.T @ F @ K
-    _, R, t, _ = cv2.recoverPose(E, points0, points1)
+    _, R, t, _ = cv.recoverPose(E, pts0, pts1)
 
     # Reconstruct 3D points (triangulation)
-    P0 = K @ np.eye(3,4, dtype=np.float32)
+    P0 = K @ np.eye(3, 4, dtype=np.float32)
     Rt = np.hstack((R, t))
     P1 = K @ Rt
-    X = cv2.triangulatePoints(P0, P1, points0.T, points1.T)
+    X = cv.triangulatePoints(P0, P1, pts0.T, pts1.T)
     X /= X[3]
     X = X.T
-    
-    triangular_file = "../bin/data/triangulation.xyz"
-    with open(triangular_file, 'wt') as f:
-        f.write(str(X[:,:3]))
 
-if __name__=="__main__":
-    main()
+    # Write the reconstructed 3D points
+    np.savetxt(output_file, X)
diff --git a/examples/triangulation_implement.py b/examples/triangulation_implement.py
@@ -0,0 +1,37 @@
+import cv2 as cv
+import numpy as np
+
+def triangulatePoints(P0, P1, pts0, pts1):
+    Xs = []
+    for (p, q) in zip(pts0.T, pts1.T):
+        # Solve 'AX = 0'
+        A = np.vstack((p[0] * P0[2] - P0[0],
+                       p[1] * P0[2] - P0[1],
+                       q[0] * P1[2] - P1[0],
+                       q[1] * P1[2] - P1[1]))
+        _, _, Vt = np.linalg.svd(A, full_matrices=True)
+        Xs.append(Vt[-1])
+    return np.vstack(Xs).T
+
+if __name__ == '__main__':
+    f, cx, cy = 1000., 320., 240.
+    pts0 = np.loadtxt('../bin/data/image_formation0.xyz')[:,:2]
+    pts1 = np.loadtxt('../bin/data/image_formation1.xyz')[:,:2]
+    output_file = '../bin/triangulation_implement.xyz'
+
+    # Estimate relative pose of two view
+    F, _ = cv.findFundamentalMat(pts0, pts1, cv.FM_8POINT)
+    K = np.array([[f, 0, cx], [0, f, cy], [0, 0, 1]])
+    E = K.T @ F @ K
+    _, R, t, _ = cv.recoverPose(E, pts0, pts1)
+
+    # Reconstruct 3D points (triangulation)
+    P0 = K @ np.eye(3, 4, dtype=np.float32)
+    Rt = np.hstack((R, t))
+    P1 = K @ Rt
+    X = triangulatePoints(P0, P1, pts0.T, pts1.T)
+    X /= X[3]
+    X = X.T
+
+    # Write the reconstructed 3D points
+    np.savetxt(output_file, X)
diff --git a/msvs/3dv_tutorial.sln b/msvs/3dv_tutorial.sln
@@ -31,7 +31,7 @@ Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "distortion_correction", "di
 EndProject
 Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "camera_calibration", "camera_calibration\camera_calibration.vcxproj", "{8FE6C6CB-6D5D-4745-A4CE-0621BC8633B9}"
 EndProject
-Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "line_fitting_m_est", "line_fitting_m_est\line_fitting_m_est.vcxproj", "{AFC78990-4FCF-40A8-AD20-39EA569AD2F2}"
+Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "line_fitting_m_estimation", "line_fitting_m_estimation\line_fitting_m_estimation.vcxproj", "{AFC78990-4FCF-40A8-AD20-39EA569AD2F2}"
 EndProject
 Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "bundle_adjustment_global", "bundle_adjustment_global\bundle_adjustment_global.vcxproj", "{64E65811-6F72-479E-BEAB-1DADE0952A7B}"
 EndProject
diff --git a/msvs/line_fitting_m_estimation/line_fitting_m_estimation.vcxproj b/msvs/line_fitting_m_estimation/line_fitting_m_estimation.vcxproj
@@ -92,7 +92,7 @@
     </Link>
   </ItemDefinitionGroup>
   <ItemGroup>
-    <ClCompile Include="..\..\examples\line_fitting_m_est.cpp" />
+    <ClCompile Include="..\..\examples\line_fitting_m_estimation.cpp" />
   </ItemGroup>
   <Import Project="$(VCTargetsPath)\Microsoft.Cpp.targets" />
   <ImportGroup Label="ExtensionTargets">
diff --git a/msvs/line_fitting_m_estimation/line_fitting_m_estimation.vcxproj.user b/msvs/line_fitting_m_estimation/line_fitting_m_estimation.vcxproj.user