import numpy as np
import math
from scipy import linalg

# %load solutions/image-formation/solution_01.py
# Computing representation of a line from two points in homogeneous coordinates
ah = np.array([1,2,1])
bh = np.array([4,3,1])

l = np.cross(ah, bh)
print('l = {}'.format(l))
print('Computed line passes through point a: {}'.format(math.isclose(np.dot(ah, l), 0.0)))
print('Computed line passes through point b: {}'.format(math.isclose(np.dot(bh, l), 0.0)))

l = [-1  3 -5]
Computed line passes through point a: True
Computed line passes through point b: True

l1 = np.array([3,-1,7])
l2 = np.array([2,-1,1])

ph = np.cross(l1, l2)
print('ph = {}'.format(ph))

p = ph[:2] / ph[2]
print('p = {}'.format(p))
print('Point p sits on l1: {}'.format(math.isclose(np.dot(l1, np.append(p,[1])), 0.0)))
print('Point p sits on l2: {}'.format(math.isclose(np.dot(l2, np.append(p,[1])), 0.0)))

ph = [ 6 11 -1]
p = [ -6. -11.]
Point p sits on l1: True
Point p sits on l2: True

# %load solutions/image-formation/solution_02.py
# Computing point of intersection of two lines using homogeneous coordinates
ah = np.array([3,-1,7])
bh = np.array([3,-1,-3])

p = np.cross(ah, bh)
print('p = {}'.format(p))
print('Homogenous component of p: w = {}'.format(p[2]))
print('Computed line passes through point a: {}'.format(math.isclose(np.dot(ah, p), 0.0)))
print('Computed line passes through point b: {}'.format(math.isclose(np.dot(bh, p), 0.0)))

p = [10 30  0]
Homogenous component of p: w = 0
Computed line passes through point a: True
Computed line passes through point b: True

F = np.diag(np.sign(np.diag(K)))

P = np.array([[3.53553e2, 3.39645e2, 2.77744e2, -1.44946e6],
              [-1.03528e2, 2.33212e1, 4.59607e2, -6.32525e5],
              [7.07107e-1, -3.53553e-1, 6.12372e-1, -9.18559e2]])

M = P[:3,:3]
print(f'M = {M}')

M_inv = np.linalg.inv(M)
print(f'M_inv = {M_inv}')

p_4 = P[:,-1]
print(f'p_4 = {p_4}')

C = - np.dot(M_inv, p_4)
print(f'Center of this camera is {C}')

M = [[ 3.53553e+02  3.39645e+02  2.77744e+02]
 [-1.03528e+02  2.33212e+01  4.59607e+02]
 [ 7.07107e-01 -3.53553e-01  6.12372e-01]]
M_inv = [[ 8.83882084e-04 -1.53092925e-03  7.48128351e-01]
 [ 1.94194195e-03  1.00556004e-04 -9.56247129e-01]
 [ 1.00560104e-04  1.82582265e-03  2.17039911e-01]]
p_4 = [-1.44946e+06 -6.32525e+05 -9.18559e+02]
Center of this camera is [1000.00073079 2000.001952   1500.00028314]

K, R = linalg.rq(M)

print(f'K = {K}')
print(f'R = {R}')

K = [[ 468.16467128  -91.22505222 -300.00001631]
 [   0.         -427.20086371 -199.99985412]
 [   0.            0.           -0.99999975]]
R = [[ 0.41380237  0.90914861  0.04707869]
 [ 0.57338211 -0.22011137 -0.78916661]
 [-0.70710718  0.35355309 -0.61237215]]

np.isclose(np.dot(R[:,0], R[:,1]), 0)

np.True_

np.dot(R, R.T)

array([[ 1.00000000e+00, -1.66533454e-16, -5.55111512e-17],
       [-1.66533454e-16,  1.00000000e+00,  1.24491442e-16],
       [-5.55111512e-17,  1.24491442e-16,  1.00000000e+00]])

K

array([[ 468.16467128,  -91.22505222, -300.00001631],
       [   0.        , -427.20086371, -199.99985412],
       [   0.        ,    0.        ,   -0.99999975]])

np.diag(K)

array([ 468.16467128, -427.20086371,   -0.99999975])

np.sign(np.diag(K))

array([ 1., -1., -1.])

F = np.diag(np.sign(np.diag(K)))
print(f'F = {F}')

F = [[ 1.  0.  0.]
 [ 0. -1.  0.]
 [ 0.  0. -1.]]

np.dot(F, F) # FORTRAN IDENTITY

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

new_K = np.dot(K, F)
print(f'new_K = {new_K}')

new_K = [[468.16467128  91.22505222 300.00001631]
 [  0.         427.20086371 199.99985412]
 [  0.           0.           0.99999975]]

new_R = np.dot(F, R)
print(f'new_R = {new_R}')

new_R = [[ 0.41380237  0.90914861  0.04707869]
 [-0.57338211  0.22011137  0.78916661]
 [ 0.70710718 -0.35355309  0.61237215]]

import numpy as np

M = np.array([[1,2,3,4],[2,4,8,0],[12,-8,-12,0]])
print('M (3x4):\n', M)

M (3x4):
 [[  1   2   3   4]
 [  2   4   8   0]
 [ 12  -8 -12   0]]

U, E, Vt = np.linalg.svd(M)
print('\nU (3x3):\n', U)
print('\nE (non-zero Sigma_ii in diag form):\n', E)
print('\nVt (4x4):\n', Vt)

U (3x3):
 [[-0.13334471 -0.47047655 -0.8722792 ]
 [-0.32814963 -0.8095341   0.48679806]
 [ 0.93516683 -0.35115005  0.04643961]]

E (non-zero Sigma_ii in diag form):
 [19.85439808  7.65819068  3.62698118]

Vt (4x4):
 [[ 0.52544318 -0.45635343 -0.71758575 -0.02686452]
 [-0.82308545 -0.17887896 -0.47973498 -0.2457377 ]
 [ 0.18158138 -0.04656298  0.19858707 -0.96198922]
 [-0.11605177 -0.87038828  0.46420708  0.11605177]]

Reconstructed_M = np.zeros((3,4))

for i in range(len(E)):
    Reconstructed_M += ( E[i] * np.dot(U[:,i].reshape(3,1), Vt[i,:].reshape(1,4)) )
    
print('Reconstructed_M (3x4):\n', Reconstructed_M)
print('\nElement-wise squared reconstruction error (3x4):\n', (M - Reconstructed_M)**2)

Reconstructed_M (3x4):
 [[ 1.00000000e+00  2.00000000e+00  3.00000000e+00  4.00000000e+00]
 [ 2.00000000e+00  4.00000000e+00  8.00000000e+00  2.88657986e-15]
 [ 1.20000000e+01 -8.00000000e+00 -1.20000000e+01  2.22044605e-15]]

Element-wise squared reconstruction error (3x4):
 [[7.88860905e-31 3.15544362e-30 9.66354609e-30 7.88860905e-31]
 [1.26217745e-29 7.88860905e-31 1.26217745e-29 8.33234331e-30]
 [7.88860905e-29 1.26217745e-29 0.00000000e+00 4.93038066e-30]]

print('U is orthonormal (U U^T):\n', np.dot(U, U.T))
print('\nV is orthonormal (V V^T):\n', np.dot(Vt, Vt.T))

U is orthonormal (U U^T):
 [[1.00000000e+00 1.66533454e-16 8.32667268e-17]
 [1.66533454e-16 1.00000000e+00 1.07552856e-16]
 [8.32667268e-17 1.07552856e-16 1.00000000e+00]]

V is orthonormal (V V^T):
 [[ 1.00000000e+00 -9.71445147e-17 -4.16333634e-17  2.77555756e-16]
 [-9.71445147e-17  1.00000000e+00 -5.55111512e-17 -2.77555756e-16]
 [-4.16333634e-17 -5.55111512e-17  1.00000000e+00  2.35922393e-16]
 [ 2.77555756e-16 -2.77555756e-16  2.35922393e-16  1.00000000e+00]]

E_plus = np.diag( 1./E )
E_plus = np.vstack( (E_plus, np.zeros((1,3)) ) )
print('E_plus:\n', E_plus)

E_plus:
 [[0.05036667 0.         0.        ]
 [0.         0.13057915 0.        ]
 [0.         0.         0.27571138]
 [0.         0.         0.        ]]

M_plus = np.dot(Vt.T, np.dot(E_plus, U.T))
print('M_plus (4x3):\n', M_plus)

M_plus (4x3):
 [[ 0.003367    0.1026936   0.06481481]
 [ 0.02525253  0.02020202 -0.01388889]
 [-0.01346801  0.08922559 -0.00925926]
 [ 0.246633   -0.1026936  -0.00231481]]

print('M M_plus (should be an identity matrix):\n', np.dot(M, M_plus))

M M_plus (should be an identity matrix):
 [[ 1.00000000e+00  3.33066907e-16  2.18575158e-16]
 [-3.33066907e-16  1.00000000e+00  9.71445147e-17]
 [ 0.00000000e+00 -3.33066907e-16  1.00000000e+00]]

print('Pseudo-inverse using pinv:\n',np.linalg.pinv(M))

Pseudo-inverse using pinv:
 [[ 0.003367    0.1026936   0.06481481]
 [ 0.02525253  0.02020202 -0.01388889]
 [-0.01346801  0.08922559 -0.00925926]
 [ 0.246633   -0.1026936  -0.00231481]]

Image formation and pinhole camera model¶

Copyright information¶

License¶

Lesson Plan¶

Camera Obscura¶

Pinhole Camera Model¶

In 2D¶

In 3D¶

Homogeneous Coordinates¶

From Cartesian Coordinates to Homogeneous Coordinates¶

Example¶

From Homogeneous Coordinates to Cartesian Coordinates¶

Example¶

Homogeneous Coordinates Properties¶

Constructing a Line¶

Proof¶

Cross-Product¶

Exercise: computing a representation of a line from homogenous coordinates¶

Intersecting Lines¶

Proof¶

Example: finding the intersection of two lines using homogeneous coordinates¶

Exercise: finding the intersection of two lines using homogeneous coordinates¶

Parallel Lines¶

Points at Infinity¶

Back to Pinhole Model¶

Using Homoegenous Coordinates¶

Principal Point Offset¶

Exercise: Degrees of freedom of a projection matrix¶

Camera Rotation and Translation¶

A note about camera rotation matrix $\mathbf{R}$

Exercise: Degrees of freedom of a projection matrix¶

CCD Pixel Sizes and Skew¶

Exercise: Degrees of freedom of a projection matrix¶

Putting it all together¶

Extrinsic and Intrinsic matrices¶

Properties of $\mathtt{P}$¶

Finite Projective Camera¶

Thought experiment: what value of $x$ will satisfy the following equation.¶

Camera Center¶

Columns and rows of $\mathtt{P}$¶

Columns of $\mathtt{P}$¶

Rows of $\mathtt{P}$¶

Principal Point¶

Principal Axis Vector¶

Action of $\mathtt{P}$ on points¶

Forward Projection¶

Back-projection of points to rays¶

Decomposition of the camera matrix¶

Camera centre¶

Camera rotation and intrinsic parameters¶

Why RQ-decomposition?¶

Make $\mathbf{K}$ diagonal entries positive¶

Exercise: determining camera parameters from a projection matrix¶

Camera Calibration¶

Over-determined solution¶

Orthographic cameras¶

Cameras exhibiting weak perspective¶

Pushbroom cameras¶

Projective Geometry (Lessons)¶

Distant Objects Appear Smaller¶

Focal Lengths¶

Angles are Not Preserved¶

Parallel Lines Meet¶

Vanishing Points¶

Lens Effects¶

Modeling radial distortion to capture (and undo) lens effects¶

Correction of distortion¶

Camera calibration in OpenCV¶

Appendix¶

Singular Value Decomposition¶

Moore-Penrose Pseudo Inverse¶

Example