import numpy as np
import cv2 as cv
import matplotlib.pyplot as plt

left_patch = cv.imread('data/local-features-construction-2.jpg')
left_patch = cv.cvtColor(left_patch, cv.COLOR_BGR2RGB)
left_patch = cv.resize(left_patch, (32, 32), interpolation=cv.INTER_NEAREST)

right_patch = cv.imread('data/local-features-construction-1.jpg')
right_patch = cv.cvtColor(right_patch, cv.COLOR_BGR2RGB)
right_patch = cv.resize(right_patch, (32, 32), interpolation=cv.INTER_NEAREST)

plt.figure(figsize=(10,5))
plt.subplot(121)
plt.imshow(left_patch)
plt.subplot(122)
plt.imshow(right_patch);

# %load solutions/local-features/solution-01.py
# Local features - Exercise 01

from scipy.spatial import distance
import numpy as np

a = np.array([1,0,0])
b = np.array([0,1,0])
c = np.array([1,1,0])
d = np.array([10,-2,1])

# Set up an m-by-n matrix, where m is the number of
# data items and n is the dimension
X = np.vstack((a,b,c,d))
#print(f'Shape of X is {X.shape}')

# D is condensed matrix
metric = ['cosine', 'euclidean']
i = 0
D = distance.pdist(X, metric[i])

# Lets convert it into square form
print(f'{metric[i]} similarity:')
print(distance.squareform(D))

cosine similarity:
[[0.         1.         0.29289322 0.02409993]
 [1.         0.         0.29289322 1.19518001]
 [0.29289322 0.29289322 0.         0.44794755]
 [0.02409993 1.19518001 0.44794755 0.        ]]

# %load solutions/local-features/solution-02.py
# Local features - Exercise 02

from scipy.spatial import distance
import numpy as np

a = np.array([1,0,0])
b = np.array([0,1,0])
c = np.array([1,1,0])
d = np.array([10,-2,1])

# Set up an m-by-n matrix, where m is the number of
# data items and n is the dimension
X = np.vstack((a,b,c,d))
#print(f'Shape of X is {X.shape}')

# D is condensed matrix
metric = ['cosine', 'euclidean']
i = 0
D = distance.pdist(X, metric[i])

# Lets convert it into square form
print(f'{metric[i]} similarity:')
print(1.0 - distance.squareform(D))

cosine similarity:
[[ 1.          0.          0.70710678  0.97590007]
 [ 0.          1.          0.70710678 -0.19518001]
 [ 0.70710678  0.70710678  1.          0.55205245]
 [ 0.97590007 -0.19518001  0.55205245  1.        ]]

# %load solutions/local-features/solution-03.py
# Local features - Solution 03

from scipy.spatial import distance
import numpy as np

a = np.array([1,0,0])
b = np.array([0,1,0])
c = np.array([1,1,0])
d = np.array([10,-2,1])

# Set up an m-by-n matrix, where m is the number of
# data items and n is the dimension
X = np.vstack((a,b,c,d))
#print(f'Shape of X is {X.shape}')

# D is condensed matrix
metric = ['cosine', 'euclidean']
i = 1
D = distance.squareform(distance.pdist(X, metric[i]))
print('Distance:\n', D)

# Lets convert it into square form
sigma = 0.0001
scaling = 2 * (sigma ** 2)

print(f'{metric[i]} similarity:')
np.set_printoptions(formatter={'float': lambda x: "{0:0.1e}".format(x)})
S = np.exp(-D**2 / (scaling))
print('Similarity:\n', S)
np.set_printoptions() # To not mess with other printing

Distance:
 [[ 0.          1.41421356  1.          9.2736185 ]
 [ 1.41421356  0.          1.         10.48808848]
 [ 1.          1.          0.          9.53939201]
 [ 9.2736185  10.48808848  9.53939201  0.        ]]
euclidean similarity:
Similarity:
 [[1.0e+00 0.0e+00 0.0e+00 0.0e+00]
 [0.0e+00 1.0e+00 0.0e+00 0.0e+00]
 [0.0e+00 0.0e+00 1.0e+00 0.0e+00]
 [0.0e+00 0.0e+00 0.0e+00 1.0e+00]]

from scipy.stats import wasserstein_distance
wasserstein_distance([0, 1, 3], [5, 6, 8])

np.float64(5.0)

import numpy as np
import cv2 as cv
import matplotlib.pyplot as plt

img1 = cv.imread('data/box.png',cv.IMREAD_GRAYSCALE)          
img2 = cv.imread('data/box_in_scene.png',cv.IMREAD_GRAYSCALE) 
print(img1.shape)

(223, 324)

orb = cv.ORB_create()
kp1, des1 = orb.detectAndCompute(img1, None) # locations and descriptor
kp2, des2 = orb.detectAndCompute(img2, None)

bf = cv.BFMatcher(cv.NORM_HAMMING, crossCheck=True)
matches = bf.match(des1, des2)
matches = sorted(matches, key = lambda x:x.distance)

img3 = cv.drawMatches(img1, kp1, img2, kp2, matches[:10], None, flags=cv.DrawMatchesFlags_NOT_DRAW_SINGLE_POINTS)

plt.figure(figsize=(10,10))
plt.imshow(img3)
plt.show()

# %load solutions/local-features/kdtree.py
# Local Features - kdtree.py

import numpy as np
from scipy.spatial import KDTree

rng = np.random.RandomState(0)
X = rng.random_sample((10, 3))
print(X)
T = KDTree(X, leafsize=3)
distance, index = T.query(X[0,:]) # Try to perturb the query vector +[0.01,0.01,0]
print(f'distance={distance}, data={X[index,:]}')

[[0.5488135  0.71518937 0.60276338]
 [0.54488318 0.4236548  0.64589411]
 [0.43758721 0.891773   0.96366276]
 [0.38344152 0.79172504 0.52889492]
 [0.56804456 0.92559664 0.07103606]
 [0.0871293  0.0202184  0.83261985]
 [0.77815675 0.87001215 0.97861834]
 [0.79915856 0.46147936 0.78052918]
 [0.11827443 0.63992102 0.14335329]
 [0.94466892 0.52184832 0.41466194]]
distance=0.0, data=[0.5488135  0.71518937 0.60276338]

import numpy as np
import cv2 as cv
import matplotlib.pyplot as plt

img1 = cv.imread('data/box.png',cv.IMREAD_GRAYSCALE)          
img2 = cv.imread('data/box_in_scene.png',cv.IMREAD_GRAYSCALE)

orb = cv.ORB_create()
kp1, des1 = orb.detectAndCompute(img1, None) # locations and descriptor
kp2, des2 = orb.detectAndCompute(img2, None)

FLANN_INDEX_LSH = 6
index_params = dict(algorithm = FLANN_INDEX_LSH, table_number = 6)
search_params = dict(checks=50)
flann = cv.FlannBasedMatcher(index_params, search_params)

matches = flann.knnMatch(des1, des2, k=2)

good = []
for match in matches:
    if len(match) < 2: continue
    m, n = match[0], match[1]
    if m.distance < 0.75*n.distance:
        good.append([m])

img3 = cv.drawMatchesKnn(img1, kp1, img2, kp2, good, None, flags=cv.DrawMatchesFlags_NOT_DRAW_SINGLE_POINTS)
plt.figure(figsize=(10,10))
plt.imshow(img3)
plt.show()

import cv2 as cv
import numpy as np
import matplotlib.pyplot as plt

filename = "data/butterfly.jpg"
#filename = "data/BlobTest.jpg"
im = cv.imread(filename)
im = cv.cvtColor(im, cv.COLOR_BGR2RGB)

params = cv.SimpleBlobDetector_Params()
params.minThreshold = 10 # Change thresholds
params.maxThreshold = 250
params.filterByArea = False # Filter by Area.
params.minArea = 100
params.filterByCircularity = False # Filter by Circularity
params.minCircularity = 0.1
params.filterByConvexity = False # Filter by Convexity
params.minConvexity = 0.9
params.filterByInertia = False # Filter by Inertia
params.minInertiaRatio = 0.9
detector = cv.SimpleBlobDetector_create(params)

keypoints = detector.detect(im)

im_with_keypoints = cv.drawKeypoints(im, keypoints, np.array([]), (255,0,0), cv.DRAW_MATCHES_FLAGS_DRAW_RICH_KEYPOINTS)

plt.figure(figsize=(15,15))
plt.imshow(im_with_keypoints);

#im = cv.imread('data/apple.jpg');
im = cv.imread('data/box.png');
im = cv.cvtColor(im, cv.COLOR_BGR2RGB)
vis = im.copy()

mser = cv.MSER_create()
regions, bboxes = mser.detectRegions(im)

hulls = [cv.convexHull(p.reshape(-1, 1, 2)) for p in regions]
cv.polylines(vis, hulls, 1, (255, 0, 255), 1)
plt.figure(figsize=(10,10))
plt.imshow(vis);

Local features¶

Copyright information¶

License¶

Lesson Plan¶

Motivation¶

Review: Characteristics of a Good Feature¶

Repeatability¶

Interest point detectors¶

Which interst point detector should you choose?¶

Saliency¶

Local feature descriptors¶

Computing local feature descriptors¶

Raw patches as local descriptors¶

Shift Invariant Feature Transform (SIFT) [Lowe 2004]¶

SIFT Pyramid¶

Key-point localization in scale¶

Computing SIFT descriiptor¶

Achieving rotation invariance¶

Computing SIFT descriiptor¶

128-dimensional SIFT Descriptors¶

SIFT properties¶

SIFT summary¶

SIFT Code¶

Matching local features¶

Distance computation in Python¶

Exercise 1¶

From distance to similarity¶

Exercise 2¶

Gaussian kernel to convert distance to similarity¶

Exercise 3¶

Wasserstein distance¶

Hamming distance¶

Bruteforce matching¶

KDTree data structure¶

Ambiquous matches¶

FLANN matching¶

Blob detection¶

Edge detection review¶

Second derivative of Gaussian (Laplacian)¶

From edges to blobs¶

Blob detection in 2D¶

Characteristic scale¶

Difference of Gaussian¶

Blob detection example in OpenCV¶

Maximally Stable Extremal Region (MSER)¶

MSER in OpenCV¶

Applications of local invariant features¶

Panoramas¶

Wide base-line stereo¶

Object recogniton¶