import matplotlib.pyplot as plt
import cv2

frame_1 = cv2.imread('manta_1.jpg')
frame_2 = cv2.imread('manta_2.jpg')
frame_3 = cv2.imread('manta_3.jpg')

fig, ax = plt.subplots(1, 3, figsize=(20, 8))

ax[0].imshow(cv2.cvtColor(frame_1, cv2.COLOR_BGR2RGB))
ax[0].axis('off')
ax[1].imshow(cv2.cvtColor(frame_2, cv2.COLOR_BGR2RGB))
ax[1].axis('off')
ax[2].imshow(cv2.cvtColor(frame_3, cv2.COLOR_BGR2RGB))
ax[2].axis('off')

plt.show()

import json
import numpy as np

mantas = []

keypoints_coco = json.load(open('keypoints_coco.json'))
instances_coco = json.load(open('instances_coco.json'))

keypoint_colors = [(np.random.rand(3) * 255).astype(int) for _ in range(9)]

fig, axes = plt.subplots(1, 3, figsize=(20, 8))

for image, ax in zip(instances_coco['images'], axes):
    frame = cv2.imread(image['file_name'])
    
    image_size = (image['width'], image['height'])
    line_width = int(min(image_size) * 0.005)
    circle_radius = int(min(image_size) * 0.02)

    instance_annos = [a for a in instances_coco['annotations'] if a['image_id'] == image['id']]
    keypoint_annos = [a for a in keypoints_coco['annotations'] if a['image_id'] == image['id']]
    
    for index, (instance, keypoints) in enumerate(zip(instance_annos, keypoint_annos)):
        
        manta = {
            'image': image['file_name'],
            'box': instance['bbox'],
            'keypoints': np.array(keypoints['keypoints']).reshape(-1, 3)[:, :2]
        }
        
        mantas.append(manta)
        
        x, y, w, h = manta['box']
        cv2.rectangle(frame, (int(x), int(y)), (int(x+w), int(y+h)), (0, 255, 0), line_width)
        
        c = 0
        for i in range(len(manta['keypoints'])):
            x, y =  manta['keypoints'][i]
            color = keypoint_colors[c]
            cv2.circle(frame, (int(x), int(y)), circle_radius, color.tolist(), -1)
            c += 1
    
    ax.imshow(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
    ax.axis('off')

plt.show()

# orientate keypoints to be relative to the bounding box
# Since we are going to crop out the rest of the image
for manta in mantas:
    x, y, w, h = manta['box']
    keypoints = manta['keypoints']
    for i in range(len(keypoints)):
        keypoints[i][0] -= x
        keypoints[i][1] -= y

def get_body_part(part, keypoints):
    mapp = {"eye_1": 0, "eye_2": 1, "gill_1": 2, "gill_2": 3, "gill_3": 4, "gill_4": 5, "pectoral_1": 6, "pectoral_2": 7, "pelvic": 8}
    return keypoints[mapp[part]]


def manta_orientation(manta):
    # use all the keypoints to compute the orientation
    points = manta['keypoints']
    
    # PCA is used to compute the orientation of the points
    # https://docs.opencv.org/4.x/d1/dee/tutorial_introduction_to_pca.html
    mean, eigen_vec, eigen_val = cv2.PCACompute2(points, np.array([]))
    
    center = (int(mean[0, 0]), int(mean[0, 1]))
    axis_1 = (center[0] + eigen_vec[0, 0] * eigen_val[0, 0], center[1] + eigen_vec[0, 1] * eigen_val[0, 0])
    axis_2 = (center[0] - eigen_vec[1, 0] * eigen_val[1, 0], center[1] - eigen_vec[1, 1] * eigen_val[1, 0])
    
    angle = np.arctan2(eigen_vec[0, 1], eigen_vec[0, 0])
    
    return center, angle, axis_1, axis_2


fig, axes = plt.subplots(2, 2, figsize=(10, 10))

for manta, ax in zip(mantas, axes.flatten()):
    frame = cv2.imread(manta['image'])
    
    # crop the frame to the bounding box of the manta
    x, y, w, h = manta['box']
    frame = frame[int(y):int(y+h), int(x):int(x+w)]
    
    manta['orientation'] = manta_orientation(manta)

    center, angle, axis_1, axis_2 = manta['orientation']
    
    image_size = (frame.shape[1], frame.shape[0])
    line_width = max(int(min(image_size) * 0.005), 1)
    circle_radius = max(int(min(image_size) * 0.02), 1)

    cv2.line(frame, center, (int(axis_1[0]), int(axis_1[1])), (255, 0, 0), line_width)
    cv2.line(frame, center, (int(axis_2[0]), int(axis_2[1])), (0, 255, 0), line_width)
    cv2.circle(frame, center, circle_radius, (0, 0, 255), -1)
    
    angle = np.rad2deg(angle)
    
    for i in range(len(manta['keypoints'])):
        x, y =  manta['keypoints'][i]
        color = keypoint_colors[i]
        cv2.circle(frame, (int(x), int(y)), circle_radius, color.tolist(), -1)
    
    rows, cols, _ = frame.shape
    frame_matrix = cv2.getRotationMatrix2D(center, angle, 1)
    frame = cv2.warpAffine(frame, frame_matrix, (cols, rows))
    
    ax.imshow(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
    ax.set_title('Angle: {:.2f}'.format(angle))
    ax.axis('off')
    
plt.show()

for manta in mantas:
    center, angle, axis_1, axis_2 = manta['orientation']

    points = manta['keypoints'].copy()
    
    for i in range(len(points)):
        x, y = points[i]
        x -= center[0]
        y -= center[1]

        x_new = x * np.cos(-angle) - y * np.sin(-angle)
        y_new = x * np.sin(-angle) + y * np.cos(-angle)
        
        points[i] = [x_new + center[0], y_new + center[1]]
        
    manta['rotated_keypoints'] = points

x' = x * cos(theta) - y * sin(theta)
y' = x * sin(theta) + y * cos(theta)

fig, axes = plt.subplots(2, 2, figsize=(10, 10))

for manta, ax in zip(mantas, axes.flatten()):
    frame = cv2.imread(manta['image'])
    
    # crop the frame to the bounding box of the manta
    x, y, w, h = manta['box']
    frame = frame[int(y):int(y+h), int(x):int(x+w)]
    
    image_size = (frame.shape[1], frame.shape[0])
    line_width = max(int(min(image_size) * 0.005), 1)
    circle_radius = int(min(image_size) * 0.02)

    center, angle, axis_1, axis_2 = manta['orientation']
    
    rows, cols, _ = frame.shape
    frame_matrix = cv2.getRotationMatrix2D(center, np.rad2deg(angle), 1)
    frame = cv2.warpAffine(frame, frame_matrix, (cols, rows))
    
    # we discard the pectoral fin keypoints to focus
    # on the central body of the manta
    hull = np.array([
        get_body_part("eye_1", manta['rotated_keypoints']),
        get_body_part("eye_2", manta['rotated_keypoints']),
        get_body_part("gill_1", manta['rotated_keypoints']),
        get_body_part("gill_2", manta['rotated_keypoints']),
        get_body_part("gill_3", manta['rotated_keypoints']),
        get_body_part("gill_4", manta['rotated_keypoints']),
        get_body_part("pelvic", manta['rotated_keypoints']),
    ]).astype(np.int32)
    
    hull = cv2.convexHull(hull)
    
    mask = np.zeros_like(frame)
    cv2.fillPoly(mask, [hull], (255, 255, 255))
    frame = cv2.bitwise_and(frame, mask)
    
    hull_box = cv2.boundingRect(hull)
    x, y, w, h = hull_box
    
    frame = frame[y:y+h, x:x+w]
    
    manta['cropped_hull'] = frame.copy()
    
    ax.imshow(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
    ax.axis('off')
    
plt.show()

fig, axes = plt.subplots(2, 2, figsize=(10, 10))

for manta, ax in zip(mantas, axes.flatten()):
    frame = manta['cropped_hull'].copy()
    
    # convert the image to grayscale
    gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
    
    # apply median filter to smooth the image
    gray = cv2.medianBlur(gray, 5)
    
    # apply adaptive thresholding to binarize the image
    clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8,8))
    gray = clahe.apply(gray)
    
    manta['gray'] = gray
    
    ax.imshow(gray, cmap='gray')
    ax.axis('off')

plt.show()

fig, axes = plt.subplots(2, 2, figsize=(10, 10))

for manta, ax in zip(mantas, axes.flatten()):
    gray = manta['gray'].copy()
    
    sift = cv2.SIFT_create()
    
    keypoints, descriptors = sift.detectAndCompute(gray, None)
    
    manta["sift"] = {
        "keypoints": keypoints,
        "descriptors": descriptors
    }
    
    gray = cv2.drawKeypoints(gray, keypoints, gray, flags=cv2.DRAW_MATCHES_FLAGS_DRAW_RICH_KEYPOINTS)
    
    ax.imshow(gray, cmap='gray')
    ax.axis('off')

plt.show()

keypoint = mantas[0]['sift']['keypoints'][0]

keypoint.pt, keypoint.size, keypoint.angle, keypoint.response, keypoint.octave

((7.386290073394775, 213.12411499023438),
 4.260604381561279,
 98.21598052978516,
 0.031134868040680885,
 12321024)

descriptor = mantas[0]['sift']['descriptors'][0]

descriptor.shape, descriptor

((128,),
 array([  1.,  36.,  38.,   0.,   0.,   0.,   0.,   0.,  16.,  38.,  31.,
          1.,   1.,   9.,   4.,   6.,  63.,   7.,   1.,   0.,   0.,   6.,
         26., 138.,   3.,   0.,   0.,   0.,   0.,  11.,  99.,  79.,  12.,
         54.,  64.,   0.,   0.,   0.,   1.,   9.,  83.,  68.,  22.,   0.,
          0.,   0.,  13.,  31., 138.,  42.,  10.,   3.,   0.,   0.,   7.,
         75.,  31.,   7.,  58.,  64.,   3.,  12.,  34.,  33.,  82., 138.,
         26.,   0.,   0.,   0.,   4.,  32., 104.,  35.,   1.,   2.,   7.,
         17., 111., 111., 132.,  65., 138.,  59.,  15.,  14.,  27.,  23.,
          9.,  13., 138., 138.,   0.,   0.,   0.,   0.,  25.,  71.,   7.,
          0.,   0.,   0.,   0.,   1.,  44.,  24.,   0.,   1.,   4.,   8.,
          9.,  11.,   0.,   1.,  18.,  17.,   9.,   7.,   3.,   0.,   0.,
          0.,  16.,  20.,   0.,   0.,   0.,   0.], dtype=float32))

import faiss

indicies = []
embeddings = []

index_s = 0
index_c = 0
for i, manta in enumerate(mantas):
    sift = manta['sift']
    
    for descriptor in sift['descriptors']:
        embeddings.append(descriptor)

    index_c += len(sift['descriptors']) - 1

    # we store the range of indicies for each manta. The position
    # of the array is the index for the manta in our list
    indicies.append((index_s, index_c))
    
    index_s = index_c + 1

indicies = np.array(indicies)
embeddings = np.array(embeddings).astype(np.float32)

dimensions = embeddings.shape[1]

index = faiss.IndexFlatL2(dimensions)

index.add(embeddings)

print('Indicies:', indicies.shape)
print('Embeddings:', embeddings.shape)

Indicies: (4, 2)
Embeddings: (1087, 128)

indicies

array([[   0,  674],
       [ 675,  910],
       [ 911, 1066],
       [1067, 1083]])

embeddings = mantas[0]['sift']['descriptors']
embeddings = np.array(embeddings).astype(np.float32)

k = 5
distances, neighbors = index.search(embeddings[0].reshape(1, -1), k)

print('Neighbors:', neighbors)
print('Distances:', distances)

Neighbors: [[   0 1078 1077  649 1058]]
Distances: [[     0. 142767. 148252. 153261. 168205.]]

distances, neighbors = index.search(embeddings, 1)

for i, (start, end) in enumerate(indicies):
    matches = np.sum((neighbors >= start) & (neighbors <= end))
    print(f'Total descriptor for manta {i}: {matches}')

Total descriptor for manta 0: 675
Total descriptor for manta 1: 0
Total descriptor for manta 2: 0
Total descriptor for manta 3: 0

Manta Fingerprint Identification with Principal Computer Vision Algorithms¶

The Plan¶

Conclusion¶