import matplotlib.pyplot as plt
import numpy as np
import cv2

frame = cv2.imread('/home/jack/Mounts/DiskOne/kona_coffee/external/mendeley_rust_miner/rust/name39.jpg')
frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)

lower_color = np.array([2, 40, 40])
upper_color = np.array([250, 255, 255])
    
mask = cv2.inRange(cv2.cvtColor(frame, cv2.COLOR_RGB2HSV), lower_color, upper_color)
mask = cv2.blur(mask, (11, 11))
mask = cv2.erode(mask, None, iterations=5)
mask[mask > 0] = 1

visual = frame.copy()

contour = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)[0]
contour = max(contour, key=cv2.contourArea)

alpha = np.zeros_like(visual)
cv2.drawContours(alpha, [contour], -1, (255, 0, 0, 255), -1)
visual = cv2.addWeighted(visual, 1, alpha, 0.2, 0)
visual = cv2.drawContours(visual, [contour], -1, (255, 0, 0), 2)

bbox = cv2.boundingRect(contour)
cropped_mask = mask[bbox[1]:bbox[1]+bbox[3], bbox[0]:bbox[0]+bbox[2]]
cropped_frame = frame[bbox[1]:bbox[1]+bbox[3], bbox[0]:bbox[0]+bbox[2]]

visual = visual[bbox[1]:bbox[1]+bbox[3], bbox[0]:bbox[0]+bbox[2]]

plt.figure(figsize=(10, 10))
plt.imshow(visual)
plt.axis('off')
plt.show()

import time
from sklearn.cluster import KMeans

start_time = time.time()

# we only want to cluster the pixels inside the mask
x = cropped_frame[cropped_mask == 1]

# reshape to be 3 features: R, G, B
x = x.reshape(-1, 3) / 255

cluster = KMeans(n_clusters=50)
cluster.fit(x)

dominate_colors = cluster.cluster_centers_

print(f'Elapsed {time.time() - start_time:.2f} seconds')

colors_image = np.zeros((100, 100 * len(dominate_colors), 3), dtype=np.uint8)
for i, color in enumerate(dominate_colors):
    colors_image[:, i*100:(i+1)*100] = color * 255

plt.figure(figsize=(10, 10))
plt.imshow(colors_image)
plt.axis('off')
plt.show()

Elapsed 2.56 seconds

from PIL import Image

pil_image = cropped_frame.copy()

start_time = time.time()

# set the background to white. This is the best we can do to minimize including the background in the clustering
pil_image[np.logical_not(cropped_mask)] = 255
pil_image = Image.fromarray(pil_image)
paletted = pil_image.convert('P', palette=Image.ADAPTIVE, colors=50)
palette = paletted.getpalette()
color_idxs = paletted.getcolors()
dominate_colors = [palette[idx*3:idx*3+3] for _, idx in color_idxs]

print(f'Elapsed {time.time() - start_time:.2f} seconds')

colors_image = np.zeros((100, 100 * len(dominate_colors), 3), dtype=np.uint8)
for i, color in enumerate(dominate_colors):
    colors_image[:, i*100:(i+1)*100] = color

plt.figure(figsize=(10, 10))
plt.imshow(colors_image)
plt.axis('off')
plt.show()

Elapsed 0.17 seconds

import pandas as pd

df = pd.read_parquet('dataset.parquet')

source_dir = df.iloc[0].source_dir

df = df.drop(columns=['source_dir'])

df

from tqdm import tqdm
from concurrent.futures import ThreadPoolExecutor, as_completed

def get_features(row):
    image_path = f'{source_dir}/{row.image}'
    frame = cv2.imread(image_path)
    frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
    contour = np.array(row.contour).reshape(-1, 2)
    
    mask = np.zeros(frame.shape[:2], dtype=np.uint8)
    cv2.drawContours(mask, [contour], -1, 1, -1)
    
    bbox = cv2.boundingRect(contour)
    frame = frame[bbox[1]:bbox[1]+bbox[3], bbox[0]:bbox[0]+bbox[2]]
    mask = mask[bbox[1]:bbox[1]+bbox[3], bbox[0]:bbox[0]+bbox[2]]
    
    # resize to 512x512 for faster computation
    frame = cv2.resize(frame, (512, 512))
    mask = cv2.resize(mask, (512, 512))
    
    # kmeans clustering
    x = frame[mask == 1]
    x = x.reshape(-1, 3) / 255
    model = KMeans(n_clusters=50)
    model.fit(x)
    kmeans_dominate_colors = model.cluster_centers_
    
    # PIL computation
    pil_image = frame
    pil_image[np.logical_not(mask)] = 255
    pil_image = Image.fromarray(pil_image)
    paletted = pil_image.convert('P', palette=Image.ADAPTIVE, colors=50)
    palette = paletted.getpalette()
    color_idxs = paletted.getcolors()
    pil_dominate_colors = np.array([palette[idx*3:idx*3+3] for _, idx in color_idxs]) / 255

    return pil_dominate_colors.flatten(), kmeans_dominate_colors.flatten()


pool = ThreadPoolExecutor(8)
futures = []
columns = []

loader = tqdm(total=len(df), desc='Processing Frames')

for row in df.itertuples():
    futures.append(pool.submit(get_features, row))

for future in as_completed(futures):
    loader.update(1)
    columns.append(future.result())
columns = np.array(columns)

loader.close()

df['pil_method'] = list(columns[:, 0])
df['kmeans_method'] = list(columns[:, 1])

df.to_parquet('features.parquet')

Processing Frames: 100%|██████████| 1694/1694 [05:01<00:00,  5.62it/s]

sample_size = 100
features = 50

s1 = df[df.defective==True].sample(sample_size // 2)
s2 = df[df.defective==False].sample(sample_size // 2)

samples = pd.concat([s1, s2])

shape = (sample_size, features, 3)

pil_colors = np.zeros(shape, dtype=np.uint8)
kms_colors = np.zeros(shape, dtype=np.uint8)

for y, row in enumerate(samples.itertuples()):
    pil_method = np.array(row.pil_method).reshape(-1, 3) * 255
    kms_method = np.array(row.kmeans_method).reshape(-1, 3) * 255

    # We sort the colors by their norm to make the comparison easier to distinguish
    # This gives less randomness to the order of the colors, 
    pil_method = pil_method[np.argsort(np.linalg.norm(pil_method, axis=1))]
    kms_method = kms_method[np.argsort(np.linalg.norm(kms_method, axis=1))]

    for x in range(features):
        pil_colors[y:y+1, x:(x+1)] = pil_method[x]
        kms_colors[y:y+1, x:(x+1)] = kms_method[x]

pil_colors = cv2.copyMakeBorder(pil_colors, 1, 1, 1, 1, cv2.BORDER_CONSTANT, value=255)
kms_colors = cv2.copyMakeBorder(kms_colors, 1, 1, 1, 1, cv2.BORDER_CONSTANT, value=255)

fig, ax = plt.subplots(1, 2, figsize=(5, 5))
ax[0].imshow(kms_colors)
ax[0].axis('off')
ax[1].imshow(pil_colors)
ax[1].axis('off')
plt.show()

from sklearn.metrics import f1_score, precision_recall_curve, roc_curve, confusion_matrix
import seaborn as sns

sns.set_theme(style='whitegrid')

def plot_classifier(model, x_test, y_test, title):
    y_pred = model.predict(x_test)

    f1 = f1_score(y_test, y_pred)

    # plot precision recall curve
    proba = model.predict_proba(x_test)[:, 1]
    precision, recall, _ = precision_recall_curve(y_test, proba)
    fpr, tpr, _ = roc_curve(y_test, proba)
    conf_matrix = confusion_matrix(y_test, y_pred)

    fig, ax = plt.subplots(1, 3, figsize=(20, 5))
    
    # padding at top
    plt.subplots_adjust(top=0.85)
    
    ax[0].set_title('Confusion Matrix')
    ax[0].set_xlabel('Predicted')
    ax[0].set_ylabel('Actual')
    sns.heatmap(conf_matrix, annot=True, fmt='d', cmap='Blues', ax=ax[0])

    ax[1].plot(recall, precision, color='b')
    ax[1].fill_between(recall, precision, alpha=0.2, color='b')
    ax[1].set_xlabel('Recall')
    ax[1].set_ylabel('Precision')
    ax[1].set_title('Precision Recall Curve')

    ax[2].plot(fpr, tpr, color='b')
    ax[2].fill_between(fpr, tpr, alpha=0.2, color='b')
    ax[2].set_xlabel('False Positive Rate')
    ax[2].set_ylabel('True Positive Rate')
    ax[2].set_title('ROC Curve')

    plt.suptitle(f'{title} | F1 {f1:.2f}')
    plt.show()

from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.preprocessing import MinMaxScaler
from sklearn.pipeline import Pipeline

df = df.reset_index()

model = Pipeline([
    ('scaler', MinMaxScaler()),
    ('classifier', LogisticRegression())
])

y = df['defective'].astype(int)

x = df.pil_method.apply(lambda x: np.array(x).reshape(-1, 3) * 255)
x = np.array(x.apply(lambda x: x[np.argsort(np.linalg.norm(x, axis=1))]).tolist()).reshape(-1, 150)
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=42)

model.fit(x_train, y_train)
plot_classifier(model, x_test, y_test, 'PIL Method')

x = df.kmeans_method.apply(lambda x: np.array(x).reshape(-1, 3) * 255)
x = np.array(x.apply(lambda x: x[np.argsort(np.linalg.norm(x, axis=1))]).tolist()).reshape(-1, 150)
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=42)

model.fit(x_train, y_train)
plot_classifier(model, x_test, y_test, 'KMeans Method')

	image	contour	defect	defective
3015	miner/41.jpg	[1147, 241, 1146, 242, 1142, 242, 1141, 243, 1...	miner	True
4698	phoma/279.jpg	[1056, 88, 1055, 89, 1043, 89, 1042, 90, 1034,...	phoma	True
5404	rust/1579.jpg	[1202, 186, 1201, 187, 1194, 187, 1193, 188, 1...	rust	True
6309	phoma/551.jpg	[1284, 229, 1283, 230, 1279, 230, 1278, 231, 1...	phoma	True
4456	phoma/320.jpg	[331, 226, 330, 227, 330, 237, 331, 238, 331, ...	phoma	True
...	...	...	...	...
6194	nodisease/1197.jpg	[958, 141, 957, 142, 944, 142, 943, 143, 936, ...	nodisease	False
6195	nodisease/1197.jpg	[958, 141, 957, 142, 944, 142, 943, 143, 936, ...	nodisease	False
6197	nodisease/1209.jpg	[1010, 154, 1009, 155, 1001, 155, 1000, 156, 9...	nodisease	False
6198	nodisease/1209.jpg	[1010, 154, 1009, 155, 1001, 155, 1000, 156, 9...	nodisease	False
6199	nodisease/1209.jpg	[1010, 154, 1009, 155, 1001, 155, 1000, 156, 9...	nodisease	False

Exploring Different Algorithms of Dominant Color Extraction¶

Extracting the Mask¶

Extracting the dominate Colors¶

KMeans Extraction¶

Utilizing PIL to Compress the Image¶

Training A Model on the Extracted Colors¶

Conclusion¶