import numpy as np
from matplotlib import pyplot as plt
import sklearn
from sklearn import datasets
import cv2

def plot_images(images, rows, cols, titles=None, figsize=(20,7)):

    fig, axarr = plt.subplots(rows, cols, figsize=figsize)
    axarr = np.array(axarr).reshape(-1) 

    for i, ax in enumerate(axarr):
        ax.imshow(images[i], cmap='gray')
        ax.axis('off')
        if titles:  
            ax.set_title(titles[i])

    plt.tight_layout()
    plt.show()

#All rights resevred to n0acar (github username)
def plot_portraits(images, n_row, n_col, titles, h, w,):
    plt.figure(figsize=(2.2 * n_col, 2.2 * n_row))
    plt.subplots_adjust(bottom=0, left=.01, right=.99, top=.90, hspace=.20)
    for i in range(n_row * n_col):
        plt.subplot(n_row, n_col, i + 1)
        plt.imshow(images[i].real.reshape((h, w)), cmap=plt.cm.gray)
        plt.title(titles[i])
        plt.xticks(())
        plt.yticks(())

# #Taking a picture of you
camera = cv2.VideoCapture(1)
ret, frame = camera.read()
if ret:
    RBGFace = np.array(frame)
else:
    print("Failed to capture frame")

camera.release()
cv2.destroyAllWindows()

2024-09-22 01:58:40.343 python[13218:39444387] WARNING: AVCaptureDeviceTypeExternal is deprecated for Continuity Cameras. Please use AVCaptureDeviceTypeContinuityCamera and add NSCameraUseContinuityCameraDeviceType to your Info.plist.

plt.figure(figsize=(10,10))
plt.imshow(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
plt.show()

#Converting to grayscale and plotting new image:
gsFace = cv2.cvtColor(RBGFace, cv2.COLOR_BGR2GRAY)
plt.figure(figsize=(10,10))
plt.imshow(gsFace, cmap = 'gray')

<matplotlib.image.AxesImage at 0x7fbac0b90a30>

#Next, we convert this image into a 64x64 pixel array:
height, width = gsFace.shape

#Cropping the sides:
croppedFace = gsFace[0 : height, (width-height)//2 : width - (width-height)//2]
#Note that this assumes width > height. If your camera produces an image with height > width,
#Comment out the last line and use this instead:
# croppedFace = gsFace[(height-width)//2 : height - (height-width)//2, 0:width]

#Scaling it down (taking the average of neighboring pixels):
scaledFace = np.zeros(shape=(64,64))
div = height//64
k, q = 0, 0

for i in range (64):
    for j in range (64):
        scaledFace[i,j] = np.mean(croppedFace[k : k + div, q : q + div])
        q += div
    k += div
    q = 0

#As a last step, we normalize the array to match the dataset we'll use:
scaledFaceNormalized = (scaledFace - np.min(scaledFace))/np.ptp(scaledFace)

#Note that this approach is very rudimentary, we just crop the sides until the image is square and scale it down.

#We now have an appropriate array to work with!
plt.figure(figsize=(5,5))
plt.imshow(scaledFaceNormalized, cmap = 'gray')

<matplotlib.image.AxesImage at 0x7fbaa1cfd970>

#Getting the dataset we'll use to perform SVD:
olivetti = sklearn.datasets.fetch_olivetti_faces()
faces = olivetti['data']

#The numpy function returns a list of the singular values, so we need to put them into S:
U, s, VT = np.linalg.svd(faces, compute_uv=True)
S = np.zeros(shape=(400,4096))
for i in range(400):
    S[i,i] = s[i]

SVDTest = U@S@VT

face_0_SVD = SVDTest[0].reshape(64,64)
face_0_original = faces[0].reshape(64,64)

plot_images([face_0_SVD, face_0_original], 1, 2, titles=['From SVD', 'Original'], figsize=(8,8))

SVDfaces = []

for i in range (0, 400, 50):
    SVDfaces.append((U[:, 0:i]@S[0:i, 0:i]@VT[0:i, :])[0].reshape(64,64))

titles = ["Face with %d s.v." %i for i in range(0, 400, 50)]
plot_images(SVDfaces, 2, 4, titles=titles, figsize=(10,5))

olivetti = sklearn.datasets.fetch_olivetti_faces()
faces = olivetti['data']

avgFace = np.average(faces, axis=0)

plt.figure(figsize=(5,5))
plt.imshow(avgFace.reshape(64,64), cmap='gray')

<matplotlib.image.AxesImage at 0x7fbac12e8a30>

normFaces = faces - avgFace

plt.figure(figsize=(5,5))
plt.imshow(normFaces[0].reshape(64,64), cmap='gray')

<matplotlib.image.AxesImage at 0x7fba99f0c280>

Cov = normFaces.T@normFaces
eigvals, eigvecs = np.linalg.eig(Cov)

order = np.argsort(eigvals)[::-1]
sorted_eigvals = eigvals[order]
sorted_eigvecs = eigvecs[:, order]

eigvecs.shape

(4096, 4096)

eigtitles = ["Eigenface %d" %i for i in range(4096)]
plot_portraits(sorted_eigvecs.real.T, 6, 10, eigtitles, 64, 64)

E = sorted_eigvecs.T
coeffs0 = E@faces[0]
testReconstruction = np.zeros(shape=(4096))

for i in range(4096):
    testReconstruction += coeffs0[i]*E[i]

plt.figure(figsize=(5,5))
plt.imshow(testReconstruction.reshape(64,64), cmap='gray')

<matplotlib.image.AxesImage at 0x7fba9a2ebaf0>

testReconstruction_quarter = np.zeros(shape=(4096))

for i in range(200):
    testReconstruction_quarter += coeffs0[i]*E[i]

plt.figure(figsize=(5,5))
plt.imshow(testReconstruction_quarter.reshape(64,64), cmap='gray')

<matplotlib.image.AxesImage at 0x7fba800629a0>

myCoeffs = E@scaledFaceNormalized.reshape(4096)

myCoeffs

array([-38.57019476,  11.10955009,   8.2167536 , ...,  -0.10252883,
         0.10202647,   0.06904295])

myReconstruction = np.zeros(4096)

#We can project the original image with simpler matrix multiplications, but let's be explicit and see exactly what we're doing:

for i in range(4096):
    myReconstruction += myCoeffs[i]*E[i]

plt.figure(figsize=(5,5))
plt.imshow(myReconstruction.reshape(64,64), cmap='gray')

<matplotlib.image.AxesImage at 0x7fba9a32dfd0>

np.linalg.norm(myReconstruction-scaledFaceNormalized.flatten())

3.0069485983971723e-06

components = np.linspace(1, 4096, 12, dtype=int)
reconstructed_images = []

for comp in components:
    reconstruction = E[:comp].T @ myCoeffs[:comp] #more efficient matrix multiplication
    reconstructed_images.append(reconstruction.reshape(64,64))

titles = ["Reconstructed with %d components" % comp for comp in components]
plot_images(reconstructed_images, 3, 4, titles=titles, figsize=(15,10))

coeffsMatrix = E@normFaces.T

# Now, we find the vector in the dataset that minimizes the magnitude of the difference
# between itself and the projected image

distances = np.linalg.norm(coeffsMatrix - np.reshape(myCoeffs, (4096,1)), axis=0)
closestFaceIndex = np.argmin(distances)

# Let's see the closest face in the dataset to our image

plt.figure(figsize=(5,5))
plt.imshow(faces[closestFaceIndex].reshape(64,64), cmap='gray')

<matplotlib.image.AxesImage at 0x7fbac10bc760>

Capturing the image¶

Onto SVD!¶

SVD with numpy:¶

What's happening?¶

Data Science and Rudimentary facial reconstruction and recognition (PCA)¶

The idea:¶

In practice:¶

Capturing the image¶

(Not related to class content, skip if not interested.)¶

Onto SVD!¶

SVD with numpy:¶

What's happening?¶

Data Science and Rudimentary facial reconstruction and recognition (PCA)¶

The idea:¶

In practice:¶