# Connect to google
from google.colab import drive
drive.mount('/content/drive/')

Mounted at /content/drive/

import os
os.chdir('/content/drive/MyDrive/Colab Notebooks/Case Study - Face Identification')

import numpy as np
from glob import glob
from PIL import Image
import matplotlib.pyplot as plt
import copy

!pip install utils
import utils

Collecting utils
  Downloading utils-1.0.2.tar.gz (13 kB)
  Preparing metadata (setup.py) ... done
Building wheels for collected packages: utils
  Building wheel for utils (setup.py) ... done
  Created wheel for utils: filename=utils-1.0.2-py2.py3-none-any.whl size=13905 sha256=79d61e9116bddaf20ed2245cc078f4d8ac4e3bacb1d94b8888ec39401d7eedf4
  Stored in directory: /root/.cache/pip/wheels/b8/39/f5/9d0ca31dba85773ececf0a7f5469f18810e1c8a8ed9da28ca7
Successfully built utils
Installing collected packages: utils
Successfully installed utils-1.0.2

# number of images on the training set.
M = 14;
# read and show images(jpg);

# S will store all the images
S=[];

#Ensure the instructors folder is in the same directory and has not been moved.
S, all_faces = utils.loadFaces('instructors/')
grid_im = utils.gray_images_square_grid(np.array(all_faces))
plt.imshow(grid_im, cmap='gray')

<matplotlib.image.AxesImage at 0x7de532ae8160>

def computeEigenFaces(S):
    dbx = np.array(S) #Converting into numpy array
    A = dbx # Note that the dbx here is transposed as compared to the original M script

    # Covariance matrix C=A'A, L=AA'
    covariance_matrix = np.matmul(A, A.T)

    A=None

    #Compute the eigenvalues and eigenvectors from the covariance matrix
    eigen_values, eigen_vectors = np.linalg.eig(covariance_matrix)


    # Sort and eliminate those whose eigenvalue is small based on the threshold.
    nonzero_eigenvals = eigen_values > 1e-4
    v = eigen_vectors[:,nonzero_eigenvals]
    d = eigen_values[nonzero_eigenvals]

    # Sort eigenvalues already sorted, but in descending order, so let's change this into ascending
    d = d[::-1]
    v = v[:,::-1]


    # Reducing the number of dimensions by multiplying original vales and eigenvectors.
    u = []
    for i in range(len(d)):
        temp = np.sqrt(d[i])
        u.append(np.matmul(dbx.T, v[:,i])/temp)

    # Normalization of reduced dimensions.
    for i in range(len(u)):
        kk = u[i]
        temp = np.sqrt(np.sum(np.square(kk)))
        u[i] = u[i]/temp

    return u

# Normalize the images
S = utils.normalizeImages(S)

# Compute average face
avg_face = utils.computeAverageFace(S)

# Calling the above function which results the eigenfaces
EigenFaces = computeEigenFaces(S)

# Now render the eigenfaces
EigenFacesIm = []

#Visualizaing the eigenfaces
for i in range(len(EigenFaces)):
    img = np.reshape(EigenFaces[i], (300,300))
    img = img.T
    # Scale the image
    img = utils.convertImageToU8bit(img)
    # convert and save
    im = Image.fromarray(img)
    im.convert('RGB').save('eigenfaces/eigen_{}.jpeg'.format(i+1))

    EigenFacesIm.append(img)

_, eigen_faces = utils.loadFaces('./eigenfaces/')
grid_im = utils.gray_images_square_grid(np.array(eigen_faces))
plt.imshow(grid_im, cmap='gray')

<matplotlib.image.AxesImage at 0x7de521209540>

def reconstructNewFaces(u, mean_face, input_image = 'new_image.jpg'):

    eigen_face = np.array(u)

    # Read the input image and convert to gray scale
    im = Image.open(input_image)
    InputImage = im.convert('L')

    # Converting to numpy array
    im_raw = np.asarray(InputImage)

    # Reshaping to vector
    InImage = np.reshape(im_raw.T,im_raw.shape[0]*im_raw.shape[1])

    # Normalization of the vector
    temp = InImage
    me=np.mean(temp)
    st=np.std(temp)
    temp=(temp-me)*st/(st+me)
    NormImage = temp

    # obtain the weights by dotting the normalized image with the eigenfaces
    weights = np.matmul(u, NormImage.T)

    # To reconstruct a face, we dot the weights with the eigenfaces, and add the mean face.
    ReshapedImage = mean_face + np.matmul(weights, u)

    # Converting back to image
    ReshapedImage = np.reshape(ReshapedImage,im_raw.shape)
    ReshapedImage = ReshapedImage.T

    return ReshapedImage

ReshapedImage = reconstructNewFaces(EigenFaces, avg_face, 'new_image.jpg')

# Show the reconstructed image.
ReshapedImage_s = utils.convertImageToU8bit(ReshapedImage)
ReshapedImage_s = Image.fromarray(ReshapedImage_s)
ReshapedImage_s.show()

# Convert notebook to html
!jupyter nbconvert --to html "/content/drive/My Drive/Colab Notebooks/Copy of FDS_Project_LearnerNotebook_FullCode.ipynb"

MODULE 1: MAKING SENSE OF UNSTRUCTURED DATA¶

CASE STUDY - FACE IDENTIFICATION¶

Importing libraries¶

Image Dataset¶

Steps in PCA¶

1:Standardize the data.¶

2:Calculate the Covariance Matrix¶

3:Compute Eigenvalues and EigenVectors of the covariance matrix.¶

4:Selecting Number of components using Explained Variance¶

5:Projecting the data into lower dimensions.¶

Computing Eigenfaces¶

The following code computes all the necessary components needed to compute the Eigenfaces and then finally saves (under the directory: “eigenfaces”) and shows the Eigenfaces:¶

Processing and Visualization¶

Reconstruct Image from EigenFaces¶

Show Reconstructed Image¶