%matplotlib inline
from IPython import display
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sn
sn.set(style='whitegrid')


from sklearn.datasets import fetch_lfw_people
faces = fetch_lfw_people(min_faces_per_person=60)
print(faces.target_names)
print(faces.images.shape)

['Ariel Sharon' 'Colin Powell' 'Donald Rumsfeld' 'George W Bush'
 'Gerhard Schroeder' 'Hugo Chavez' 'Junichiro Koizumi' 'Tony Blair']
(1348, 62, 47)


62*47 #it is M

2914


# show the face images
fig, ax = plt.subplots(figsize=(3, 3))
for n in range(0, faces.images.shape[0], 100):
    I = faces.images[n,:,:].reshape(62,47)   
    ax.imshow(I, cmap='gray')    
    ax.axis('off')
    ax.set_title(faces.target_names[faces.target[n]])
    plt.draw()
    display.clear_output(wait=True)
    display.display(fig)
    plt.pause(0.1)

<Figure size 640x480 with 0 Axes>


from sklearn.decomposition import PCA
pca = PCA(n_components=150, svd_solver='randomized')
#pca = PCA(n_components=0.9)
pca.fit(faces.data)

PCA(n_components=150, svd_solver='randomized')


pca.components_.shape

(150, 2914)


fig, ax = plt.subplots(1, 1,figsize=(3, 2))
ax.imshow(pca.mean_.reshape(62, 47), cmap='gray')
ax.axis('off')
ax.set_title('mean face', fontsize=16)

Text(0.5, 1.0, 'mean face')


fig, axes = plt.subplots(3, 8, figsize=(9, 4),
                         subplot_kw={'xticks':[], 'yticks':[]},
                         gridspec_kw=dict(hspace=0.1, wspace=0.1))
for i, ax in enumerate(axes.flat):
    ax.imshow(pca.components_[i].reshape(62, 47), cmap='gray')


plt.plot(np.cumsum(pca.explained_variance_ratio_))
plt.xlabel('number of components')
plt.ylabel('cumulative explained variance');


# Compute the components and projected faces
components = pca.transform(faces.data)
projected = pca.inverse_transform(components)


# Plot the results
fig, ax = plt.subplots(2, 10, figsize=(10, 2.5),
                       subplot_kw={'xticks':[], 'yticks':[]},
                       gridspec_kw=dict(hspace=0.1, wspace=0.1))
for i in range(10):
    ax[0, i].imshow(faces.data[i].reshape(62, 47), cmap='binary_r')
    ax[1, i].imshow(projected[i].reshape(62, 47), cmap='binary_r')
    
ax[0, 0].set_ylabel('full-dim\ninput')
ax[1, 0].set_ylabel('150-dim\nreconstruction');


# use two components
w0=pca.components_[4,:]
w1=pca.components_[5,:]
lamda0=pca.explained_variance_[4]
lamda1=pca.explained_variance_[5]
meanface=pca.mean_
# generate some new face images
fig, ax = plt.subplots(figsize=(3, 3))
for n in range(0, 100):
    I = meanface + np.random.randn()*np.sqrt(lamda0)*w0 + np.random.randn()*np.sqrt(lamda1)*w1
    I = I.reshape(62,47)  
    ax.imshow(I, cmap='gray')    
    ax.axis('off')
    ax.set_title('new face')
    plt.draw()
    display.clear_output(wait=True)
    display.display(fig)
    plt.pause(0.1)

<Figure size 640x480 with 0 Axes>


# use all of the 150 components
W=pca.components_ * np.sqrt(pca.explained_variance_.reshape(150,1))
meanface=pca.mean_
# generate some new face images
fig, ax = plt.subplots(figsize=(3, 3))
for n in range(0, 100):
    y = np.random.randn(150,1)
    temp = W*y
    temp = temp.sum(axis=0)
    I = meanface + temp
    I = I.reshape(62,47)  
    ax.imshow(I, cmap='gray')    
    ax.axis('off')
    ax.set_title('new face')
    plt.draw()
    display.clear_output(wait=True)
    display.display(fig)
    plt.pause(0.2)

<Figure size 640x480 with 0 Axes>

PCA to obtain Eigenfaces¶

Use PCA to generate images¶