import numpy as np
import matplotlib.pyplot as plt
# set up the feature matrix and check the column means are zero
D=2; N=4
X = np.array([[1, 2], [2, 1], [-2, -1], [-1, -2]])
print(f'Column means: col 1, {X[:,0].mean()} and col 2, {X[:,1].mean()}')
# and the empirical covariance matrix
S = 1/N*X.T @ X
print('S = \n',S)
# solve the eigenvalue problem
lmda, V = np.linalg.eig(S)
print('evals = ', lmda)
print('evecs = \n', V)

Column means: col 1, 0.0 and col 2, 0.0
S = 
 [[2.5 2. ]
 [2.  2.5]]
evals =  [4.5 0.5]
evecs = 
 [[ 0.70710678 -0.70710678]
 [ 0.70710678  0.70710678]]


# a picture will tell us much more...
plt.figure(figsize=(4,4)); plt.gca().set_aspect('equal')
# plot the data in blue
plt.plot(X[:,0], X[:,1], '.', color='b')
# plot the eigenvectors...
# the first in red from -v0 to +v0 with length 2*lambda_0
x0 = lmda[0]*V[0,[0]]; y0 = lmda[0]*V[1,[0]]
plt.plot([-x0,x0],[-y0,y0],'-', color='r')
# the second in green from -v1 to +v1 with length 2*lambda_1
x1 = lmda[1]*V[0,[1]]; y1 = lmda[1]*V[1,[1]]
plt.plot([-x1,x1],[-y1,y1],'-', color='g')

[<matplotlib.lines.Line2D at 0x7fe7e01d1668>]


print('X - X V V.T = \n', X - X @ V @ V.T )

v0 = V[:,[0]]; Z0 = X @ v0 @ v0.T
print('X @ v0 @ v0.T = \n', Z0)

v1 = V[:,[1]]; Z1 = X @ v1 @ v1.T
print('X @ v1 @ v1.T = \n', Z1)

X - X V V.T = 
 [[ 1.11022302e-16  2.22044605e-16]
 [ 4.44089210e-16  2.22044605e-16]
 [-4.44089210e-16 -2.22044605e-16]
 [-1.11022302e-16 -2.22044605e-16]]
X @ v0 @ v0.T = 
 [[ 1.5  1.5]
 [ 1.5  1.5]
 [-1.5 -1.5]
 [-1.5 -1.5]]
X @ v1 @ v1.T = 
 [[-0.5  0.5]
 [ 0.5 -0.5]
 [-0.5  0.5]
 [ 0.5 -0.5]]


plt.figure(figsize=(3,3)); plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')
plt.plot([-x0,x0],[-y0,y0],'-', color='r')
plt.plot([-x1,x1],[-y1,y1],'-', color='g')
# just the first row of Z0 for the moment
plt.plot([X[0,0], Z0[0,0]], [X[0,1], Z0[0,1]], ':', marker='o', color='r', markevery=[1])

[<matplotlib.lines.Line2D at 0x7fe7c07fbef0>]


plt.figure(figsize=(3,3)); plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')
plt.plot([-x0,x0],[-y0,y0],'-', color='r')
plt.plot([-x1,x1],[-y1,y1],'-', color='g')
# just the last row of Z1 for the moment
plt.plot([X[3,0], Z1[3,0]], [X[3,1], Z1[3,1]], ':', marker='o', color='g', markevery=[1])

[<matplotlib.lines.Line2D at 0x7fe7c082bcf8>]


plt.figure(figsize=(3,3)); plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')
plt.plot([-x0,x0],[-y0,y0],'-', color='r')
plt.plot([-x1,x1],[-y1,y1],'-', color='g')
for k in range(4):
  plt.plot([X[k,0], Z0[k,0]], [X[k,1], Z0[k,1]], ':', marker='o', color='r', markevery=[1])
  plt.plot([X[k,0], Z1[k,0]], [X[k,1], Z1[k,1]], ':', marker='o', color='g', markevery=[1])


Xv0 = X @ v0
Xv1 = X @ v1
# multiply by root 2 to tidy up the output
print('sqrt(2) X v0 = \n', np.sqrt(2) * Xv0)
print('sqrt(2) X v1 = \n', np.sqrt(2) * Xv1)

sqrt(2) X v0 = 
 [[ 3.]
 [ 3.]
 [-3.]
 [-3.]]
sqrt(2) X v1 = 
 [[ 1.]
 [-1.]
 [ 1.]
 [-1.]]


plt.figure(figsize=(4,4)); plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')
plt.plot([-x0,x0],[-y0,y0],'-', color='r')
plt.plot([-x1,x1],[-y1,y1],'-', color='g')
cos45 = sin45 = 1/np.sqrt(2)
# for data point 0 along v0
plt.plot([0, Xv0[0,0]*cos45], [0, Xv0[0,0]*sin45], ':', marker='o', color='k', markevery=[1])
# for data point 3 along v1
plt.plot([0, -Xv1[3,0]*cos45], [0, Xv1[3,0]*sin45], ':', marker='o', color='k', markevery=[1])

[<matplotlib.lines.Line2D at 0x7fe7d04d8a20>]


# re-solve the eigenvalue problem
lmda, V = np.linalg.eig(S)
print(f'evals = {lmda} and V = ')
print(V)
# take the SVD of X
U, Sig, VT = np.linalg.svd(X)
print(f'singular values Sigma = {Sig}')
print(f'Sigma^2/N = {Sig*Sig/N} and V = ')
print(VT.T)

evals = [4.5 0.5] and V = 
[[ 0.70710678 -0.70710678]
 [ 0.70710678  0.70710678]]
singular values Sigma = [4.24264069 1.41421356]
Sigma^2/N = [4.5 0.5] and V = 
[[-0.70710678 -0.70710678]
 [-0.70710678  0.70710678]]


from sklearn.decomposition import PCA
pca = PCA(n_components=2)
pca.fit(X)
print('Here is the explained variance as ratios...')
print(f'XV ratio = {pca.explained_variance_ratio_}')
print(f'Here are the singular values = {pca.singular_values_}')
print('the eigenvalues are squares of the singular values divided by N')
print(f'eigenvalues = {pca.singular_values_**2/N}')

Here is the explained variance as ratios...
XV ratio = [0.9 0.1]
Here are the singular values = [4.24264069 1.41421356]
the eigenvalues are squares of the singular values divided by N
eigenvalues = [4.5 0.5]


# the principal components are stored as row vectors, so transpose
B = pca.components_.T
print('Principal Components (transposed) B = \n', B)
print('Compare with our earlier V = \n', V)

Principal Components (transposed) B = 
 [[ 0.70710678  0.70710678]
 [ 0.70710678 -0.70710678]]
Compare with our earlier V = 
 [[ 0.70710678 -0.70710678]
 [ 0.70710678  0.70710678]]


# multiply by sqrt(2) to tidy the output.
Xf = pca.fit_transform(X)
print('np.sqrt(2)*Xf = \n', np.sqrt(2)*Xf)

np.sqrt(2)*Xf = 
 [[ 3. -1.]
 [ 3.  1.]
 [-3. -1.]
 [-3.  1.]]


plt.figure(figsize=(4,4)); plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')

[<matplotlib.lines.Line2D at 0x7fe7f237feb8>]


plt.figure(figsize=(4,4)); plt.gca().set_aspect('equal')
plt.plot(Xf[:,0], Xf[:,1], '.', color='b')

[<matplotlib.lines.Line2D at 0x7fe7d07548d0>]


# generate this number of sample points
Ns=50 
# The Gaussian lozenge will be centered with non-unit covariance
mean = [0, 0]
cov = [[30, 15], [15, 15]]
# generate Ns random points (x,y)
x, y = np.random.multivariate_normal(mean, cov, Ns).T
# reshape them to columns and stack them next to each other 
X = np.hstack((x.reshape(-1,1),y.reshape(-1,1)))
# We can see it if the data matrix is small - otherwise little point
if Ns < 8: print(X)


# let's look at the empirical column means - they wont be exactly zero 
print(f'Column means 1, {X[:,0].mean()} and 2, {X[:,1].mean()}')
# so let's center this sample data
X[:,0] -= X[:,0].mean()
X[:,1] -= X[:,1].mean()
print(f'Centered column means 1, {X[:,0].mean()} and 2, {X[:,1].mean()}')

Column means 1, -0.8950498463386201 and 2, -1.0498584870978453
Centered column means 1, -1.7763568394002505e-17 and 2, -3.552713678800501e-17


# let's plot our data set
plt.figure(figsize=(4,4))
plt.xlim(-20,20)
plt.ylim(-20,20)
plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')

[<matplotlib.lines.Line2D at 0x7fe7d07b5e10>]


# perform the PCA
pca = PCA(n_components=2)
pca.fit(X)
print(f'XV ratio = {pca.explained_variance_ratio_}')
print(f'sing vals = {pca.singular_values_}')
# the component are stored as row vectors, so transpose
V = pca.components_.T
print('V = \n', V)

XV ratio = [0.9048396 0.0951604]
sing vals = [46.84344541 15.19116807]
V = 
 [[-0.87691056 -0.48065359]
 [-0.48065359  0.87691056]]


# project X to the singular components
Z1 = X @ V[:,[0]] @ V[:,[0]].T
Z2 = X @ V[:,[1]] @ V[:,[1]].T


# re-plot, and include all the projected data
plt.figure(figsize=(4,4))
plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')
# plot the projections - these illustrate the directions
plt.plot(Z1[:,0], Z1[:,1], '.', color='r')
plt.plot(Z2[:,0], Z2[:,1], '.', color='g')
# Now loop over each point and dot-line the projection onto v0 and v1
for k in range(Ns):
  plt.plot([X[k,0], Z1[k,0]], [X[k,1],Z1[k,1]], ':', color='r')
  plt.plot([X[k,0], Z2[k,0]], [X[k,1],Z2[k,1]], ':', color='g')
# zoom in or out with this...
window=10; plt.xlim(-window,window); plt.ylim(-window,window); plt.show()


# Let's see what the data looks like in the new coordinate system
Xf = pca.fit_transform(X)


# here is the original...
plt.figure(figsize=(4,4))
plt.xlim(-20,20)
plt.ylim(-20,20)
plt.gca().set_aspect('equal')
plt.plot(X[:,0], X[:,1], '.', color='b')

[<matplotlib.lines.Line2D at 0x7fe7d07c2860>]


# here is the transformed data
plt.figure(figsize=(4,4))
plt.xlim(-20,20)
plt.ylim(-20,20)
plt.gca().set_aspect('equal')
plt.plot(Xf[:,0], Xf[:,1], '.', color='b')

[<matplotlib.lines.Line2D at 0x7fe7d0840f98>]

Principal Component Analysis¶

variationalform https://variationalform.github.io/¶

Just Enough: progress at pace¶

What this is about:¶

Assigned Reading¶

Context¶

Eigen-systems of Symmetric Matrices¶

The SVD: Singular Value Decomposition¶

How are these factorizations connected?¶

Why does this matter?¶

Terminology¶

Conventions¶

Features and Observations¶

PCA - Principal Component Analysis¶

PCA - outline algorithm.¶

Some Technicalities¶

Worked example¶

The Local Coordinate System¶

Explained Variance¶

The connection to SVD¶

Reflection¶

Standard Example¶

Review¶