import numpy as np
u = np.array([1., 3., 5. ,7.])
print(u)

[1. 3. 5. 7.]


from numpy import linalg as LA
LA.norm(u)
#check
np.sqrt(np.sum(u ** 2))

9.16515138991168


#creating a matrix using stack in numpy:
u = np.array([1., 3., 5., 7.])
v = np.array([2., 4., 6., 8.])
w = np.array([9., 8., 7., 6.])
X = np.stack((u,v,w))
print(X)

[[1. 3. 5. 7.]
 [2. 4. 6. 8.]
 [9. 8. 7. 6.]]


import matplotlib.pyplot as plt
x = np.linspace(-2,2,100)
y = x ** 2
plt.plot(x,y)
plt.show()


import numpy as np

a=np.array([1,2,3,4])
b=np.array([5,8,9,2])

np.outer(a,b)

array([[ 5,  8,  9,  2],
       [10, 16, 18,  4],
       [15, 24, 27,  6],
       [20, 32, 36,  8]])

1.24¶

Logistics¶

Clustering¶

Probability¶

Markov inequality¶

Chebyshev's inequality¶

1.26¶

Weak laws of big numbers¶

Proof¶

K-means Clustering¶

Objective¶

Lemma:¶

K-means algorithm (Alternating minimization)¶

K-means by matrix:¶

1.31¶

K-means clustering in high dimensional data¶

New phenomenon¶

2.7¶

Linear algebra review¶

Orthorgonal in high dimension¶

2.28¶

PCA¶

Goal: Dimension Reduction (Find $\phi$ s.t. sample variance after projection is the maximum)¶

Conditional Numbers¶

Thm.¶