import numpy as np

# Define our matrices
A = np.array([[1,1,1],[0,1,1],[0,0,1],[0,0,0]])
B = np.array([[1,0,0],[1,1,0],[1,1,1],[1,1,1]])

# Take QR decompositions
QA, RA = np.linalg.qr(A)
QB, RB = np.linalg.qr(B)

print(f"QA = {QA}\n")
print(f"RA = {RA}\n")
print(f"QB = {QB}\n")
print(f"RB = {RB}")

QA = [[ 1.  0.  0.]
 [-0.  1.  0.]
 [-0. -0.  1.]
 [-0. -0. -0.]]

RA = [[1. 1. 1.]
 [0. 1. 1.]
 [0. 0. 1.]]

QB = [[-0.5         0.8660254   0.        ]
 [-0.5        -0.28867513  0.81649658]
 [-0.5        -0.28867513 -0.40824829]
 [-0.5        -0.28867513 -0.40824829]]

RB = [[-2.         -1.5        -1.        ]
 [ 0.         -0.8660254  -0.57735027]
 [ 0.          0.         -0.81649658]]

import numpy as np

# Define matrix and vector
A = np.array([[1,0,0],[1,1,0],[1,1,1],[1,1,1]])
b = np.array([[1],[1],[1],[0]])

# Take the QR decomposition of A
Q, R = np.linalg.qr(A)

# Solve the linear system Rx = Q.T b
beta = np.linalg.solve(R,Q.T @ b)

beta

array([[ 1.00000000e+00],
       [ 6.40987562e-17],
       [-5.00000000e-01]])

np.linalg.lstsq(A,b)[0]

array([[ 1.00000000e+00],
       [ 2.22044605e-16],
       [-5.00000000e-01]])

import numpy as np
import pandas as pd

# First let us make a dictionary incorporating our data.
# Each entry corresponds to a column (feature of our data)
data = {
    'Square ft': [1600, 2100, 1550, 1600, 2000],
    'Bedrooms': [3, 4, 2, 3, 4],
    'Price': [500, 650, 475, 490, 620]
}

# Create a pandas DataFrame
df = pd.DataFrame(data)

# Create our matrix X and our target y
X = df[["Square ft", "Bedrooms"]].to_numpy()
y = df[["Price"]].to_numpy()

# Augment X with a column of 1's (intercept)
X_aug = np.hstack((np.ones((X.shape[0], 1)), X))

# Perform QR decomposition
Q, R = np.linalg.qr(X_aug)

# Solve the upper triangular system Rx = Q^Ty
beta = np.linalg.solve(R, Q.T @ y)

print(f"Q = {Q} \n\nR = {R} \n\nbeta = {beta}")

Q = [[-0.4472136   0.32838365  0.40496317]
 [-0.4472136  -0.63745061 -0.22042299]
 [-0.4472136   0.42496708 -0.7689174 ]
 [-0.4472136   0.32838365  0.40496317]
 [-0.4472136  -0.44428376  0.17941406]] 

R = [[-2.23606798e+00 -3.95784032e+03 -7.15541753e+00]
 [ 0.00000000e+00 -5.17687164e+02 -1.50670145e+00]
 [ 0.00000000e+00  0.00000000e+00  7.27908474e-01]] 

beta = [[-3.05053797e-13]
 [ 3.00000000e-01]
 [ 5.00000000e+00]]

import numpy as np

# Create our matrix A
A = np.array([[1,0,0],[1,1,0],[1,1,1],[1,1,1]])

# Take the QR decomposition
Q, R = np.linalg.qr(A)

# Create the range projection
P = Q @ Q.T

P

array([[1.00000000e+00, 2.89687929e-17, 2.89687929e-17, 2.89687929e-17],
       [2.89687929e-17, 1.00000000e+00, 7.07349921e-17, 7.07349921e-17],
       [2.89687929e-17, 7.07349921e-17, 5.00000000e-01, 5.00000000e-01],
       [2.89687929e-17, 7.07349921e-17, 5.00000000e-01, 5.00000000e-01]])

array([[1.00000000e+00, 2.89687929e-17, 2.89687929e-17, 2.89687929e-17],
       [2.89687929e-17, 1.00000000e+00, 7.07349921e-17, 7.07349921e-17],
       [2.89687929e-17, 7.07349921e-17, 5.00000000e-01, 5.00000000e-01],
       [2.89687929e-17, 7.07349921e-17, 5.00000000e-01, 5.00000000e-01]])

import numpy as np

def proj_onto_col_space(A):
	# Take the QR decomposition
	Q,R = np.linalg.qr(A)
	# The projection is just Q @ Q.T
	P = Q @ Q.T

	return P

import numpy as np

#Define our matrix
A = np.array([[3,2,2],[2,3,-2]])

# Take the SVD
U, S, Vh = np.linalg.svd(A)

print(f"U = {U}\n\nS = {S}\n\nVh.T = {Vh.T}")

U = [[-0.70710678 -0.70710678]
 [-0.70710678  0.70710678]]

S = [5. 3.]

Vh.T = [[-7.07106781e-01 -2.35702260e-01 -6.66666667e-01]
 [-7.07106781e-01  2.35702260e-01  6.66666667e-01]
 [-6.47932334e-17 -9.42809042e-01  3.33333333e-01]]

import numpy as np

# Define our matrices
A = np.array([[1,1,1],[0,1,1],[0,0,1],[0,0,0]])
B = np.array([[1,0,0],[1,1,0],[1,1,1],[1,1,1]])

# SVD decomposition
U_A, S_A, Vh_A = np.linalg.svd(A)
U_B, S_B, Vh_B = np.linalg.svd(B)

print(f"U_A = {U_A}\n\nS_A = {S_A}\n\nVh_A.T = {Vh_A.T}\n\nU_B = {U_B}\n\nS_B = {S_B}\n\nVh_B.T = {Vh_B.T}")

U_A = [[ 0.73697623  0.59100905  0.32798528  0.        ]
 [ 0.59100905 -0.32798528 -0.73697623  0.        ]
 [ 0.32798528 -0.73697623  0.59100905  0.        ]
 [ 0.          0.          0.          1.        ]]

S_A = [2.2469796  0.80193774 0.55495813]

Vh_A.T = [[ 0.32798528  0.73697623  0.59100905]
 [ 0.59100905  0.32798528 -0.73697623]
 [ 0.73697623 -0.59100905  0.32798528]]

U_B = [[-2.41816250e-01  7.12015746e-01 -6.59210496e-01  0.00000000e+00]
 [-4.52990541e-01  5.17957311e-01  7.25616837e-01  6.71536163e-17]
 [-6.06763739e-01 -3.35226641e-01 -1.39502200e-01 -7.07106781e-01]
 [-6.06763739e-01 -3.35226641e-01 -1.39502200e-01  7.07106781e-01]]

S_B = [2.8092118  0.88646771 0.56789441]

Vh_B.T = [[-0.67931306  0.63117897 -0.37436195]
 [-0.59323331 -0.17202654  0.7864357 ]
 [-0.43198148 -0.75632002 -0.49129626]]

import numpy as np

# Create our matrix A and our target b
A = np.array([[1,1,2],[0,1,1],[1,0,1],[0,0,0]])
b = np.array([[1],[1],[1],[1]])

# Take the SVD decomposition
U, S, Vh = np.linalg.svd(A)

# Prepare the pseudoinverse
# Recall that we invert the non-zero diagonal entries of the diagonal matrix.
# So we first build S_inv to be the appropriate size
S_inv = np.zeros((Vh.shape[0], U.shape[0])) 
# We then fill in the appropriate values on the diagonal
S_inv[:len(S), :len(S)] = np.diag(1/S)

# Build the pseudoinverse
A_pinv = Vh.T @ S_inv @ U.T

# Compute the least-squares solution
beta = A_pinv @ b

beta

array([[ 2.74080345e+15],
       [ 2.74080345e+15],
       [-2.74080345e+15]])

S

array([3.00000000e+00, 1.00000000e+00, 1.21618839e-16])

import numpy as np

# Create our matrix A and our target b
A = np.array([[1,1,2],[0,1,1],[1,0,1],[0,0,0]])
b = np.array([[1],[1],[1],[1]])

# Build the pseudoinverse
A_pinv = np.linalg.pinv(A)

# Compute the least-squares solution
beta = A_pinv @ b

print(f"A_pinv={A_pinv}\n\nbeta={beta}")

A_pinv=[[ 0.11111111 -0.44444444  0.55555556  0.        ]
 [ 0.11111111  0.55555556 -0.44444444  0.        ]
 [ 0.22222222  0.11111111  0.11111111  0.        ]]

beta=[[0.22222222]
 [0.22222222]
 [0.44444444]]

import numpy as np
import pandas as pd

# First let us make a dictionary incorporating our data.
# Each entry corresponds to a column (feature of our data)
data = {
    'Square ft': [1600, 2100, 1550, 1600, 2000],
    'Bedrooms': [3, 4, 2, 3, 4],
    'Price': [500, 650, 475, 490, 620]
}

# Create a pandas DataFrame
df = pd.DataFrame(data)

# Create out matrix X
X = df[['Square ft', 'Bedrooms']].to_numpy()

# Check the condition number
cond_X = np.linalg.cond(X)

cond_X

np.float64(4329.082589067693)

QR Decompositions¶

How to use QR decompositions¶

Singular Value Decomposition¶

Pseudoinverses and using the SVD¶

The Condition Number¶