Numerical Linear Algebra: Householder a'la Golub and Van Loan

numerical linear algebra householder

Exploring properties of Householder transformations.

Dustin Lennon
April 2021
https://dlennon.org/20210427_householder

April 2021

Abstract

This is a document for exploring properties of Householder transformations.

import numpy as np
from pydlennon.contexts.seeded_rng import SeededRng

np.set_printoptions( precision=3, linewidth = 132, suppress = True )

m = 8
n = 6

I_m = np.identity(m)
I_n = np.identity(n)

with SeededRng(111) as s:
    data = s.negative_binomial(10, 0.25, size=m*n)    
    A = np.array(data, dtype=np.float64).reshape((m,n))
    
    data = s.negative_binomial(10, 0.25, size=n*n)
    B = np.array(data, dtype=np.float64).reshape((n,n))
    
    data = s.negative_binomial(10, 0.25, size=n*n)
    Z,_ = np.linalg.qr(
            np.array(data, dtype=np.float64).reshape((n,n))    
    )

def house(x):
    """
    Golub and Van Loan, 3rd Ed.  
    Algorithm 5.1.1
    """
    n = len(x)
    sigma = x[1:] @ x[1:]
    v = np.concatenate([[1], x[1:]])

    if sigma == 0:
        beta = 0
    else:
        mu = np.sqrt(x[0]**2 + sigma)
        if x[0] <= 0:
            v[0] = x[0] - mu
        else:
            v[0] = -sigma / (x[0] + mu)
        beta = 2 * v[0]**2 / (sigma + v[0]**2)
        v = v/v[0]
    
    return(v, beta)

x = A[:,0]

v,beta = house( x ) 
P = (I_m - beta * np.outer(v,v))

P @ x

array([102.113,   0.   ,  -0.   ,   0.   ,  -0.   ,  -0.   ,  -0.   ,   0.   ])

R = A.copy()

V = np.identity(m)
Beta = np.zeros(n)

for j in range(n):
    x = R[j:,j]
    v,beta = house( x ) 

    s = np.s_[j:,j:]
    
    # Atmp = P @ Atmp 
    w = beta * R[s].T @ v
    R[s] = R[s] - np.outer(v,w)
    
    # Factored form representation
    Beta[j] = beta
    V[j,j] = 1.0 
    V[j+1:,j] = v[1:]

# Reconstruct Q from factored form; backward accumulation
Q = I_m.copy()
for j in range(n)[::-1]:
    v = V[j:,j].copy()
    beta = Beta[j]

    s = np.s_[j:,j:]
    P = np.identity(m-j) - beta * np.outer(v,v)
    Q[s] = P @ Q[s]  # Q_1 ... Q_k ... Q_n

(Q.T @ A, Q @ R)

(array([[102.113,  75.671,  65.506,  74.163,  47.115,  94.631],
        [  0.   ,  65.642,  41.91 ,  42.107,  28.85 ,  30.943],
        [ -0.   ,  -0.   ,  54.419,   2.924,  12.635,   8.219],
        [ -0.   ,  -0.   ,  -0.   ,  28.023,  10.352,   8.562],
        [  0.   ,  -0.   ,   0.   ,  -0.   ,  14.215, -18.268],
        [ -0.   ,  -0.   ,  -0.   ,  -0.   ,   0.   ,  18.734],
        [  0.   ,   0.   ,  -0.   ,  -0.   ,  -0.   ,  -0.   ],
        [ -0.   ,  -0.   ,   0.   ,   0.   ,   0.   ,   0.   ]]),
 array([[26., 26., 26., 22., 17., 14.],
        [50., 21., 15., 23., 15., 46.],
        [11., 40., 32., 39., 21., 30.],
        [27., 60., 29., 26., 18., 40.],
        [42., 22., 63., 20., 25., 34.],
        [29., 41., 20., 44., 34., 25.],
        [60., 23.,  5., 35., 10., 47.],
        [14., 32., 43., 36., 19., 44.]]))

Hessenberg Reduction

B0 = Z.T @ B @ Z
# B0 = B
Btmp = B0.copy()
U = I_n.copy()

for k in range(n-2):
    v,beta = house(Btmp[k+1:n, k])
    vp = np.pad(v, (k+1,0))
    P = I_n - beta * np.outer(vp,vp)
    Btmp = P.T @ Btmp @ P
    U = U @ P
    
H = U.T @ B0 @ U    
(B0, H)

(array([[164.533,  37.299,  36.604, -17.722,  30.584, -27.13 ],
        [ 39.477,  16.303,   3.115, -10.634,   3.408, -10.418],
        [ 24.111,  29.105,  14.486,   9.866,   9.773,  12.609],
        [ -2.569,   4.244,   1.124,   8.255,  -5.707, -10.352],
        [ 12.692,  12.145,  -3.231,  -6.987,   2.092,  20.604],
        [-13.23 , -18.403,  11.126,  11.049, -16.502,  -0.67 ]]),
 array([[164.533,  63.174,   3.406, -20.94 ,  13.669,   9.417],
        [ 49.825,  32.936, -18.525,   6.785,   4.039,   1.218],
        [  0.   ,  17.621,  -0.586,   9.554,   2.336, -14.628],
        [ -0.   ,  -0.   ,  25.482,  -1.78 ,  -9.527,  -1.698],
        [ -0.   ,   0.   ,   0.   ,  24.062,  10.328,  -2.967],
        [ -0.   ,  -0.   ,   0.   ,  -0.   ,   9.138,  -0.432]]))

e1 = np.zeros(n)
e1[0] = 1
(Z @ e1, Z @ U @ e1, U @ e1)

(array([-0.548, -0.43 , -0.252, -0.548, -0.296, -0.252]),
 array([-0.548, -0.43 , -0.252, -0.548, -0.296, -0.252]),
 array([1., 0., 0., 0., 0., 0.]))

Dustin Lennon

Applied Scientist
dlennon.org

Abstract

Abstract

Hessenberg Reduction

Hessenberg Reduction

Dustin Lennon

Applied Scientist
dlennon.org

Dustin Lennon

Applied Scientist dlennon.org

Abstract

Abstract

Hessenberg Reduction

Hessenberg Reduction

Dustin Lennon

Applied Scientist dlennon.org

Applied Scientist
dlennon.org

Applied Scientist
dlennon.org