basis = (1/sqrt(2) * array([1, 1]), 1/sqrt(2) * array([1, -1]))
for i in [0,1]:
    for j in [0,1]:
        print "{}, {} :".format(i,j)
        print outer(basis[i], basis[j])
        print

0, 0 :
[[ 0.5  0.5]
 [ 0.5  0.5]]

0, 1 :
[[ 0.5 -0.5]
 [ 0.5 -0.5]]

1, 0 :
[[ 0.5  0.5]
 [-0.5 -0.5]]

1, 1 :
[[ 0.5 -0.5]
 [-0.5  0.5]]


# The 8 x 8 DCT matrix thus looks like this.
N = 8
dct = zeros((N, N))
for x in range(N):
    dct[0,x] = sqrt(2.0/N) / sqrt(2.0)
for u in xrange(1,N):
    for x in xrange(N):
        dct[u,x] = sqrt(2.0/N) * cos((pi/N) * u * (x + 0.5) )
        
np.set_printoptions(precision=3)
dct

array([[ 0.354,  0.354,  0.354,  0.354,  0.354,  0.354,  0.354,  0.354],
       [ 0.49 ,  0.416,  0.278,  0.098, -0.098, -0.278, -0.416, -0.49 ],
       [ 0.462,  0.191, -0.191, -0.462, -0.462, -0.191,  0.191,  0.462],
       [ 0.416, -0.098, -0.49 , -0.278,  0.278,  0.49 ,  0.098, -0.416],
       [ 0.354, -0.354, -0.354,  0.354,  0.354, -0.354, -0.354,  0.354],
       [ 0.278, -0.49 ,  0.098,  0.416, -0.416, -0.098,  0.49 , -0.278],
       [ 0.191, -0.462,  0.462, -0.191, -0.191,  0.462, -0.462,  0.191],
       [ 0.098, -0.278,  0.416, -0.49 ,  0.49 , -0.416,  0.278, -0.098]])


# Here's what they look like.
figure(figsize=(9,12))
for u in xrange(N):
    subplot(4, 2, u+1)
    ylim((-1, 1))
    title(str(u))
    plot(dct[u, :])
    plot(dct[u, :],'ro')


def rowdot(i,j):
    return dot(dct[i, :], dct[j, :])
rowdot(0,0), rowdot(3,3), rowdot(0,3), rowdot(1, 7), rowdot(1,5)

(0.99999999999999978,
 0.99999999999999989,
 5.5511151231257827e-17,
 1.9428902930940239e-16,
 -2.4980018054066022e-16)


dct_transpose = dct.transpose()
dct_transpose

array([[ 0.354,  0.49 ,  0.462,  0.416,  0.354,  0.278,  0.191,  0.098],
       [ 0.354,  0.416,  0.191, -0.098, -0.354, -0.49 , -0.462, -0.278],
       [ 0.354,  0.278, -0.191, -0.49 , -0.354,  0.098,  0.462,  0.416],
       [ 0.354,  0.098, -0.462, -0.278,  0.354,  0.416, -0.191, -0.49 ],
       [ 0.354, -0.098, -0.462,  0.278,  0.354, -0.416, -0.191,  0.49 ],
       [ 0.354, -0.278, -0.191,  0.49 , -0.354, -0.098,  0.462, -0.416],
       [ 0.354, -0.416,  0.191,  0.098, -0.354,  0.49 , -0.462,  0.278],
       [ 0.354, -0.49 ,  0.462, -0.416,  0.354, -0.278,  0.191, -0.098]])


# Is the dot product of dct and its transpose the identity?
maybe_identity = dot(dct, dct_transpose)

# Since there are many nearly zero like 3.2334e-17 in this numerical result,
# the output will look much nicer if we round them all of to (say) 6 places.
roundoff = vectorize(lambda m: round(m, 6))
roundoff(maybe_identity)

array([[ 1.,  0., -0.,  0.,  0.,  0., -0., -0.],
       [ 0.,  1.,  0., -0.,  0., -0.,  0.,  0.],
       [-0.,  0.,  1.,  0., -0.,  0.,  0.,  0.],
       [ 0., -0.,  0.,  1.,  0.,  0., -0.,  0.],
       [ 0.,  0., -0.,  0.,  1.,  0., -0., -0.],
       [ 0., -0.,  0.,  0.,  0.,  1.,  0., -0.],
       [-0.,  0.,  0., -0., -0.,  0.,  1.,  0.],
       [-0.,  0.,  0.,  0., -0., -0.,  0.,  1.]])


# See http://matplotlib.org/users/image_tutorial.html for the image manipulation syntax.
# The image itself is a small piece from http://www.cordwainer-smith.com/virgil_finlay.htm.
import matplotlib.image as mpimg
img = mpimg.imread('stormplanet112.jpg')
p=plt.imshow(img, origin='lower')


# The image itself contains 3 dimensions: rows, columns, and colors
img.shape

(112, 112, 3)


tiny = img[40:48, 40:48, 0]    # a tiny 8 x 8 block, in the color=0 (Red) channel

def show_image(img):
    plt.imshow(img)
    plt.colorbar()

show_image(tiny)


# And here are the numbers.
tiny

array([[ 24, 147, 212, 216, 209, 223, 156,  74],
       [ 47,  33, 179, 221, 201, 230, 164,  95],
       [ 20,  73, 201, 235, 215, 219, 175, 109],
       [140, 181, 215, 217, 197, 192, 142,  95],
       [204, 235, 206, 195, 204, 208, 192, 159],
       [208, 187, 217, 226, 222, 216, 209, 173],
       [203, 234, 225, 211, 204, 185, 232, 227],
       [155, 143, 150, 193, 204, 177, 178, 195]], dtype=uint8)


def doDCT(grid):
    return dot(dot(dct, grid), dct_transpose)

def undoDCT(grid):
    return dot(dot(dct_transpose, grid), dct)

# test : do DCT, then undo DCT; should get back the same image.
tiny_do_undo = undoDCT(doDCT(tiny))

show_image(tiny_do_undo) # Yup, looks the same.


# And the numbers are the same.
tiny_do_undo

array([[  24.,  147.,  212.,  216.,  209.,  223.,  156.,   74.],
       [  47.,   33.,  179.,  221.,  201.,  230.,  164.,   95.],
       [  20.,   73.,  201.,  235.,  215.,  219.,  175.,  109.],
       [ 140.,  181.,  215.,  217.,  197.,  192.,  142.,   95.],
       [ 204.,  235.,  206.,  195.,  204.,  208.,  192.,  159.],
       [ 208.,  187.,  217.,  226.,  222.,  216.,  209.,  173.],
       [ 203.,  234.,  225.,  211.,  204.,  185.,  232.,  227.],
       [ 155.,  143.,  150.,  193.,  204.,  177.,  178.,  195.]])


tinyDCT = doDCT(tiny)
show_image(tinyDCT)


set_printoptions(linewidth=100) # output line width (default is 75)
round6 = vectorize(lambda m: '{:6.1f}'.format(m))
round6(tinyDCT)

array([['1429.2', ' -55.9', '-241.7', '  -9.0', ' -54.7', '  31.9', '   9.7', '   0.1'],
       ['-152.3', ' -58.3', '-201.2', '  -4.0', ' -64.9', '  24.0', '  35.8', ' -10.9'],
       [' -54.2', ' -74.9', ' -27.0', ' -15.7', '   8.3', '  -0.2', '   0.1', '   0.3'],
       ['  92.6', '  59.6', '  48.2', '  12.2', ' -30.1', ' -17.3', ' -16.2', '   0.1'],
       [' -19.7', '  64.2', '  21.0', '  10.9', ' -14.3', ' -44.2', ' -21.1', ' -15.0'],
       ['  35.3', '  41.9', '   0.2', ' -39.1', ' -32.3', ' -21.0', ' -23.1', '   0.2'],
       [' -19.8', ' -26.2', ' -47.4', '  -0.7', '   0.4', '   0.3', '   0.5', '  -0.3'],
       ['  27.9', ' -18.2', '  19.1', ' -20.5', ' -22.5', ' -20.0', ' -21.1', '   0.7']], 
      dtype='|S8')


# First make a copy to work on.
tinyDCT_chopped = tinyDCT.copy()

# Then zero the pieces below the x + y = 8 line.
for x in xrange(N):
    for u in xrange(N):
        if x + u > 8:
            tinyDCT_chopped[x,u] = 0.0

show_image(tinyDCT_chopped)


round6(tinyDCT_chopped)
# Notice all the zeros at the bottom right - those are the chopped high frequences.
# We've essentially done a "low pass filter" on the spacial frequencies.

array([['1429.2', ' -55.9', '-241.7', '  -9.0', ' -54.7', '  31.9', '   9.7', '   0.1'],
       ['-152.3', ' -58.3', '-201.2', '  -4.0', ' -64.9', '  24.0', '  35.8', ' -10.9'],
       [' -54.2', ' -74.9', ' -27.0', ' -15.7', '   8.3', '  -0.2', '   0.1', '   0.0'],
       ['  92.6', '  59.6', '  48.2', '  12.2', ' -30.1', ' -17.3', '   0.0', '   0.0'],
       [' -19.7', '  64.2', '  21.0', '  10.9', ' -14.3', '   0.0', '   0.0', '   0.0'],
       ['  35.3', '  41.9', '   0.2', ' -39.1', '   0.0', '   0.0', '   0.0', '   0.0'],
       [' -19.8', ' -26.2', ' -47.4', '   0.0', '   0.0', '   0.0', '   0.0', '   0.0'],
       ['  27.9', ' -18.2', '   0.0', '   0.0', '   0.0', '   0.0', '   0.0', '   0.0']], 
      dtype='|S8')


tiny_chopped_float = undoDCT(tinyDCT_chopped)

# Also convert the floats back to uint8, which was the original format
tiny_chopped = vectorize(lambda x: uint8(x))(tiny_chopped_float) 

show_image(tiny_chopped)


tiny_chopped

array([[ 39, 119, 222, 223, 202, 226, 154,  73],
       [ 25,  71, 171, 206, 204, 226, 167,  96],
       [ 21,  72, 188, 241, 225, 221, 168, 107],
       [146, 173, 222, 219, 186, 181, 149, 100],
       [210, 217, 213, 197, 203, 217, 195, 147],
       [193, 212, 214, 213, 222, 214, 205, 181],
       [212, 220, 218, 220, 210, 188, 216, 232],
       [152, 145, 153, 190, 199, 173, 191, 188]], dtype=uint8)

The DCT (Discrete Cosine Transform)¶

The basic linear algebra with N = 2¶

quick quiz 1¶

the matrix math¶

quick quiz 2¶

two dimensions¶

quick quiz¶

N = 8¶

playing with a real image¶

conclusions¶