import math; import PIL; from PIL import Image; import numpy as np; import matplotlib.pyplot as plt


image = Image.open('habitat_67_small.jpg').convert("L")
img_mat = np.asarray(image)
fig = plt.imshow(img_mat, cmap='gray')
fig.axes.get_xaxis().set_visible(False) 
fig.axes.get_yaxis().set_visible(False)


U, s, V = np.linalg.svd(img_mat, full_matrices=True)
s = np.diag(s)

plt.figure(figsize=(15, 10), dpi=40)

plt.subplot(1,2,1)

k = 30
compressed_by_k = U[:, :k] @ s[0:k, :k] @ V[:k, :]

fig = plt.imshow(compressed_by_k, cmap='gray')
fig.axes.get_xaxis().set_visible(False) 
fig.axes.get_yaxis().set_visible(False)

plt.subplot(1,2,2)

k = 10
compressed_by_k = U[:, :k] @ s[0:k, :k] @ V[:k, :]

fig = plt.imshow(compressed_by_k, cmap='gray'); fig.axes.get_xaxis().set_visible(False); fig.axes.get_yaxis().set_visible(False); plt.show()


def print_image(array, colors):
    fig = plt.imshow(array); fig.set_cmap(colors); fig.axes.get_xaxis().set_visible(False); fig.axes.get_yaxis().set_visible(False); plt.show()

output=np.zeros((73,73), dtype=np.float16)
for u in range(0,8): 
    for v in range(0,8): 
        for i in range(0,8): 
            for j in range(0,8):
                output[(9*u)+i+1][(9*v)+j+1] = math.cos(math.pi*u*(2*i+1)*(1/16)) * math.cos(math.pi*v*(2*j+1)*(1/16)) * 127 + 127
print_image(output, 'Greys')


class DCT:

   # scale for inside the sum
   def C(self,i,j):
      if (i==0 and j==0):
         return 1/2 
      elif (i==0 or j==0):
         return 1/math.sqrt(2)
      else:
         return 1

   # Forward DCT (8x8)
   def DCT(self, image_pixels):
      basis_weights=np.zeros((8,8), dtype=np.int16)
      cos_sum=0

      for u in range(0,8):
         for v in range(0,8):
            for i in range(0,8):
               for j in range(0,8):
                  cos_sum += self.C(u,v) * math.cos(math.pi*u*(2*i+1)*(1/16)) * math.cos(math.pi*v*(2*j+1)*(1/16)) * image_pixels[i][j]
            basis_weights[u][v] = (1/4)*cos_sum
            cos_sum = 0

      return basis_weights

   # Inverse DCT
   def IDCT(self, basis_weights):
      image_pixels=np.zeros((8,8), dtype=np.int16)
      cos_sum=0

      for i in range(0,8):
         for j in range(0,8):
            for u in range(0,8):
               for v in range(0,8):
                  cos_sum += self.C(u,v) * math.cos(math.pi*u*(2*i+1)*(1/16)) * math.cos(math.pi*v*(2*j+1)*(1/16)) * basis_weights[u][v]
         
            image_pixels[i][j] = int(round((1/4)*cos_sum, 0))
            cos_sum = 0

      return image_pixels


dct = DCT()
image = np.array([[1+x,2+x,3+x,4+x,5+x,6+x,7+x,8+x] for x in range(0,8)])
coefficients = dct.DCT(image)
new_image = dct.IDCT(coefficients)

print("Original Image:")
print_image(image, 'Greys')
print("Basis weights:")
print(coefficients)

Original Image:

Basis weights:
[[ 64 -18   0  -1   0   0   0   0]
 [-18   0   0   0   0   0   0   0]
 [  0   0   0   0   0   0   0   0]
 [ -1   0   0   0   0   0   0   0]
 [  0   0   0   0   0   0   0   0]
 [  0   0   0   0   0   0   0   0]
 [  0   0   0   0   0   0   0   0]
 [  0   0   0   0   0   0   0   0]]


class Qunatization:
    def __init__(self):
        self.LUMINANCE_TABLE = np.array([[16, 11, 10, 16, 24, 40, 51, 61],[12, 12, 14, 19, 26, 58, 60, 55],[14, 13, 16, 24, 40, 57, 69, 56],[14, 17, 22, 29, 51, 87, 80, 62],[18, 22, 37, 56, 68, 109, 103, 77],[24, 35, 55, 64, 81, 104, 113, 92],[49, 64, 78, 87, 103, 121, 120, 101],[72, 92, 95, 98, 112, 100, 103, 99]])
        self.CHROMINANCE_TABLE = np.array([[17, 18, 24, 47, 99, 99, 99, 99], [18, 21, 26, 66, 99, 99, 99, 99], [24, 26, 56, 99, 99, 99, 99, 99], [47, 66, 99, 99, 99, 99, 99, 99], [99, 99, 99, 99, 99, 99, 99, 99],[99, 99, 99, 99, 99, 99, 99, 99],[99, 99, 99, 99, 99, 99, 99, 99],[99, 99, 99, 99, 99, 99, 99, 99]])
    
    def quantize(self, basis_weight, table):
        quantized_value = np.zeros((8,8), dtype=np.int16)
        for i in range(0,7):
            for j in range(0,7):
                quantized_value[i][j] = round(basis_weight[i][j]/table[i][j], 0)
        return quantized_value

    def unquantize(self, quantized_value, table):
        basis_weight = np.zeros((8,8), dtype=np.int16)
        for i in range(0,7):
            for j in range(0,7):
                basis_weight[i][j] = quantized_value[i][j] * table[i][j]
        return basis_weight


quantizer = Qunatization()
quantized_values = quantizer.quantize(coefficients, quantizer.LUMINANCE_TABLE)
restored_weights = quantizer.unquantize(quantized_values, quantizer.LUMINANCE_TABLE)
restored_image = dct.IDCT(restored_weights)
print("Original Image:")
print_image(image, "Greys")
print("Compressed Image:")
print_image(restored_image, "Greys")

Original Image:

Compressed Image:


class Encoder:
   def entropy_encode(self, mask):
      output = np.zeros(64, dtype=np.int16)
      output[0] = mask[0][0]; i=0; j=1; level=1; loc=1
      while True:
         # level is even, so we are iterating from left to right
         if (level%2==0):
            if (i<8 and j<8):
               output[loc] = mask[i][j]; loc+=1
            i-=1; j+=1
            # move to the next level
            if (i==-1):
               level+=1; i=0; j=level
         # level is odd, so we are iterating from right to left
         else:
            if (i<8 and j<8):
               output[loc] = mask[i][j]; loc+=1
            i+=1; j-=1
            # move to the next level
            if (j==-1):
               level+=1; j=0; i=level
         if (i==7 and j==7):
            output[loc] = mask[i][j]; return output

   def entropy_decode(self, array):
      output = np.zeros((8,8), dtype=np.int16)
      output[0][0] = array[0]; i=0; j=1; level=1; loc=1
      while True:
         # level is even, so we are iterating from left to right
         if (level%2==0):
            if (i<8 and j<8):
               output[i][j] = array[loc]; loc+=1
            i-=1; j+=1
            # move to the next level
            if (i==-1):
               level+=1; i=0; j=level
         # level is odd, so we are iterating from right to left
         else:
            if (i<8 and j<8):
               output[i][j] = array[loc]; loc+=1
            i+=1; j-=1
            if (j==-1):
               level+=1; j=0; i=level
         if (i==7 and j==7):
            output[i][j] = array[loc]; return output


encoder=Encoder()
encoded = encoder.entropy_encode(quantized_values)
print("Quantized values:"); print(quantized_values); print()
print("Encoded values in array:"); print(encoded)

Quantized values:
[[ 4 -2  0  0  0  0  0  0]
 [-2  0  0  0  0  0  0  0]
 [ 0  0  0  0  0  0  0  0]
 [ 0  0  0  0  0  0  0  0]
 [ 0  0  0  0  0  0  0  0]
 [ 0  0  0  0  0  0  0  0]
 [ 0  0  0  0  0  0  0  0]
 [ 0  0  0  0  0  0  0  0]]

Encoded values in array:
[ 4 -2 -2  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0
  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0
  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0  0]


from dahuffman import HuffmanCodec
codec = HuffmanCodec.from_data(encoded)
codec.print_code_table()
bytes = codec.encode(encoded)
print("Number of bytes before Huffman Coding: " + str(len(encoded)))
print("Number of bytes after Huffman Coding: " + str(len(bytes)))
print("And in bytes, the final image looks like: " + str(bytes))

Bits Code Value Symbol
   3 000      0 _EOF
   3 001      1 4
   2 01       1 -2
   1 1        1 0
Number of bytes before Huffman Coding: 64
Number of bytes after Huffman Coding: 9
And in bytes, the final image looks like: b'+\xff\xff\xff\xff\xff\xff\xff\xf0'


image = Image.open('habitat_67_small.jpg')

fig = plt.imshow(image)
fig.axes.get_xaxis().set_visible(False) 
fig.axes.get_yaxis().set_visible(False)
plt.show()


h = 256
w = 256
N = 8 #8x8 chunks

dct = DCT()
quantizer = Qunatization()
encoder = Encoder()

def gen_quant_quality(Q, quality):
    if quality>50:
        Q = (Q * ((100-quality)/50)).astype('int')
        Q = np.where(Q>255,255,Q)
    elif quality<50:
        Q = (Q * (50/quality)).astype('int')
        Q = np.where(Q>255,255,Q)
    return Q

def compressChannel(channel, quality, color_channel):
    new_Q = gen_quant_quality(quantizer.CHROMINANCE_TABLE, quality) if color_channel else gen_quant_quality(quantizer.LUMINANCE_TABLE, quality) # selecting correct table
    
    out = np.zeros(shape=(h*w), dtype=np.int16)
    final_idx = 0;
    for i in range(0,h,N):
        print("Compressing: "+str(100*i/h)+"%      ", end = "\r")
        for j in range(0,w,N):
            entropy_encode = encoder.entropy_encode(quantizer.quantize(dct.DCT(channel[i:i+N, j:j+N]), new_Q))
            for batch_idx in range(0,64):
                out[final_idx] = entropy_encode[batch_idx]
                final_idx+=1
    print("Finished                 ", end = "\r"); return out

def uncompressChannel(compressed_channel, quality, color_channel):
    new_Q = gen_quant_quality(quantizer.CHROMINANCE_TABLE, quality) if color_channel else gen_quant_quality(quantizer.LUMINANCE_TABLE, quality) # selecting correct table
    out = np.zeros(shape=(h,w), dtype=np.int16)
    chunk_num=0
    
    for i in range(0,h,N):
        print("Uncompressing: "+str(100*i/h)+"%     ", end = "\r")
        for j in range(0,w,N):
            inv_dct = dct.IDCT(quantizer.unquantize(encoder.entropy_decode(compressed_channel[64*chunk_num:64+(64*chunk_num)]), new_Q)) # restoring from encoded array by chunk
            x_counter = 0 # Stitching image back together from chunks
            for x in range(i,i+N):
                y_counter = 0
                for y in range(j,j+N):
                    out[x][y] = inv_dct[x_counter][y_counter]
                    y_counter += 1
                x_counter += 1

            chunk_num+=1
    print("Finished               ", end = "\r")
    return out

plt.figure(figsize=(15, 10), dpi=40)
subplot_counter = 1
byteSize = []
for quality_val in [90, 50, 10, 5]:
    ycbcr = image.convert('YCbCr')
    (Y, Cb, Cr) = ycbcr.split()
    Y, Cb, Cr = np.array(Y).astype(np.int16), np.array(Cb).astype(np.int16), np.array(Cr).astype(np.int16)
    Y, Cb, Cr = Y - 128, Cb - 128, Cr - 128
    Y, Cb, Cr = compressChannel(Y,quality_val, False), compressChannel(Cb,quality_val, True), compressChannel(Cr,quality_val, True)
    
    encoded_vals = np.concatenate((Y, Cb, Cr)) # measuring the byte size of each image - factors in 512 bytes for worst case size of saved huffman tree
    codec = HuffmanCodec.from_data(encoded_vals)
    bytes = codec.encode(encoded_vals)
    byteSize.append(len(bytes)+255)
    
    Y, Cb, Cr = uncompressChannel(Y,quality_val, False), uncompressChannel(Cb,quality_val, True), uncompressChannel(Cr,quality_val, True)
    Y, Cb, Cr = Y + 128, Cb + 128, Cr + 128
    Y, Cb, Cr = Y.astype('uint8'), Cb.astype('uint8'), Cr.astype('uint8')

    stacked = np.dstack((Y,Cb,Cr))    # Converting from numpy matrix to image
    fromarray = Image.fromarray(stacked, mode="YCbCr")
    compressed = fromarray.convert('RGB')
    
    plt.subplot(1,4,subplot_counter)
    fig = plt.imshow(compressed)
    fig.axes.get_xaxis().set_visible(False); fig.axes.get_yaxis().set_visible(False); subplot_counter += 1
    
plt.show()
print("Size in Kilobytes of each compression")
print([size/1000 for size in byteSize])

Finished

Size in Kilobytes of each compression
[52.012, 34.489, 27.402, 25.967]

Image Compression¶

By Jack Wilcom and Ethan Coates for MATH401¶

SVD Image Compression¶

Implementation of JPEG Image Compression¶

Discrete Cosine Transform¶

Quantization¶

Encoding¶

Huffman Coding¶

Sources¶