%matplotlib inline

#These are the python libraries used to illustrate this course

import matplotlib
import matplotlib.pyplot as plt
import matplotlib.animation
import numpy as np
import io
import math
from IPython.display import HTML
import ipywidgets as widgets
from mpl_toolkits.mplot3d import Axes3D


# Center plots

HTML("""
<style>
.output_png, .output_result.rendered_html {
    display: table-cell;
    text-align: center;
    vertical-align: middle;
}
</style>
""")


def img_init(img, size = None, dpi = 100):
    if size is None:
        size = img.shape[:2]
    xinches = size[1] / dpi
    yinches = size[0] / dpi
    fig = plt.figure(figsize = (xinches,yinches))
    ax = plt.axes([0., 0., 1., 1.], frameon=False, xticks=[],yticks=[])
    ax.axis('off')
    return ax

def img_defaults(img):
    opts = {}
    if len(img.shape) == 2:
        opts['cmap'] = 'gray'
        if img.dtype == 'uint8':
            opts['vmin'] = 0
            opts['vmax'] = 255
        else:
            opts['vmin'] = 0
            opts['vmax'] = 1
    return opts

def img_show(img, size = None, dpi = 100):
    ax = img_init(img, size, dpi)
    opts = img_defaults(img)
    ax.imshow(img, **opts)

def img_equalize(img):
    histo, bins = np.histogram(img, 256, density = True)
    cdf = histo.cumsum()
    equalized = np.interp(img.flatten(), bins[:-1], cdf / cdf[-1])
    return equalized.reshape(img.shape)

def grayscale(img):
    return (0.21 * img[:,:,0] + 0.72 * img[:,:,1] + 0.07 * img[:,:,2]).astype(img.dtype)

def dft_show(dft, size = None, dpi = 100, equalize = 0):
    ax = img_init(dft,size,dpi)
    shifted_norm = np.absolute(np.fft.fftshift(dft))
    for _ in range(equalize):
        shifted_norm = img_equalize(shifted_norm)
    #dftmin = np.min(shifted_norm)
    #dftmax = np.max(shifted_norm)
    ax.imshow(
        shifted_norm, 
        #norm = matplotlib.colors.SymLogNorm(linthresh = dftmax / 255, linscale = 1, vmin = dftmin, vmax = dftmax, base = 10), 
        cmap = 'gray',
        vmin = 0,
        vmax = 1
    )

def img_resize(img, to):
    dpi = 72
    ax = img_show(img, size = to, dpi = dpi)
    
    buf = io.BytesIO()
    plt.savefig(buf, format='raw', dpi = dpi)
    buf.seek(0)
    resized = np.reshape(np.frombuffer(buf.getvalue(), dtype=np.uint8), newshape=(*to, -1))
    buf.close()
    plt.close()
    if len(img.shape) == 2:
        return resized[:,:,0]
    else:
        return resized[:,:,:img.shape[2]]
    
def img_pad(img, padl, padc = None):
    if padc is None:
        padc = padl
    return np.pad(img, [(padl,padl),(padc,padc),*[(0,0) for _ in img.shape[2:]]], mode='edge')

def turntable(fig, angle_step, interval = 150):  
    plt.close()
    
    def animate(i):
        fig.gca().view_init(30, (angle_step *i) % 360)
        fig.canvas.draw_idle()
    
    ani = matplotlib.animation.FuncAnimation(fig, animate, frames=int(360 / angle_step), interval = interval);
    return (HTML(ani.to_html5_video()))

def alternate(images, interval = 1000, **kwargs): 
    size = len(images)
    ax = img_init(images[0], **kwargs)
    opts = img_defaults(images[0])
    imgax = ax.imshow(images[0], **opts)
    
    def animate(i):
        im = images[i % size]
        imgax.set_data(im)

    ani = matplotlib.animation.FuncAnimation(plt.gcf(), animate, frames=size, interval = interval);
    plt.close()
    return (HTML(ani.to_html5_video()))

def circle_img(size, radius):
    x,y = np.meshgrid(np.linspace(-1,1,size), np.linspace(-1,1,size))
    return (x*x + y*y < radius * radius)

def gaussian_img(size, sigma):
    x,y = np.meshgrid(np.linspace(-1,1,size), np.linspace(-1,1,size))
    return np.exp(-(x*x + y*y) / (2 * sigma * sigma))


#voxel grid
r, g, b = np.indices((9, 9, 9)) / 8
rc = 0.5 * (r[1:,1:,1:] + r[:-1,:-1,:-1])
gc = 0.5 * (g[1:,1:,1:] + g[:-1,:-1,:-1])
bc = 0.5 * (b[1:,1:,1:] + b[:-1,:-1,:-1])

#color of each voxel
colors = np.empty((8, 8, 8, 3))
colors[..., 0], colors[..., 1], colors[..., 2] = rc, gc, bc

#plot
fig = plt.figure(figsize = (8, 8))
ax = fig.add_subplot(projection='3d')
ax.voxels(r, g, b, np.ones((8, 8, 8)), facecolors = colors, edgecolors = 'black')
ax.set_xlabel('R', fontsize = 20)
ax.set_ylabel('G', fontsize = 20)
ax.set_zlabel('B', fontsize = 20)
turntable(fig, 10, 300)


reine = plt.imread('reine.png')
img_show(reine)


#some high frequency signal
signal = lambda x : np.cos(200*x)

#sampling the signal with a high resolution 
x = np.arange(0,1,0.0001)
high_freq = signal(x)

#sampling the signal with an insufficient resolution
sample = np.arange(0,1,0.06)
sampled_high_freq = signal(sample)

#plot
fig = plt.figure(figsize = (8, 4))
ax = fig.add_subplot()
#high frequency sampling as a blue line
ax.plot(x, high_freq, color = 'tab:blue')
#low frequency as orange dots
ax.plot(sample, sampled_high_freq, 'o', color = 'tab:orange')
plt.show()


img_show(reine)
reine_gs_naive = (reine[:,:,0] + reine[:,:,1] + reine[:,:,2]) / 3
img_show(reine_gs_naive)


reine_gs_perceptive = 0.21 * reine[:,:,0] + 0.72 * reine[:,:,1] + 0.07 * reine[:,:,2]
img_show(reine_gs_perceptive)


alternate([reine_gs_naive, reine_gs_perceptive])


reine_gs = reine_gs_perceptive


coins = plt.imread('pieces.png')
img_show(coins)


def update(shade):
    img_show(coins > (shade / 255))
    plt.show()
    
_ = widgets.interact(update, shade=(0, 255, 1))


coins_histo,_ = np.histogram(coins, 256, range = (0,1))
plt.plot(coins_histo)
plt.show()


img_show(coins > (155 / 255))


reine_histo, bins = np.histogram(reine_gs, 256, range=(0,1))
plt.plot(reine_histo)
plt.show()


reine_normalized = (reine_gs - (50 /256)) * 256 / (255 - 50)
reine_normalized_histo, bins = np.histogram(reine_normalized, 256, range=(0,1))
plt.plot(reine_normalized_histo)
plt.show()


alternate([reine_gs, reine_normalized])


reine_cdf = reine_histo.cumsum()
plt.plot(reine_cdf)
plt.show()


plt.plot([0,255], [0,reine_cdf[-1]])
plt.show()


reine_equalized = np.interp(reine_gs.flatten(), bins[:-1], reine_cdf / reine_cdf[-1])
reine_equalized = reine_equalized.reshape(reine_gs.shape)
alternate([reine_gs, reine_equalized])


alternate([reine_normalized, reine_equalized])


reine_equalized_histo,_ = np.histogram(reine_equalized, 256, range=(0,1))
plt.plot(reine_equalized_histo)
plt.show()


reine_equalized_cdf = reine_equalized_histo.cumsum()
plt.plot(reine_equalized_cdf)
plt.show()


def apply_kernel(img, kernel):
    sk = kernel.shape
    ps = [int(s/2) for s in sk]
    si = img.shape
    padded_image = img_pad(img, ps[0], ps[1])
    res = np.zeros(img.shape)
    for i in range(sk[0]):
        for j in range(sk[1]):
            res += kernel[sk[0]-i-1,sk[1]-j-1] * padded_image[i:i+si[0],j:j+si[1]]
    return res


kernel = np.ones((9,9))/81


reine_blurred = apply_kernel(reine, kernel)
reine_blurred = np.clip(reine_blurred, 0, 1) #clipping is necessary due to rounding errors, not in theory


img_show(reine_blurred)


img_show(reine_blurred[-256:,-256:], size = (700,700))


kernel = circle_img(9, 1.01)
img_show(kernel, size = (512,512))
kernel = kernel / np.sum(kernel)


reine_blurred = apply_kernel(reine, kernel)


img_show(reine_blurred)


img_show(reine_blurred[-256:,-256:], size = (700,700))


def gaussian(mu, sigma):
    sqs = 2*sigma*sigma
    denom = math.sqrt((2 * math.pi * sigma)**len(mu))
    if(len(mu) > 1):
        def Gxy(*x):
            cx = np.array(x)-mu
            exp = np.exp(- cx.dot(cx) / sqs)
            return exp / denom
        return Gxy
    else:
        def Gxy(x):
            cx = x-mu
            exp = np.exp(- x*x / sqs)
            return exp / denom
        return Gxy
        
X,Y = np.meshgrid(np.linspace(-10,10, 21), np.linspace(-10,10, 21))

fig = plt.figure(figsize=(8,8))
ax = fig.add_subplot(projection='3d')
plt.close()

def update(mux = 0, muy = 0, sigma = 2):
    Gxy = np.vectorize(gaussian(np.array([mux, muy]), sigma))
    Z = Gxy(X,Y)
    ax.clear()
    ax.plot_surface(X,Y,Z, cmap='viridis')
    display(fig)
    
_= widgets.interact(update, mux = (-10,10,1), muy = (-10,10,1), sigma = (0,10,0.1))


def gaussian_grow(kernel):
    s = kernel.shape
    res = np.zeros((s[0]+1,s[1]+1))
    res[:-1,:-1] = kernel
    res[1: ,:-1] += kernel
    res[:, 1:] += res[:, :-1]
    return res

def gaussian_kernel(size):
    g = np.ones((1,1))
    for _ in range(size-1):
        g = gaussian_grow(g)
    return g


gaussian_kernel(3)

array([[1., 2., 1.],
       [2., 4., 2.],
       [1., 2., 1.]])


gaussian_kernel(5)

array([[ 1.,  4.,  6.,  4.,  1.],
       [ 4., 16., 24., 16.,  4.],
       [ 6., 24., 36., 24.,  6.],
       [ 4., 16., 24., 16.,  4.],
       [ 1.,  4.,  6.,  4.,  1.]])


kernel = gaussian_kernel(15)
kernel /= np.sum(kernel)


reine_blurred = apply_kernel(reine, kernel)


img_show(reine_blurred)


img_show(reine_blurred[-256:,-256:], size = (700,700))


x,y = np.meshgrid(np.linspace(-10,10,512),np.linspace(-10,10, 512))


def update(nu = 1, xi = 1):
    z = np.exp(-1j * (nu * x + xi * y))
    img_show((np.real(z) + 1) / 2)
    plt.show()
    
_=widgets.interact(update, nu = (-2,2,0.1), xi = (-2,2,0.1))


z = np.cos(2 * math.pi * x) * np.cos(0.5 * math.pi * y)
img_show((z + 1) / 2)


cos_fft = np.fft.fft2(z)
dft_show(0.0001 * cos_fft)


img_show(coins,(512,512))
img_show(np.fft.fftshift(coins),(512,512))


reine_fft = np.fft.fft2(reine_gs)
dft_show(0.01 * reine_fft)


kernel = circle_img(reine_gs.shape[0], 0.25)
img_show(kernel)


reine_low_pass_fft = reine_fft * np.fft.ifftshift(kernel) #the window has to be 'unshifted'
dft_show(0.001 * reine_low_pass_fft)


reine_gs_low_pass = np.absolute(np.fft.ifft2(reine_low_pass_fft))
img_show(reine_gs_low_pass)


img_show(reine_gs_low_pass[-256:,-768:-512], (700,700))


circle = circle_img(700,0.1)
img_show(circle)


circle_fft = np.fft.fft2(circle)
dft_show(0.002 * circle_fft)


circle_ifft = np.fft.ifft2(np.fft.ifftshift(circle))
#translate the origin from the lower left to the center
circle_ifft = np.fft.fftshift(circle_ifft)
img_show(2000*np.real(circle_ifft))


kernel = gaussian_img(1024, 0.05)
img_show(kernel)


#shifting the kernel for centering at the lower left before fft
gaussian_fft = np.fft.fft2(np.fft.ifftshift(kernel))
dft_show(0.0005 * gaussian_fft)


reine_low_pass_fft = reine_fft * np.fft.ifftshift(kernel)
dft_show(0.001 * reine_low_pass_fft)


reine_low_pass = np.absolute(np.fft.ifft2(reine_low_pass_fft))
img_show(reine_low_pass)


reine_high_pass_fft = np.fft.ifftshift(np.fft.fftshift(reine_fft) * (1 - kernel))
reine_gs_high_pass = np.absolute(np.fft.ifft2(reine_high_pass_fft))
img_show(2*reine_gs_high_pass)


kernel = gaussian_kernel(3) #smooth the image
kernel /= np.sum(kernel)
identity = np.zeros((3,3))
identity[1,1] = 1 #identity filter, doing nothing
details = identity - kernel #details : substracting the smoothed image from the original image
kernel = identity + 3*details #emphasizing the details


reine_details = apply_kernel(reine, details)
img_show(np.clip((10 * reine_details + 0.5), 0, 1))


reine_sharp = np.clip(apply_kernel(reine, kernel), 0, 1)


alternate([reine, reine_sharp])


rs = reine_gs.shape
#centering the kernel is useless here since it is 3x3 there is no good centering
um_fft = np.fft.fft2(kernel, rs)
dft_show(0.2*um_fft)


reine_rgb_fft = [np.fft.fft2(reine[:,:,i]) for i in range(reine.shape[2])]
reine_rgb_back = [np.absolute(np.fft.ifft2(um_fft * reine_rgb_fft[i])) for i in range(reine.shape[2])]
reine_back = np.clip(np.stack(reine_rgb_back, -1), 0, 1)
alternate([reine, reine_back])


reine_back = np.roll(reine_back, -1, axis=(0,1))
alternate([reine, reine_back])


def fast_apply_kernel(img, kernel):
    img_fft = np.fft.fft2(img)
    ks = np.array(kernel.shape)
    kernel_fft = np.fft.fft2(kernel, img.shape)
    res = np.absolute(np.fft.ifft2(kernel_fft * img_fft))
    #compensate the shift due to the kernel not being centered at the lower left
    res = np.roll(res, -(ks[0] // 2), axis = 0)
    res = np.roll(res, -(ks[1] // 2), axis = 1)
    return res


import time

kernel = gaussian_kernel(512)
kernel /= np.sum(kernel)

start_time = time.time()
convolved = fast_apply_kernel(reine_gs, kernel)
print("convolution took %s seconds" % (time.time() - start_time))

alternate([reine_gs,convolved])

convolution took 0.16054391860961914 seconds


import signal

def signal_handler(signum, frame):
    raise Exception("Timed out!")

signal.signal(signal.SIGALRM, signal_handler)
signal.alarm(10)   # Ten seconds execution limit

try:
    apply_kernel(reine_gs, kernel)
except:
    print("Timed out!")

Timed out!


def bilateral(img, sigma_v, sigma_s):
    width = int(3*sigma_s +1)
    spacial_gaussian = gaussian(np.zeros(2), sigma_s) #regular 2D gaussian filter
    value_gaussian = gaussian(np.zeros(1), sigma_v) #another gaussian for dampening based on values
    si = img.shape
    target_shape = [*si,1] if len(si) == 2 else si #hack to handle multi channel images
    
    pad_img = img_pad(img, width, width) #padding to handle edge cases
    res = np.zeros(si)
    
    reg = np.zeros(si)
    for s in np.arange(2*width+1): #naive loops as in regular convolution
        for t in np.arange(2*width+1):
            sw = spacial_gaussian(s-width,t-width) #gaussian influence as in regular gaussian filtering
            if len(si) == 2:
                offset = pad_img[s:s+si[0],t:t+si[1]]
                value_diff = (img - offset) #difference in value between the pixels
                value_weight = value_gaussian(value_diff).reshape(si) #gaussian dampening
                mask = sw * value_weight
            else:
                offset = pad_img[s:s+si[0],t:t+si[1],:]
                value_diff = (img - offset) #difference in value between the pixels
                value_weight = value_gaussian(value_diff).reshape(si) #gaussian dampening
                mask = sw * np.prod(value_weight,2)[:,:,None] 
            reg += mask #sum the influences for final normalization
            res += offset * mask #splat the offset with the correct weighting
            
    return res/reg #normalize the result


reine_bilat = bilateral(reine,0.2,5)


img_show(reine_bilat)


alternate([reine,reine_bilat])


def saltpepper_pollute(img, threshold):
    noise = np.random.random((img.shape))
    return np.clip(img + (noise > threshold) - (noise < (1-threshold)), 0, 1)

reine_corrupted = saltpepper_pollute(reine_gs, 0.95)
img_show(reine_corrupted)
img_show(reine_corrupted[-256:,-256:],(700,700))


def median_filter(img, width):
    si = img.shape
    target_shape = [*si,1] if len(si) == 2 else si
    
    pad_img = img_pad(img, int(width/2), int(width/2)) #padding for edge cases
    
    windows = [] #stack shifted images to have for each pixels the list of its neighboring shades
    for s in np.arange(width):
        for t in np.arange(width):
            windows.append(pad_img[s:s+si[0],t:t+si[1]])

    vlists = np.dstack(windows)
    
    #sort the lists, and get the median values
    return np.sort(vlists,axis=2)[:,:,int(width*width/2)]


reine_medfilt = median_filter(reine_corrupted, 3)
alternate([reine_gs[-256:,-256:], reine_corrupted[-256:,-256:],reine_medfilt[-256:,-256:]], size=(700,700))


cube4s = plt.imread("cube4s.png")
img_show(cube4s)


cube128s = plt.imread("cube128s.png")
img_show(cube128s)


denoised_cube = median_filter(cube4s, 3)
img_show(denoised_cube)


def dilation(img, kernel):
    #using the convolution : a result pixel is white if at least 
    #one input pixel contributed to it in the convolution with the kernel
    #using 0.5 as a threshold rather than 0 to avoid noise
    return fast_apply_kernel(img, kernel) > 0.5

square = np.zeros((500,500))
square[200:300, 200:300] = 1

#input image
img_show(square)

#structuring element : a small disc with a lower right sharp corner
struct_elt = circle_img(30, 1.01)
dx, dy = struct_elt.shape
struct_elt[dx // 2:, dy // 2:] = 1
img_show(struct_elt)

#cube dilated by the circle
dilated_square = dilation(square, struct_elt)
img_show(dilated_square)


def erosion(img, kernel):
    #using the convolution : a result pixel is white if all the pixels contributing 
    #at the resulting pixels with a convolution with the flipped kernel are white
    #substracting 0.5 to the kernel area to avoid noise
    #the kernel is flipped because in the convolution, it is the influence of an input 
    #pixel on its neighborhood, but we need the set of input pixels influencing one 
    #output pixel. Flipping the kernel on both axis gives that.
    flipped_kernel = np.flip(kernel, axis = (0,1))
    return fast_apply_kernel(img, flipped_kernel) > (np.sum(kernel) - 0.5)

#input rounded cube
img_show(dilated_square)

#structuring element : a disc with a lower left sharp corner
struct_elt = np.flip(struct_elt, 1)
img_show(struct_elt)

#eroded cube : a smaller cube with a round corner due to the sharp corner in the structuring element
res = erosion(dilated_square, struct_elt)
img_show(res)


def opening(img, kernel):
    eroded = erosion(img, kernel)
    return dilation(eroded, kernel)


raw_coins = coins > 155 / 256
img_show(raw_coins)


disc_elt = circle_img(5, 1.01)
opened_coins = opening(raw_coins, disc_elt)
img_show(opened_coins)


def closing(img, kernel):
    dilated = dilation(img, kernel)
    return erosion(dilated, kernel)


closed_coins = closing(raw_coins, disc_elt)
img_show(closed_coins)


current_coins = raw_coins

for i in [3, 4, 5, 6, 7, 8, 9, 10, 12, 15, 20]:
    elt = circle_img(i, 1)
    current_coins = opening(current_coins, elt)
    current_coins = closing(current_coins, elt)


img_show(current_coins)

Image processing basics¶

Table of contents¶

Images¶

Perception¶

Color reproduction and representation¶

RGB colors¶

CMYK colors¶

Other color spaces¶

Storing images¶

Vector images¶

Raster images¶

Global filtering¶

Grayscale conversion¶

Thresholding¶

Normalization¶

Equalization¶

Linear filtering¶

Convolution¶

Blur¶

Average filter¶

Gaussian filter¶

Fourrier domain¶

Low / High pass filtering¶

Sharpening¶

Advantages of linear filtering¶

Non linear filtering¶

Bilateral filter¶

Median filter¶

Noise in rendering¶

Mathematical morphology¶

Final remarks¶