import os
import cv2
import numpy as np
import matplotlib.pyplot as plt
import matplotlib
from zipfile import ZipFile
from urllib.request import urlretrieve
from IPython.display import Image
%matplotlib inline
Brightness
Image Enhancement
Image Processing techniques take advantage of mathematical operations to achieve different results. Most often we arrive at an enhanced version of the image using some basic operations. We will take a look at some of the fundamental operations often used in computer vision pipelines. In this page we will cover:
- Arithmetic Operations like addition, multiplication
- Thresholding & Masking
- Bitwise Operations like OR, AND, XOR
Setup
- Almost identical to the other pages, let’s setup the jupyter notebook and import the assets
- Remember that I will be activating the venv since I will be using the venv kernel from within jupyter notebook. Steps for that are in all the pages prior to this one.
def download_and_unzip(url, save_path):
print(f"Downloading and extracting assests....", end="")
# Downloading zip file using urllib package.
urlretrieve(url, save_path)
try:
# Extracting zip file using the zipfile package.
with ZipFile(save_path) as z:
# Extract ZIP file contents in the same directory.
0])
z.extractall(os.path.split(save_path)[
print("Done")
except Exception as e:
print("\nInvalid file.", e)
= r"https://www.dropbox.com/s/0oe92zziik5mwhf/opencv_bootcamp_assets_NB4.zip?dl=1"
URL
= os.path.join(os.getcwd(), "opencv_bootcamp_assets_NB4.zip")
asset_zip_path
# Download if assest ZIP does not exists.
if not os.path.exists(asset_zip_path):
download_and_unzip(URL, asset_zip_path)
Add or Subtract Brightness
The first operation we discuss is simple addition to images. This results in increasing or decreasing the brightness of the image since we are eventually increasing or decreasing the intensity values of each pixel by the same amount. So, this will result in a global increase/decrease in brightness.
Read Image
= cv2.imread("New_Zealand_Coast.jpg", cv2.IMREAD_COLOR)
img_bgr = cv2.cvtColor(img_bgr, cv2.COLOR_BGR2RGB)
img_rgb
# Display 18x18 pixel image.
="New_Zealand_Coast.jpg") Image(filename
- Let’s increase/decrease the brightness by the same amount
- So, let’s multiply by 50 each value in the matrix
- Notice here we are using numpy.ones()
- Then we will add or subtract the multiplied values from the original image matrix
= np.ones(img_rgb.shape, dtype="uint8") * 50
matrix
= cv2.add(img_rgb, matrix)
img_rgb_brighter = cv2.subtract(img_rgb, matrix)
img_rgb_darker
# Show the images
=[18, 5])
plt.figure(figsize131); plt.imshow(img_rgb_darker); plt.title("Darker");
plt.subplot(132); plt.imshow(img_rgb); plt.title("Original");
plt.subplot(133); plt.imshow(img_rgb_brighter);plt.title("Brighter"); plt.subplot(
Contrast
Multiplication
Just like addition can result in brightness change, multiplication can be used to improve the contrast of the image.
Contrast is the difference in the intensity values of the pixels of an image. Multiplying the intensity values with a constant can make the difference larger or smaller ( if multiplying factor is < 1 ).
= np.ones(img_rgb.shape) * 0.8
matrix_low_contrast = np.ones(img_rgb.shape) * 1.2
matrix_high_contast
= np.uint8(cv2.multiply(np.float64(img_rgb), matrix_low_contrast))
img_rgb_darker = np.uint8(cv2.multiply(np.float64(img_rgb), matrix_high_contast))
img_rgb_brighter
# Show the images
=[18,5])
plt.figure(figsize131); plt.imshow(img_rgb_darker); plt.title("Lower Contrast");
plt.subplot(132); plt.imshow(img_rgb); plt.title("Original");
plt.subplot(133); plt.imshow(img_rgb_brighter);plt.title("Higher Contrast"); plt.subplot(
NOTE:
Can you see the weird colors in some areas of the image after multiplication? The issue is that after multiplying, the values which are already high, are becoming greater than 255. Thus, the overflow issue. How do we overcome this?
- So what we can do is set the max overflow value to default to a number instead of rolling over to a small number.
- So as you see below, any overflow values will be set to 255 or white and you can tell how the upper left corner is more white than the original because some values have been replaced with 255 after the multiplication
= np.ones(img_rgb.shape) * 0.8
matrix_low_contrast = np.ones(img_rgb.shape) * 1.2
matrix_high_contast
= np.uint8(cv2.multiply(np.float64(img_rgb), matrix_low_contrast))
img_rgb_lower = np.uint8(np.clip(cv2.multiply(np.float64(img_rgb), matrix_high_contast), 0, 255))
img_rgb_higher
# Show the images
=[18,5])
plt.figure(figsize131); plt.imshow(img_rgb_lower); plt.title("Lower Contrast");
plt.subplot(132); plt.imshow(img_rgb); plt.title("Original");
plt.subplot(133); plt.imshow(img_rgb_higher);plt.title("Higher Contrast"); plt.subplot(
Mask / Thresholding
Binary Images have a lot of use cases in Image Processing. One of the most common use cases is that of creating masks. Image Masks allow us to process on specific parts of an image keeping the other parts intact. Image Thresholding is used to create Binary Images from grayscale images. You can use different thresholds to create different binary images from the same original image.
Syntax
= cv2.threshold( src, thresh, maxval, type[, dst] ) retval, dst
dst
: The output array of the same size and type and the same number of channels as src
.
The function has 4 required arguments:
src
: input array (multiple-channel, 8-bit or 32-bit floating point).thresh
: threshold value.maxval
: maximum value to use with the THRESH_BINARY and THRESH_BINARY_INV thresholding types.type
: thresholding type (see ThresholdTypes).
Adaptive Threshold
Syntax
= cv.adaptiveThreshold( src, maxValue, adaptiveMethod, thresholdType, blockSize, C[, dst] ) dst
dst
Destination image of the same size and the same type as src.
The function has 6 required arguments:
src
: Source 8-bit single-channel image.maxValue
: Non-zero value assigned to the pixels for which the condition is satisfiedadaptiveMethod
: Adaptive thresholding algorithm to use, see AdaptiveThresholdTypes. The BORDER_REPLICATE | BORDER_ISOLATED is used to process boundaries.thresholdType:
Thresholding type that must be either THRESH_BINARY or THRESH_BINARY_INV, see ThresholdTypes.blockSize
: Size of a pixel neighborhood that is used to calculate a threshold value for the pixel: 3, 5, 7, and so on.C
: Constant subtracted from the mean or weighted mean (see the details below). Normally, it is positive but may be zero or negative as well.
= cv2.imread("building-windows.jpg", cv2.IMREAD_GRAYSCALE)
img_read = cv2.threshold(img_read, 100, 255, cv2.THRESH_BINARY)
retval, img_thresh
# Show the images
=[18, 5])
plt.figure(figsize
121);plt.imshow(img_read, cmap="gray"); plt.title("Original")
plt.subplot(122);plt.imshow(img_thresh, cmap="gray");plt.title("Thresholded")
plt.subplot(
print(img_thresh.shape)
Example/Sheet Music
Suppose you wanted to build an application that could read (decode) sheet music. This is similar to Optical Character Recognigition (OCR) for text documents where the goal is to recognize text characters. In either application, one of the first steps in the processing pipeline is to isolate the important information in the image of a document (separating it from the background). This task can be accomplished with thresholding techniques. Let’s take a look at an example.
# Read the original image
= cv2.imread("Piano_Sheet_Music.png", cv2.IMREAD_GRAYSCALE)
img_read
# Perform global thresholding
= cv2.threshold(img_read, 50, 255, cv2.THRESH_BINARY)
retval, img_thresh_gbl_1
# Perform global thresholding
= cv2.threshold(img_read, 130, 255, cv2.THRESH_BINARY)
retval, img_thresh_gbl_2
# Perform adaptive thresholding
= cv2.adaptiveThreshold(img_read, 255, cv2.ADAPTIVE_THRESH_MEAN_C, cv2.THRESH_BINARY, 11, 7)
img_thresh_adp
# Show the images
=[18,15])
plt.figure(figsize221); plt.imshow(img_read, cmap="gray"); plt.title("Original");
plt.subplot(222); plt.imshow(img_thresh_gbl_1,cmap="gray"); plt.title("Thresholded (global: 50)");
plt.subplot(223); plt.imshow(img_thresh_gbl_2,cmap="gray"); plt.title("Thresholded (global: 130)");
plt.subplot(224); plt.imshow(img_thresh_adp, cmap="gray"); plt.title("Thresholded (adaptive)"); plt.subplot(
Bitwise Operations
Syntax
Example API for cv2.bitwise_and()
. Others include: cv2.bitwise_or()
, cv2.bitwise_xor()
, cv2.bitwise_not()
= cv2.bitwise_and( src1, src2[, dst[, mask]] ) dst
dst
: Output array that has the same size and type as the input arrays.
The function has 2 required arguments:
src1
: first input array or a scalar.src2
: second input array or a scalar.
An important optional argument is:
mask
: optional operation mask, 8-bit single channel array, that specifies elements of the output array to be changed.
= cv2.imread("rectangle.jpg", cv2.IMREAD_GRAYSCALE)
img_rec
= cv2.imread("circle.jpg", cv2.IMREAD_GRAYSCALE)
img_cir
=[20, 5])
plt.figure(figsize121);plt.imshow(img_rec, cmap="gray")
plt.subplot(122);plt.imshow(img_cir, cmap="gray")
plt.subplot(print(img_rec.shape)
AND Operator
We find what is white in both AND
= cv2.bitwise_and(img_rec, img_cir, mask=None)
result ="gray") plt.imshow(result, cmap
OR Operator
= cv2.bitwise_or(img_rec, img_cir, mask=None)
result ="gray") plt.imshow(result, cmap
XOR Operator
One or the Other NOT both
= cv2.bitwise_xor(img_rec, img_cir, mask=None)
result ="gray") plt.imshow(result, cmap
Example: Logo
- Let’s fill in the white lettering of the logo with the checkered background
- Here is an image of the desired result
='Logo_Manipulation.png') Image(filename
Read Foreground Image
= cv2.imread("coca-cola-logo.png")
img_bgr = cv2.cvtColor(img_bgr, cv2.COLOR_BGR2RGB)
img_rgb
plt.imshow(img_rgb)
print(img_rgb.shape)
= img_rgb.shape[0]
logo_h = img_rgb.shape[1] logo_w
Read Background Image
# Read in image of color cheackerboad background
= cv2.imread("checkerboard_color.png")
img_background_bgr = cv2.cvtColor(img_background_bgr, cv2.COLOR_BGR2RGB)
img_background_rgb
# Resize background image to same size as logo image
= cv2.resize(img_background_rgb, (logo_w, logo_h), interpolation=cv2.INTER_AREA)
img_background_rgb
plt.imshow(img_background_rgb)print(img_background_rgb.shape)
Create Mask of Original
= cv2.cvtColor(img_rgb, cv2.COLOR_RGB2GRAY)
img_gray
# Apply global thresholding to creat a binary mask of the logo
= cv2.threshold(img_gray, 127, 255, cv2.THRESH_BINARY)
retval, img_mask
="gray")
plt.imshow(img_mask, cmapprint(img_mask.shape)
Invert Mask
# Create an inverse mask
= cv2.bitwise_not(img_mask)
img_mask_inv ="gray") plt.imshow(img_mask_inv, cmap
Apply Background to Mask
# Create colorful background "behind" the logo lettering
= cv2.bitwise_and(img_background_rgb, img_background_rgb, mask=img_mask)
img_background plt.imshow(img_background)
Isolate Foreground
# Isolate foreground (red from original image) using the inverse mask
= cv2.bitwise_and(img_rgb, img_rgb, mask=img_mask_inv)
img_foreground plt.imshow(img_foreground)
Merge F & Background
# Add the two previous results obtain the final result
= cv2.add(img_background, img_foreground)
result
plt.imshow(result)"logo_final.png", result[:, :, ::-1]) cv2.imwrite(