pip3 install opencv-python


import cv2


cap = cv2.VideoCapture(0)


ret, frame = cap.read()
cap.release() # always remember to release the capture!


import matplotlib.pyplot as plt
plt.imshow(frame);


frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
plt.imshow(frame_rgb);


def plotOpenCVImage(image):
    image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
    fig = plt.imshow(image_rgb)
    return fig


plotOpenCVImage(frame);


print(f'The shape of the image is {frame.shape}')

The shape of the image is (720, 1280, 3)


frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY) # convert to greyscale
print(f'The shape of the grayscale image is {frame_gray.shape}')
plt.imshow(frame_gray, cmap='gray');

The shape of the grayscale image is (720, 1280)


plotOpenCVImage(frame);


plotOpenCVImage(frame[0:100, 1000:1280]);


# save the image to file
cv2.imwrite('test_image.png', frame)

True


# load the image from file
loaded_image = cv2.imread('test_image.png')
plotOpenCVImage(loaded_image);


def RecordVideo(outfilename, record_duration_s = 3):
    cap = cv2.VideoCapture(0)
    
    # set resolution and framerate
    frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
    frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
    fps = 30 # getting it from cap.get(cv2.CAP_PROP_FPS) does not work for my webcam
    
    # Define the codec and create VideoWriter object
    fourcc = cv2.VideoWriter_fourcc(*'XVID')
    out = cv2.VideoWriter(outfilename, fourcc, fps, (frame_width, frame_height))

    print(f'Recording video for {record_duration_s} seconds with resolution {frame_width}x{frame_height}')    
    for i in range(0, fps * record_duration_s):
        ret, frame = cap.read()
        out.write(frame)
    
    cap.release()
    out.release()
    print(f'Video written to {outfilename}')


RecordVideo('test_video.avi', record_duration_s=3)

Recording video for 3 seconds with resolution 1280x720
Video written to test_video.avi


# Open the video capture from the AVI video file
cap = cv2.VideoCapture('test_video.avi')

# Get the number of frames in the video
n_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
print(f'The video contains {n_frames} frames')

# Read frames one by one
for frame_index in range(n_frames):
    ret, frame = cap.read()
    # Do something with the frame before moving on to the next one...
    print(frame_index, frame[0,0]) # just printing the color code of the first pixel of each frame
cap.release()

The video contains 90 frames
0 [3 8 8]
1 [25 32 38]
2 [36 46 50]
3 [40 50 54]
4 [42 52 56]
5 [46 56 60]
6 [49 59 63]
7 [50 60 64]
8 [55 65 69]
9 [72 85 93]
10 [70 86 93]
11 [70 86 93]
12 [70 86 93]
13 [71 87 94]
14 [71 87 94]
15 [71 88 92]
16 [71 88 92]
17 [68 85 89]
18 [65 82 86]
19 [70 87 91]
20 [74 86 91]
21 [74 84 94]
22 [74 84 94]
23 [74 84 96]
24 [74 84 96]
25 [76 89 97]
26 [ 85  98 106]
27 [ 87 103 110]
28 [ 90 106 113]
29 [ 88 104 111]
30 [ 90 106 113]
31 [ 90 106 113]
32 [ 86 102 109]
33 [ 86 102 109]
34 [ 79  95 102]
35 [ 78  94 101]
36 [76 92 99]
37 [78 95 99]
38 [78 95 99]
39 [78 95 99]
40 [77 94 98]
41 [77 94 98]
42 [76 93 97]
43 [76 93 97]
44 [76 93 97]
45 [72 89 93]
46 [72 89 93]
47 [72 89 93]
48 [72 88 95]
49 [75 85 95]
50 [75 85 95]
51 [75 85 95]
52 [74 85 93]
53 [75 86 94]
54 [77 88 96]
55 [77 88 96]
56 [77 88 96]
57 [77 88 96]
58 [77 88 96]
59 [77 88 96]
60 [77 88 96]
61 [71 88 92]
62 [71 88 92]
63 [71 88 92]
64 [72 89 93]
65 [72 89 93]
66 [72 89 93]
67 [72 89 93]
68 [72 89 93]
69 [72 89 93]
70 [72 89 93]
71 [72 89 93]
72 [71 88 92]
73 [73 87 92]
74 [75 89 94]
75 [73 89 96]
76 [73 89 96]
77 [72 88 95]
78 [72 88 95]
79 [72 88 95]
80 [74 90 97]
81 [74 90 97]
82 [74 90 97]
83 [74 90 97]
84 [74 90 97]
85 [74 87 95]
86 [74 87 95]
87 [75 88 96]
88 [75 88 96]
89 [75 88 96]


# get the 10th frame in the video
cap = cv2.VideoCapture('test_video.avi')
cap.set(cv2.CAP_PROP_POS_FRAMES, 9)
ret, frame = cap.read()
cap.release()

plotOpenCVImage(frame);


image = cv2.imread('test_dots.png')
plotOpenCVImage(image);


# first create mask as a null matrix with the same shape as the image
import numpy as np
mask = np.zeros(image.shape[:2], dtype=np.uint8)

# then mask the region outside of these four corners
mask_corners = np.array([[180, 70], [860, 30], [840, 620], [180, 500]])
cv2.drawContours(mask, [mask_corners], -1, 255, -1)
plt.imshow(mask, cmap='gray');


masked_image = cv2.bitwise_and(image, image, mask=mask)
plotOpenCVImage(masked_image);


hsv_image = cv2.cvtColor(masked_image, cv2.COLOR_BGR2HSV)


lower_green = np.array([70, 40, 40])    # Lower bound for green hue (adjust as needed)
upper_green = np.array([90, 255, 255])  # Upper bound for green hue (adjust as needed)
green_regions = cv2.inRange(hsv_image, lower_green, upper_green)
plt.imshow(green_regions, cmap='gray');


plotOpenCVImage(masked_image);
contours, _ = cv2.findContours(green_regions, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)

green_dots_positions = []
for contour in contours:
    if cv2.contourArea(contour) > 50:  # Minimum contour area threshold
        M = cv2.moments(contour)
        center_x = M["m10"] / M["m00"]
        center_y = M["m01"] / M["m00"]
        print(f"Centroid of green dot: (x, y) = ({center_x:.1f}, {center_y:.1f})")
        plt.scatter(center_x, center_y, color='green', marker='o', facecolor='none', s=100);
        green_dots_positions.append([center_x, center_y])

Centroid of green dot: (x, y) = (570.6, 448.1)
Centroid of green dot: (x, y) = (575.2, 310.9)
Centroid of green dot: (x, y) = (576.6, 171.1)


calibration_pixels = np.array([[199, 488], [200, 98], [812, 570], [834, 62]], dtype=np.float32)
for x, y in calibration_pixels:
    plt.scatter(x, y, color='black', marker='o', facecolor='none', s=100)

# the corresponding coordinates in the plane are:
calibration_coords = np.array([[0, 0], [0, 2], [3, 0], [3, 2]], dtype=np.float32)

plotOpenCVImage(masked_image);


transform_matrix = cv2.getPerspectiveTransform(calibration_pixels, calibration_coords)

def get_coordinates(x_pixel, y_pixel, transform_matrix=transform_matrix):
    point_pixels = np.array([[x_pixel], [y_pixel], [1]], dtype=np.float32)
    point_coords = transform_matrix.dot(point_pixels)
    point_coords = point_coords / point_coords[2]
    return point_coords[0][0], point_coords[1][0]


for x, y in green_dots_positions:
    x_coord, y_coord = get_coordinates(x, y)
    print(f"Green dot at (x, y) = ({x_coord:.1f}, {y_coord:.1f})")
plotOpenCVImage(masked_image);

Green dot at (x, y) = (2.0, 0.4)
Green dot at (x, y) = (2.0, 1.0)
Green dot at (x, y) = (2.0, 1.6)

Simple Computer Vision with OpenCV+python¶

What is OpenCV?¶

How are we going to use OpenCV?¶

How to install OpenCV?¶

Acquiring images and videos¶

Image acquisition¶

Image saving and loading¶

Video acquisition¶

Read in a video file¶

Object detection¶

Masking¶

Coloured dots identification¶

Perspective transformation and calibration¶

Summary¶

How can you use this?¶