import cv2
from matplotlib import pyplot as plt
import numpy as np

image = cv2.imread("./sample/cat.jpg")
plt.imshow(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
plt.show()  # 為什麼要使用 cv2.cvtColor ?

image = cv2.imread("./sample/cat.jpg")
plt.imshow(image)
plt.show()

image = cv2.imread("./sample/cat.jpg")
print(image.shape)

(3888, 5184, 3)

image = cv2.imread("./sample/cat.jpg")
gray_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
plt.imshow(gray_image, cmap='gray')
plt.show()

image = cv2.imread("./sample/cat.jpg")
rotated_image = cv2.rotate(image, cv2.ROTATE_90_COUNTERCLOCKWISE)
plt.imshow(cv2.cvtColor(rotated_image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/cat.jpg")
image_center = tuple(np.array(image.shape[1::-1]) / 2)
rotation_matrix = cv2.getRotationMatrix2D(image_center, 45, 1.0)
rotated_image = cv2.warpAffine(
    image, rotation_matrix, image.shape[1::-1], flags=cv2.INTER_LINEAR)
plt.imshow(cv2.cvtColor(rotated_image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/cat.jpg")
cropped_image = image[200:800, :4000]
plt.imshow(cv2.cvtColor(cropped_image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/cat.jpg")
beluga = cv2.imread("./sample/beluga.jpg")
beluga_height , beluga_width , beluga_depth = beluga.shape
image[:beluga_height,:beluga_width , :beluga_depth] = beluga
plt.imshow(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/leena.png")
plt.imshow(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/leena.png")
noise = np.zeros(image.shape, np.uint8)
mean = 0
stddev = 50
cv2.randn(noise, mean, stddev)
noisy_image = cv2.add(image , noise)
plt.imshow(cv2.cvtColor(noisy_image, cv2.COLOR_BGR2RGB))
plt.show()

blurred_image = cv2.GaussianBlur(noisy_image, (9, 9) , 3)
plt.imshow(cv2.cvtColor(blurred_image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/leena.png")
enhanced_image = cv2.convertScaleAbs(image, alpha=1.5, beta=0) 
plt.imshow(cv2.cvtColor(enhanced_image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/leena.png")
kernel = np.array([[0, -1, 0], [-1, 5, -1], [0, -1, 0]])
sharpened_image = cv2.filter2D(image, -1, kernel) 
plt.imshow(cv2.cvtColor(sharpened_image, cv2.COLOR_BGR2RGB))
plt.show()

image = cv2.imread("./sample/leena.png")
th1 = 100
th2 = 200
edges = cv2.Canny(image, th1, th2) 
plt.imshow(edges , cmap="gray")
plt.show()

import torch
model_name = "resnet18"
model = torch.hub.load('pytorch/vision:v0.10.0', model_name, pretrained=True)
model.eval()
params = sum(p.numel() for p in model.parameters())
print(f"{model_name} 共有 {params} 個參數")

Using cache found in /home/namwoam/.cache/torch/hub/pytorch_vision_v0.10.0

resnet18 共有 11689512 個參數

from torchvision import transforms
image = cv2.imread("./sample/alligator.jpg")
# 將圖片轉為黑白
preprocess = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
])
input_tensor = preprocess(cv2.cvtColor(image, cv2.COLOR_BGR2RGB)) 
input_batch = input_tensor.unsqueeze(0)
plt.imshow(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
plt.show()

# 如果有 GPU 的話將模型移到 GPU 上加速
if torch.cuda.is_available():
    input_batch = input_batch.to('cuda')
    model.to('cuda')

# 結果為 1*1000 的矩陣，代表對應 1000 個類別預測分數
with torch.no_grad():
    output = model(input_batch)

# 將分數轉換為機率
probabilities = torch.nn.functional.softmax(output[0], dim=0)
with open("imagenet_classes.txt", "r") as f:
    categories = [s.strip() for s in f.readlines()]
# 取出前 5 個最有可能的類別
top5_prob, top5_catid = torch.topk(probabilities, 5)
for i in range(top5_prob.size(0)):
    print(categories[top5_catid[i]], top5_prob[i].item())

American alligator 0.2871130704879761
African crocodile 0.08221334964036942
hippopotamus 0.02637476660311222
Komodo dragon 0.02383621595799923
chimpanzee 0.016115523874759674

Python Computer Vision¶

Notes¶

Outline¶

Computer Vision Intro¶

What is Computer Vision ?¶

A Bit of History¶

A Bit of History Cont.¶

A Bit of History Cont.¶

A Bit of History Cont.¶

Image Processing¶

Before we start¶

Import Packages¶

Read Image¶

Image Size¶

Grayscale¶

Rotate¶

Custom Rotation¶

Crop¶

Overlay¶

Practice¶

Image Filter¶

Blur¶

Contrast¶

Algorithm¶

Sharpen¶

Edge Dection¶

Algorithm¶

Practice¶

Image Classification¶

Machine Learning¶

高中生也會的 Deep Learning¶

高中生也會的 Deep Learning Cont.¶

Convolution Neural Network¶

Alexnet¶

呼叫深度學習模型！¶

Practice¶

Remarks¶

Source¶

Additional Information¶

The sky is the limit!!¶