Computer Vision basics
Computer Vision basics
@Tajamulkhann
Convert images to grayscale
Resize images
Normalize pixel values
Apply filters (Gaussian Blur,
Edge Detection)
import cv2
import numpy as np
image = cv2.imread("image.jpg")
# Load image
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
# Convert to grayscale
resized = cv2.resize(gray, (128, 128))
# Resize image
normalized = resized / 255.0
# Normalize pixel values
@Tajamulkhann
Sobel & Canny Edge Detection
Blurring (Gaussian, Median,
Bilateral)
@Tajamulkhann
Rotation, Flipping, Zooming,
Shearing
Used to increase dataset
diversity in deep learning
from
tensorflow.keras.preprocessing.image
import ImageDataGenerator
datagen =
ImageDataGenerator(rotation_range=30,
horizontal_flip=True)
augmented_image =
datagen.random_transform(image)
@Tajamulkhann
Classifies images into categories
import tensorflow as tf
model = tf.keras.Sequential([
tf.keras.layers.Conv2D(32, (3,3),
activation='relu', input_shape=(128,128,3)),
tf.keras.layers.MaxPooling2D(2,2),
tf.keras.layers.Flatten(),
tf.keras.layers.Dense(128, activation='relu'),
tf.keras.layers.Dense(10, activation='softmax')
])
model.compile(optimizer='adam',
loss='categorical_crossentropy', metrics=
['accuracy'])
@Tajamulkhann
SSD, Faster R-CNN
YOLO (You Only Look Once) –
Real-time object detection
import cv2
net =
cv2.dnn.readNet("yolov3.weights",
"yolov3.cfg")
layer_names = net.getLayerNames()
output_layers = [layer_names[i - 1]
for i in
net.getUnconnectedOutLayers()]
@Tajamulkhann
Haar Cascades – Pre-trained
classifiers for detecting
faces
face_cascade =
cv2.CascadeClassifier(cv2.data.haarcascade
s + "haarcascade_frontalface_default.xml")
faces =
face_cascade.detectMultiScale(gray, 1.1,
4)
@Tajamulkhann
Divides an image into
meaningful parts
import cv2
@Tajamulkhann
Extracts text from images
import pytesseract
text =
pytesseract.image_to_string
(gray)
print(text)
@Tajamulkhann
(GANs, Autoencoders)
GANs (Generative
Adversarial Networks) –
Generate new images)
generator = Sequential([
Dense(256, input_dim=100),
LeakyReLU(alpha=0.2),
Dense(512, activation='relu'),
Dense(1024, activation='relu'),
Dense(784, activation='tanh')
])
@Tajamulkhann
Follow for more!