scripts/utils.py

import os
import sys
import cv2
import json
import keras
import pickle
import numpy as np
import tensorflow as tf

from config import *
from typing import TypeVar
from keras.applications.xception import Xception
from keras.applications.mobilenet_v2 import MobileNetV2
from keras.applications.inception_v3 import InceptionV3
from keras.applications.inception_resnet_v2 import InceptionResNetV2


config = tf.ConfigProto()
config.gpu_options.allow_growth = True
sess = tf.Session(config=config)
T = TypeVar('T')
MODELS = {
	'xception': 'Xception',
	'mobilenetv2': 'MobileNetV2',
	'inceptionv3': 'InceptionV3',
	'inceptionresnetv2': 'InceptionResNetV2'
}


def read_json(path: str) -> dict:
	"""
	Reads a json file given by the path.
	
	Arguments:
		path {str} -- path of the json file to be read
	
	Returns:
		dict -- label, encoding pairs which describe the mapping
	"""
	with open(path, 'r') as f:
		return json.load(f)


def read_image(path: str) -> np.ndarray:
	"""
	Reads an image given by the path.
	
	Arguments:
		path {str} -- the path of the image to be read
	
	Returns:
		np.ndarray -- an array of image pixels
	"""
	img = cv2.imread(path, cv2.IMREAD_UNCHANGED)
	return np.asarray(img)


def save_image(img: np.ndarray, path: str) -> None:
	"""
	Saves an image to the given path.

	Arguments:
		img {np.ndarray} -- an array of image pixels
		path {str} -- the path of the image to be saved
	"""
	cv2.imwrite(path, img)


def show_image(img: np.ndarray) -> None:
	"""
	Display the image on the screen.
	
	Arguments:
		img {np.ndarray} -- an array of image pixels
	"""
	cv2.imshow('Image', img)
	cv2.waitKey()


def serialize(data: T, path: str) -> None:
	"""
	Serializes the given data and stores the binary in the given path.
	
	Arguments:
		data {T} -- object to serialize
		path {str} -- path to output serialized object
	"""
	with open(path, 'wb') as f:
		pickle.dump(data, f, protocol=pickle.HIGHEST_PROTOCOL)


def deserialize(path: str) -> T:
	"""
	Deserializes the binary in the given path.
	
	Arguments:
		path {str} -- path to serialized object
	
	Returns:
		T -- deserialized object
	"""
	with open(path, 'rb') as f:
		data = pickle.load(f)
	return data


def resize_image(img: np.ndarray) -> np.ndarray:
	"""
	Resizes an image to shape [SHAPE×SHAPE×CHANNELS] format with padding to keep the aspect ratio.
	
	Arguments:
		img {np.ndarray} -- an array of image pixels
	
	Returns:
		np.ndarray -- resized image of shape [SHAPE×SHAPE×CHANNELS]
	"""
	# convert grayscale to rgb
	if len(img.shape) == 2:
		img = cv2.cvtColor(img, cv2.COLOR_GRAY2RGB)
	elif len(image.shape) != 3:
		sys.exit(f'Expected image format to be of Grayscale or Color, found image with shape {img.shape} instead.')
	
	# resize the image
	old_shape = img.shape[1::-1]
	ratio = SHAPE / max(old_shape)
	new_shape = tuple([int(dim * ratio) for dim in old_shape])
	img = cv2.resize(img, new_shape)

	# pad the image
	color = [0, 0, 0]
	w, h = [SHAPE - dim for dim in new_shape]
	top, bottom = h // 2, h - h // 2
	left, right = w // 2, w - w // 2
	img = cv2.copyMakeBorder(img, top, bottom, left, right, cv2.BORDER_CONSTANT, value=color)

	return img


def shuffle_in_unison(a: np.ndarray, b: np.ndarray) -> None:
	"""
	Shuffles 2 numpy arrays together inplace.
	AssertionError if the lengths of a & b are not the same.
	
	Arguments:
		a {np.ndarray} -- a numpy array
		b {np.ndarray} -- a numpy array
	"""
	assert len(a) == len(b)
	rng_state = np.random.get_state()
	np.random.shuffle(a)
	np.random.set_state(rng_state)
	np.random.shuffle(b)


def last_count(path: str) -> int:
	"""
	Computes the last count of the data in the path having format '[label]_[count].png'.
	
	Arguments:
		path {str} -- path to a directory containing the data
	
	Returns:
		int -- last count in the path
	"""
	files = os.listdir(path)
	if not files:
		return 0
	files = [int(f.split('_')[-1].split('.')[0]) for f in files if f.endswith('.png')]
	return sorted(files)[-1]


def region_of_interest(img: np.ndarray) -> np.ndarray:
	"""
	Given an image, computes the region of interest.

	Arguments:
		img {np.ndarray} -- an array of image pixels

	Returns:
		np.ndarray -- region of interest (roi)
	"""
	offset = 125
	height = img.shape[0]
	
	# compute the coordinates of roi
	x1, x2 = 150 - offset, 150 + offset
	y1, y2 = height // 2 - offset, height // 2 + offset
	
	# draw a blue bounding box on the image
	cv2.rectangle(img, (x1, y1), (x2, y2), (255, 0, 0), 2)
	
	return img[y1:y2, x1:x2]


def load_learning_model(model: str) -> keras.Model:
	"""
	Loads the transfer learning model with input shape [SHAPE×SHAPE×CHANNELS].
	
	Arguments:
		model {str} -- One of the options available from MODELS.keys()
	
	Returns:
		keras.Model -- the transfer learning model
	"""
	model = globals()[f'{MODELS[model]}'](include_top=False, weights='imagenet', input_shape=(SHAPE, SHAPE, CHANNELS), classes=NUM_CLASSES)
	layer = model.layers[-1]
	return keras.Model(inputs=model.inputs, outputs=layer.output)