averdones/deeplab_demo_webcam_v2.py

## deeplab_demo_webcam_v2.py
### THIS FILE CAN BE RUN ANYWHERE IN A TERMINAL WRITING 'python deeplab_demo_webcam_v2.py' AS LONG
### AS THE HELPER FILE get_dataset_colormap.py IS IN THE SAME DIRECTORY AS deeplab_demo_webcam_v2.py

## Imports

import collections
import os
import io
import sys
import tarfile
import tempfile
import urllib

from matplotlib import gridspec
from matplotlib import pyplot as plt
import numpy as np
from PIL import Image
import cv2
# import skvideo.io

import tensorflow as tf

# Needed to show segmentation colormap labels
sys.path.append('utils')
import get_dataset_colormap


## Select and download models
_MODEL_URLS = {
    'xception_coco_voctrainaug': 'http://download.tensorflow.org/models/deeplabv3_pascal_train_aug_2018_01_04.tar.gz',
    'xception_coco_voctrainval': 'http://download.tensorflow.org/models/deeplabv3_pascal_trainval_2018_01_04.tar.gz',
}

_TARBALL_NAME = 'deeplab_model.tar.gz'
model_url = _MODEL_URLS['xception_coco_voctrainaug']

model_dir = tempfile.mkdtemp()
tf.io.gfile.makedirs(model_dir)

download_path = os.path.join(model_dir, _TARBALL_NAME)
print('downloading model to %s, this might take a while...' % download_path)
urllib.request.urlretrieve(model_url, download_path)
print('download completed!')

## Load model in TensorFlow
_FROZEN_GRAPH_NAME = 'frozen_inference_graph'

class DeepLabModel(object):
    """Class to load deeplab model and run inference."""

    INPUT_TENSOR_NAME = 'ImageTensor:0'
    OUTPUT_TENSOR_NAME = 'SemanticPredictions:0'
    INPUT_SIZE = 513

    def __init__(self, tarball_path):
        """Creates and loads pretrained deeplab model."""
        self.graph = tf.Graph()

        graph_def = None
        # Extract frozen graph from tar archive.
        tar_file = tarfile.open(tarball_path)
        for tar_info in tar_file.getmembers():
            if _FROZEN_GRAPH_NAME in os.path.basename(tar_info.name):
                file_handle = tar_file.extractfile(tar_info)
                graph_def = tf.compat.v1.GraphDef.FromString(file_handle.read())
                break

        tar_file.close()

        if graph_def is None:
            raise RuntimeError('Cannot find inference graph in tar archive.')

        with self.graph.as_default():
            tf.import_graph_def(graph_def, name='')

        self.sess = tf.compat.v1.Session(graph=self.graph)

    def run(self, image):
        """Runs inference on a single image.

        Args:
            image: A PIL.Image object, raw input image.

        Returns:
            resized_image: RGB image resized from original input image.
            seg_map: Segmentation map of `resized_image`.
        """
        width, height = image.size
        resize_ratio = 1.0 * self.INPUT_SIZE / max(width, height)
        target_size = (int(resize_ratio * width), int(resize_ratio * height))
        resized_image = image.convert('RGB').resize(target_size, Image.ANTIALIAS)
        batch_seg_map = self.sess.run(
            self.OUTPUT_TENSOR_NAME,
            feed_dict={self.INPUT_TENSOR_NAME: [np.asarray(resized_image)]})
        seg_map = batch_seg_map[0]
        return resized_image, seg_map

model = DeepLabModel(download_path)

## Webcam demo
cap = cv2.VideoCapture(0)

# Next line may need adjusting depending on webcam resolution
final = np.zeros((1, 384, 1026, 3))
while True:
    ret, frame = cap.read()

    # From cv2 to PIL
    cv2_im = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
    pil_im = Image.fromarray(cv2_im)

    # Run model
    resized_im, seg_map = model.run(pil_im)

    # Adjust color of mask
    seg_image = get_dataset_colormap.label_to_color_image(
        seg_map, get_dataset_colormap.get_pascal_name()).astype(np.uint8)

    # Convert PIL image back to cv2 and resize
    frame = np.array(pil_im)
    r = seg_image.shape[1] / frame.shape[1]
    dim = (int(frame.shape[0] * r), seg_image.shape[1])[::-1]
    resized = cv2.resize(frame, dim, interpolation = cv2.INTER_AREA)
    resized = cv2.cvtColor(resized, cv2.COLOR_RGB2BGR)

    # Stack horizontally color frame and mask
    color_and_mask = np.hstack((resized, seg_image))

    cv2.imshow('frame', color_and_mask)
    if cv2.waitKey(25) & 0xFF == ord('q'):
        cap.release()
        cv2.destroyAllWindows()
        break


###  UNCOMMENT NEXT LINES TO SAVE THE VIDEO  ###
#    output = np.expand_dims(both, axis=0)
#    final = np.append(final, output, 0)
#skvideo.io.vwrite("outputvideo111.mp4", final)
	### THIS FILE CAN BE RUN ANYWHERE IN A TERMINAL WRITING 'python deeplab_demo_webcam_v2.py' AS LONG
	### AS THE HELPER FILE get_dataset_colormap.py IS IN THE SAME DIRECTORY AS deeplab_demo_webcam_v2.py

	## Imports

	import collections
	import os
	import io
	import sys
	import tarfile
	import tempfile
	import urllib

	from matplotlib import gridspec
	from matplotlib import pyplot as plt
	import numpy as np
	from PIL import Image
	import cv2
	# import skvideo.io

	import tensorflow as tf

	# Needed to show segmentation colormap labels
	sys.path.append('utils')
	import get_dataset_colormap


	## Select and download models
	_MODEL_URLS = {
	'xception_coco_voctrainaug': 'http://download.tensorflow.org/models/deeplabv3_pascal_train_aug_2018_01_04.tar.gz',
	'xception_coco_voctrainval': 'http://download.tensorflow.org/models/deeplabv3_pascal_trainval_2018_01_04.tar.gz',
	}

	_TARBALL_NAME = 'deeplab_model.tar.gz'
	model_url = _MODEL_URLS['xception_coco_voctrainaug']

	model_dir = tempfile.mkdtemp()
	tf.io.gfile.makedirs(model_dir)

	download_path = os.path.join(model_dir, _TARBALL_NAME)
	print('downloading model to %s, this might take a while...' % download_path)
	urllib.request.urlretrieve(model_url, download_path)
	print('download completed!')

	## Load model in TensorFlow
	_FROZEN_GRAPH_NAME = 'frozen_inference_graph'

	class DeepLabModel(object):
	"""Class to load deeplab model and run inference."""

	INPUT_TENSOR_NAME = 'ImageTensor:0'
	OUTPUT_TENSOR_NAME = 'SemanticPredictions:0'
	INPUT_SIZE = 513

	def __init__(self, tarball_path):
	"""Creates and loads pretrained deeplab model."""
	self.graph = tf.Graph()

	graph_def = None
	# Extract frozen graph from tar archive.
	tar_file = tarfile.open(tarball_path)
	for tar_info in tar_file.getmembers():
	if _FROZEN_GRAPH_NAME in os.path.basename(tar_info.name):
	file_handle = tar_file.extractfile(tar_info)
	graph_def = tf.compat.v1.GraphDef.FromString(file_handle.read())
	break

	tar_file.close()

	if graph_def is None:
	raise RuntimeError('Cannot find inference graph in tar archive.')

	with self.graph.as_default():
	tf.import_graph_def(graph_def, name='')

	self.sess = tf.compat.v1.Session(graph=self.graph)

	def run(self, image):
	"""Runs inference on a single image.

	Args:
	image: A PIL.Image object, raw input image.

	Returns:
	resized_image: RGB image resized from original input image.
	seg_map: Segmentation map of `resized_image`.
	"""
	width, height = image.size
	resize_ratio = 1.0 * self.INPUT_SIZE / max(width, height)
	target_size = (int(resize_ratio * width), int(resize_ratio * height))
	resized_image = image.convert('RGB').resize(target_size, Image.ANTIALIAS)
	batch_seg_map = self.sess.run(
	self.OUTPUT_TENSOR_NAME,
	feed_dict={self.INPUT_TENSOR_NAME: [np.asarray(resized_image)]})
	seg_map = batch_seg_map[0]
	return resized_image, seg_map

	model = DeepLabModel(download_path)

	## Webcam demo
	cap = cv2.VideoCapture(0)

	# Next line may need adjusting depending on webcam resolution
	final = np.zeros((1, 384, 1026, 3))
	while True:
	ret, frame = cap.read()

	# From cv2 to PIL
	cv2_im = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
	pil_im = Image.fromarray(cv2_im)

	# Run model
	resized_im, seg_map = model.run(pil_im)

	# Adjust color of mask
	seg_image = get_dataset_colormap.label_to_color_image(
	seg_map, get_dataset_colormap.get_pascal_name()).astype(np.uint8)

	# Convert PIL image back to cv2 and resize
	frame = np.array(pil_im)
	r = seg_image.shape[1] / frame.shape[1]
	dim = (int(frame.shape[0] * r), seg_image.shape[1])[::-1]
	resized = cv2.resize(frame, dim, interpolation = cv2.INTER_AREA)
	resized = cv2.cvtColor(resized, cv2.COLOR_RGB2BGR)

	# Stack horizontally color frame and mask
	color_and_mask = np.hstack((resized, seg_image))

	cv2.imshow('frame', color_and_mask)
	if cv2.waitKey(25) & 0xFF == ord('q'):
	cap.release()
	cv2.destroyAllWindows()
	break


	### UNCOMMENT NEXT LINES TO SAVE THE VIDEO ###
	# output = np.expand_dims(both, axis=0)
	# final = np.append(final, output, 0)
	#skvideo.io.vwrite("outputvideo111.mp4", final)