Kartik-cl/block11.python Secret

## block11.python
"""
 Copyright (c) 2019 Intel Corporation
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
      http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
"""

import argparse
import logging
import sys
from pydoc import locate
import cherrypy
import json
from tqdm import tqdm
import base64
from PIL import Image
import io

from segmentoly.data.dataparallel import collate
from segmentoly.data.transforms import *
from segmentoly.datasets.factory import get_dataset
from segmentoly.datasets.images import ImagesDataset
from segmentoly.datasets.video import VideoDataset
from segmentoly.rcnn.openvino_net import MaskRCNNOpenVINO
from segmentoly.utils.logging import setup_logging
from segmentoly.utils.postprocess import postprocess
from segmentoly.utils.profile import Timer
from segmentoly.utils.stats import add_flops_counting_methods, flops_to_string, print_model_with_flops
from segmentoly.utils.tracker import StaticIOUTracker
from segmentoly.utils.visualizer import Visualizer
from segmentoly.utils.weights import load_checkpoint


class Inference:
    def __init__(self):
        self.args = self.parse_args()
        self.transforms = Compose(
        [
            Resize(max_size=self.args.fit_max_image_size, window_size=self.args.fit_window_size, size=self.args.size),
            ToTensor(),
            Normalize(mean=self.args.mean_pixel, std=[1., 1., 1.], rgb=self.args.rgb),
        ]
    )
        self.dataset = get_dataset(self.args.dataset, False, False, self.transforms)
        self.batch_size = 1
        self.net = MaskRCNNOpenVINO(self.args.openvino_model_path, self.args.checkpoint_file_path,
                            device=self.args.device, plugin_dir=self.args.plugin_dir,
                            cpu_extension_lib_path=self.args.cpu_extension,
                            collect_perf_counters=self.args.show_performance_counters)

    def parse_args(self):
        parser = argparse.ArgumentParser(description='Run instance segmentation live')
        subparsers = parser.add_subparsers(help='Backend', dest='backend')

        parser.add_argument('--dataset', help='Training dataset')
        parser.add_argument('--ckpt', dest='checkpoint_file_path', required=True, help='File with models weights')
        parser.add_argument('--mean_pixel', default=(0.0, 0.0, 0.0), type=float, nargs=3,
                        metavar='<num>',
                        help='Mean pixel value to subtract from image.')
        parser.add_argument('--rgb', action='store_true',
                        help='Use RGB instead of BGR.')
        image_resize_group = parser.add_mutually_exclusive_group(required=True)
        image_resize_group.add_argument('--fit_max', dest='fit_max_image_size', default=None, type=int, nargs=2,
                                    metavar='<num>',
                                    help='Max processed image size in a format '
                                         '(max short side, max long side).')
        image_resize_group.add_argument('--fit_window', dest='fit_window_size', default=None, type=int, nargs=2,
                                    metavar='<num>',
                                    help='Max processed image size in a format (max height, max width).')
        image_resize_group.add_argument('--size', dest='size', default=None, type=int, nargs=2,
                                    metavar='<num>',
                                    help='Precise input size (height, width).')

        data_source_parser = parser.add_mutually_exclusive_group(required=True)

        data_source_parser.add_argument('-v', '--video', default=None, type=str,
                                    help='Path to a video file or numeric camera ID.')

        data_source_parser.add_argument('-i', '--images', default=None, type=str,
                                    help='Path to an image or a folder with images.')

        parser.add_argument('--show_scores', action='store_true',
                        help='Show detection scores.')
        parser.add_argument('--show_boxes', action='store_true',
                        help='Show bounding boxes.')
        parser.add_argument('--show_fps', action='store_true',
                        help='Show FPS.')
        parser.add_argument('-pt', '--prob_threshold', default=0.7, type=float,
                        help='Probability threshold for detections filtering.')
        parser.add_argument('--delay', default=0, type=int)

        openvino_parser = subparsers.add_parser('openvino')
        openvino_parser.add_argument('--model', dest='openvino_model_path', default=None, type=str, required=True,
                                 help='XML file with model description (OpenVINO format)')
        openvino_parser.add_argument('-d', '--device',
                                 help='Optional. Specify the target device to infer on: CPU, GPU, FPGA or MYRIAD. '
                                      'The demo will look for a suitable plugin for device specified '
                                      '(by default, it is CPU).',
                                 default='CPU', type=str, metavar='"<device>"')
        openvino_parser.add_argument('-l', '--cpu_extension',
                                 help='Required for CPU custom layers. '
                                      'Absolute path to a shared library with the kernels implementation.',
                                 default=None, type=str, metavar='"<absolute_path>"')
        openvino_parser.add_argument('-pp', '--plugin_dir',
                                 help='Optional. Path to a plugin folder.',
                                 default=None, type=str, metavar='"<absolute_path>"')
        openvino_parser.add_argument('--show_pc', '--show_performance_counters', dest='show_performance_counters',
                                 help='Show OpenVINO performance counters.',
                                 action='store_true')

        pytorch_parser = subparsers.add_parser('pytorch')
        pytorch_parser.add_argument('--model', dest='pytorch_model_class', type=str, required=True,
                                help='Path to module and class implementing Mask R-CNN instance segmentation model.')
        pytorch_parser.add_argument('--show_flops',
                                help='Show FLOPs.',
                                action='store_true')
        pytorch_parser.add_argument('--show_layers_flops',
                                help='Show FLOPs for all modules.',
                                action='store_true')

        return parser.parse_args()


    def output(self, img_path):

        self.args.show_boxes = True #need to pass as a parameter

        viz = Visualizer(self.dataset.classes, confidence_threshold=self.args.prob_threshold,
                        show_boxes=self.args.show_boxes, show_scores=self.args.show_scores)

        inference_timer = Timer(cuda_sync=True, warmup=1)
        timer = Timer(cuda_sync=False, warmup=1)
        timer.tic()

        logging.info('Configuring data source...')
        demo_dataset = ImagesDataset(img_path, labels=self.dataset.classes, transforms=self.transforms)
        num_workers = 1
        tracker = None

        data_loader = torch.utils.data.DataLoader(
            demo_dataset,
            batch_size=self.batch_size,
            num_workers=num_workers,
            shuffle=False,
            collate_fn=collate
        )

        logging.info('Processing data...')
        frames_num = len(demo_dataset)
        for data_batch in tqdm(iter(data_loader), total=frames_num if frames_num != sys.maxsize else 0):
            im_data = data_batch['im_data']
            im_info = data_batch['im_info']
            if torch.cuda.is_available():
                im_data = [i.cuda() for i in im_data]
                im_info = [i.cuda() for i in im_info]
            with torch.no_grad(), inference_timer:
                boxes, classes, scores, _, masks = self.net(im_data, im_info)
                image = data_batch['original_image'][0]
                image = cv2.resize(image, (1344,768), interpolation = cv2.INTER_AREA)
            meta = data_batch['meta'][0]
            scores, classes, boxes, masks = postprocess(scores, classes, boxes, masks,
                                                        im_h=meta['original_size'][0],
                                                        im_w=meta['original_size'][1],
                                                        im_scale_y=meta['processed_size'][0] / meta['original_size'][0],
                                                        im_scale_x=meta['processed_size'][1] / meta['original_size'][1],
                                                        full_image_masks=True, encode_masks=False,
                                                        confidence_threshold=self.args.prob_threshold)


            masks_ids = tracker(masks, classes) if tracker is not None else None
            image = data_batch['original_image'][0]
            visualization = viz(image, boxes, classes, scores, segms=masks, ids=masks_ids)
            fps = 1 / timer.toc()
            if self.args.show_fps:
                visualization = cv2.putText(visualization, 'FPS: {:>2.2f}'.format(fps),
                                            (30, 30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2)
            cv2.imwrite("out.png", visualization)


    def openVino(self):
        self.output(self.args.images)

obj = Inference()
obj.openVino()
	"""
	Copyright (c) 2019 Intel Corporation
	Licensed under the Apache License, Version 2.0 (the "License");
	you may not use this file except in compliance with the License.
	You may obtain a copy of the License at
	http://www.apache.org/licenses/LICENSE-2.0
	Unless required by applicable law or agreed to in writing, software
	distributed under the License is distributed on an "AS IS" BASIS,
	WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	See the License for the specific language governing permissions and
	limitations under the License.
	"""

	import argparse
	import logging
	import sys
	from pydoc import locate
	import cherrypy
	import json
	from tqdm import tqdm
	import base64
	from PIL import Image
	import io

	from segmentoly.data.dataparallel import collate
	from segmentoly.data.transforms import *
	from segmentoly.datasets.factory import get_dataset
	from segmentoly.datasets.images import ImagesDataset
	from segmentoly.datasets.video import VideoDataset
	from segmentoly.rcnn.openvino_net import MaskRCNNOpenVINO
	from segmentoly.utils.logging import setup_logging
	from segmentoly.utils.postprocess import postprocess
	from segmentoly.utils.profile import Timer
	from segmentoly.utils.stats import add_flops_counting_methods, flops_to_string, print_model_with_flops
	from segmentoly.utils.tracker import StaticIOUTracker
	from segmentoly.utils.visualizer import Visualizer
	from segmentoly.utils.weights import load_checkpoint



	class Inference:
	def __init__(self):
	self.args = self.parse_args()
	self.transforms = Compose(
	[
	Resize(max_size=self.args.fit_max_image_size, window_size=self.args.fit_window_size, size=self.args.size),
	ToTensor(),
	Normalize(mean=self.args.mean_pixel, std=[1., 1., 1.], rgb=self.args.rgb),
	]
	)
	self.dataset = get_dataset(self.args.dataset, False, False, self.transforms)
	self.batch_size = 1
	self.net = MaskRCNNOpenVINO(self.args.openvino_model_path, self.args.checkpoint_file_path,
	device=self.args.device, plugin_dir=self.args.plugin_dir,
	cpu_extension_lib_path=self.args.cpu_extension,
	collect_perf_counters=self.args.show_performance_counters)

	def parse_args(self):
	parser = argparse.ArgumentParser(description='Run instance segmentation live')
	subparsers = parser.add_subparsers(help='Backend', dest='backend')

	parser.add_argument('--dataset', help='Training dataset')
	parser.add_argument('--ckpt', dest='checkpoint_file_path', required=True, help='File with models weights')
	parser.add_argument('--mean_pixel', default=(0.0, 0.0, 0.0), type=float, nargs=3,
	metavar='<num>',
	help='Mean pixel value to subtract from image.')
	parser.add_argument('--rgb', action='store_true',
	help='Use RGB instead of BGR.')
	image_resize_group = parser.add_mutually_exclusive_group(required=True)
	image_resize_group.add_argument('--fit_max', dest='fit_max_image_size', default=None, type=int, nargs=2,
	metavar='<num>',
	help='Max processed image size in a format '
	'(max short side, max long side).')
	image_resize_group.add_argument('--fit_window', dest='fit_window_size', default=None, type=int, nargs=2,
	metavar='<num>',
	help='Max processed image size in a format (max height, max width).')
	image_resize_group.add_argument('--size', dest='size', default=None, type=int, nargs=2,
	metavar='<num>',
	help='Precise input size (height, width).')

	data_source_parser = parser.add_mutually_exclusive_group(required=True)

	data_source_parser.add_argument('-v', '--video', default=None, type=str,
	help='Path to a video file or numeric camera ID.')

	data_source_parser.add_argument('-i', '--images', default=None, type=str,
	help='Path to an image or a folder with images.')

	parser.add_argument('--show_scores', action='store_true',
	help='Show detection scores.')
	parser.add_argument('--show_boxes', action='store_true',
	help='Show bounding boxes.')
	parser.add_argument('--show_fps', action='store_true',
	help='Show FPS.')
	parser.add_argument('-pt', '--prob_threshold', default=0.7, type=float,
	help='Probability threshold for detections filtering.')
	parser.add_argument('--delay', default=0, type=int)

	openvino_parser = subparsers.add_parser('openvino')
	openvino_parser.add_argument('--model', dest='openvino_model_path', default=None, type=str, required=True,
	help='XML file with model description (OpenVINO format)')
	openvino_parser.add_argument('-d', '--device',
	help='Optional. Specify the target device to infer on: CPU, GPU, FPGA or MYRIAD. '
	'The demo will look for a suitable plugin for device specified '
	'(by default, it is CPU).',
	default='CPU', type=str, metavar='"<device>"')
	openvino_parser.add_argument('-l', '--cpu_extension',
	help='Required for CPU custom layers. '
	'Absolute path to a shared library with the kernels implementation.',
	default=None, type=str, metavar='"<absolute_path>"')
	openvino_parser.add_argument('-pp', '--plugin_dir',
	help='Optional. Path to a plugin folder.',
	default=None, type=str, metavar='"<absolute_path>"')
	openvino_parser.add_argument('--show_pc', '--show_performance_counters', dest='show_performance_counters',
	help='Show OpenVINO performance counters.',
	action='store_true')

	pytorch_parser = subparsers.add_parser('pytorch')
	pytorch_parser.add_argument('--model', dest='pytorch_model_class', type=str, required=True,
	help='Path to module and class implementing Mask R-CNN instance segmentation model.')
	pytorch_parser.add_argument('--show_flops',
	help='Show FLOPs.',
	action='store_true')
	pytorch_parser.add_argument('--show_layers_flops',
	help='Show FLOPs for all modules.',
	action='store_true')

	return parser.parse_args()


	def output(self, img_path):

	self.args.show_boxes = True #need to pass as a parameter

	viz = Visualizer(self.dataset.classes, confidence_threshold=self.args.prob_threshold,
	show_boxes=self.args.show_boxes, show_scores=self.args.show_scores)

	inference_timer = Timer(cuda_sync=True, warmup=1)
	timer = Timer(cuda_sync=False, warmup=1)
	timer.tic()

	logging.info('Configuring data source...')
	demo_dataset = ImagesDataset(img_path, labels=self.dataset.classes, transforms=self.transforms)
	num_workers = 1
	tracker = None

	data_loader = torch.utils.data.DataLoader(
	demo_dataset,
	batch_size=self.batch_size,
	num_workers=num_workers,
	shuffle=False,
	collate_fn=collate
	)

	logging.info('Processing data...')
	frames_num = len(demo_dataset)
	for data_batch in tqdm(iter(data_loader), total=frames_num if frames_num != sys.maxsize else 0):
	im_data = data_batch['im_data']
	im_info = data_batch['im_info']
	if torch.cuda.is_available():
	im_data = [i.cuda() for i in im_data]
	im_info = [i.cuda() for i in im_info]
	with torch.no_grad(), inference_timer:
	boxes, classes, scores, _, masks = self.net(im_data, im_info)
	image = data_batch['original_image'][0]
	image = cv2.resize(image, (1344,768), interpolation = cv2.INTER_AREA)
	meta = data_batch['meta'][0]
	scores, classes, boxes, masks = postprocess(scores, classes, boxes, masks,
	im_h=meta['original_size'][0],
	im_w=meta['original_size'][1],
	im_scale_y=meta['processed_size'][0] / meta['original_size'][0],
	im_scale_x=meta['processed_size'][1] / meta['original_size'][1],
	full_image_masks=True, encode_masks=False,
	confidence_threshold=self.args.prob_threshold)


	masks_ids = tracker(masks, classes) if tracker is not None else None
	image = data_batch['original_image'][0]
	visualization = viz(image, boxes, classes, scores, segms=masks, ids=masks_ids)
	fps = 1 / timer.toc()
	if self.args.show_fps:
	visualization = cv2.putText(visualization, 'FPS: {:>2.2f}'.format(fps),
	(30, 30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2)
	cv2.imwrite("out.png", visualization)


	def openVino(self):
	self.output(self.args.images)

	obj = Inference()
	obj.openVino()