jarodsmk/orient.py

## orient.py
import cv2
import pytesseract
import urllib
import numpy as np
import re

# Installs: https://www.learnopencv.com/deep-learning-based-text-recognition-ocr-using-tesseract-and-opencv/

if __name__ == '__main__':

  # Uncomment the line below to provide path to tesseract manually
  # pytesseract.pytesseract.tesseract_cmd = '/usr/bin/tesseract'


  # Read image from URL
  #   Taken from https://stackoverflow.com/questions/21061814/how-can-i-read-an-image-from-an-internet-url-in-python-cv2-scikit-image-and-mah
  # https://i.ibb.co/4mm9WvZ/book-rot.jpg
  # https://i.ibb.co/M7jwWR2/book.jpg
  # https://i.ibb.co/27bKNJ8/book-rot2.jpg
  resp = urllib.request.urlopen('https://i.ibb.co/27bKNJ8/book-rot2.jpg')
  image = np.asarray(bytearray(resp.read()), dtype="uint8")
  image = cv2.imdecode(image, cv2.IMREAD_COLOR) # Initially decode as color

  #  TAKEN FROM: https://www.pyimagesearch.com/2017/02/20/text-skew-correction-opencv-python/
  # convert the image to grayscale and flip the foreground
  # and background to ensure foreground is now "white" and
  # the background is "black"
  gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
  gray = cv2.bitwise_not(gray)

  rot_data = pytesseract.image_to_osd(image);
  print("[OSD] "+rot_data)
  rot = re.search('(?<=Rotate: )\d+', rot_data).group(0)

  angle = float(rot)
  if angle > 0:
    angle = 360 - angle
  print("[ANGLE] "+str(angle))

  # rotate the image to deskew it
  (h, w) = image.shape[:2]
  center = (w // 2, h // 2)
  M = cv2.getRotationMatrix2D(center, angle, 1.0)
  rotated = cv2.warpAffine(image, M, (w, h),
	flags=cv2.INTER_CUBIC, borderMode=cv2.BORDER_REPLICATE)

  #  TODO: Rotated image can be saved here
  print(pytesseract.image_to_osd(rotated));
  print("[TEXT]")
  # Run tesseract OCR on image
  text = pytesseract.image_to_string(rotated, lang='eng', config="-psm 1")

  # Print recognized text
  print(text.encode(encoding='UTF-8'))
	import cv2
	import pytesseract
	import urllib
	import numpy as np
	import re

	# Installs: https://www.learnopencv.com/deep-learning-based-text-recognition-ocr-using-tesseract-and-opencv/

	if __name__ == '__main__':

	# Uncomment the line below to provide path to tesseract manually
	# pytesseract.pytesseract.tesseract_cmd = '/usr/bin/tesseract'


	# Read image from URL
	# Taken from https://stackoverflow.com/questions/21061814/how-can-i-read-an-image-from-an-internet-url-in-python-cv2-scikit-image-and-mah
	# https://i.ibb.co/4mm9WvZ/book-rot.jpg
	# https://i.ibb.co/M7jwWR2/book.jpg
	# https://i.ibb.co/27bKNJ8/book-rot2.jpg
	resp = urllib.request.urlopen('https://i.ibb.co/27bKNJ8/book-rot2.jpg')
	image = np.asarray(bytearray(resp.read()), dtype="uint8")
	image = cv2.imdecode(image, cv2.IMREAD_COLOR) # Initially decode as color

	# TAKEN FROM: https://www.pyimagesearch.com/2017/02/20/text-skew-correction-opencv-python/
	# convert the image to grayscale and flip the foreground
	# and background to ensure foreground is now "white" and
	# the background is "black"
	gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
	gray = cv2.bitwise_not(gray)

	rot_data = pytesseract.image_to_osd(image);
	print("[OSD] "+rot_data)
	rot = re.search('(?<=Rotate: )\d+', rot_data).group(0)

	angle = float(rot)
	if angle > 0:
	angle = 360 - angle
	print("[ANGLE] "+str(angle))

	# rotate the image to deskew it
	(h, w) = image.shape[:2]
	center = (w // 2, h // 2)
	M = cv2.getRotationMatrix2D(center, angle, 1.0)
	rotated = cv2.warpAffine(image, M, (w, h),
	flags=cv2.INTER_CUBIC, borderMode=cv2.BORDER_REPLICATE)

	# TODO: Rotated image can be saved here
	print(pytesseract.image_to_osd(rotated));
	print("[TEXT]")
	# Run tesseract OCR on image
	text = pytesseract.image_to_string(rotated, lang='eng', config="-psm 1")

	# Print recognized text
	print(text.encode(encoding='UTF-8'))