devarshi16/gocr_image_annotation.py

## gocr_image_annotation.py
from google.cloud import vision
import io
import os
import os
os.environ["GOOGLE_APPLICATION_CREDENTIALS"]="/home/devarshi/gcloud.json"

def detect_text(path):
    """Detects text in the file."""
    client = vision.ImageAnnotatorClient()

    with io.open(path, 'rb') as image_file:
        content = image_file.read()

    image = vision.types.Image(content=content)

    response = client.text_detection(image=image)
    texts = response.text_annotations
    print(path,': Texts:')
    if len(texts) != 0:
        all_texts = []
        for text in texts:
            print('\n"{}"'.format(text.description))
            all_texts.append(text.description.strip())
        return all_texts[:int(len(all_texts)/2)] # For some unknown reason GOCR returns info about same text twice
    else:
        return None

with open('annotations.txt','w') as f:
    for img in os.listdir('cropped'):
        img_path = os.path.join('cropped',img)
        print(img_path)
        text = detect_text(img_path)
        if text!= None:
            f.write(img+' '+' '.join(text)+'\n')
	from google.cloud import vision
	import io
	import os
	import os
	os.environ["GOOGLE_APPLICATION_CREDENTIALS"]="/home/devarshi/gcloud.json"

	def detect_text(path):
	"""Detects text in the file."""
	client = vision.ImageAnnotatorClient()

	with io.open(path, 'rb') as image_file:
	content = image_file.read()

	image = vision.types.Image(content=content)

	response = client.text_detection(image=image)
	texts = response.text_annotations
	print(path,': Texts:')
	if len(texts) != 0:
	all_texts = []
	for text in texts:
	print('\n"{}"'.format(text.description))
	all_texts.append(text.description.strip())
	return all_texts[:int(len(all_texts)/2)] # For some unknown reason GOCR returns info about same text twice
	else:
	return None

	with open('annotations.txt','w') as f:
	for img in os.listdir('cropped'):
	img_path = os.path.join('cropped',img)
	print(img_path)
	text = detect_text(img_path)
	if text!= None:
	f.write(img+' '+' '.join(text)+'\n')