HaochenGong
create
f1554a2
import cv2
import os
import requests
import json
from base64 import b64encode
import time
def Google_OCR_makeImageData(imgpath):
with open(imgpath, 'rb') as f:
ctxt = b64encode(f.read()).decode()
img_req = {
'image': {
'content': ctxt
},
'features': [{
'type': 'DOCUMENT_TEXT_DETECTION',
# 'type': 'TEXT_DETECTION',
'maxResults': 1
}]
}
return json.dumps({"requests": img_req}).encode()
def ocr_detection_google(imgpath):
# start = time.clock()
url = 'https://vision.googleapis.com/v1/images:annotate'
api_key = os.environ.get('google_ocr')
imgdata = Google_OCR_makeImageData(imgpath)
response = requests.post(url,
data=imgdata,
params={'key': api_key},
headers={'Content_Type': 'application/json'})
# print('*** Text Detection Time Taken:%.3fs ***' % (time.clock() - start))
print("*** Please replace the Google OCR key at detect_text/ocr.py line 28 with your own (apply in https://cloud.google.com/vision) ***")
# print('response.json(): ', response.json())
if response.json()['responses'] == [{}]:
# No Text
return None
else:
return response.json()['responses'][0]['textAnnotations'][1:]