Spaces:

Jimmyzheng-10
/

ScreenCoder

Running

App Files Files Community

ScreenCoder / screencoder /UIED /detect_text /ocr.py

Jimmyzheng-10

Add app.py and the screencoder repo

a383d0e 23 days ago

raw

history blame contribute delete

2.17 kB

	import cv2
	import os
	import requests
	import json
	from base64 import b64encode
	import time


	def Google_OCR_makeImageData(imgpath):
	with open(imgpath, 'rb') as f:
	ctxt = b64encode(f.read()).decode()
	img_req = {
	'image': {
	'content': ctxt
	},
	'features': [{
	'type': 'DOCUMENT_TEXT_DETECTION',
	# 'type': 'TEXT_DETECTION',
	'maxResults': 1
	}]
	}
	return json.dumps({"requests": img_req}).encode()


	def ocr_detection_google(imgpath):
	start = time.perf_counter()
	url = 'https://vision.googleapis.com/v1/images:annotate'
	api_key = 'AIzaSyDUc4iOUASJQYkVwSomIArTKhE2C6bHK8U' # * Replace with your own Key *
	imgdata = Google_OCR_makeImageData(imgpath)
	response = requests.post(url,
	data=imgdata,
	params={'key': api_key},
	headers={'Content_Type': 'application/json'})
	# print('* Text Detection Time Taken:%.3fs *' % (time.perf_counter() - start))
	print("* Please replace the Google OCR key at detect_text/ocr.py line 28 with your own (apply in https://cloud.google.com/vision) *")

	response_json = response.json()
	if 'error' in response_json:
	error_msg = response_json['error']
	if 'BILLING_DISABLED' in str(error_msg):
	raise Exception("Google Vision API requires billing to be enabled. Please:\n"
	"1. Visit https://console.developers.google.com/billing/enable?project=718250946490\n"
	"2. Enable billing for your project\n"
	"3. Wait a few minutes for changes to propagate\n"
	"4. Or use PaddleOCR instead by setting method='paddle'")
	else:
	raise Exception(f"Google Vision API error: {error_msg}")

	if 'responses' not in response_json:
	raise Exception(response_json)
	if response_json['responses'] == [{}]:
	# No Text
	return None
	else:
	return response_json['responses'][0]['textAnnotations'][1:]