mirror of
https://github.com/leigest519/ScreenCoder.git
synced 2026-02-13 10:12:46 +00:00
56 lines
2.1 KiB
Python
56 lines
2.1 KiB
Python
import cv2
|
|
import os
|
|
import requests
|
|
import json
|
|
from base64 import b64encode
|
|
import time
|
|
|
|
|
|
def Google_OCR_makeImageData(imgpath):
|
|
with open(imgpath, 'rb') as f:
|
|
ctxt = b64encode(f.read()).decode()
|
|
img_req = {
|
|
'image': {
|
|
'content': ctxt
|
|
},
|
|
'features': [{
|
|
'type': 'DOCUMENT_TEXT_DETECTION',
|
|
# 'type': 'TEXT_DETECTION',
|
|
'maxResults': 1
|
|
}]
|
|
}
|
|
return json.dumps({"requests": img_req}).encode()
|
|
|
|
|
|
def ocr_detection_google(imgpath):
|
|
start = time.perf_counter()
|
|
url = 'https://vision.googleapis.com/v1/images:annotate'
|
|
api_key = 'AIzaSyDUc4iOUASJQYkVwSomIArTKhE2C6bHK8U' # *** Replace with your own Key ***
|
|
imgdata = Google_OCR_makeImageData(imgpath)
|
|
response = requests.post(url,
|
|
data=imgdata,
|
|
params={'key': api_key},
|
|
headers={'Content_Type': 'application/json'})
|
|
# print('*** Text Detection Time Taken:%.3fs ***' % (time.perf_counter() - start))
|
|
print("*** Please replace the Google OCR key at detect_text/ocr.py line 28 with your own (apply in https://cloud.google.com/vision) ***")
|
|
|
|
response_json = response.json()
|
|
if 'error' in response_json:
|
|
error_msg = response_json['error']
|
|
if 'BILLING_DISABLED' in str(error_msg):
|
|
raise Exception("Google Vision API requires billing to be enabled. Please:\n"
|
|
"1. Visit https://console.developers.google.com/billing/enable?project=718250946490\n"
|
|
"2. Enable billing for your project\n"
|
|
"3. Wait a few minutes for changes to propagate\n"
|
|
"4. Or use PaddleOCR instead by setting method='paddle'")
|
|
else:
|
|
raise Exception(f"Google Vision API error: {error_msg}")
|
|
|
|
if 'responses' not in response_json:
|
|
raise Exception(response_json)
|
|
if response_json['responses'] == [{}]:
|
|
# No Text
|
|
return None
|
|
else:
|
|
return response_json['responses'][0]['textAnnotations'][1:]
|