mirror of
https://github.com/leigest519/ScreenCoder.git
synced 2026-02-12 17:52:47 +00:00
182 lines
6.8 KiB
Python
182 lines
6.8 KiB
Python
import cv2
|
|
import numpy as np
|
|
|
|
|
|
class Text:
|
|
def __init__(self, id, content, location):
|
|
self.id = id
|
|
self.content = content
|
|
self.location = location
|
|
|
|
self.width = self.location['right'] - self.location['left']
|
|
self.height = self.location['bottom'] - self.location['top']
|
|
self.area = self.width * self.height
|
|
self.word_width = self.width / len(self.content)
|
|
|
|
'''
|
|
********************************
|
|
*** Relation with Other text ***
|
|
********************************
|
|
'''
|
|
def is_justified(self, ele_b, direction='h', max_bias_justify=4):
|
|
'''
|
|
Check if the element is justified
|
|
:param max_bias_justify: maximum bias if two elements to be justified
|
|
:param direction:
|
|
- 'v': vertical up-down connection
|
|
- 'h': horizontal left-right connection
|
|
'''
|
|
l_a = self.location
|
|
l_b = ele_b.location
|
|
# connected vertically - up and below
|
|
if direction == 'v':
|
|
# left and right should be justified
|
|
if abs(l_a['left'] - l_b['left']) < max_bias_justify and abs(l_a['right'] - l_b['right']) < max_bias_justify:
|
|
return True
|
|
return False
|
|
elif direction == 'h':
|
|
# top and bottom should be justified
|
|
if abs(l_a['top'] - l_b['top']) < max_bias_justify and abs(l_a['bottom'] - l_b['bottom']) < max_bias_justify:
|
|
return True
|
|
return False
|
|
|
|
def is_on_same_line(self, text_b, direction='h', bias_gap=4, bias_justify=4):
|
|
'''
|
|
Check if the element is on the same row(direction='h') or column(direction='v') with ele_b
|
|
:param direction:
|
|
- 'v': vertical up-down connection
|
|
- 'h': horizontal left-right connection
|
|
:return:
|
|
'''
|
|
l_a = self.location
|
|
l_b = text_b.location
|
|
# connected vertically - up and below
|
|
if direction == 'v':
|
|
# left and right should be justified
|
|
if self.is_justified(text_b, direction='v', max_bias_justify=bias_justify):
|
|
# top and bottom should be connected (small gap)
|
|
if abs(l_a['bottom'] - l_b['top']) < bias_gap or abs(l_a['top'] - l_b['bottom']) < bias_gap:
|
|
return True
|
|
return False
|
|
elif direction == 'h':
|
|
# top and bottom should be justified
|
|
if self.is_justified(text_b, direction='h', max_bias_justify=bias_justify):
|
|
# top and bottom should be connected (small gap)
|
|
if abs(l_a['right'] - l_b['left']) < bias_gap or abs(l_a['left'] - l_b['right']) < bias_gap:
|
|
return True
|
|
return False
|
|
|
|
def is_intersected(self, text_b, bias):
|
|
l_a = self.location
|
|
l_b = text_b.location
|
|
left_in = max(l_a['left'], l_b['left']) + bias
|
|
top_in = max(l_a['top'], l_b['top']) + bias
|
|
right_in = min(l_a['right'], l_b['right'])
|
|
bottom_in = min(l_a['bottom'], l_b['bottom'])
|
|
|
|
w_in = max(0, right_in - left_in)
|
|
h_in = max(0, bottom_in - top_in)
|
|
area_in = w_in * h_in
|
|
if area_in > 0:
|
|
return True
|
|
|
|
'''
|
|
***********************
|
|
*** Revise the Text ***
|
|
***********************
|
|
'''
|
|
def merge_text(self, text_b):
|
|
text_a = self
|
|
top = min(text_a.location['top'], text_b.location['top'])
|
|
left = min(text_a.location['left'], text_b.location['left'])
|
|
right = max(text_a.location['right'], text_b.location['right'])
|
|
bottom = max(text_a.location['bottom'], text_b.location['bottom'])
|
|
self.location = {'left': left, 'top': top, 'right': right, 'bottom': bottom}
|
|
self.width = self.location['right'] - self.location['left']
|
|
self.height = self.location['bottom'] - self.location['top']
|
|
self.area = self.width * self.height
|
|
|
|
left_element = text_a
|
|
right_element = text_b
|
|
if text_a.location['left'] > text_b.location['left']:
|
|
left_element = text_b
|
|
right_element = text_a
|
|
self.content = left_element.content + ' ' + right_element.content
|
|
self.word_width = self.width / len(self.content)
|
|
|
|
def shrink_bound(self, binary_map):
|
|
bin_clip = binary_map[self.location['top']:self.location['bottom'], self.location['left']:self.location['right']]
|
|
height, width = np.shape(bin_clip)
|
|
|
|
shrink_top = 0
|
|
shrink_bottom = 0
|
|
for i in range(height):
|
|
# top
|
|
if shrink_top == 0:
|
|
if sum(bin_clip[i]) == 0:
|
|
shrink_top = 1
|
|
else:
|
|
shrink_top = -1
|
|
elif shrink_top == 1:
|
|
if sum(bin_clip[i]) != 0:
|
|
self.location['top'] += i
|
|
shrink_top = -1
|
|
# bottom
|
|
if shrink_bottom == 0:
|
|
if sum(bin_clip[height-i-1]) == 0:
|
|
shrink_bottom = 1
|
|
else:
|
|
shrink_bottom = -1
|
|
elif shrink_bottom == 1:
|
|
if sum(bin_clip[height-i-1]) != 0:
|
|
self.location['bottom'] -= i
|
|
shrink_bottom = -1
|
|
|
|
if shrink_top == -1 and shrink_bottom == -1:
|
|
break
|
|
|
|
shrink_left = 0
|
|
shrink_right = 0
|
|
for j in range(width):
|
|
# left
|
|
if shrink_left == 0:
|
|
if sum(bin_clip[:, j]) == 0:
|
|
shrink_left = 1
|
|
else:
|
|
shrink_left = -1
|
|
elif shrink_left == 1:
|
|
if sum(bin_clip[:, j]) != 0:
|
|
self.location['left'] += j
|
|
shrink_left = -1
|
|
# right
|
|
if shrink_right == 0:
|
|
if sum(bin_clip[:, width-j-1]) == 0:
|
|
shrink_right = 1
|
|
else:
|
|
shrink_right = -1
|
|
elif shrink_right == 1:
|
|
if sum(bin_clip[:, width-j-1]) != 0:
|
|
self.location['right'] -= j
|
|
shrink_right = -1
|
|
|
|
if shrink_left == -1 and shrink_right == -1:
|
|
break
|
|
self.width = self.location['right'] - self.location['left']
|
|
self.height = self.location['bottom'] - self.location['top']
|
|
self.area = self.width * self.height
|
|
self.word_width = self.width / len(self.content)
|
|
|
|
'''
|
|
*********************
|
|
*** Visualization ***
|
|
*********************
|
|
'''
|
|
def visualize_element(self, img, color=(0, 0, 255), line=1, show=False):
|
|
loc = self.location
|
|
cv2.rectangle(img, (loc['left'], loc['top']), (loc['right'], loc['bottom']), color, line)
|
|
if show:
|
|
print(self.content)
|
|
cv2.imshow('text', img)
|
|
cv2.waitKey()
|
|
cv2.destroyWindow('text')
|