Initial commit

2026-02-13 18:22:50 +00:00 · 2025-07-28 18:43:47 +08:00
parent 0a6e4ab682
commit 06408ffa6a
702 changed files with 153932 additions and 0 deletions
--- a/UIED/detect_text/Text.py
+++ b/UIED/detect_text/Text.py
@@ -0,0 +1,181 @@
+import cv2
+import numpy as np
+
+
+class Text:
+    def __init__(self, id, content, location):
+        self.id = id
+        self.content = content
+        self.location = location
+
+        self.width = self.location['right'] - self.location['left']
+        self.height = self.location['bottom'] - self.location['top']
+        self.area = self.width * self.height
+        self.word_width = self.width / len(self.content)
+
+    '''
+    ********************************
+    *** Relation with Other text ***
+    ********************************
+    '''
+    def is_justified(self, ele_b, direction='h', max_bias_justify=4):
+        '''
+        Check if the element is justified
+        :param max_bias_justify: maximum bias if two elements to be justified
+        :param direction:
+             - 'v': vertical up-down connection
+             - 'h': horizontal left-right connection
+        '''
+        l_a = self.location
+        l_b = ele_b.location
+        # connected vertically - up and below
+        if direction == 'v':
+            # left and right should be justified
+            if abs(l_a['left'] - l_b['left']) < max_bias_justify and abs(l_a['right'] - l_b['right']) < max_bias_justify:
+                return True
+            return False
+        elif direction == 'h':
+            # top and bottom should be justified
+            if abs(l_a['top'] - l_b['top']) < max_bias_justify and abs(l_a['bottom'] - l_b['bottom']) < max_bias_justify:
+                return True
+            return False
+
+    def is_on_same_line(self, text_b, direction='h', bias_gap=4, bias_justify=4):
+        '''
+        Check if the element is on the same row(direction='h') or column(direction='v') with ele_b
+        :param direction:
+             - 'v': vertical up-down connection
+             - 'h': horizontal left-right connection
+        :return:
+        '''
+        l_a = self.location
+        l_b = text_b.location
+        # connected vertically - up and below
+        if direction == 'v':
+            # left and right should be justified
+            if self.is_justified(text_b, direction='v', max_bias_justify=bias_justify):
+                # top and bottom should be connected (small gap)
+                if abs(l_a['bottom'] - l_b['top']) < bias_gap or abs(l_a['top'] - l_b['bottom']) < bias_gap:
+                    return True
+            return False
+        elif direction == 'h':
+            # top and bottom should be justified
+            if self.is_justified(text_b, direction='h', max_bias_justify=bias_justify):
+                # top and bottom should be connected (small gap)
+                if abs(l_a['right'] - l_b['left']) < bias_gap or abs(l_a['left'] - l_b['right']) < bias_gap:
+                    return True
+            return False
+
+    def is_intersected(self, text_b, bias):
+        l_a = self.location
+        l_b = text_b.location
+        left_in = max(l_a['left'], l_b['left']) + bias
+        top_in = max(l_a['top'], l_b['top']) + bias
+        right_in = min(l_a['right'], l_b['right'])
+        bottom_in = min(l_a['bottom'], l_b['bottom'])
+
+        w_in = max(0, right_in - left_in)
+        h_in = max(0, bottom_in - top_in)
+        area_in = w_in * h_in
+        if area_in > 0:
+            return True
+
+    '''
+    ***********************
+    *** Revise the Text ***
+    ***********************
+    '''
+    def merge_text(self, text_b):
+        text_a = self
+        top = min(text_a.location['top'], text_b.location['top'])
+        left = min(text_a.location['left'], text_b.location['left'])
+        right = max(text_a.location['right'], text_b.location['right'])
+        bottom = max(text_a.location['bottom'], text_b.location['bottom'])
+        self.location = {'left': left, 'top': top, 'right': right, 'bottom': bottom}
+        self.width = self.location['right'] - self.location['left']
+        self.height = self.location['bottom'] - self.location['top']
+        self.area = self.width * self.height
+
+        left_element = text_a
+        right_element = text_b
+        if text_a.location['left'] > text_b.location['left']:
+            left_element = text_b
+            right_element = text_a
+        self.content = left_element.content + ' ' + right_element.content
+        self.word_width = self.width / len(self.content)
+
+    def shrink_bound(self, binary_map):
+        bin_clip = binary_map[self.location['top']:self.location['bottom'], self.location['left']:self.location['right']]
+        height, width = np.shape(bin_clip)
+
+        shrink_top = 0
+        shrink_bottom = 0
+        for i in range(height):
+            # top
+            if shrink_top == 0:
+                if sum(bin_clip[i]) == 0:
+                    shrink_top = 1
+                else:
+                    shrink_top = -1
+            elif shrink_top == 1:
+                if sum(bin_clip[i]) != 0:
+                    self.location['top'] += i
+                    shrink_top = -1
+            # bottom
+            if shrink_bottom == 0:
+                if sum(bin_clip[height-i-1]) == 0:
+                    shrink_bottom = 1
+                else:
+                    shrink_bottom = -1
+            elif shrink_bottom == 1:
+                if sum(bin_clip[height-i-1]) != 0:
+                    self.location['bottom'] -= i
+                    shrink_bottom = -1
+
+            if shrink_top == -1 and shrink_bottom == -1:
+                break
+
+        shrink_left = 0
+        shrink_right = 0
+        for j in range(width):
+            # left
+            if shrink_left == 0:
+                if sum(bin_clip[:, j]) == 0:
+                    shrink_left = 1
+                else:
+                    shrink_left = -1
+            elif shrink_left == 1:
+                if sum(bin_clip[:, j]) != 0:
+                    self.location['left'] += j
+                    shrink_left = -1
+            # right
+            if shrink_right == 0:
+                if sum(bin_clip[:, width-j-1]) == 0:
+                    shrink_right = 1
+                else:
+                    shrink_right = -1
+            elif shrink_right == 1:
+                if sum(bin_clip[:, width-j-1]) != 0:
+                    self.location['right'] -= j
+                    shrink_right = -1
+
+            if shrink_left == -1 and shrink_right == -1:
+                break
+        self.width = self.location['right'] - self.location['left']
+        self.height = self.location['bottom'] - self.location['top']
+        self.area = self.width * self.height
+        self.word_width = self.width / len(self.content)
+
+    '''
+    *********************
+    *** Visualization ***
+    *********************
+    '''
+    def visualize_element(self, img, color=(0, 0, 255), line=1, show=False):
+        loc = self.location
+        cv2.rectangle(img, (loc['left'], loc['top']), (loc['right'], loc['bottom']), color, line)
+        if show:
+            print(self.content)
+            cv2.imshow('text', img)
+            cv2.waitKey()
+            cv2.destroyWindow('text')