4 years ago · 1a27cfd39f
--- a/segment/sheet_resolve/analysis/anchor/marker_detection.py
+++ b/segment/sheet_resolve/analysis/anchor/marker_detection.py
@@ -4,8 +4,8 @@ import math
 
															 from .util import *
														
 
															 import ctypes
														
 
															 import time
														
 
															-import sys
														
 
															 import numpy as np
														
 
															+
														
 
															 try:
														
 
															     temp = ctypes.windll.LoadLibrary('opencv_ffmpeg410_64.dll')
														
 
															 except:
														
@@ -181,6 +181,7 @@ def detect_anchor_by_position(anchors, markers, image, method, debug=0):
 
															 def detect_anchor_public(image, method='connected', debug=0):
														
 
															     #   寻找第三方试卷最上方及最下方的定位点
														
 
															+    #   anchor:[xmin, ymin, xmax, ymax]
														
 
															     shift_threshold = 50  # 80
														
 
															     height, width = image.shape[:2]
														
 
															     h0, h1 = 0.1, 0.9
														
@@ -188,34 +189,45 @@ def detect_anchor_public(image, method='connected', debug=0):
 
															     pos_threshold = 0.1
														
 
															     area_threshold = 0.28  # 0.25   # 大定位点面积差阈值
														
 
															     anchors_len_threshold = 2
														
 
															-    shape_para = {'height': (80, 10), 'w2h': (3, 0.6), 'area': (6000, 500), 'area_ratio': 0.9}
														
 
															-    blur_size = 3
														
 
															-    sigma = 5
														
 
															+    shape_para = {'height': (80, 10), 'w2h': (3, 0.6), 'area': (8000, 500), 'area_ratio': 0.9}
														
 
															+    blur_size = 1
														
 
															+    sigma = 1
														
 
															+    ker_size1, ker_size2 = 2, 10
														
 
															+
														
 
															     shift_edge = 2  # 对定位点位置做微调偏移
														
 
															-    binary = pre_process_for_anchors(image, debug=0, blur_size=blur_size, sigma=sigma)
														
 
															-    binary = extract_feature(binary, method=4, debug=0)
														
 
															+    binary = pre_process_for_anchors(image, h_ratio=0, blur_size=blur_size, sigma=sigma, debug=0)
														
 
															+    binary = extract_feature(binary, ker_size1=ker_size1, ker_size2=ker_size2, method=4, debug=0)
														
 
															     boxes = find_boxes(binary, method=method, debug=0)
														
 
															     markers = find_marker_by_shape(boxes, shape_para=shape_para, debug=0)
														
 
															     marker_list = collect_markers_by_position(markers, method='h', shift_threshold=shift_threshold)
														
 
															+    anchor_list = []
														
 
															+    for m in marker_list:
														
 
															+        m = collect_markers_by_area(m)
														
 
															+        anchor_list.append(m)
														
 
															-    if len(marker_list) == 0:
														
 
															+    if len(anchor_list) == 0:
														
 
															         anchors = []
														
 
															-    elif len(marker_list) == 1:
														
 
															-        anchors = marker_list[0]
														
 
															+    elif len(anchor_list) == 1:
														
 
															+        anchors = anchor_list[0]
														
 
															     else:
														
 
															-        anchors = marker_list[0]
														
 
															-        anchors.extend(marker_list[-1])
														
 
															+        anchors = anchor_list[0]
														
 
															+        anchors.extend(anchor_list[-1])
														
 
															     anchors = [[a[0]-shift_edge, a[1]-shift_edge, a[2]-shift_edge-1, a[3]-shift_edge-1] for a in anchors]
														
 
															     if debug == 1:
														
 
															-        # print(anchors)
														
 
															+        #   显示偏移处理后的定位点信息
														
 
															+        print('Anchors after edge shifting:')
														
 
															+        print(anchors)
														
 
															         draw_box(image, anchors, (0, 255, 255), debug=1)
														
 
															         plt.figure(figsize=(15, 10))
														
 
															         plt.title(method)
														
 
															         plt.imshow(image, cmap='gray')
														
 
															         plt.show()
														
 
															     elif debug == 2:
														
 
															+        #   显示偏移处理前的定位点信息
														
 
															+        print('Achors before edge shifting:')
														
 
															+        print(markers)
														
 
															         markers.sort(reverse=True, key=lambda x: x[4][1])
														
 
															         draw_box(image, markers, debug=1)
														
 
															         plt.figure(figsize=(15, 10))
														
@@ -642,3 +654,47 @@ def find_anchor(image, method='connected'):
 
															         anchor_dict = {'class_name': 'anchor_point', 'bounding_box': bbox}
														
 
															         anchors_list.append(anchor_dict)
														
 
															     return anchors_list
														
 
															+
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+    from pathlib import Path
														
 
															+
														
 
															+    # work_dir = sys.argv[1]
														
 
															+    # if os.path.exists(work_dir):
														
 
															+    #     img_list = glob.glob(os.path.join(work_dir, '*.jpg'))
														
 
															+    #     for img_file in img_list:
														
 
															+    #         print(img_file)
														
 
															+    #         anchors, problem_markers = main(img_file, debug=1)
														
 
															+    #
														
 
															+    # else:
														
 
															+    #     print('Directory not found!')
														
 
															+
														
 
															+    work_dir = Path(r'E:\data\location-point\8_5-lin\biology')
														
 
															+    img_list = work_dir.rglob('*.jpg')
														
 
															+    # img_list = glob.glob(os.path.join(work_dir, '*.jpg'))
														
 
															+
														
 
															+    tick = time.clock()
														
 
															+    for img_file in img_list:
														
 
															+        print(img_file)
														
 
															+        image = read_single_img(img_file)
														
 
															+        # rot_image, flag = rotate_by_anchor(image, method='connected', debug=0)
														
 
															+        anchors = detect_anchor_public(image, debug=1)
														
 
															+        # anchors, problem_markers = main(img_file, debug=1)
														
 
															+    toc = time.clock()
														
 
															+    print('time cost:', toc - tick)
														
 
															+    #
														
 
															+    # index = 14
														
 
															+    # img_file = img_list[index]
														
 
															+    # # img_file = r'E:\data\location_point\1.jpg'
														
 
															+    # print(img_file)
														
 
															+    # markers, image = detect_marker(img_file, debug=1)
														
 
															+    # # for index in (0, 2, -20, -19, -15, -16, -1, 13, 16, 18, -34, -21, -30, 7, 14, -42):
														
 
															+    # #     img_file = img_list[index]
														
 
															+    # #     print(img_file)
														
 
															+    # #     markers, image = main(img_file, debug=1)
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
--- a/segment/sheet_resolve/analysis/anchor/util.py
+++ b/segment/sheet_resolve/analysis/anchor/util.py
@@ -19,6 +19,8 @@ def pre_process(image, blank_top=20, blank_bottom=-20, blur_size=5, sigma=5, deb
 
															         gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
														
 
															     elif image.ndim == 2:
														
 
															         gray = image
														
 
															+    else:
														
 
															+        raise Exception('The dimension of the image should be 2 or 3!')
														
 
															     #   裁边
														
 
															     gray[0:blank_top, :] = 255
														
 
															     gray[blank_bottom:, :] = 255
														
@@ -29,6 +31,7 @@ def pre_process(image, blank_top=20, blank_bottom=-20, blur_size=5, sigma=5, deb
 
															     binary = cv2.threshold(pre, 0, 255, cv2.THRESH_BINARY+cv2.THRESH_OTSU)[1]
														
 
															     if debug == 1:
														
 
															+        #   显示灰度图和二值图
														
 
															         plt.figure(figsize=(15, 10))
														
 
															         plt.subplot(211)
														
 
															         plt.title('gray')
														
@@ -41,31 +44,35 @@ def pre_process(image, blank_top=20, blank_bottom=-20, blur_size=5, sigma=5, deb
 
															     return binary
														
 
															-def pre_process_for_anchors(image, blank_top=20, blank_bottom=-20, blur_size=5, sigma=10, blank_size=20, debug=0):
														
 
															+def pre_process_for_anchors(image, blank_top=20, blank_bottom=-20, h_ratio=(0.1, 0.9),
														
 
															+                            blur_size=3, sigma=5, blank_size=20, debug=0):
														
 
															     #   去掉中间内容，返回上下定位点的二值逆图
														
 
															+    #   h_ration=0 则不裁去中间部分
														
 
															-    h_ratio = (0.1, 0.9)
														
 
															-    h0 = int(image.shape[0] * h_ratio[0])
														
 
															-    h1 = int(image.shape[0] * h_ratio[1])
														
 
															-
														
 
															+    # assert(image.ndim == 2 or image.ndim == 3)
														
 
															     if image.ndim == 3:
														
 
															         gray = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)
														
 
															     elif image.ndim == 2:
														
 
															         gray = image.copy()
														
 
															-
														
 
															+    else:
														
 
															+        raise Exception('The dimension of the image should be 2 or 3!')
														
 
															     #   裁边
														
 
															     gray[0:blank_top, :] = 255
														
 
															     gray[blank_bottom:, :] = 255
														
 
															     gray[:, 0:blank_size] = 255
														
 
															     gray[:, -blank_size:] = 255
														
 
															     #   去掉中间内容
														
 
															-    gray[h0:h1, :] = 255
														
 
															+    if h_ratio != 0:
														
 
															+        h0 = int(image.shape[0] * h_ratio[0])
														
 
															+        h1 = int(image.shape[0] * h_ratio[1])
														
 
															+        gray[h0:h1, :] = 255
														
 
															     pre = 255 - gray
														
 
															     pre = cv2.GaussianBlur(pre, (blur_size, blur_size), sigma)
														
 
															     binary = cv2.threshold(pre, 0, 255, cv2.THRESH_BINARY+cv2.THRESH_OTSU)[1]
														
 
															     if debug == 1:
														
 
															+        #   显示灰度图和二值图
														
 
															         plt.figure(figsize=(15, 10))
														
 
															         plt.subplot(211)
														
 
															         plt.title('gray')
														
@@ -106,6 +113,7 @@ def extract_feature(binary, method=4, ker_size1=2, ker_size2=10, debug=0):
 
															     else:
														
 
															         ret = binary
														
 
															     if debug == 1:
														
 
															+        #   显示特征提取其后的图像
														
 
															         plt.figure(figsize=(15, 10))
														
 
															         plt.subplot(211)
														
 
															         plt.title('before feature extraction')
														
@@ -155,8 +163,13 @@ def find_boxes(binary, method='connected', debug=0):
 
															         boxes = draw_contour(binary)
														
 
															     elif method == 'connected':
														
 
															         boxes = draw_connected_component(binary)
														
 
															+    else:
														
 
															+        raise Exception('Wrong method for finding boxes!')
														
 
															+
														
 
															     if debug == 1:
														
 
															+        #   显示boxes信息
														
 
															         boxes.sort(key=lambda x: x[4][1])
														
 
															+        print('The features of the boxes after feature extractions:')
														
 
															         for box in boxes:
														
 
															             width = box[2] - box[0]
														
 
															             height = box[3] - box[1]
														
@@ -191,7 +204,9 @@ def find_marker_by_shape(boxes,
 
															             markers.append(box)
														
 
															     if debug == 1:
														
 
															+        #   显示通过形状参数找到的定位点信息
														
 
															         markers.sort(reverse=True, key=lambda x: x[-1])
														
 
															+        print('The features of the markers picking up by shapes:')
														
 
															         for box in markers:
														
 
															             width = box[2] - box[0]
														
 
															             height = box[3] - box[1]
														
@@ -202,6 +217,8 @@ def find_marker_by_shape(boxes,
 
															             print('width:{}, height:{}, centroid:{}, w_to_h:{}, area:{}, area ratio:{}'.
														
 
															                   format(width, height, centroid, w_to_h, area, area_ratio))
														
 
															     elif debug == 2:
														
 
															+        #   显示所有定位点信息
														
 
															+        print('The features of the markers without picking up by shapes:')
														
 
															         for box in boxes:
														
 
															             markers.append(box)
														
 
															         for box in markers:
														
@@ -324,6 +341,15 @@ def collect_markers_by_position(boxes, method='h', shift_threshold=30, slope_thr
 
															     return box_list
														
 
															+def collect_markers_by_area(boxes, area_threshold=2):
														
 
															+    #   去除面积相差过大的定位点
														
 
															+    boxes.sort(reverse=True, key=lambda x: x[-1])
														
 
															+    # print(boxes[0])
														
 
															+    min_area = boxes[0][-1] / area_threshold
														
 
															+    boxes = [b for b in boxes if b[-1] > min_area]
														
 
															+    return boxes
														
 
															+
														
 
															+
														
 
															 def check_with_anchor(problem_markers, top_anchors, page_width, column_num):
														
 
															     #    根据top_anchors位置去除异常markers
														
 
															     min_shift = 100
														
@@ -483,14 +509,16 @@ def draw_box(image, boxes, color=(0, 255, 0), debug=0):
 
															             cv2.rectangle(image, (box[0], box[1]), (box[2], box[3]), color, 5)
														
 
															     if debug == 1:
														
 
															+        #   显示定位点信息
														
 
															         for box in boxes:
														
 
															             if len(box) == 4:
														
 
															                 width = box[2] - box[0]
														
 
															                 height = box[3] - box[1]
														
 
															                 w_to_h = width / height
														
 
															+                area = width * height
														
 
															                 # centroid = (box[0]+box[1])/2, (box[1]+box[3])/2
														
 
															-                print('width:{}, height:{}, w_to_h:{}, top_left:{}, bottom_right:{},'.
														
 
															-                      format(width, height, w_to_h, box[0:2], box[2:4]))
														
 
															+                print('width:{}, height:{}, w_to_h:{}, area:{}, top_left:{}, bottom_right:{},'.
														
 
															+                      format(width, height, w_to_h, area, box[0:2], box[2:4]))
														
 
															             elif len(box) > 4:
														
 
															                 width = box[2] - box[0]
														
 
															                 height = box[3] - box[1]
														
@@ -622,3 +650,5 @@ def find_column(anchors, width, column_num=2, debug=0):
 
															         print('page width:', page_width, 'column number:', column_num, 'column position:', column_pos)
														
 
															     return page_width, column_num, column_pos
														
 
															+
														
 
															+
														
--- a/segment/sheet_resolve/analysis/choice/choice_line_box.py
+++ b/segment/sheet_resolve/analysis/choice/choice_line_box.py
@@ -291,6 +291,9 @@ def choice_m_row_col0(left, top, image, choice_bbox_list, xml_path, img, choice_
 
															     choice_m_dict_list = []
														
 
															     for index0, box in enumerate(choice_bbox_list['regions']):  # rcnn识别的框匹配题号
														
 
															         box = box['bounding_box']
														
 
															+        box['ymin'] = box['ymin'] - 3  # lf_7_2 1change
														
 
															+        box['xmax'] = box['xmax'] + 3
														
 
															+        box['ymax'] = box['ymax'] + 3
														
 
															         m_left, m_top = box['xmin']+left, box['ymin']+top,
														
 
															         box_coordiante = (m_left, m_top, box['xmax']+left, box['ymax']+top)
														
 
															         tree = utils.create_xml('choice_m', tree,
														
@@ -376,13 +379,25 @@ def choice_bbox_vague(choice_m_list0, x_y_interval_ave, singe_box_width_height_a
 
															             x_diff = x_y_interval_ave[0]
														
 
															             s_width = singe_box_width_height_ave[0]
														
 
															             choice_bbox = (np.hstack((np.array([min(xmin0) - x_diff - 3 * s_width, min(ymin0)]), np.array([max(xmax0), max(ymax0)])))).tolist()
														
 
															-            choice_bbox_with_index_list = (choice_bbox, choice_m_list1[1])
														
 
															+            choice_box = []
														
 
															+            for element in choice_bbox:
														
 
															+                if element < 0:
														
 
															+                    choice_box.append(0)
														
 
															+                else:
														
 
															+                    choice_box.append(element)
														
 
															+            choice_bbox_with_index_list = (choice_box, choice_m_list1[1])
														
 
															             choice_bbox_all.append(choice_bbox_with_index_list)
														
 
															         elif direction == 90:
														
 
															             y_diff = x_y_interval_ave[1]
														
 
															             s_height = singe_box_width_height_ave[1]
														
 
															             choice_bbox = (np.hstack((np.array([min(xmin0), min(ymin0) - y_diff - 3 * s_height]), np.array([max(xmax0), max(ymax0)])))).tolist()
														
 
															-            choice_bbox_with_index_list = (choice_bbox, choice_m_list1[1])
														
 
															+            choice_box = []
														
 
															+            for element in choice_bbox:
														
 
															+                if element < 0:
														
 
															+                    choice_box.append(0)
														
 
															+                else:
														
 
															+                    choice_box.append(element)
														
 
															+            choice_bbox_with_index_list = (choice_box, choice_m_list1[1])
														
 
															             choice_bbox_all.append(choice_bbox_with_index_list)
														
 
															     return choice_bbox_all
														
@@ -418,6 +433,9 @@ def choice_m_adjust(image, choice_m_bbox_list):
 
															     a_z = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
														
 
															     for index0, choice_m in enumerate(choice_m_bbox_list):  # rcnn识别的框匹配题号
														
 
															         box = choice_m['bounding_box']
														
 
															+        box['ymin'] = choice_m['ymin'] - 3  # lf_7_2 1change
														
 
															+        box['xmax'] = choice_m['xmax'] + 3
														
 
															+        box['ymax'] = choice_m['ymax'] + 3
														
 
															         m_left, m_top = box['xmin'], box['ymin'],
														
 
															         # box_coordiante = (m_left, m_top, box['xmax'], box['ymax'])
														
 
															         single_choice_m = utils.crop_region(image, box)
														
@@ -434,7 +452,7 @@ def choice_m_adjust(image, choice_m_bbox_list):
 
															     return choice_m_bbox_list
														
 
															-def choice_m_row_col(image, choice_m_bbox_list, direction, xml_path):
														
 
															+def choice_m_row_col(image, choice_m_bbox_list, direction, subject, xml_path):
														
 
															     a_z = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
														
 
															     choice_m_dict_list = []
														
@@ -444,14 +462,16 @@ def choice_m_row_col(image, choice_m_bbox_list, direction, xml_path):
 
															         choice_m_for_dircetion = utils.crop_region(image, choice_m_bbox_list[random_one]['bounding_box'])
														
 
															         res_dict = get_ocr_text_and_coordinate(choice_m_for_dircetion, ocr_accuracy='accurate', language_type='ENG')
														
 
															         direction = get_direction(res_dict)
														
 
															-
														
 
															     for index0, box in enumerate(choice_m_bbox_list):  # rcnn识别的框匹配题号
														
 
															         box = box['bounding_box']
														
 
															+        box['ymin'] = box['ymin'] - 3   # lf_7_2 1change
														
 
															+        box['xmax'] = box['xmax'] + 3
														
 
															+        box['ymax'] = box['ymax'] + 3
														
 
															         m_left, m_top = box['xmin'], box['ymin'],
														
 
															         # box_coordiante = (m_left, m_top, box['xmax'], box['ymax'])
														
 
															         single_choice_m = utils.crop_region(image, box)
														
 
															         try:
														
 
															-            row_col_dict = get_choice_m_row_and_col(m_left, m_top, single_choice_m)     # 所有的小框，行列等
														
 
															+            row_col_dict = get_choice_m_row_and_col(m_left, m_top, single_choice_m)     # 所有的小框，行列
														
 
															             if len(row_col_dict) > 0:
														
 
															                 if direction == 90:
														
@@ -472,6 +492,8 @@ def choice_m_row_col(image, choice_m_bbox_list, direction, xml_path):
 
															                 row_col_dict.update({'direction': direction, 'option': choice_option,
														
 
															                                      'number': title_number, 'default_points': default_points})
														
 
															                 choice_m_dict_list.append(row_col_dict)
														
 
															+            # else:
														
 
															+            #     del choice_m_bbox_list[index0]
														
 
															         except Exception:
														
 
															             pass
														
@@ -496,7 +518,8 @@ def choice_m_row_col(image, choice_m_bbox_list, direction, xml_path):
 
															         else:
														
 
															             for index, s_box in enumerate(choice_m_box_dict):
														
 
															                 all_small_coordinate_dict = s_box['all_small_coordinate']
														
 
															-                all_small_coordinate_list = [[ele['xmin'], ele['ymin'], ele['xmax'], ele['ymax']] for ele in all_small_coordinate_dict]
														
 
															+                all_small_coordinate_list = [[ele['xmin'], ele['ymin'], ele['xmax'], ele['ymax']] for ele in
														
 
															+                                             all_small_coordinate_dict]
														
 
															                 col = s_box['cols']
														
 
															                 rows = s_box['rows']
														
 
															                 if rows == 1:
														
@@ -511,11 +534,35 @@ def choice_m_row_col(image, choice_m_bbox_list, direction, xml_path):
 
															                         int(np.mean(s_box_array[:, 2])) - int(np.mean(s_box_array[:, 0])),
														
 
															                         int(np.mean(s_box_array[:, 3])) - int(np.mean(s_box_array[:, 1])))
														
 
															                     s_box_w_h.append(s_box_wid_hei)
														
 
															-        x_y_interval_arr = np.array(x_y_interval_all)
														
 
															-        if len(x_y_interval_arr) == 1:
														
 
															+        whether_nan = [ele for index, ele in enumerate(x_y_interval_all) if 'nan' in ele]
														
 
															+        if len(whether_nan) == 0:
														
 
															+            x_y_interval_all0 = x_y_interval_all
														
 
															+        else:
														
 
															+            if len(x_y_interval_all) == 1:
														
 
															+                x_y_interval_all0 = s_box_w_h
														
 
															+            else:
														
 
															+                x_y_interval_all1 = []
														
 
															+                for element in x_y_interval_all:
														
 
															+                    if element not in whether_nan:
														
 
															+                        x_y_interval_all1.append(element)
														
 
															+                x_y_interval_all2 = [x_y_interval_all1[0] for i in range(len(whether_nan))]
														
 
															+                x_y_interval_all0 = x_y_interval_all1 + x_y_interval_all2
														
 
															+
														
 
															+        x_y_interval_arr = np.array(x_y_interval_all0)
														
 
															+        if len(x_y_interval_arr) == 1 and len(rows_list) != 0:
														
 
															             x_y_interval_all_arr = np.array(x_y_interval_all)
														
 
															-            x_ = int(np.mean(x_y_interval_all_arr[:, 0]))
														
 
															-            y_ = int(np.mean(x_y_interval_all_arr[:, 1]))
														
 
															+            x_ = int(np.mean(x_y_interval_all_arr[:, 0][0][0]))
														
 
															+            y_ = int(np.mean(x_y_interval_all_arr[:, 0][0][1]))
														
 
															+            x_y_interval_ave = (x_, y_)
														
 
															+
														
 
															+            singe_box_width_height_ave = s_box_w_h[0]
														
 
															+
														
 
															+            image_height, image_width, _ = image.shape
														
 
															+            image_size = (image_width, image_height)
														
 
															+        elif len(x_y_interval_arr) == 1 and len(rows_list) == 0:
														
 
															+            x_y_interval_all_arr = np.array(x_y_interval_all)
														
 
															+            x_ = int(np.mean(x_y_interval_all_arr[0][0]))
														
 
															+            y_ = int(np.mean(x_y_interval_all_arr[0][1]))
														
 
															             x_y_interval_ave = (x_, y_)
														
 
															             singe_box_width_height_ave = s_box_w_h[0]
														
@@ -530,15 +577,25 @@ def choice_m_row_col(image, choice_m_bbox_list, direction, xml_path):
 
															             image_height, image_width, _ = image.shape
														
 
															             image_size = (image_width, image_height)
														
 
															-        choice_bbox = choice_bbox_vague(choice_m_list, x_y_interval_ave, singe_box_width_height_ave, direction, image_size)
														
 
															+
														
 
															+        choice_bbox = choice_bbox_vague(choice_m_list, x_y_interval_ave, singe_box_width_height_ave, direction,
														
 
															+                                        image_size)
														
 
															         choice_m_dict_list_all_tmp = []
														
 
															         for index, choice_box_ele in enumerate(choice_bbox):
														
 
															-            choice_region = utils.crop_region_direct(image, choice_box_ele[0])
														
 
															-            # choice_path = xml_path[: xml_path.rfind('\\')]
														
 
															-            # cv2.imwrite(os.path.join(choice_path, 'choice_region_' + str(index) + '.jpg'), choice_region)
														
 
															+            choice_bbox_ele = []
														
 
															+            if direction == 180:
														
 
															+                choice_bbox_ele0 = choice_box_ele[0]
														
 
															+                choice_bbox_ele = [choice_bbox_ele0[0], choice_bbox_ele0[1] - 2,
														
 
															+                                   choice_bbox_ele0[2], choice_bbox_ele0[3] + 5]
														
 
															+            elif direction == 90:
														
 
															+                choice_bbox_ele = choice_box_ele[0]
														
 
															+            choice_region = utils.crop_region_direct(image, choice_bbox_ele)
														
 
															+            choice_path = xml_path[: xml_path.rfind('/')]
														
 
															+            cv2.imwrite(os.path.join(choice_path, 'choice_region_' + str(index) + '.jpg'), choice_region)
														
 
															             choice_m_box_dict_new = [choice_m_box_dict[i] for i in choice_box_ele[1]]
														
 
															-            choice_m_dict_list_part = get_title_number_by_choice_m.get_title_number(choice_box_ele[0], choice_region,
														
 
															-                                                                                     choice_m_box_dict_new, direction)
														
 
															+            choice_m_dict_list_part = get_title_number_by_choice_m.get_title_number(choice_bbox_ele, choice_region,
														
 
															+                                                                                    image, choice_m_box_dict_new,
														
 
															+                                                                                    x_y_interval_ave, subject, direction)
														
 
															             choice_m_dict_list_all_tmp.append(choice_m_dict_list_part)
														
 
															         if len(choice_m_dict_list_all_tmp) == 1:
														
 
															             choice_m_dict_list_all = choice_m_dict_list_all_tmp[0]
														
--- a/segment/sheet_resolve/analysis/choice/get_title_number_by_choice_m.py
+++ b/segment/sheet_resolve/analysis/choice/get_title_number_by_choice_m.py
@@ -4,6 +4,7 @@ import numpy as np
 
															 import re, os
														
 
															 import xml.etree.cElementTree as ET
														
 
															 import cv2
														
 
															+from concurrent.futures import ThreadPoolExecutor
														
 
															 def combine_char(all_digital_list):
														
@@ -42,6 +43,82 @@ def combine_char(all_digital_list):
 
															     return new_all_digital_list
														
 
															+def modify_coordinate(words_result_choice):
														
 
															+    # single character height 22  width  17
														
 
															+    # two character height 21  width 30
														
 
															+    digital_list = []
														
 
															+    for ele in words_result_choice:
														
 
															+        pattern1 = re.compile('\d+')
														
 
															+        if pattern1.findall(ele['char']):
														
 
															+            digital_list.append(ele)
														
 
															+            # if re.search('[ABCD]', ele['char']) == None:
														
 
															+            #     digital_list.append(ele)
														
 
															+
														
 
															+    s_l = []
														
 
															+    t_l = []
														
 
															+
														
 
															+    for ele in digital_list:
														
 
															+        char = ele['char']
														
 
															+        char1 = re.findall('\d+', char)[0]
														
 
															+        pattern1 = re.compile('\d+')
														
 
															+        pattern2 = re.compile(r'[A|B|C|D]|[(（]|[)）]')  # ABCD ..
														
 
															+        pattern3 = re.compile('[\u4e00-\u9fa5]')  # chinese char
														
 
															+        if pattern1.findall(ele['char']):
														
 
															+            if not pattern3.findall(ele['char']) and not pattern2.findall(ele['char']):
														
 
															+                if len(char1) == 1:
														
 
															+                    s_l.append(ele)
														
 
															+                else:
														
 
															+                    t_l.append(ele)
														
 
															+
														
 
															+    if s_l != []:
														
 
															+        s_h_list = [ele['location']['height'] for ele in s_l]
														
 
															+        s_w_list = [ele['location']['width'] for ele in s_l]
														
 
															+
														
 
															+        s_h_mean = int(np.mean(np.array(s_h_list)))  # single  height
														
 
															+        s_w_mean = int(np.mean(np.array(s_w_list)))  # single  width
														
 
															+    else:
														
 
															+        s_h_list = [ele['location']['height'] for ele in words_result_choice]
														
 
															+        s_h_mean = int(np.mean(np.array(s_h_list)))  # single  height
														
 
															+        s_w_mean = 18
														
 
															+
														
 
															+    if t_l != []:
														
 
															+        t_h_list = [ele['location']['height'] for ele in t_l]
														
 
															+        t_w_list = [ele['location']['width'] for ele in t_l]
														
 
															+
														
 
															+        t_h_mean = int(np.mean(np.array(t_h_list)))  # single  height
														
 
															+        t_w_mean = int(np.mean(np.array(t_w_list)))  # single  width
														
 
															+    else:
														
 
															+        t_h_list = [ele['location']['height'] for ele in words_result_choice]
														
 
															+        t_h_mean = int(np.mean(np.array(t_h_list)))  # single  height
														
 
															+        t_w_mean = 31
														
 
															+
														
 
															+    digital_list_all = []
														
 
															+    for ele in words_result_choice:
														
 
															+        pattern1 = re.compile('\d+')
														
 
															+        if pattern1.findall(ele['char']):
														
 
															+            if re.search('[A|B|C|D]', ele['char']) != None:
														
 
															+                char1 = len(pattern1.findall(ele['char'])[0])
														
 
															+                if char1 == 1:
														
 
															+                    location = {}
														
 
															+                    location['left'] = ele['location']['left']
														
 
															+                    location['top'] = ele['location']['top']
														
 
															+                    location['width'] = s_w_mean
														
 
															+                    location['height'] = s_h_mean
														
 
															+                    ele.update({'location': location})
														
 
															+                    digital_list_all.append(ele)
														
 
															+                elif char1 == 2:
														
 
															+                    location = {}
														
 
															+                    location['left'] = ele['location']['left']
														
 
															+                    location['top'] = ele['location']['top']
														
 
															+                    location['width'] = t_w_mean
														
 
															+                    location['height'] = t_h_mean
														
 
															+                    ele.update({'location': location})
														
 
															+                    digital_list_all.append(ele)
														
 
															+            else:
														
 
															+                digital_list_all.append(ele)
														
 
															+    return digital_list_all
														
 
															+
														
 
															+
														
 
															 def get_x_diff_and_y_diff0(single_choice_m_coordinates):
														
 
															     single_choice_m_matrix = np.array(single_choice_m_coordinates)
														
 
															     x_diff = single_choice_m_matrix[1:, 0] - single_choice_m_matrix[:-1, 2]
														
@@ -303,26 +380,203 @@ def analysis_s_box(choice_m_bbox_list):
 
															     return choice_m_box_dict
														
 
															-def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
														
 
															-    words_result_choice = get_ocr_text_and_coordinate0(choice_region, ocr_accuracy='accurate', language_type='CHN_ENG')
														
 
															+def decide_box_left(one_line_box, digital_list):
														
 
															+    one_line_box = sorted(one_line_box, key=lambda k: k[0])
														
 
															+
														
 
															+    min_w = one_line_box[0][0]
														
 
															+    max_w = one_line_box[-1][2]
														
 
															+    width = max_w - min_w
														
 
															+
														
 
															+    s_box_width = 27
														
 
															+    s_box_height = 20
														
 
															+
														
 
															+    # compare two box
														
 
															+    s_box = one_line_box[0]
														
 
															+
														
 
															+    s_box_xmin = s_box[0]
														
 
															+    s_box_ymin = s_box[1]
														
 
															+    s_box_xmax = s_box[2]
														
 
															+    s_box_ymax = s_box[3]
														
 
															+
														
 
															+    mid_x1 = int(s_box_xmin + (s_box_xmax - s_box_xmin) // 2)
														
 
															+    mid_y1 = int(s_box_ymin + (s_box_ymax - s_box_ymin) // 2)
														
 
															+
														
 
															+    digital_box = digital_list[0]
														
 
															+
														
 
															+    xmin_d = digital_box['location']['left']
														
 
															+    ymin_d = digital_box['location']['top']
														
 
															+    xmax_d = digital_box['location']['left'] + digital_box['location']['width']
														
 
															+    ymax_d = digital_box['location']['top'] + digital_box['location']['height']
														
 
															+
														
 
															+    if xmin_d < s_box_xmin and mid_x1 <= 2 * width and ymin_d <= mid_y1 <= ymax_d:
														
 
															+        return True
														
 
															+    else:
														
 
															+        return False
														
 
															+
														
 
															+
														
 
															+def analyse_words_result(words_result):
														
 
															+    char_list = []
														
 
															+    for ele in words_result:
														
 
															+        digital_list = []
														
 
															+        un_digital_list = []
														
 
															+        for ele0 in ele['chars']:
														
 
															+            digital = re.findall('\d+', ele0['char'])
														
 
															+            if len(digital) == 0:
														
 
															+                un_digital_list.append(ele0)
														
 
															+            else:
														
 
															+                digital_list.append(ele0)
														
 
															+        digital_list1 = combine_char(digital_list)
														
 
															+        words_dict = {}
														
 
															+        words_dict['words'] = ele['words']
														
 
															+        char_list_all = digital_list1 + un_digital_list + [words_dict]
														
 
															+        char_list.append(char_list_all)
														
 
															+    return char_list
														
 
															+
														
 
															+
														
 
															+def get_chinese_choice_number(choice_m_box_dict, image):
														
 
															+    for index, ele in enumerate(choice_m_box_dict):
														
 
															+        choice_m_box = [ele['bounding_box']['xmin'], ele['bounding_box']['ymin'],
														
 
															+                        ele['bounding_box']['xmax'], ele['bounding_box']['ymax']]
														
 
															+
														
 
															+        all_small_coordinate_dict = ele['all_small_coordinate']
														
 
															+        all_small_coordinate_list = [[ele['xmin'], ele['ymin'], ele['xmax'], ele['ymax']] for ele in
														
 
															+                                     all_small_coordinate_dict]
														
 
															+        res_list = get_one_line_box(all_small_coordinate_list, ele['single_height'])
														
 
															+
														
 
															+        c_w = choice_m_box[2] - choice_m_box[0]
														
 
															+        c_h = choice_m_box[3] - choice_m_box[1]
														
 
															+
														
 
															+        choice_m_box_forward = [choice_m_box[0] - int(1.5 * c_w), ele['bounding_box']['ymin'] - 5,
														
 
															+                                    ele['bounding_box']['xmax'], ele['bounding_box']['ymax']]
														
 
															+
														
 
															+        all_small_coordinate_list_new = []
														
 
															+        for s_box_line in res_list:
														
 
															+            line_box = []
														
 
															+            for s_box in s_box_line:
														
 
															+                ss_box = utils.get_img_region_box1(s_box, choice_m_box_forward)
														
 
															+                line_box.append(ss_box)
														
 
															+            line_box_array = np.array(line_box)
														
 
															+            width_s = int(np.mean(line_box_array[:, 2] - line_box_array[:, 0]))
														
 
															+            width_h = int(np.mean(line_box_array[:, 3] - line_box_array[:, 1]))
														
 
															+            s_box_dict = {}
														
 
															+            s_box_dict['bbox'] = line_box
														
 
															+            s_box_dict['width_s'] = width_s
														
 
															+            s_box_dict['width_h'] = width_h
														
 
															+            all_small_coordinate_list_new.append(s_box_dict)
														
 
															+        # print(all_small_coordinate_list_new)
														
 
															+
														
 
															+        region = utils.crop_region_direct(image, choice_m_box_forward)
														
 
															+        words_result = get_ocr_text_and_coordinate0(region)
														
 
															+        char_list = analyse_words_result(words_result)
														
 
															+
														
 
															+        number0 = []
														
 
															+        value0 = []
														
 
															+        for one_line in all_small_coordinate_list_new:
														
 
															+            one_line_box = one_line['bbox']
														
 
															+
														
 
															+            number_list = []
														
 
															+            for ele_line in char_list:
														
 
															+                ele_line_copy = ele_line.copy()
														
 
															+                ele_line_copy = [ele for ele in ele_line_copy if 'char' in ele]
														
 
															+
														
 
															+                digital_list_line = sorted(ele_line_copy, key=lambda k: k['location']['left'])
														
 
															+                # TODO  decide left
														
 
															+
														
 
															+                if decide_box_left(one_line_box, digital_list_line) == True:
														
 
															+                    number_list.append(ele_line)
														
 
															+                else:
														
 
															+                    continue
														
 
															+            # print(number_list)
														
 
															+
														
 
															+            for s_bbox0 in number_list:
														
 
															+                for s_bbox in s_bbox0:
														
 
															+                    if 'words' in s_bbox:
														
 
															+                        words = s_bbox['words']
														
 
															+
														
 
															+                        pattern1 = re.compile(
														
 
															+                            '^\d+[,、.]?[\u4e00-\u9fa5]?[(（]?\d+分+[)）]?[(（]?\d+[)）]?|^\d+[,、.]?[\u4e00-\u9fa5]?[(（]?\d+分+[)）]?')
														
 
															+                        result1 = re.findall(pattern1, words)
														
 
															+
														
 
															+                        pattern11 = re.compile('^\d+[,、.]?[\u4e00-\u9fa5]?[(（]?\d+[)）]?')
														
 
															+                        result11 = re.findall(pattern11, words)
														
 
															+
														
 
															+                        pattern2 = re.compile('[(（]?\d+[)）]?')
														
 
															+                        result2 = re.findall(pattern2, words)
														
 
															+
														
 
															+                        pattern3 = re.compile('[(（]?\d?分+[)）]?')
														
 
															+                        result3 = re.findall(pattern3, words)
														
 
															+
														
 
															+                        if result2 and result3:
														
 
															+                            number = int(result2[0])
														
 
															+                            value_str = re.findall('\d+', result2[1])
														
 
															+                            value = int(value_str[0])
														
 
															+                            number0.append(number)
														
 
															+                            value0.append(value)
														
 
															+
														
 
															+                        elif result2 and not result3:
														
 
															+                            number = int(result2[0])
														
 
															+                            value = -1
														
 
															+                            number0.append(number)
														
 
															+                            value0.append(value)
														
 
															+
														
 
															+        ele.update({'number': number0, 'default_points': value0})
														
 
															+    return choice_m_box_dict
														
 
															+
														
 
															+
														
 
															+def get_title_number(choice_bbox, choice_region, image, choice_m_box_dict, x_y_interval_ave0, subject, direction):
														
 
															+    # c_h, c_w, _ = choice_region.shape
														
 
															+    # if c_h * c_w > 1000 * 1000:
														
 
															+    #     # baidu ocr format
														
 
															+    #     words_result_choice_raw = get_ocr_text_and_coordinate0(choice_region, ocr_accuracy='accurate', language_type='CHN_ENG')
														
 
															+    #     words_result_choice1 = [ele1 for ele in words_result_choice_raw for ele1 in ele['chars']]
														
 
															+    #     words_result_choice1 = combine_char(words_result_choice1)    # baidu need
														
 
															+
														
 
															+    # else:
														
 
															+    # tr ocr
														
 
															+    words_result_choice1 = ''
														
 
															+    if direction == 90:
														
 
															+        words_result_choice_raw = get_ocr_text_and_coordinate0(choice_region, ocr_accuracy='accurate', language_type='CHN_ENG')
														
 
															+        char_list = [ele1 for ele in words_result_choice_raw for ele1 in ele['chars']]
														
 
															+        words_result_choice1 = combine_char(char_list)
														
 
															+
														
 
															+    elif direction == 180:
														
 
															+        choice_gray = cv2.cvtColor(choice_region, cv2.COLOR_BGR2GRAY)
														
 
															+        with ThreadPoolExecutor() as executor:
														
 
															+            future = executor.submit(tr.run, choice_gray)
														
 
															+            words_result_choice0 = future.result()
														
 
															+            words_result_choice_tmp = utils.change_baidu_to_tr_format(words_result_choice0)
														
 
															+            # tr  I  -- > 1
														
 
															+            words_result_choice1 = []
														
 
															+            for ele in words_result_choice_tmp:
														
 
															+                if 'I' in ele['char']:
														
 
															+                    element = re.sub('I', '1', ele['char'])
														
 
															+                    ele.update({'char': element})
														
 
															+                    words_result_choice1.append(ele)
														
 
															+                else:
														
 
															+                    words_result_choice1.append(ele)
														
 
															+    words_result_choice = modify_coordinate(words_result_choice1)
														
 
															+
														
 
															     all_digital_list0 = []
														
 
															-    pattern = re.compile(r'\d')
														
 
															-    for i, chars_dict in enumerate(words_result_choice):
														
 
															-        chars_list = chars_dict['chars']
														
 
															-        for ele in chars_list:
														
 
															-            if pattern.search(ele['char']):
														
 
															-                all_digital_list0.append(ele)
														
 
															+    pattern = re.compile(r'\d+')
														
 
															+    for i, ele in enumerate(words_result_choice):
														
 
															+        if pattern.findall(ele['char']):
														
 
															+            all_digital_list0.append(ele)
														
 
															+
														
 
															+    for i, ele in enumerate(all_digital_list0):
														
 
															+        if pattern.findall(ele['char']):
														
 
															+            new_char = pattern.findall(ele['char'])[0]
														
 
															+            ele.update({'char': new_char})
														
 
															+    # # tree = ET.parse(r'C:\Users\admin\Desktop\exam_segment_django113\segment\exam_info\000000-template.xml')  # xml tree
														
 
															+    # # for index, bbox in enumerate(all_digital_list0):
														
 
															+    # #     # bbox0 = region_info['bbox']
														
 
															+    # #     location = bbox['location']
														
 
															+    # #     xmin = location['left']
														
 
															+    # #     ymin = location['top']
														
 
															+    # #     xmax = location['left'] + location['width']
														
 
															+    # #     ymax = location['top'] + location['height']
														
 
															+    # #     tree = utils.create_xml(bbox['char'], tree, xmin, ymin, xmax, ymax)
														
 
															+    # # tree.write(r'C:\Users\admin\Desktop\exam_segment_django113\segment\exam_image\sheet\arts_comprehensive\2020-02-05\choice_region_00.xml')
														
 
															-    # tree = ET.parse(r'C:\Users\admin\Desktop\exam_segment_django113\segment\exam_info\000000-template.xml')  # xml tree
														
 
															-    # for index, bbox in enumerate(all_digital_list0):
														
 
															-    #     # bbox0 = region_info['bbox']
														
 
															-    #     location = bbox['location']
														
 
															-    #     xmin = location['left']
														
 
															-    #     ymin = location['top']
														
 
															-    #     xmax = location['left'] + location['width']
														
 
															-    #     ymax = location['top'] + location['height']
														
 
															-    #     tree = utils.create_xml(bbox['char'], tree, xmin, ymin, xmax, ymax)
														
 
															-    # tree.write(r'C:\Users\admin\Desktop\exam_segment_django113\segment\exam_image\sheet\arts_comprehensive\2020-02-05\choice_region_00.xml')
														
 
															     delete_list = []
														
 
															     for ele_digtal in all_digital_list0:
														
@@ -333,12 +587,20 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															             ymax_d = ele_digtal['location']['top'] + ele_digtal['location']['height']
														
 
															             ele_digtal_bbox = [xmin_d, ymin_d, xmax_d, ymax_d]
														
 
															+            ele_digtal_bbox_tmp = [xmin_d + 4, ymin_d - 3, xmax_d - 6, ymax_d - 3]
														
 
															+
														
 
															             ele_choice_m_bbox = [ele_choice_m['bounding_box']['xmin'], ele_choice_m['bounding_box']['ymin'],
														
 
															                                  ele_choice_m['bounding_box']['xmax'], ele_choice_m['bounding_box']['ymax']]
														
 
															             choice_m_new_box = utils.get_img_region_box1(ele_choice_m_bbox, choice_bbox)
														
 
															-            if utils.decide_coordinate_full_contains2(choice_m_new_box, ele_digtal_bbox) == True:
														
 
															+            ele_digtal_bbox_tmp_array = np.array(ele_digtal_bbox_tmp)
														
 
															+            neg_ele = np.where(ele_digtal_bbox_tmp_array < 0)[0]
														
 
															+
														
 
															+            if len(neg_ele) != 0:
														
 
															+                delete_list.append(ele_digtal)
														
 
															+                break
														
 
															+            elif utils.decide_coordinate_full_contains2(choice_m_new_box, ele_digtal_bbox_tmp) == True:
														
 
															                 delete_list.append(ele_digtal)
														
 
															     all_digital_list = []
														
@@ -348,6 +610,7 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															             continue
														
 
															         else:
														
 
															             all_digital_list.append(ele)
														
 
															+    # print(all_digital_list)
														
 
															     # new_all_digital_list = combine_char(all_digital_list)
														
 
															     #
														
@@ -407,8 +670,11 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															                 choice_m_box_dict_new.append(s_choice_m_box)
														
 
															             else:
														
 
															                 x_y_interval = utils.get_x_diff_and_y_diff1(all_small_coordinate_new, col)
														
 
															-                x_y_interval_all.append(x_y_interval)
														
 
															-
														
 
															+                if 'nan' in x_y_interval:
														
 
															+                    x_y_interval = x_y_interval_ave0
														
 
															+                    x_y_interval_all.append(x_y_interval)
														
 
															+                else:
														
 
															+                    x_y_interval_all.append(x_y_interval)
														
 
															                 all_small_coordinate_list = sorted(all_small_coordinate_new, key=lambda k: k[1])
														
 
															                 s_box_array = np.array(all_small_coordinate_list)
														
 
															                 s_box_wid_hei = (int(np.mean(s_box_array[:, 2])) - int(np.mean(s_box_array[:, 0])),
														
@@ -427,14 +693,14 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															     s_box_w_h_arr = np.array(s_box_w_h)
														
 
															     singe_box_width_height_ave = (int(np.mean(s_box_w_h_arr[:, 0])), int(np.mean(s_box_w_h_arr[:, 1])))
														
 
															-    digital_list_by_choice_m = get_digital_near_choice_m_box(all_digital_list0, choice_m_box_dict_new, x_y_interval_ave, singe_box_width_height_ave, direction)
														
 
															+    digital_list_by_choice_m = get_digital_near_choice_m_box(all_digital_list, choice_m_box_dict_new, x_y_interval_ave, singe_box_width_height_ave, direction)
														
 
															     for number in digital_list_by_choice_m:
														
 
															         title_number_list = number['title_number']
														
 
															         all_digital_list = sorted(title_number_list, key=lambda k: k.get('location')['top'])
														
 
															-        new_title_number_list = combine_char(all_digital_list)
														
 
															-        number.update({'title_number': new_title_number_list})
														
 
															+        # new_title_number_list = combine_char(all_digital_list)
														
 
															+        number.update({'title_number': all_digital_list})
														
 
															     # tree = ET.parse(r'C:\Users\admin\Desktop\exam_segment_django113\segment\exam_info\000000-template.xml')  # xml tree
														
 
															     # for index, bbox0 in enumerate(digital_list_by_choice_m):
														
@@ -485,23 +751,50 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															                         title_number_bbox = [ele1['location']['left'], ele1['location']['top'],
														
 
															                                              ele1['location']['left'] + ele1['location']['width'],
														
 
															                                              ele1['location']['top'] + ele1['location']['height']]
														
 
															-                        row_box = {}
														
 
															-                        if title_number_bbox[1] - single_bbox_width_height[1] < ele0[0][1] < title_number_bbox[1] + \
														
 
															-                                single_bbox_width_height[1] \
														
 
															-                                and title_number_bbox[3] - single_bbox_width_height[1] < ele0[0][3] < \
														
 
															-                                title_number_bbox[3] + single_bbox_width_height[1]:
														
 
															-                            row_box['title_number'] = ele1
														
 
															-                            row_box['row_box'] = ele0
														
 
															-                            row_box_.append(row_box)
														
 
															-                            index_list.append(index0)
														
 
															-                        elif title_number_bbox[0] - single_bbox_width_height[0] < ele0[0][0] < title_number_bbox[0] + \
														
 
															-                                single_bbox_width_height[0] \
														
 
															-                                and title_number_bbox[2] - single_bbox_width_height[0] < ele0[0][2] < \
														
 
															-                                title_number_bbox[2] + single_bbox_width_height[0]:
														
 
															-                            row_box['title_number'] = ele1
														
 
															-                            row_box['row_box'] = ele0
														
 
															-                            row_box_.append(row_box)
														
 
															-                            index_list.append(index0)
														
 
															+                        if choice_m_s['direction'] == 180:
														
 
															+                            # x axis
														
 
															+                            pattern1 = int(3 / 5 * (title_number_bbox[0] - single_bbox_width_height[0])) < \
														
 
															+                                       int(9/10 * ele0[0][0]) < \
														
 
															+                                       title_number_bbox[0] + int(1.6 * single_bbox_width_height[0]) \
														
 
															+                                       and int(3 / 5 * (title_number_bbox[2] - single_bbox_width_height[0])) < \
														
 
															+                                       int(ele0[0][2] * 9/10) < \
														
 
															+                                       title_number_bbox[2] + int(1.6 * single_bbox_width_height[0])
														
 
															+                            # y axis
														
 
															+                            pattern2 = title_number_bbox[1] - single_bbox_width_height[1] < ele0[0][1] < \
														
 
															+                                       title_number_bbox[1] + int(1.6 * single_bbox_width_height[1]) \
														
 
															+                                       and int(3 / 5 * (title_number_bbox[3] - single_bbox_width_height[1])) < \
														
 
															+                                       int(ele0[0][3] * 9 /10) < \
														
 
															+                                       title_number_bbox[3] + int(1.6 * single_bbox_width_height[1])
														
 
															+
														
 
															+                            row_box = {}
														
 
															+                            if pattern1 and pattern2:
														
 
															+                                row_box['title_number'] = ele1
														
 
															+                                row_box['row_box'] = ele0
														
 
															+                                row_box_.append(row_box)
														
 
															+                                index_list.append(index0)
														
 
															+
														
 
															+                        elif choice_m_s['direction'] == 90:
														
 
															+                            # x axis
														
 
															+                            pattern1 = title_number_bbox[0] - single_bbox_width_height[0] <= ele0[0][0] <= \
														
 
															+                                       title_number_bbox[0] + int(1.6 * single_bbox_width_height[0]) \
														
 
															+                                       and int(3 / 5 * (title_number_bbox[2] - single_bbox_width_height[0])) <= \
														
 
															+                                       int(ele0[0][2] * 0.9) \
														
 
															+                                       <= title_number_bbox[2] + int(1.6 * single_bbox_width_height[0])
														
 
															+
														
 
															+                            # y axis
														
 
															+                            pattern2 = title_number_bbox[1] - single_bbox_width_height[1] <= \
														
 
															+                                       ele0[0][1] \
														
 
															+                                       <= title_number_bbox[1] + int(3 * single_bbox_width_height[1]) \
														
 
															+                                       and int(3 / 5 * (title_number_bbox[3] - single_bbox_width_height[1])) <= \
														
 
															+                                       int(ele0[0][3] * 0.9) \
														
 
															+                                       <= title_number_bbox[3] + int(3 * single_bbox_width_height[1])
														
 
															+                            row_box = {}
														
 
															+                            if pattern1 and pattern2:
														
 
															+                                row_box['title_number'] = ele1
														
 
															+                                row_box['row_box'] = ele0
														
 
															+                                row_box_.append(row_box)
														
 
															+                                index_list.append(index0)
														
 
															+                # print(index_list)
														
 
															                 index_list = sorted(list(set(index_list)))
														
 
															                 index0 = list(set([i for i in range(0, row_and_col[0])]) - set(index_list))  # lack index
														
 
															                 number0 = choice_m_s['number']
														
@@ -512,7 +805,11 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															                 choice_m_s.update({'title_number': new_number_list})
														
 
															                 all_list_new.append(choice_m_s)
														
 
															             except Exception as e:
														
 
															+                number0 = choice_m_s['number']
														
 
															+                new_number_list = utils.infer_number(number0)
														
 
															+                choice_m_s.update({'title_number': new_number_list})
														
 
															                 all_list_new.append(choice_m_s)
														
 
															+
														
 
															     # print(all_list_new)
														
 
															     title_number_by_choice_m_list = []     # sort change coordinate
														
 
															     for index, single_choice_m in enumerate(all_list_new):
														
@@ -536,4 +833,23 @@ def get_title_number(choice_bbox, choice_region, choice_m_box_dict, direction):
 
															         single_choice_m.pop('s_box_w_h')
														
 
															         single_choice_m.pop('title_number')
														
 
															         title_number_by_choice_m_list.append(single_choice_m)
														
 
															-    return title_number_by_choice_m_list
														
 
															+    # print(title_number_by_choice_m_list)
														
 
															+
														
 
															+    # Chinese number and value    11 (3 fen)
														
 
															+    if subject == 'chinese' or subject == 'chinese_blank':
														
 
															+        title_number_by_choice_m_list_tmp = title_number_by_choice_m_list.copy()
														
 
															+        number_list_all = [ele['number'] for ele in title_number_by_choice_m_list_tmp if ele['number']]
														
 
															+        number_list_all_ = [ele1 for ele in number_list_all for ele1 in ele]
														
 
															+        number_tmp = list(set(number_list_all_))
														
 
															+        if len(number_tmp) == 1 and number_tmp[0] == -1:
														
 
															+            try:
														
 
															+                number_by_choice_m_list = get_chinese_choice_number(title_number_by_choice_m_list_tmp, image)
														
 
															+                return number_by_choice_m_list
														
 
															+            except Exception as e:
														
 
															+                print('Chinses number and value error, please check')
														
 
															+                return title_number_by_choice_m_list
														
 
															+        else:
														
 
															+            return title_number_by_choice_m_list
														
 
															+
														
 
															+    else:
														
 
															+        return title_number_by_choice_m_list
														
--- a/segment/sheet_resolve/analysis/correct/register_once_mbq_recursive_by_page.py
+++ b/segment/sheet_resolve/analysis/correct/register_once_mbq_recursive_by_page.py
@@ -0,0 +1,637 @@
 
															+# @Author  : lightXu
														
 
															+# @File    : register_once_mbq_recursive_by_page.py
														
 
															+# @Time    : 2019/8/8 0008 上午 10:25
														
 
															+import argparse
														
 
															+import time
														
 
															+from os import path as os_path, makedirs
														
 
															+import math
														
 
															+import cv2  # VERSION <=3.3
														
 
															+import numpy as np
														
 
															+from PIL import Image
														
 
															+from pywt import wavedec2, waverec2
														
 
															+
														
 
															+REGISTER_RIGHT_HIGH = 0.85
														
 
															+REGISTER_RIGHT_LOW = 0.5
														
 
															+RECURSIVE_EPSILON = 0.02
														
 
															+STD_DIFF = 5.0
														
 
															+FIXED_MAX_LENGTH = 800
														
 
															+CLIP_RATIO = 0.25
														
 
															+WEIGHT_GLOBAL = 0.1
														
 
															+WEIGHT_CORNER = 0.9
														
 
															+SINGLE_GLOBAL = SINGLE_CORNER = 0.92
														
 
															+NEED_FLIP = True
														
 
															+MATCH_PIX = 10
														
 
															+L_W_RATIO = 0.2
														
 
															+RATIO = 0.7
														
 
															+RECURSIVE_RATIO = 1.0
														
 
															+
														
 
															+
														
 
															+def _binary_array_to_hex(arr):
														
 
															+    """
														
 
															+    internal function to make a hex string out of a binary array.
														
 
															+    """
														
 
															+    bit_string = ''.join(str(b) for b in 1 * arr.flatten())
														
 
															+    width = int(np.ceil(len(bit_string) / 4))
														
 
															+    return '{:0>{width}x}'.format(int(bit_string, 2), width=width)
														
 
															+
														
 
															+
														
 
															+class ImageHash(object):
														
 
															+    """
														
 
															+    Hash encapsulation. Can be used for dictionary keys and comparisons.
														
 
															+    """
														
 
															+
														
 
															+    def __init__(self, binary_array):
														
 
															+        self.hash = binary_array
														
 
															+
														
 
															+    def __str__(self):
														
 
															+        return _binary_array_to_hex(self.hash.flatten())
														
 
															+
														
 
															+    def __repr__(self):
														
 
															+        return repr(self.hash)
														
 
															+
														
 
															+    def __sub__(self, other):
														
 
															+        if other is None:
														
 
															+            raise TypeError('Other hash must not be None.')
														
 
															+        if self.hash.size != other.hash.size:
														
 
															+            raise TypeError('ImageHashes must be of the same shape.', self.hash.shape, other.hash.shape)
														
 
															+        return np.count_nonzero(self.hash.flatten() != other.hash.flatten())
														
 
															+
														
 
															+    def __eq__(self, other):
														
 
															+        if other is None:
														
 
															+            return False
														
 
															+        return np.array_equal(self.hash.flatten(), other.hash.flatten())
														
 
															+
														
 
															+    def __ne__(self, other):
														
 
															+        if other is None:
														
 
															+            return False
														
 
															+        return not np.array_equal(self.hash.flatten(), other.hash.flatten())
														
 
															+
														
 
															+    def __hash__(self):
														
 
															+        # this returns a 8 bit integer, intentionally shortening the information
														
 
															+        return sum([2 ** (i % 8) for i, v in enumerate(self.hash.flatten()) if v])
														
 
															+
														
 
															+
														
 
															+def whash(image, hash_size=8, image_scale=None, mode='haar', remove_max_haar_ll=True):
														
 
															+    if image_scale is not None:
														
 
															+        assert image_scale & (image_scale - 1) == 0, "image_scale is not power of 2"
														
 
															+    else:
														
 
															+        image_natural_scale = 2 ** int(np.log2(min(image.size)))
														
 
															+        image_scale = max(image_natural_scale, hash_size)
														
 
															+
														
 
															+    ll_max_level = int(np.log2(image_scale))
														
 
															+
														
 
															+    level = int(np.log2(hash_size))
														
 
															+    assert hash_size & (hash_size - 1) == 0, "hash_size is not power of 2"
														
 
															+    assert level <= ll_max_level, "hash_size in a wrong range"
														
 
															+    dwt_level = ll_max_level - level
														
 
															+
														
 
															+    image = image.resize((image_scale, image_scale), Image.ANTIALIAS)
														
 
															+    pixels = np.asarray(image) / 255
														
 
															+
														
 
															+    # Remove low level frequency LL(max_ll) if @remove_max_haar_ll using haar filter
														
 
															+    if remove_max_haar_ll:
														
 
															+        coeffs = wavedec2(pixels, 'haar', level=ll_max_level)
														
 
															+        coeffs = list(coeffs)
														
 
															+        coeffs[0] *= 0
														
 
															+        pixels = waverec2(coeffs, 'haar')
														
 
															+
														
 
															+    # Use LL(K) as freq, where K is log2(@hash_size)
														
 
															+    coeffs = wavedec2(pixels, mode, level=dwt_level)
														
 
															+    dwt_low = coeffs[0]
														
 
															+
														
 
															+    # Substract median and compute hash
														
 
															+    med = np.median(dwt_low)
														
 
															+    diff = dwt_low > med
														
 
															+    return ImageHash(diff)
														
 
															+
														
 
															+
														
 
															+def phash(image, hash_size=8, highfreq_factor=4):
														
 
															+    if hash_size < 2:
														
 
															+        raise ValueError("Hash size must be greater than or equal to 2")
														
 
															+
														
 
															+    img_size = hash_size * highfreq_factor
														
 
															+    image = image.resize((img_size, img_size), Image.ANTIALIAS)
														
 
															+    pixels = np.asarray(image)
														
 
															+    dct = cv2.dct(pixels.astype(np.float))
														
 
															+    dctlowfreq = dct[:hash_size, :hash_size]
														
 
															+    med = np.median(dctlowfreq)
														
 
															+    diff = dctlowfreq > med
														
 
															+    return ImageHash(diff)
														
 
															+
														
 
															+
														
 
															+def dhash(image, hash_size=8):
														
 
															+    # resize(w, h), but numpy.array((h, w))
														
 
															+    if hash_size < 2:
														
 
															+        raise ValueError("Hash size must be greater than or equal to 2")
														
 
															+
														
 
															+    image = image.resize((hash_size + 1, hash_size), Image.ANTIALIAS)
														
 
															+    pixels = np.asarray(image)
														
 
															+    # compute differences between columns
														
 
															+    diff = pixels[:, 1:] > pixels[:, :-1]
														
 
															+    return ImageHash(diff)
														
 
															+
														
 
															+
														
 
															+def average_hash(image, hash_size=8):
														
 
															+    if hash_size < 2:
														
 
															+        raise ValueError("Hash size must be greater than or equal to 2")
														
 
															+
														
 
															+    # reduce size and complexity, then covert to grayscale
														
 
															+    image = image.resize((hash_size, hash_size), Image.ANTIALIAS)
														
 
															+
														
 
															+    # find average pixel value; 'pixels' is an array of the pixel values, ranging from 0 (black) to 255 (white)
														
 
															+    pixels = np.asarray(image)
														
 
															+    avg = pixels.mean()
														
 
															+
														
 
															+    # create string of bits
														
 
															+    diff = pixels > avg
														
 
															+    # make a hash
														
 
															+    return ImageHash(diff)
														
 
															+
														
 
															+
														
 
															+def image_hash(image):
														
 
															+    image = Image.fromarray(image)
														
 
															+    hash_size = 10
														
 
															+    dhash_code = dhash(image, hash_size=hash_size)
														
 
															+    # ahash_code = average_hash(image, hash_size=hash_size)
														
 
															+    phash_code = phash(image, hash_size=hash_size, highfreq_factor=4)
														
 
															+    hash_code = whash(image, image_scale=64, hash_size=8, mode='db4')
														
 
															+    return hash_code, dhash_code, phash_code
														
 
															+
														
 
															+
														
 
															+def hash_similarity(hash_as_t, hash_to_regi):
														
 
															+    similarity = 1 - (hash_as_t - hash_to_regi) / len(hash_as_t.hash) ** 2  # 相似性
														
 
															+    return similarity
														
 
															+
														
 
															+
														
 
															+def hash_detection(t_image, image_to_regi):
														
 
															+    # t_hash = image_hash(t_image)
														
 
															+    # r_hash = image_hash(image_to_regi)
														
 
															+
														
 
															+    [t_hash, tdh, tph] = image_hash(t_image)
														
 
															+    [r_hash, rdh, rph] = image_hash(image_to_regi)
														
 
															+    simi = hash_similarity(tdh, rdh)
														
 
															+    # simi = hash_similarity(t_hash, r_hash)
														
 
															+
														
 
															+    evidence = [hash_similarity(t_hash, r_hash),
														
 
															+                hash_similarity(tdh, rdh),
														
 
															+                hash_similarity(tph, rph)]
														
 
															+    return simi, evidence
														
 
															+
														
 
															+
														
 
															+def read_single_img(img_path):
														
 
															+    try:
														
 
															+        im = cv2.imdecode(np.fromfile(img_path, dtype=np.uint8), -1)
														
 
															+        # im = np.asarray(Image.open(img_path).convert('L'))
														
 
															+        # im = np.asarray(Image.open(img_path))
														
 
															+        # im = cv2.cvtColor(im, cv2.COLOR_BGR2GRAY)
														
 
															+        # im = im[:, :, 0]
														
 
															+        if len(im.shape) == 3:
														
 
															+            im = cv2.cvtColor(im, cv2.COLOR_BGR2GRAY)
														
 
															+    except FileNotFoundError as e:
														
 
															+        raise e
														
 
															+    return im
														
 
															+
														
 
															+
														
 
															+def write_single_img(dst, save_path):
														
 
															+    try:
														
 
															+        # cv2.imencode('.jpg', dst)[1].tofile(save_path)
														
 
															+        save_img = Image.fromarray(dst)
														
 
															+        save_img.save(save_path)
														
 
															+    except FileNotFoundError as e:
														
 
															+        raise e
														
 
															+
														
 
															+
														
 
															+def resize_by_percent(im, percent):
														
 
															+    height = im.shape[0]
														
 
															+    width = im.shape[1]
														
 
															+    new_x = int(width * percent)
														
 
															+    new_y = int(height * percent)
														
 
															+    res = cv2.resize(im, (new_x, new_y), interpolation=cv2.INTER_AREA)
														
 
															+    return res
														
 
															+
														
 
															+
														
 
															+def resize_by_fixed_size(im, new_x, new_y):
														
 
															+    res = cv2.resize(im, (new_x, new_y), interpolation=cv2.INTER_AREA)
														
 
															+    return res
														
 
															+
														
 
															+
														
 
															+def image_flip(image, angle='90'):
														
 
															+    rotate_code = {"90": Image.ROTATE_90, "180": Image.ROTATE_180, "270": Image.ROTATE_270, }  # 逆时针
														
 
															+    if str(angle) != "0":
														
 
															+        img = ''
														
 
															+        if 'PIL' not in str(type(image)):
														
 
															+            img = Image.fromarray(image)
														
 
															+        rotate_img = img.transpose(rotate_code[str(angle)])  # 翻转
														
 
															+        cv2_img_tmp = np.asarray(rotate_img)
														
 
															+        if len(cv2_img_tmp.shape) > 2:
														
 
															+            cv2_img = cv2.cvtColor(cv2_img_tmp, cv2.COLOR_RGB2BGR)
														
 
															+        else:
														
 
															+            cv2_img = cv2_img_tmp
														
 
															+    else:
														
 
															+        cv2_img = image
														
 
															+
														
 
															+    return cv2_img
														
 
															+
														
 
															+
														
 
															+def get_corners_of_image(image, clip_ratio=0.25):
														
 
															+    t_x, t_y = image.shape[1], image.shape[0]
														
 
															+    clip_x = int(t_x * clip_ratio)
														
 
															+    clip_y = int(t_y * clip_ratio)
														
 
															+    y_del_list = [ele for ele in range(clip_y, t_y - clip_y)]
														
 
															+    x_del_list = [ele for ele in range(clip_x, t_x - clip_x)]
														
 
															+
														
 
															+    t_corner_array = np.delete(image, y_del_list, axis=0)
														
 
															+    t_corner_array = np.delete(t_corner_array, x_del_list, axis=1)
														
 
															+
														
 
															+    return t_corner_array
														
 
															+
														
 
															+
														
 
															+# def sift_kp(image):
														
 
															+#     sift = cv2.xfeatures2d.SIFT_create()
														
 
															+#     # sift = cv2.xfeatures2d.SURF_create()
														
 
															+#     kp, des = sift.detectAndCompute(image, None)
														
 
															+#     return kp, des
														
 
															+
														
 
															+
														
 
															+def sift_kp(image):
														
 
															+    fast = cv2.FastFeatureDetector_create(threshold=35)
														
 
															+    kp = fast.detect(image, None)
														
 
															+    dsp = cv2.xfeatures2d.BriefDescriptorExtractor_create()
														
 
															+    kp, des = dsp.compute(image, kp)
														
 
															+    return kp, des
														
 
															+
														
 
															+
														
 
															+def get_good_match(des1, des2):
														
 
															+    bf = cv2.BFMatcher()
														
 
															+    matches = bf.knnMatch(des1, des2, k=2)  # des1为模板图，des2为匹配图
														
 
															+    for ele in matches:
														
 
															+        if ele[1].distance == 0:
														
 
															+            ele[1].distance = 0.001
														
 
															+    matches = sorted(matches, key=lambda x: x[0].distance / x[1].distance)
														
 
															+    good = []
														
 
															+    for m, n in matches:
														
 
															+        if m.distance < 0.75 * n.distance:
														
 
															+            good.append(m)
														
 
															+    return good
														
 
															+
														
 
															+
														
 
															+def transform_mtx_from_points(template_points, regi_points):
														
 
															+    points1 = np.float64(np.matrix([[point[0], point[1]] for point in template_points]))
														
 
															+    points2 = np.float64(np.matrix([[point[0], point[1]] for point in regi_points]))
														
 
															+
														
 
															+    c1 = np.mean(points1, axis=0)
														
 
															+    c2 = np.mean(points2, axis=0)
														
 
															+    points1 -= c1
														
 
															+    points2 -= c2
														
 
															+    s1 = np.std(points1)
														
 
															+    s2 = np.std(points2)
														
 
															+    points1 /= s1
														
 
															+    points2 /= s2
														
 
															+    U, S, Vt = np.linalg.svd(points1.T * points2)
														
 
															+    R = (U * Vt).T
														
 
															+    return np.vstack([np.hstack(((s2 / s1) * R, c2.T - (s2 / s1) * R * c1.T)), np.array([0., 0., 1.])])
														
 
															+
														
 
															+
														
 
															+def sift_transform_mtx_by_match(good_match, t_kp, r_kp, ratio=1):
														
 
															+    # x_ratio != y_ratio may cause bias
														
 
															+    x_ratio = y_ratio = 1 / ratio
														
 
															+    transform_mtx = np.ones((3, 3))
														
 
															+    if len(good_match) > 4:
														
 
															+        ratio_array = np.array([x_ratio, y_ratio])
														
 
															+        t_pts = np.float32([t_kp[m.queryIdx].pt for m in good_match])
														
 
															+        r_pts = np.float32([r_kp[m.trainIdx].pt for m in good_match])
														
 
															+
														
 
															+        t_pts = (t_pts * ratio_array)
														
 
															+        r_pts = (r_pts * ratio_array)
														
 
															+        pts_t_pers = (t_pts * ratio_array).reshape(-1, 1, 2)
														
 
															+        pts_r_pers = (r_pts * ratio_array).reshape(-1, 1, 2)
														
 
															+        _, status_array = cv2.findHomography(pts_t_pers, pts_r_pers, cv2.RANSAC, ransacReprojThreshold=4)
														
 
															+
														
 
															+        status_arr = status_array.reshape(-1)
														
 
															+        idx = np.where(status_arr >= 1)
														
 
															+
														
 
															+        t_points = np.float32(t_pts[idx])
														
 
															+        r_points = np.float32(r_pts[idx])
														
 
															+        transform_mtx = transform_mtx_from_points(t_points, r_points)
														
 
															+    return transform_mtx
														
 
															+
														
 
															+
														
 
															+def perspective(regi_img, mtx):
														
 
															+    width, height = regi_img.shape[1], regi_img.shape[0]
														
 
															+    # img_out = cv2.warpPerspective(raw_img_r, mtx, (width, height),
														
 
															+    #                               flags=cv2.INTER_AREA + cv2.WARP_INVERSE_MAP, borderValue=(255, 255, 255))
														
 
															+
														
 
															+    img_out = cv2.warpAffine(regi_img, mtx[:2], (width, height), flags=cv2.INTER_AREA + cv2.WARP_INVERSE_MAP,
														
 
															+                             borderValue=(255, 255, 255))
														
 
															+    return img_out
														
 
															+
														
 
															+
														
 
															+def pre_process(t_image_path_list, r_img_path):
														
 
															+    flip_degree = 0
														
 
															+    t_image_tmp = read_single_img(t_image_path_list[0])
														
 
															+    t_y, t_x = t_image_tmp.shape[0], t_image_tmp.shape[1]
														
 
															+    regi_image = read_single_img(r_img_path)
														
 
															+    r_y, r_x = regi_image.shape[0], regi_image.shape[1]
														
 
															+
														
 
															+    if (r_y - r_x) * (t_y - t_x) < 0:
														
 
															+        regi_image = image_flip(regi_image, "90")
														
 
															+        r_y, r_x = r_x, r_y
														
 
															+        flip_degree = 90
														
 
															+
														
 
															+    n_x, n_y = t_x, t_y
														
 
															+    if (r_y / r_x) != (t_y / t_x):
														
 
															+        # if abs(int(r_y * t_x / t_y - r_x)) > MATCH_PIX:
														
 
															+        #     raise ValueError("source image_shape(height/width) is not identical to register image_shape with 10+ "
														
 
															+        #                      "pixels.")
														
 
															+
														
 
															+        if abs(max(r_y, r_x) / min(r_y, r_x) - max(t_y, t_x) / min(t_y, t_x)) > L_W_RATIO:
														
 
															+            raise ValueError("template image shape is not identical to register image shape.")
														
 
															+        else:
														
 
															+            if r_y > t_y:  # resize regi_image
														
 
															+                regi_image = resize_by_fixed_size(regi_image, t_x, t_y)
														
 
															+                n_x, n_y = t_x, t_y
														
 
															+
														
 
															+            if r_y < t_y:
														
 
															+                # t_norm_ratio = r_y / t_y
														
 
															+                t_image_tmp = resize_by_fixed_size(t_image_tmp, r_x, r_y)
														
 
															+                n_x, n_y = r_x, r_y
														
 
															+
														
 
															+    return (n_y, n_x), regi_image, t_image_tmp, flip_degree
														
 
															+
														
 
															+
														
 
															+# def pre_process(t_image_path_list, r_img_path):
														
 
															+#     flip_degree = 0
														
 
															+#     t_image_tmp = read_single_img(t_image_path_list[0])
														
 
															+#     t_y, t_x = t_image_tmp.shape[0], t_image_tmp.shape[1]
														
 
															+#     regi_image = read_single_img(r_img_path)
														
 
															+#     r_y, r_x = regi_image.shape[0], regi_image.shape[1]
														
 
															+#
														
 
															+#     if abs(max(r_y, r_x) / min(r_y, r_x) - max(t_y, t_x) / min(t_y, t_x)) > L_W_RATIO:
														
 
															+#         raise ValueError("template image shape is not identical to register image shape.")
														
 
															+#
														
 
															+#     if (r_y - r_x) * (t_y - t_x) < 0:
														
 
															+#         regi_image = image_flip(regi_image, "90")
														
 
															+#         r_y, r_x = r_x, r_y
														
 
															+#         flip_degree = 90
														
 
															+#
														
 
															+#     n_x, n_y = t_x, t_y
														
 
															+#
														
 
															+#     if t_y*t_x == r_y*r_x:
														
 
															+#         if (t_y, t_x) != (r_y, r_x):
														
 
															+#             regi_image = resize_by_fixed_size(regi_image, t_x, t_y)
														
 
															+#     else:
														
 
															+#         regi_image = resize_by_fixed_size(regi_image, t_x, t_y)
														
 
															+#
														
 
															+#     return (n_y, n_x), regi_image, t_image_tmp, flip_degree
														
 
															+
														
 
															+
														
 
															+def ds_evidence(evid_list):
														
 
															+    evid_array = np.array(evid_list)
														
 
															+    evid_normed = evid_array / evid_array.sum(axis=0)
														
 
															+
														
 
															+    k = 0
														
 
															+    p = []
														
 
															+    for single in evid_normed:
														
 
															+        product_tmp = 1
														
 
															+        for ele in single:
														
 
															+            product_tmp = product_tmp * ele
														
 
															+        p.append(product_tmp)
														
 
															+        k = k + product_tmp
														
 
															+
														
 
															+    p = [ele / k for ele in p]
														
 
															+
														
 
															+    return p
														
 
															+
														
 
															+
														
 
															+def recursive_regi(save, template_list, r_image_path, max_length, old_similarity,
														
 
															+                   norm_row, norm_col, regi_image, t_image_0, flip_degree):
														
 
															+    degree_dict = {0: 0, 90: 1, 180: 2, 270: 3}
														
 
															+    raw_name = r_image_path.replace('/', '\\').split('\\')[-1]
														
 
															+
														
 
															+    resize_ratio = min(round(max_length / max(norm_row, norm_col), 2), 1)
														
 
															+    print('resize_ratio', resize_ratio)
														
 
															+    max_simi_index, similarity_dict, std, registered_image, r_flip_degree = run(template_list, raw_name,
														
 
															+                                                                                norm_row, norm_col, resize_ratio,
														
 
															+                                                                                regi_image, t_image_0, flip_degree,
														
 
															+                                                                                need_flip=NEED_FLIP)
														
 
															+
														
 
															+    similarity = round(similarity_dict['weight'], 2)
														
 
															+    g_simi = round(similarity_dict['global'], 2)
														
 
															+    c_simi = round(similarity_dict['corner'], 2)
														
 
															+
														
 
															+    cond1 = similarity >= REGISTER_RIGHT_HIGH  # 权重相似图上阈值， 超过就达标
														
 
															+    cond2 = g_simi >= SINGLE_GLOBAL  # 全局相似度上阈值， 超过就达标
														
 
															+    cond3 = c_simi >= SINGLE_CORNER  # 局部相似度上阈值，超过就达标
														
 
															+    cond4 = abs(old_similarity - similarity) <= RECURSIVE_EPSILON  # 两次校准相似度偏差，是否小于RECURSIVE_EPSILON
														
 
															+    cond5 = similarity > REGISTER_RIGHT_LOW  # 权重相似度是否大于相似度下限
														
 
															+    cond6 = abs(std) < STD_DIFF  # 方差阈值， 小于达标
														
 
															+    cond7 = similarity <= REGISTER_RIGHT_LOW  # 权重相似度下限，小于下限不达标
														
 
															+
														
 
															+    regi_flag = (cond6 and (cond1 or cond2 or cond3)) or (cond4 and cond5)
														
 
															+
														
 
															+    if resize_ratio >= RECURSIVE_RATIO:
														
 
															+        if regi_flag:
														
 
															+            degree_flag = degree_dict[r_flip_degree]
														
 
															+            save_path = os_path.join(save, raw_name.replace('.jpg',
														
 
															+                                                            '_index_{:02d}_{}.jpg'
														
 
															+                                                            .format(max_simi_index, degree_flag)))
														
 
															+            save_img = Image.fromarray(registered_image)
														
 
															+            save_img.save(save_path)
														
 
															+            write_single_img(registered_image, save_path)
														
 
															+            print('{} >>> {}'.format(r_image_path, save_path))
														
 
															+            return max_simi_index, save_path
														
 
															+        else:
														
 
															+            print('recursion and failed')
														
 
															+            return -1, ''
														
 
															+    else:
														
 
															+        if regi_flag:
														
 
															+            degree_flag = degree_dict[r_flip_degree]
														
 
															+            save_path = os_path.join(save, raw_name.replace('.jpg',
														
 
															+                                                            '_index_{:02d}_{}.jpg'
														
 
															+                                                            .format(max_simi_index, degree_flag)))
														
 
															+            write_single_img(registered_image, save_path)
														
 
															+            print('{} >>> {}'.format(r_image_path, save_path))
														
 
															+            return max_simi_index, save_path
														
 
															+        else:
														
 
															+            if cond7:
														
 
															+                print('not register')
														
 
															+                return -1, ''
														
 
															+            print('recursion')
														
 
															+            max_length = max_length + int(max_length * 0.5)
														
 
															+            return recursive_regi(save, template_list, r_image_path, max_length, similarity,
														
 
															+                                  norm_row, norm_col, regi_image, t_image_0, flip_degree)
														
 
															+
														
 
															+
														
 
															+def run(t_image_path_list, raw_name, norm_row, norm_col, resize_ratio, regi_image, t_img_0, flip_degree, need_flip):
														
 
															+    opencv_r_img_resize = resize_by_percent(regi_image, resize_ratio)
														
 
															+
														
 
															+    match_len = []
														
 
															+    evid_list = []
														
 
															+
														
 
															+    t_length = len(t_image_path_list)
														
 
															+    opencv_t_img_resize_0 = resize_by_percent(t_img_0, resize_ratio)
														
 
															+
														
 
															+    t_h, t_w = opencv_t_img_resize_0.shape[0], opencv_t_img_resize_0.shape[1]
														
 
															+
														
 
															+    array_dim = t_length
														
 
															+    if need_flip:
														
 
															+        t_image_array = np.zeros((t_h, t_w, 1 + t_length * 2), dtype=np.uint8)
														
 
															+        array_dim = t_length * 2
														
 
															+    else:
														
 
															+        t_image_array = np.zeros((t_h, t_w, 1 + t_length), dtype=np.uint8)
														
 
															+
														
 
															+    for index, ele in enumerate(t_image_path_list):
														
 
															+        if index == 0:
														
 
															+            opencv_t_img_resize = opencv_t_img_resize_0
														
 
															+        else:
														
 
															+            norm_t_img = resize_by_fixed_size(read_single_img(ele), norm_col, norm_row)
														
 
															+            opencv_t_img_resize = resize_by_percent(norm_t_img, resize_ratio)
														
 
															+
														
 
															+        t_image_array[:, :, index] = opencv_t_img_resize
														
 
															+        if need_flip:
														
 
															+            flip_image = np.flipud(np.fliplr(opencv_t_img_resize))
														
 
															+            t_image_array[:, :, index + t_length] = flip_image
														
 
															+
														
 
															+    t_image_array[:, :, -1] = opencv_r_img_resize
														
 
															+    t_corner_array = get_corners_of_image(t_image_array, CLIP_RATIO)
														
 
															+    r_corners = t_corner_array[:, :, -1]
														
 
															+
														
 
															+    for index in range(0, array_dim):
														
 
															+        similarity_corner, evidence_c = hash_detection(t_corner_array[:, :, index], r_corners)
														
 
															+        similarity_global, evidence_g = hash_detection(t_image_array[:, :, index], opencv_r_img_resize)
														
 
															+        evid_list.append(evidence_c + evidence_g)
														
 
															+
														
 
															+        print('  t-{}, corner:  whash: {:.4f}, dhash: {:.4f},  phash: {:.4f}'
														
 
															+              .format(index,
														
 
															+                      evidence_c[0],
														
 
															+                      evidence_c[1],
														
 
															+                      evidence_c[2],
														
 
															+                      ))
														
 
															+        print('       global:  whash: {:.4f}, dhash: {:.4f},  phash: {:.4f}'
														
 
															+              .format(evidence_g[0],
														
 
															+                      evidence_g[1],
														
 
															+                      evidence_g[2],
														
 
															+                      ))
														
 
															+
														
 
															+    p_list = ds_evidence(evid_list)
														
 
															+
														
 
															+    p_list_str = ', '.join(['page_{}: {:.4f}'.format(index, p) for index, p in enumerate(p_list)])
														
 
															+    print(p_list_str)
														
 
															+
														
 
															+    if need_flip:
														
 
															+        max_index = p_list.index(max(p_list))
														
 
															+        half_len = t_length
														
 
															+        if max_index >= half_len != 0:
														
 
															+            max_index = max_index - half_len
														
 
															+            opencv_r_img_resize = image_flip(opencv_r_img_resize, '180')
														
 
															+            regi_image = image_flip(regi_image, '180')
														
 
															+            r_kp, r_des = sift_kp(opencv_r_img_resize)
														
 
															+            flip_degree = flip_degree + 180
														
 
															+        else:
														
 
															+            r_kp, r_des = sift_kp(opencv_r_img_resize)
														
 
															+    else:
														
 
															+        max_index = p_list.index(max(p_list))
														
 
															+        r_kp, r_des = sift_kp(opencv_r_img_resize)
														
 
															+
														
 
															+    print('max_index: ', max_index)
														
 
															+
														
 
															+    t_kp, t_des = sift_kp(t_image_array[:, :, max_index])
														
 
															+    match_points = get_good_match(t_des, r_des)
														
 
															+    match_len.append(len(match_points))
														
 
															+    try:
														
 
															+        transform_mtx = sift_transform_mtx_by_match(match_points, t_kp, r_kp, resize_ratio)
														
 
															+    except Exception as e:
														
 
															+        print(e)
														
 
															+        transform_mtx = None
														
 
															+    # print(transform_mtx)
														
 
															+    if transform_mtx is not None:
														
 
															+        registered_image = perspective(regi_image, transform_mtx)
														
 
															+
														
 
															+        r_corners = get_corners_of_image(registered_image, CLIP_RATIO)
														
 
															+        raw_corners = get_corners_of_image(regi_image, CLIP_RATIO)
														
 
															+        simi_corner = hash_similarity(dhash(Image.fromarray(r_corners), hash_size=10),
														
 
															+                                      dhash(Image.fromarray(raw_corners), hash_size=10))
														
 
															+        simi_global = hash_similarity(dhash(Image.fromarray(registered_image), hash_size=10),
														
 
															+                                      dhash(Image.fromarray(regi_image), hash_size=10))
														
 
															+
														
 
															+        std0 = np.std(resize_by_percent(regi_image, resize_ratio))
														
 
															+        std1 = np.std(resize_by_percent(registered_image, resize_ratio))
														
 
															+        std_dif = abs(std0 - std1)
														
 
															+        print('std0: {:.4f}, std1: {:.4f}, diff: {:.4f}'.format(std0, std1, std_dif))
														
 
															+        # std_dif = 0
														
 
															+
														
 
															+        similarity = WEIGHT_GLOBAL * simi_global + WEIGHT_CORNER * simi_corner  # 校准图与原图比较
														
 
															+        print('simi_global: {:.4f}, simi_corner: {:.4f}'.format(simi_global, simi_corner))
														
 
															+        print('weight_similarity: {:.4f}\n'.format(similarity))
														
 
															+
														
 
															+        simi_dict = {'global': simi_global, 'corner': simi_corner, 'weight': similarity}
														
 
															+        return max_index, simi_dict, std_dif, registered_image, flip_degree
														
 
															+
														
 
															+    else:
														
 
															+        raise ValueError('{} failed to find transform matrix'.format(raw_name))
														
 
															+
														
 
															+
														
 
															+if __name__ == '__main__':
														
 
															+    t1 = time.time()
														
 
															+    parser = argparse.ArgumentParser(description="your script description")  # --help
														
 
															+    parser.add_argument('--image_path', '-i', help='register image_path')
														
 
															+    parser.add_argument('--save_path', '-s', help='register save_path')
														
 
															+    parser.add_argument('--template_path', '-t', help='template_path')
														
 
															+    # description参数可以用于插入描述脚本用途的信息，可以为空
														
 
															+
														
 
															+    args = parser.parse_args()  # 将变量以标签-值的字典形式存入args字典
														
 
															+
														
 
															+    # regi_image_path = args.image_path
														
 
															+    # save_dir = args.save_path
														
 
															+    # template_path_list = args.template_path.split(',')
														
 
															+    # template_path_list = [ele.strip() for ele in template_path_list]
														
 
															+
														
 
															+    regi_image_path = r'C:\Users\Administrator\Desktop\error_imgs\201909061745_0001.jpg'
														
 
															+    save_dir = r'C:\Users\Administrator\Desktop\error_imgs\save'
														
 
															+    template_path_list = [r'C:\Users\Administrator\Desktop\error_imgs\10000000.jpg',
														
 
															+                          r'C:\Users\Administrator\Desktop\error_imgs\10000001.jpg',
														
 
															+                          # r'C:\Users\Administrator\Desktop\register_img_2\t\2.jpg',
														
 
															+                          # r'C:\Users\Administrator\Desktop\register_img_2\t\4.jpg'
														
 
															+                          ]
														
 
															+    #
														
 
															+    # # regi_image_path = r'C:\Users\Administrator\Desktop\error_imgs\Page0001.jpg'
														
 
															+    # # save_dir = r'C:\Users\Administrator\Desktop\error_imgs\save'
														
 
															+    # # template_path_list = [r'C:\Users\Administrator\Desktop\error_imgs\201910230723_0001.jpg',
														
 
															+    # #                       # r'C:\Users\Administrator\Desktop\AnalysisRes\t\005983-1.jpg',
														
 
															+    # #                       # r'C:\Users\Administrator\Desktop\AnalysisRes\t\010401.jpg',
														
 
															+    # #                       # r'C:\Users\Administrator\Desktop\AnalysisRes\t\010401-1.jpg'
														
 
															+    # #                       ]
														
 
															+
														
 
															+    template_path_list = [ele.strip() for ele in template_path_list]
														
 
															+
														
 
															+    if not os_path.exists(save_dir):
														
 
															+        makedirs(save_dir)
														
 
															+
														
 
															+    fixed_max_length = FIXED_MAX_LENGTH
														
 
															+
														
 
															+    check = []
														
 
															+    check_file_list = template_path_list
														
 
															+    for ele in check_file_list:
														
 
															+        if os_path.exists(ele):
														
 
															+            check.append(True)
														
 
															+        else:
														
 
															+            check.append(False)
														
 
															+
														
 
															+    if False in check:
														
 
															+        raise ValueError('templates not found, please check the path')
														
 
															+    if not os_path.exists(regi_image_path):
														
 
															+        raise ValueError('{} not found, please check the path'.format(regi_image_path))
														
 
															+
														
 
															+    else:
														
 
															+        try:
														
 
															+            ((norm_y, norm_x),
														
 
															+             raw_regi_image, t_image_index_0, degree) = pre_process(template_path_list, regi_image_path)
														
 
															+
														
 
															+            init_similarity = 0.0
														
 
															+            recursive_regi(save_dir, check_file_list, regi_image_path, fixed_max_length, init_similarity,
														
 
															+                           norm_y, norm_x, raw_regi_image, t_image_index_0, degree)
														
 
															+        except Exception as e:
														
 
															+            print('{} registered failed: {}'.format(regi_image_path, e))
														
 
															+
														
 
															+    t2 = time.time()
														
 
															+    print('time consume: {:.4f}'.format(t2 - t1))
														
--- a/segment/sheet_resolve/analysis/resolve.py
+++ b/segment/sheet_resolve/analysis/resolve.py
@@ -26,6 +26,7 @@ from segment.sheet_resolve.analysis.sheet.sheet_infer import exam_number_adjust_
 
															 from segment.sheet_resolve.tools import utils
														
 
															 from segment.sheet_resolve.tools.tf_settings import xml_template_path, model_dict
														
 
															 from segment.sheet_resolve.tools.utils import create_xml
														
 
															+from segment.sheet_resolve.analysis.sheet.ocr_sheet import ocr2sheet
														
 
															 logger = logging.getLogger(settings.LOGGING_TYPE)
														
@@ -33,6 +34,7 @@ sheet_infer_dict = dict(bar_code=True,
 
															                         choice_m=True,
														
 
															                         exam_number=True,
														
 
															                         common_sheet=False,
														
 
															+                        cloze=True,
														
 
															                         solve=True)
														
 
															 infer_choice_m_flag = False
														
@@ -50,6 +52,7 @@ def sheet(series_number, image_path, image, conf_thresh, mns_thresh, subject, sh
 
															     h, w = image.shape[0], image.shape[1]
														
 
															     regions = sheets_dict['regions']
														
 
															     fetched_class = [ele['class_name'] for ele in regions]
														
 
															+    infer_box_list = []
														
 
															     try:
														
 
															         regions = adjust_item_edge_by_gray_image(image, regions)
														
@@ -87,7 +90,8 @@ def sheet(series_number, image_path, image, conf_thresh, mns_thresh, subject, sh
 
															             if not cond1 and not cond4 and cond2 and ocr:
														
 
															                 exam_number_list = infer_exam_number(image, ocr, regions)
														
 
															-                regions.extend(exam_number_list)
														
 
															+                if len(exam_number_list) > 0:
														
 
															+                    regions.extend(exam_number_list)
														
 
															             image, regions = exam_number_adjust_infer(image, regions)
														
 
															         except Exception as e:
														
@@ -95,12 +99,12 @@ def sheet(series_number, image_path, image, conf_thresh, mns_thresh, subject, sh
 
															             logger.info('试卷：{} 考号推断失败: {}'.format(image_path, e))
														
 
															     if sheet_infer_dict['choice_m']:
														
 
															-
														
 
															         try:
														
 
															             col_split = col_split_x.copy()
														
 
															             if not col_split:
														
 
															                 col_split = [w - 1]
														
 
															-            choice_m_list = infer_choice_m(image, regions, col_split, ocr)
														
 
															+            infer_box_list = ocr2sheet(image, col_split_x, ocr)
														
 
															+            choice_m_list = infer_choice_m(image, regions, infer_box_list, col_split)
														
 
															             if len(choice_m_list) > 0:
														
 
															                 choice_m_old_list = [ele for ele in regions if 'choice_m' == ele['class_name']]
														
 
															                 for infer_box in choice_m_list.copy():
														
@@ -117,7 +121,7 @@ def sheet(series_number, image_path, image, conf_thresh, mns_thresh, subject, sh
 
															                             #     choice_m_list.remove(infer_box)
														
 
															                             regions.remove(tf_box)
														
 
															                             # break
														
 
															-                        elif iou[0] > 0:
														
 
															+                        elif iou[0] > 0.05:
														
 
															                             choice_m_list.remove(infer_box)
														
 
															                             break
														
@@ -132,6 +136,27 @@ def sheet(series_number, image_path, image, conf_thresh, mns_thresh, subject, sh
 
															             traceback.print_exc()
														
 
															             logger.info('试卷：{} 选择题推断失败: {}'.format(image_path, e))
														
 
															+    if sheet_infer_dict['cloze']:
														
 
															+
														
 
															+        cloze_list = []
														
 
															+        for infer_box in infer_box_list:
														
 
															+            # {'loc': [240, 786, 1569, 1368]}
														
 
															+            loc = infer_box['loc']
														
 
															+            xmin, ymin, xmax, ymax = loc[0], loc[1], loc[2], loc[3]
														
 
															+
														
 
															+            for ele in regions:
														
 
															+                if ele['class_name'] in ['cloze_s', 'cloze']:
														
 
															+                    tf_loc = ele['bounding_box']
														
 
															+                    tf_loc_l = tf_loc['xmin']
														
 
															+                    tf_loc_t = tf_loc['ymin']
														
 
															+                    if xmin < tf_loc_l < xmax and ymin < tf_loc_t < ymax:
														
 
															+                        cloze_box = {'class_name': 'cloze',
														
 
															+                                     'bounding_box': {'xmin': xmin, 'ymin': ymin, 'xmax': xmax, 'ymax': ymax}}
														
 
															+                        cloze_list.append(cloze_box)
														
 
															+                        break
														
 
															+
														
 
															+        regions.extend(cloze_list)
														
 
															+
														
 
															     if sheet_infer_dict['solve']:
														
 
															         try:
														
 
															             include_class = ['info_title',
														
@@ -146,7 +171,8 @@ def sheet(series_number, image_path, image, conf_thresh, mns_thresh, subject, sh
 
															                              'composition0',
														
 
															                              'correction',
														
 
															                              'alarm_info',
														
 
															-                             'page'
														
 
															+                             'page',
														
 
															+                             'mark'
														
 
															                              ]
														
 
															             if 'math' not in subject:
														
 
															                 include_class.remove('cloze_s')
														
@@ -285,11 +311,11 @@ def choice_row_col(image, regions, xml_path, conf_thresh, mns_thresh, choice_ses
 
															     return choice_list
														
 
															-def choice_m_row_col(image, regions, xml_path):
														
 
															+def choice_m_row_col(image, regions, subject, xml_path):
														
 
															     choice_m_dict_tf = []
														
 
															     direction_list = []
														
 
															-    for ele in regions:
														
 
															+    for ele in regions:
														
 
															         if ele['class_name'] == 'choice_m':
														
 
															             choice_m_dict_tf.append(ele)
														
 
															         if ele['class_name'] == 'choice_n':
														
@@ -327,7 +353,8 @@ def choice_m_row_col(image, regions, xml_path):
 
															         # else:
														
 
															         #     choice_list = choice_line_box.choice_m_row_col(image, choice_m_dict_tf, xml_path)  # 找选择题行列、分数
														
 
															-        choice_list = choice_line_box.choice_m_row_col(image, choice_m_dict_tf, direction, xml_path)  # 找选择题行列、分数
														
 
															+        choice_list = choice_line_box.choice_m_row_col(image, choice_m_dict_tf, direction, subject,
														
 
															+                                                       xml_path)  # 找选择题行列、分数
														
 
															         tree = ET.parse(xml_path)  # xml tree
														
 
															         for index_num, box in enumerate(choice_list):
														
 
															             if len(box['bounding_box']) > 0:
														
--- a/segment/sheet_resolve/analysis/sheet/analysis_sheet.py
+++ b/segment/sheet_resolve/analysis/sheet/analysis_sheet.py
@@ -14,7 +14,6 @@ from segment.sheet_resolve.lib.utils.timer import Timer
 
															 from segment.sheet_resolve.tools import utils
														
 
															 from segment.sheet_resolve.analysis.solve.optional_solve import resolve_optional_choice
														
 
															-
														
 
															 logger = logging.getLogger(settings.LOGGING_TYPE)
														
@@ -113,6 +112,7 @@ def get_single_image_sheet_regions(analysis_type, img_path, img, classes,
 
															                                            img, conf_thresh, mns_thresh,
														
 
															                                            coordinate_bias_dict)
														
 
															+    analysis_type.replace('_blank', '')
														
 
															     img_dict = {"img_name": img_path,
														
 
															                 # 'qr_code': qr_code_info,
														
 
															                 'subject': analysis_type,
														
@@ -126,6 +126,13 @@ def get_single_image_sheet_regions(analysis_type, img_path, img, classes,
 
															 def question_number_format(init_number, crt_numbers, regions):
														
 
															+    """
														
 
															+    将重复或者是-1的题号改为501
														
 
															+    :param init_number: 初始替换的题号
														
 
															+    :param crt_numbers: 目前已经有的题号
														
 
															+    :param regions: 答题卡各区域
														
 
															+    :return:
														
 
															+    """
														
 
															     logger.info('regions： {}'.format(regions))
														
 
															     for region in regions:
														
 
															         logger.info('region： {}'.format(region))
														
@@ -156,6 +163,34 @@ def question_number_format(init_number, crt_numbers, regions):
 
															     return regions, init_number, crt_numbers
														
 
															+def resolve_select_s(image, bbox):
														
 
															+    box_region = utils.crop_region(image, bbox)
														
 
															+    left = bbox['xmin']
														
 
															+    top = bbox['ymin']
														
 
															+    right = bbox['xmax']
														
 
															+    bottom = bbox['ymax']
														
 
															+
														
 
															+    if (right - left) >= (bottom - top):
														
 
															+        direction = 180
														
 
															+    else:
														
 
															+        direction = 90
														
 
															+
														
 
															+    try:
														
 
															+        res = resolve_optional_choice(left, top, direction, box_region)
														
 
															+    except Exception as e:
														
 
															+        res = {'class_name': 'optional_choice',
														
 
															+               'rows': 1, 'cols': 2,
														
 
															+               'number': [501, 502],
														
 
															+               'single_width': right - left,
														
 
															+               'single_height': bottom - top,
														
 
															+               'bounding_box': {'xmin': left,
														
 
															+                                'ymin': top,
														
 
															+                                'xmax': right,
														
 
															+                                'ymax': bottom}}
														
 
															+
														
 
															+    return res
														
 
															+
														
 
															+
														
 
															 def box_region_format(sheet_dict, image, subject, shrink=True):
														
 
															     include_class = ['anchor_point',
														
 
															                      'bar_code',
														
@@ -172,14 +207,15 @@ def box_region_format(sheet_dict, image, subject, shrink=True):
 
															                      # 'correction'
														
 
															                      ]
														
 
															-    sheet_regions = sheet_dict['regions']
														
 
															-    optional_choice_tmp = []
														
 
															     default_points_dict = {'choice_m': 5, "cloze": 5, 'solve': 12, 'optional_solve': 10, 'cloze_s': 5,
														
 
															                            "composition": 60}
														
 
															-    if subject == "english":
														
 
															-        default_points_dict = {'choice_m': 2, "cloze": 2, 'solve': 2, 'optional_solve': 10, 'cloze_s': 2,
														
 
															+
														
 
															+    if subject in ["english", 'physics', 'chemistry', 'biology', 'science_comprehensive']:
														
 
															+        default_points_dict = {'choice_m': 2, "cloze": 2, 'solve': 10, 'optional_solve': 10, 'cloze_s': 2,
														
 
															                                "composition": 25}
														
 
															+    sheet_regions = sheet_dict['regions']
														
 
															+    select_s_list = []
														
 
															     for i in range(len(sheet_regions) - 1, -1, -1):
														
 
															         if subject == "math":
														
 
															             if sheet_regions[i]['class_name'] == 'cloze':
														
@@ -187,140 +223,174 @@ def box_region_format(sheet_dict, image, subject, shrink=True):
 
															             if sheet_regions[i]['class_name'] == 'cloze_s':
														
 
															                 sheet_regions[i]['class_name'] = 'cloze'  # math exclude cloze big
														
 
															         if subject == "english":
														
 
															-            if sheet_regions[i]['class_name'] == 'solve':
														
 
															-                sheet_regions[i]['class_name'] = 'cloze'
														
 
															+            if sheet_regions[i]['class_name'] == 'cloze':
														
 
															+                sheet_regions[i]['class_name'] = 'solve'
														
 
															             if sheet_regions[i]['class_name'] == 'correction':
														
 
															                 sheet_regions[i]['class_name'] = 'solve'
														
 
															-    for i in range(len(sheet_regions) - 1, -1, -1):
														
 
															         if sheet_regions[i]['class_name'] in ['solve0']:
														
 
															             sheet_regions[i]['class_name'] = 'solve'
														
 
															         if sheet_regions[i]['class_name'] in ['composition0']:
														
 
															             sheet_regions[i]['class_name'] = 'composition'
														
 
															         if sheet_regions[i]['class_name'] == 'select_s':
														
 
															-            # sheet_regions[i]['class_name'] = 'optional_choice'
														
 
															-            # optional_solve_tmp.append(sheet_regions[i])
														
 
															-
														
 
															-            bbox = sheet_regions[i]['bounding_box']
														
 
															-            box_region = utils.crop_region(image, bbox)
														
 
															-            left = bbox['xmin']
														
 
															-            top = bbox['ymin']
														
 
															-            right = bbox['xmax']
														
 
															-            bottom = bbox['ymax']
														
 
															-
														
 
															-            if (right - left) >= (bottom - top):
														
 
															-                direction = 180
														
 
															-            else:
														
 
															-                direction = 90
														
 
															-
														
 
															-            try:
														
 
															-                res = resolve_optional_choice(left, top, direction, box_region)
														
 
															-            except Exception as e:
														
 
															-                res = {'class_name': 'optional_choice',
														
 
															-                       'rows': 1, 'cols': 1,
														
 
															-                       'number': [501],
														
 
															-                       'single_width': right - left,
														
 
															-                       'single_height': bottom - top,
														
 
															-                       'bounding_box': {'xmin': left,
														
 
															-                                        'ymin': top,
														
 
															-                                        'xmax': right,
														
 
															-                                        'ymax': bottom}}
														
 
															-
														
 
															-            optional_choice_tmp.append(res)
														
 
															-
														
 
															-            sheet_regions.pop(i)
														
 
															+            select_s_list.append(sheet_regions[i])
														
 
															         if shrink:
														
 
															             if sheet_regions[i]['class_name'] not in include_class:
														
 
															                 sheet_regions.pop(i)
														
 
															-    for ele in sheet_regions:
														
 
															-        if ele['class_name'] == 'solve':
														
 
															-            solve_box = (ele['bounding_box']['xmin'], ele['bounding_box']['ymin'],
														
 
															-                         ele['bounding_box']['xmax'], ele['bounding_box']['ymax'])
														
 
															-            for optional_choice in optional_choice_tmp:
														
 
															-                optional_choice_box = (optional_choice['bounding_box']['xmin'], optional_choice['bounding_box']['ymin'],
														
 
															-                                       optional_choice['bounding_box']['xmax'], optional_choice['bounding_box']['ymax'])
														
 
															-                if utils.decide_coordinate_contains(optional_choice_box, solve_box):
														
 
															-                    ele['class_name'] = 'optional_solve'
														
 
															-                    choice_numbers = optional_choice['number']
														
 
															-                    solve_points = ele['number']
														
 
															-                    if choice_numbers[0] < 500:
														
 
															-                        ele['number'] = choice_numbers
														
 
															-                        ele['default_points'] = [ele['default_points']] * len(choice_numbers)
														
 
															+    # 去重
														
 
															+    sheet_tmp = sheet_regions.copy()
														
 
															+    remove_index = []
														
 
															+    for i, region in enumerate(sheet_tmp):
														
 
															+        if i not in remove_index:
														
 
															+            box = region['bounding_box']
														
 
															+            name = region['class_name']
														
 
															+            for j, region_in in enumerate(sheet_tmp):
														
 
															+                box_in = region_in['bounding_box']
														
 
															+                name_in = region_in['class_name']
														
 
															+                iou = utils.cal_iou(box, box_in)
														
 
															+
														
 
															+                if name == name_in and (iou[0] > 0.75 or iou[1] > 0.85 or iou[2] > 0.85) and i != j:
														
 
															+                    box_area = (box['xmax'] - box['xmin']) * (box['ymax'] - box['ymin'])
														
 
															+                    box_in_area = (box_in['xmax'] - box_in['xmin']) * (box_in['ymax'] - box_in['ymin'])
														
 
															+
														
 
															+                    if box_area >= box_in_area:
														
 
															+                        sheet_regions.remove(region_in)
														
 
															+                        remove_index.append(j)
														
 
															                     else:
														
 
															-                        ele['number'] = [solve_points] * len(choice_numbers)
														
 
															-                        optional_choice['numbers'] = [solve_points] * len(choice_numbers)
														
 
															-                        ele['default_points'] = [ele['default_points']] * len(choice_numbers)
														
 
															+                        sheet_regions.remove(region)
														
 
															+                        remove_index.append(i)
														
 
															                     break
														
 
															-                else:
														
 
															-                    continue
														
 
															-
														
 
															-        # 设置默认分数
														
 
															-        # if ele['class_name'] == "composition":
														
 
															-        #     if isinstance(ele['default_points'], list):
														
 
															-        #         for i, dp in enumerate(ele['default_points']):
														
 
															-        #             if dp != default_points_dict[ele['class_name']]:
														
 
															-        #                 ele['default_points'][i] = default_points_dict[ele['class_name']]
														
 
															-        #
														
 
															-        #     if isinstance(ele['default_points'], int):
														
 
															-        #         if ele['default_points'] != default_points_dict[ele['class_name']]:
														
 
															-        #             ele['default_points'] = default_points_dict[ele['class_name']]
														
 
															+
														
 
															+    # 合并select_s
														
 
															+    optional_choice_tmp = []
														
 
															+    select_s_list_copy = select_s_list.copy()
														
 
															+    if len(select_s_list) > 0:
														
 
															+        for ele in sheet_regions:
														
 
															+            if ele['class_name'] == 'solve':
														
 
															+                solve_box = (ele['bounding_box']['xmin'], ele['bounding_box']['ymin'],
														
 
															+                             ele['bounding_box']['xmax'], ele['bounding_box']['ymax'])
														
 
															+
														
 
															+                xn, yn, xm, ym = 9999, 9999, 0, 0
														
 
															+                merge = False
														
 
															+                for select_s in select_s_list:
														
 
															+                    select_s_box = (select_s['bounding_box']['xmin'], select_s['bounding_box']['ymin'],
														
 
															+                                    select_s['bounding_box']['xmax'], select_s['bounding_box']['ymax'])
														
 
															+                    if utils.decide_coordinate_contains(select_s_box, solve_box):
														
 
															+                        merge = True
														
 
															+                        xn = min(xn, select_s_box[0])
														
 
															+                        yn = min(yn, select_s_box[1])
														
 
															+                        xm = max(xm, select_s_box[2])
														
 
															+                        ym = max(ym, select_s_box[3])
														
 
															+                        select_s_list_copy.remove(select_s)
														
 
															+
														
 
															+                if merge:
														
 
															+                    new_box = {'xmin': xn, 'ymin': yn, 'xmax': xm, 'ymax': ym}
														
 
															+                    optional_choice_info = resolve_select_s(image, new_box)
														
 
															+                    optional_choice_tmp.append(optional_choice_info)
														
 
															+
														
 
															+    for ele in select_s_list_copy:
														
 
															+        box = ele['bounding_box']
														
 
															+        optional_choice_info = resolve_select_s(image, box)
														
 
															+        optional_choice_tmp.append(optional_choice_info)
														
 
															+
														
 
															+    optional_choice_tmp_ = optional_choice_tmp.copy()
														
 
															+    for ele in sheet_regions:
														
 
															+        if len(optional_choice_tmp) > 0:
														
 
															+            if ele['class_name'] == 'solve':
														
 
															+                solve_box = (ele['bounding_box']['xmin'], ele['bounding_box']['ymin'],
														
 
															+                             ele['bounding_box']['xmax'], ele['bounding_box']['ymax'])
														
 
															+                for optional_choice in optional_choice_tmp_:
														
 
															+                    optional_choice_box = (optional_choice['bounding_box']['xmin'], optional_choice['bounding_box']['ymin'],
														
 
															+                                           optional_choice['bounding_box']['xmax'], optional_choice['bounding_box']['ymax'])
														
 
															+                    if utils.decide_coordinate_contains(optional_choice_box, solve_box):
														
 
															+                        optional_choice_tmp.remove(optional_choice)
														
 
															+                        ele['class_name'] = 'optional_solve'
														
 
															+
														
 
															+                        choice_numbers = optional_choice['number']
														
 
															+                        solve_numbers = ele['number']
														
 
															+                        if choice_numbers[0] < 500:
														
 
															+                            ele['number'] = choice_numbers
														
 
															+                            ele['default_points'] = [ele['default_points']] * len(choice_numbers)
														
 
															+                        else:
														
 
															+                            tmp = [solve_numbers] * len(choice_numbers)
														
 
															+                            for i, num in enumerate(tmp):
														
 
															+                                tmp[i] = num + i
														
 
															+                            ele['number'] = tmp
														
 
															+                            optional_choice['number'] = tmp
														
 
															+                            ele['default_points'] = [ele['default_points']] * len(choice_numbers)
														
 
															+                        break
														
 
															+                    else:
														
 
															+                        continue
														
 
															         if ele['class_name'] in ["choice_m", "cloze", "cloze_s", "solve", "optional_solve", "composition"]:
														
 
															             if isinstance(ele['default_points'], list):
														
 
															                 for i, dp in enumerate(ele['default_points']):
														
 
															-                    if dp <= -1:
														
 
															+                    if dp < 1:  # 小于一分
														
 
															                         ele['default_points'][i] = default_points_dict[ele['class_name']]
														
 
															             if isinstance(ele['default_points'], int) or isinstance(ele['default_points'], float):
														
 
															-                if ele['default_points'] <= -1:
														
 
															+                if ele['default_points'] < 1:  # 小于一分
														
 
															                     ele['default_points'] = default_points_dict[ele['class_name']]
														
 
															-    sheet_regions.extend(optional_choice_tmp)
														
 
															-    # for ele in optional_choice_tmp:  # 选做题
														
 
															-    #     bbox = ele['bounding_box']
														
 
															-    #     box_region = utils.crop_region(image, bbox)
														
 
															-    #     left = bbox['xmin']
														
 
															-    #     top = bbox['ymin']
														
 
															-    #     right = bbox['xmax']
														
 
															-    #     bottom = bbox['ymax']
														
 
															-    #
														
 
															-    #     if (right - left) >= (bottom - top):
														
 
															-    #         direction = 180
														
 
															-    #     else:
														
 
															-    #         direction = 90
														
 
															-    #
														
 
															-    #     # res = find_contours(left, top, box_region)
														
 
															-    #     try:
														
 
															-    #         res = resolve_optional_choice(left, top, direction, box_region)
														
 
															-    #     except Exception as e:
														
 
															-    #         res = {'class_name': 'optional_choice',
														
 
															-    #                'rows': 1, 'cols': 1,
														
 
															-    #                'numbers': [501],
														
 
															-    #                'single_width': right - left,
														
 
															-    #                'single_height': bottom - top,
														
 
															-    #                'bounding_box': {'xmin': left,
														
 
															-    #                                 'ymin': top,
														
 
															-    #                                 'xmax': right,
														
 
															-    #                                 'ymax': bottom}}
														
 
															-    #
														
 
															-    #     sheet_regions.append(res)
														
 
															-
														
 
															-    # iou
														
 
															+    # select_s 在解答区域外侧
														
 
															+    if len(optional_choice_tmp) > 0:
														
 
															+        for oc in optional_choice_tmp:
														
 
															+            optional_choice_box = (oc['bounding_box']['xmin'], oc['bounding_box']['ymin'],
														
 
															+                                   oc['bounding_box']['xmax'], oc['bounding_box']['ymax'],
														
 
															+                                   oc['bounding_box']['xmin']
														
 
															+                                   + (oc['bounding_box']['xmax'] - oc['bounding_box']['xmin']) // 2)
														
 
															+            for sr in sheet_regions:
														
 
															+                if sr['class_name'] == 'solve':
														
 
															+                    solve_box = (sr['bounding_box']['xmin'], sr['bounding_box']['ymin'],
														
 
															+                                 sr['bounding_box']['xmax'], sr['bounding_box']['ymax'])
														
 
															+                    if (optional_choice_box[1] <= solve_box[1] and
														
 
															+                            solve_box[0] < optional_choice_box[4] < solve_box[2] and
														
 
															+                            abs(optional_choice_box[1] - solve_box[1]) < solve_box[3] - solve_box[1]):
														
 
															+                        sr['class_name'] = 'optional_solve'
														
 
															+                        choice_numbers = oc['number']
														
 
															+                        solve_numbers = sr['number']
														
 
															+                        if choice_numbers[0] < 500:
														
 
															+                            sr['number'] = choice_numbers
														
 
															+                            sr['default_points'] = [sr['default_points']] * len(choice_numbers)
														
 
															+                        else:
														
 
															+                            tmp = [solve_numbers] * len(choice_numbers)
														
 
															+                            for i, num in enumerate(tmp):
														
 
															+                                tmp[i] = num + i
														
 
															+
														
 
															+                            sr['number'] = tmp
														
 
															+                            oc['number'] = tmp
														
 
															+                            sr['default_points'] = [sr['default_points']] * len(choice_numbers)
														
 
															+
														
 
															+                        break
														
 
															+
														
 
															+    if len(optional_choice_tmp_):
														
 
															+        sheet_regions.extend(optional_choice_tmp_)
														
 
															+
														
 
															+    # 去重
														
 
															     sheet_tmp = sheet_regions.copy()
														
 
															     remove_index = []
														
 
															     for i, region in enumerate(sheet_tmp):
														
 
															         if i not in remove_index:
														
 
															             box = region['bounding_box']
														
 
															+            name = region['class_name']
														
 
															             for j, region_in in enumerate(sheet_tmp):
														
 
															                 box_in = region_in['bounding_box']
														
 
															-                # TODO 根据大小
														
 
															+                name_in = region_in['class_name']
														
 
															                 iou = utils.cal_iou(box, box_in)
														
 
															-                if iou[0] > 0.75 and i != j:
														
 
															-                    sheet_regions.remove(region)
														
 
															-                    remove_index.append(j)
														
 
															+
														
 
															+                if name == name_in and (iou[0] > 0.75 or iou[1] > 0.85 or iou[2] > 0.85) and i != j:
														
 
															+                    box_area = (box['xmax'] - box['xmin']) * (box['ymax'] - box['ymin'])
														
 
															+                    box_in_area = (box_in['xmax'] - box_in['xmin']) * (box_in['ymax'] - box_in['ymin'])
														
 
															+
														
 
															+                    if box_area >= box_in_area:
														
 
															+                        sheet_regions.remove(region_in)
														
 
															+                        remove_index.append(j)
														
 
															+                    else:
														
 
															+                        sheet_regions.remove(region)
														
 
															+                        remove_index.append(i)
														
 
															                     break
														
 
															     sheet_dict.update({'regions': sheet_regions})
														
@@ -335,8 +405,8 @@ def merge_span_boxes(col_sheets):
 
															         next_col = col_sheets[i + 1]
														
 
															         if not cur_col or not next_col:
														
 
															             continue
														
 
															-        current_bottom_box = cur_col[-1]
														
 
															-        next_col_top_box = next_col[0]
														
 
															+        current_bottom_box = cur_col[-1]   # 当前栏的最后一个，bottom
														
 
															+        next_col_top_box = next_col[0]  # 下一栏的第一个，top
														
 
															         b_name = current_bottom_box['class_name']
														
 
															         t_name = next_col_top_box['class_name']
														
--- a/segment/sheet_resolve/analysis/sheet/choice_infer.py
+++ b/segment/sheet_resolve/analysis/sheet/choice_infer.py
@@ -299,6 +299,7 @@ def cluster_and_anti_abnormal(image, xml_path, choice_n_list, digital_list, char
 
															             digital_list_to_cluster.append(digital_list[i])
														
 
															             digital_loc_arr.append(point)
														
 
															+    # 得到所有题号区域， 作为后续划分choice_m的依据
														
 
															     choice_m_numbers_list = []
														
 
															     for ele in choice_n_list:
														
 
															         loc = ele['bounding_box']
														
@@ -418,295 +419,438 @@ def cluster_and_anti_abnormal(image, xml_path, choice_n_list, digital_list, char
 
															     #             # cond1 = cond2 = true, 因为infer选择题时已横向排序， 默认这种情况不会出现
														
 
															     #             pass
														
 
															+    direction180, direction90 = 0, 0
														
 
															     for ele in choice_m_numbers_list:
														
 
															         loc = ele["loc"]
														
 
															-        if loc[3] - loc[1] >= loc[2] - loc[0]:
														
 
															+        if loc[3] - loc[1] >= 2 * (loc[2] - loc[0]):
														
 
															             direction = 180
														
 
															+            direction180 += 1
														
 
															         else:
														
 
															             direction = 90
														
 
															+            direction90 += 1
														
 
															         ele.update({'direction': direction})
														
 
															-    # tree = ET.parse(xml_path)
														
 
															-    # for index, choice_m in enumerate(choice_m_numbers_list):
														
 
															-    #     name = str(choice_m["numbers"])
														
 
															-    #     xmin, ymin, xmax, ymax, _, _ = choice_m["loc"]
														
 
															-    #     tree = create_xml(name, tree, str(xmin + limit_left), str(ymin + limit_top), str(xmax + limit_left), str(ymax + limit_top))
														
 
															-    #
														
 
															-    # tree.write(xml_path)
														
 
															-    choice_m_numbers_list = sorted(choice_m_numbers_list, key=lambda x: x['loc'][3] - x['loc'][1], reverse=True)
														
 
															-    choice_m_numbers_right_limit = max([ele['loc'][2] for ele in choice_m_numbers_list])
														
 
															-    remain_len = len(choice_m_numbers_list)
														
 
															-    choice_m_list = list()
														
 
															-    need_revised_choice_m_list = list()
														
 
															-    while remain_len > 0:
														
 
															-        # 先确定属于同行的数据，然后找字母划分block
														
 
															-        # random_index = random.randint(0, len(choice_m_numbers_list)-1)
														
 
															-        random_index = 0
														
 
															-        # print(random_index)
														
 
															-        ymax_limit = choice_m_numbers_list[random_index]["loc"][3]
														
 
															-        ymin_limit = choice_m_numbers_list[random_index]["loc"][1]
														
 
															-        # choice_m_numbers_list.pop(random_index)
														
 
															-
														
 
															-        # 当前行的choice_m
														
 
															-        current_row_choice_m_d = [ele for ele in choice_m_numbers_list if ymin_limit < ele["loc"][5] < ymax_limit]
														
 
															-        current_row_choice_m_d = sorted(current_row_choice_m_d, key=lambda x: x["loc"][0])
														
 
															-        # current_row_choice_m_d.append(choice_m_numbers_list[random_index])
														
 
															-        split_pix = sorted([ele["loc"][0] for ele in current_row_choice_m_d])  # xmin排序
														
 
															-        split_index = get_split_index(split_pix, dif=choice_s_width * 0.8)
														
 
															-        split_pix = [split_pix[ele] for ele in split_index[:-1]]
														
 
															-
														
 
															-        block_list = []
														
 
															-        for i in range(len(split_index) - 1):
														
 
															-            block = current_row_choice_m_d[split_index[i]: split_index[i + 1]]
														
 
															-            if len(block) > 1:
														
 
															-                remain_len = remain_len - (len(block) - 1)
														
 
															-                numbers_new = []
														
 
															-                loc_new = [[], [], [], []]
														
 
															-                for blk in block:
														
 
															-                    loc_old = blk["loc"]
														
 
															-                    numbers_new.extend(blk["numbers"])
														
 
															-                    for ii in range(4):
														
 
															-                        loc_new[ii].append(loc_old[ii])
														
 
															-
														
 
															-                loc_new[0] = min(loc_new[0])
														
 
															-                loc_new[1] = min(loc_new[1])
														
 
															-                loc_new[2] = max(loc_new[2])
														
 
															-                loc_new[3] = max(loc_new[3])
														
 
															-
														
 
															-                loc_new.append(loc_new[0] + (loc_new[2] - loc_new[0]) // 2)
														
 
															-                loc_new.append(loc_new[1] + (loc_new[3] - loc_new[1]) // 2)
														
 
															-
														
 
															-                block = [{"numbers": sorted(numbers_new), "loc": loc_new, "direction": block[0]["direction"]}]
														
 
															-
														
 
															-            block_list.extend(block)
														
 
															-
														
 
															-        current_row_choice_m_d = block_list
														
 
															-        current_row_chars = [ele for ele in chars_list
														
 
															-                             if ymin_limit < (ele["location"]["top"] + ele["location"]["height"] // 2) < ymax_limit]
														
 
															-
														
 
															-        # split_index.append(row_chars_xmax)  # 边界
														
 
															-        split_pix.append(round(split_pix[-1] + choice_s_width * 1.75))
														
 
															-        for i in range(0, len(split_pix) - 1):
														
 
															-            left_limit = split_pix[i]
														
 
															-            right_limit = split_pix[i + 1]
														
 
															-            block_chars = [ele for ele in current_row_chars
														
 
															-                           if left_limit < (ele["location"]["left"] + ele["location"]["width"] // 2) < right_limit]
														
 
															-
														
 
															-            a_z = '_ABCD_FGHT'
														
 
															-            letter_index = [a_z.index(ele['char'].upper()) for ele in block_chars if ele['char'].upper() in a_z]
														
 
															-
														
 
															-            letter_index_times = {ele: 0 for ele in set(letter_index)}
														
 
															-            for l_index in letter_index:
														
 
															-                letter_index_times[l_index] += 1
														
 
															-
														
 
															-            if (a_z.index("T") in letter_index) and (a_z.index("F") in letter_index):
														
 
															-                choice_option = "T, F"
														
 
															-                cols = 2
														
 
															-            else:
														
 
															-                if len(letter_index) < 1:
														
 
															-                    tmp = 4
														
 
															-                    choice_option = 'A,B,C,D'
														
 
															-                else:
														
 
															-                    tmp = max(set(letter_index))
														
 
															-
														
 
															-                    choice_option = ",".join(a_z[min(letter_index):tmp + 1])
														
 
															-                cols = tmp
														
 
															-            bias = 3  # pix
														
 
															-            current_loc = current_row_choice_m_d[i]["loc"]
														
 
															-            location = dict(xmin=(current_loc[2] + bias),  # 当前数字xmax右边
														
 
															-                            # xmin=max(current_loc[2] + bias, chars_xmin) + limit_left,
														
 
															-                            ymin=current_loc[1],
														
 
															-
														
 
															-                            xmax=(right_limit - bias),
														
 
															-                            # xmax=min(chars_xmax, right_limit - bias) + limit_left,
														
 
															-                            ymax=current_loc[3])
														
 
															-
														
 
															-            try:
														
 
															-                choice_m_img = utils.crop_region(image, location)
														
 
															-                if 0 in choice_m_img.shape[:2]:
														
 
															-                    continue
														
 
															-                right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															-                if right_loc > 0:
														
 
															-                    location.update(dict(xmax=right_loc + location['xmin']))
														
 
															-                if bottom_loc > 0:
														
 
															-                    location.update(dict(ymax=bottom_loc + location['ymin']))
														
 
															-            except Exception as e:
														
 
															-                print(e)
														
 
															-                traceback.print_exc()
														
 
															+    # 判断大多数choice_m的方向
														
 
															+    if direction180 >= direction90:   # 横排
														
 
															+
														
 
															+        choice_m_numbers_list = sorted(choice_m_numbers_list, key=lambda x: x['loc'][3] - x['loc'][1], reverse=True)
														
 
															+        choice_m_numbers_right_limit = max([ele['loc'][2] for ele in choice_m_numbers_list])
														
 
															+        remain_len = len(choice_m_numbers_list)
														
 
															+        choice_m_list = list()
														
 
															+        need_revised_choice_m_list = list()
														
 
															+        while remain_len > 0:
														
 
															+            # 先确定属于同行的数据，然后找字母划分block
														
 
															+
														
 
															+            random_index = 0
														
 
															+            # print(random_index)
														
 
															+            ymax_limit = choice_m_numbers_list[random_index]["loc"][3]
														
 
															+            ymin_limit = choice_m_numbers_list[random_index]["loc"][1]
														
 
															+
														
 
															+            # 当前行的choice_m
														
 
															+            current_row_choice_m_d = [ele for ele in choice_m_numbers_list if ymin_limit < ele["loc"][5] < ymax_limit]
														
 
															+            current_row_choice_m_d = sorted(current_row_choice_m_d, key=lambda x: x["loc"][0])
														
 
															+            # current_row_choice_m_d.append(choice_m_numbers_list[random_index])
														
 
															+
														
 
															+            # 对同行的题号区域排序， 得到分割间隔， 两个题号中间的区域为choice_m
														
 
															+            split_pix = sorted([ele["loc"][0] for ele in current_row_choice_m_d])  # xmin排序
														
 
															+            split_index = get_split_index(split_pix, dif=choice_s_width * 0.8)
														
 
															+            split_pix = [split_pix[ele] for ele in split_index[:-1]]
														
 
															+
														
 
															+            block_list = []
														
 
															+            for i in range(len(split_index) - 1):
														
 
															+                block = current_row_choice_m_d[split_index[i]: split_index[i + 1]]
														
 
															+                if len(block) > 1:
														
 
															+                    remain_len = remain_len - (len(block) - 1)
														
 
															+                    numbers_new = []
														
 
															+                    loc_new = [[], [], [], []]
														
 
															+                    for blk in block:
														
 
															+                        loc_old = blk["loc"]
														
 
															+                        numbers_new.extend(blk["numbers"])
														
 
															+                        for ii in range(4):
														
 
															+                            loc_new[ii].append(loc_old[ii])
														
 
															+
														
 
															+                    loc_new[0] = min(loc_new[0])
														
 
															+                    loc_new[1] = min(loc_new[1])
														
 
															+                    loc_new[2] = max(loc_new[2])
														
 
															+                    loc_new[3] = max(loc_new[3])
														
 
															+
														
 
															+                    loc_new.append(loc_new[0] + (loc_new[2] - loc_new[0]) // 2)
														
 
															+                    loc_new.append(loc_new[1] + (loc_new[3] - loc_new[1]) // 2)
														
 
															+
														
 
															+                    block = [{"numbers": sorted(numbers_new), "loc": loc_new, "direction": block[0]["direction"]}]
														
 
															+
														
 
															+                block_list.extend(block)
														
 
															+
														
 
															+            current_row_choice_m_d = block_list
														
 
															+            current_row_chars = [ele for ele in chars_list
														
 
															+                                 if ymin_limit < (ele["location"]["top"] + ele["location"]["height"] // 2) < ymax_limit]
														
 
															+
														
 
															+            # split_index.append(row_chars_xmax)  # 边界
														
 
															+            split_pix.append(limit_right)
														
 
															+            for i in range(0, len(split_pix) - 1):
														
 
															+                left_limit = split_pix[i]
														
 
															+                right_limit = split_pix[i + 1]
														
 
															+                block_chars = [ele for ele in current_row_chars
														
 
															+                               if left_limit < (ele["location"]["left"] + ele["location"]["width"] // 2) < right_limit]
														
 
															+
														
 
															+                a_z = '_ABCD_FGHT'
														
 
															+                letter_index = [a_z.index(ele['char'].upper()) for ele in block_chars if ele['char'].upper() in a_z]
														
 
															+
														
 
															+                letter_index_times = {ele: 0 for ele in set(letter_index)}
														
 
															+                for l_index in letter_index:
														
 
															+                    letter_index_times[l_index] += 1
														
 
															+
														
 
															+                if (a_z.index("T") in letter_index) and (a_z.index("F") in letter_index):
														
 
															+                    choice_option = "T, F"
														
 
															+                    cols = 2
														
 
															+                else:
														
 
															+                    if len(letter_index) < 1:
														
 
															+                        tmp = 4
														
 
															+                        choice_option = 'A,B,C,D'
														
 
															+                    else:
														
 
															+                        tmp = max(set(letter_index))
														
 
															+
														
 
															+                        choice_option = ",".join(a_z[min(letter_index):tmp + 1])
														
 
															+                    cols = tmp
														
 
															+
														
 
															+                bias = 3  # pix
														
 
															+                current_loc = current_row_choice_m_d[i]["loc"]
														
 
															+                location = dict(xmin=(current_loc[2] + bias),  # 当前数字xmax右边
														
 
															+                                # xmin=max(current_loc[2] + bias, chars_xmin) + limit_left,
														
 
															+                                ymin=current_loc[1],
														
 
															+
														
 
															+                                xmax=(right_limit - bias),
														
 
															+                                # xmax=min(chars_xmax, right_limit - bias) + limit_left,
														
 
															+                                ymax=current_loc[3])
														
 
															+
														
 
															+                try:
														
 
															+                    # 调整choice-m区域， 避免推断出来的区域过大
														
 
															+                    choice_m_img = utils.crop_region(image, location)
														
 
															+                    if 0 in choice_m_img.shape[:2]:
														
 
															+                        continue
														
 
															+                    right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															+                    if right_loc > 0:
														
 
															+                        location.update(dict(xmax=right_loc + location['xmin']))
														
 
															+                    if bottom_loc > 0:
														
 
															+                        location.update(dict(ymax=bottom_loc + location['ymin']))
														
 
															+                except Exception as e:
														
 
															+                    print(e)
														
 
															+                    traceback.print_exc()
														
 
															+
														
 
															+                tmp_w, tmp_h = location['xmax'] - location['xmin'], location['ymax'] - location['ymin'],
														
 
															+                numbers = current_row_choice_m_d[i]["numbers"]
														
 
															+
														
 
															+                direction = current_row_choice_m_d[i]["direction"]
														
 
															+                if direction == 180:
														
 
															+                    choice_m = dict(class_name='choice_m',
														
 
															+                                    number=numbers,
														
 
															+                                    bounding_box=location,
														
 
															+                                    choice_option=choice_option,
														
 
															+                                    default_points=[5] * len(numbers),
														
 
															+                                    direction=direction,
														
 
															+                                    cols=cols,
														
 
															+                                    rows=len(numbers))
														
 
															+                else:
														
 
															+                    choice_m = dict(class_name='choice_m',
														
 
															+                                    number=numbers,
														
 
															+                                    bounding_box=location,
														
 
															+                                    choice_option=choice_option,
														
 
															+                                    default_points=[5] * len(numbers),
														
 
															+                                    direction=direction,
														
 
															+                                    cols=len(numbers),
														
 
															+                                    rows=cols)
														
 
															+
														
 
															+                if tmp_w > 2 * choice_s_width:
														
 
															+                    need_revised_choice_m_list.append(choice_m)
														
 
															+                else:
														
 
															+                    choice_m_list.append(choice_m)
														
 
															+
														
 
															+            remain_len = remain_len - len(current_row_choice_m_d)
														
 
															+            for ele in choice_m_numbers_list.copy():
														
 
															+                if ele in current_row_choice_m_d:
														
 
															+                    choice_m_numbers_list.remove(ele)
														
 
															+
														
 
															+            for ele in choice_m_numbers_list.copy():
														
 
															+                if ele in current_row_chars:
														
 
															+                    choice_m_numbers_list.remove(ele)
														
 
															+
														
 
															+            # 解决单行问题
														
 
															+            if len(choice_m_list) > 0:
														
 
															+                crt_right_max = max([int(ele['bounding_box']['xmax']) for ele in choice_m_list])
														
 
															+                if limit_right - crt_right_max > choice_s_width:
														
 
															+                    # 存在区域
														
 
															+                    region_loc = {'xmin': crt_right_max + 10,
														
 
															+                                  'ymin': choice_m_list[0]['bounding_box']['ymin'],
														
 
															+                                  'xmax': limit_right,
														
 
															+                                  'ymax': choice_m_list[0]['bounding_box']['ymax']}
														
 
															+
														
 
															+                    contain_dig = []
														
 
															+                    for i, ele in enumerate(digital_loc_arr):
														
 
															+                        if region_loc['xmin'] < ele[0] < region_loc['xmax'] and region_loc['ymin'] < ele[1] < region_loc['ymax']:
														
 
															+                            contain_dig.append(digital_list[i])
														
 
															+
														
 
															+                    contain_chars = [ele for ele in chars_list
														
 
															+                                     if region_loc['xmin'] < (ele["location"]["left"] + ele["location"]["width"] // 2) < region_loc['xmax']
														
 
															+                                     and
														
 
															+                                     region_loc['xmin'] < (ele["location"]["top"] + ele["location"]["height"] // 2) < region_loc['ymax']]
														
 
															+                    numbers = [-1]
														
 
															+                    if contain_dig or contain_chars:
														
 
															+                        d_ymin, d_ymax, d_xmin, d_xmax = 9999, 0, 9999, 0
														
 
															+                        if contain_dig:
														
 
															+                            numbers = [ele["digital"] for ele in contain_dig]
														
 
															+                            d_ymin = min([ele['loc'][1] for ele in contain_dig])
														
 
															+                            d_ymax = max([ele['loc'][3] for ele in contain_dig])
														
 
															+                            d_xmin = min([ele['loc'][0] for ele in contain_dig])
														
 
															+                            d_xmax = max([ele['loc'][2] for ele in contain_dig])
														
 
															+
														
 
															+                        c_ymin, c_ymax, c_xmin, c_xmax = 9999, 0, 9999, 0
														
 
															+                        if contain_chars:
														
 
															+                            c_ymin = min([ele["location"]["top"] for ele in contain_chars])
														
 
															+                            c_ymax = max([ele["location"]["top"] + ele["location"]["height"] for ele in contain_chars])
														
 
															+                            c_xmin = min([ele["location"]["left"] for ele in contain_chars])
														
 
															+                            c_xmax = max([ele["location"]["left"] + ele["location"]["width"] for ele in contain_chars])
														
 
															+
														
 
															+                        r_ymin, r_ymax = min(d_ymin, c_ymin), max(d_ymax, c_ymax)
														
 
															+                        r_xmin, r_xmax = min(d_xmin, c_xmin), max(d_xmax, c_xmax)
														
 
															+
														
 
															+                        region_loc['ymin'] = r_ymin - 10
														
 
															+                        region_loc['ymax'] = r_ymax + 10
														
 
															+                        if d_xmin == r_xmin:
														
 
															+                            region_loc['xmin'] = d_xmax + 5
														
 
															+                            region_loc['xmax'] = d_xmax + 5 + int(1.2 * choice_s_width)
														
 
															+                        else:
														
 
															+                            if 1.2 * (r_xmax - r_xmin) > choice_s_width:
														
 
															+                                region_loc['xmin'] = r_xmin - 10
														
 
															+                                region_loc['xmax'] = r_xmax + 10
														
 
															+                            else:
														
 
															+                                region_loc['xmin'] = max((r_xmax - r_xmin) // 2 + r_xmin - choice_s_width,
														
 
															+                                                         crt_right_max + 10)
														
 
															+                                region_loc['xmax'] = min((r_xmax - r_xmin) // 2 + r_xmin + choice_s_width ,
														
 
															+                                                         limit_right)
														
 
															-            tmp_w, tmp_h = location['xmax'] - location['xmin'], location['ymax'] - location['ymin'],
														
 
															-            numbers = current_row_choice_m_d[i]["numbers"]
														
 
															-
														
 
															-            direction = current_row_choice_m_d[i]["direction"]
														
 
															-            if direction == 180:
														
 
															-                choice_m = dict(class_name='choice_m',
														
 
															-                                number=numbers,
														
 
															-                                bounding_box=location,
														
 
															-                                choice_option=choice_option,
														
 
															-                                default_points=[5] * len(numbers),
														
 
															-                                direction=direction,
														
 
															-                                cols=cols,
														
 
															-                                rows=len(numbers))
														
 
															-            else:
														
 
															-                choice_m = dict(class_name='choice_m',
														
 
															-                                number=numbers,
														
 
															-                                bounding_box=location,
														
 
															-                                choice_option=choice_option,
														
 
															-                                default_points=[5] * len(numbers),
														
 
															-                                direction=direction,
														
 
															-                                cols=len(numbers),
														
 
															-                                rows=cols)
														
 
															-
														
 
															-            if tmp_w > 2 * choice_s_width:
														
 
															-                need_revised_choice_m_list.append(choice_m)
														
 
															-            else:
														
 
															-                choice_m_list.append(choice_m)
														
 
															-
														
 
															-        remain_len = remain_len - len(current_row_choice_m_d)
														
 
															-        for ele in choice_m_numbers_list.copy():
														
 
															-            if ele in current_row_choice_m_d:
														
 
															-                choice_m_numbers_list.remove(ele)
														
 
															-
														
 
															-        for ele in choice_m_numbers_list.copy():
														
 
															-            if ele in current_row_chars:
														
 
															-                choice_m_numbers_list.remove(ele)
														
 
															-
														
 
															-        # 解决单行问题
														
 
															-        crt_right_max = max([int(ele['bounding_box']['xmax']) for ele in choice_m_list])
														
 
															-        if limit_right - crt_right_max > choice_s_width:
														
 
															-            # 存在区域
														
 
															-            region_loc = {'xmin': crt_right_max + 10,
														
 
															-                          'ymin': choice_m_list[0]['bounding_box']['ymin'],
														
 
															-                          'xmax': limit_right,
														
 
															-                          'ymax': choice_m_list[0]['bounding_box']['ymax']}
														
 
															-
														
 
															-            contain_dig = []
														
 
															-            for i, ele in enumerate(digital_loc_arr):
														
 
															-                if region_loc['xmin'] < ele[0] < region_loc['xmax'] and region_loc['ymin'] < ele[1] < region_loc['ymax']:
														
 
															-                    contain_dig.append(digital_list[i])
														
 
															-
														
 
															-            contain_chars = [ele for ele in chars_list
														
 
															-                             if region_loc['xmin'] < (ele["location"]["left"] + ele["location"]["width"] // 2) < region_loc['xmax']
														
 
															-                             and
														
 
															-                             region_loc['xmin'] < (ele["location"]["top"] + ele["location"]["height"] // 2) < region_loc['ymax']]
														
 
															-            numbers = [-1]
														
 
															-            if contain_dig or contain_chars:
														
 
															-                d_ymin, d_ymax, d_xmin, d_xmax = 9999, 0, 9999, 0
														
 
															-                if contain_dig:
														
 
															-                    numbers = [ele["digital"] for ele in contain_dig]
														
 
															-                    d_ymin = min([ele['loc'][1] for ele in contain_dig])
														
 
															-                    d_ymax = max([ele['loc'][3] for ele in contain_dig])
														
 
															-                    d_xmin = min([ele['loc'][0] for ele in contain_dig])
														
 
															-                    d_xmax = max([ele['loc'][2] for ele in contain_dig])
														
 
															-
														
 
															-                c_ymin, c_ymax, c_xmin, c_xmax = 9999, 0, 9999, 0
														
 
															-                if contain_chars:
														
 
															-                    c_ymin = min([ele["location"]["top"] for ele in contain_chars])
														
 
															-                    c_ymax = max([ele["location"]["top"] + ele["location"]["height"] for ele in contain_chars])
														
 
															-                    c_xmin = min([ele["location"]["left"] for ele in contain_chars])
														
 
															-                    c_xmax = max([ele["location"]["left"] + ele["location"]["width"] for ele in contain_chars])
														
 
															-
														
 
															-                r_ymin, r_ymax = min(d_ymin, c_ymin), max(d_ymax, c_ymax)
														
 
															-                r_xmin, r_xmax = min(d_xmin, c_xmin), max(d_xmax, c_xmax)
														
 
															-
														
 
															-                region_loc['ymin'] = r_ymin - 10
														
 
															-                region_loc['ymax'] = r_ymax + 10
														
 
															-                if d_xmin == r_xmin:
														
 
															-                    region_loc['xmin'] = d_xmax + 5
														
 
															-                    region_loc['xmax'] = d_xmax + 5 + int(1.2 * choice_s_width)
														
 
															+                    else:
														
 
															+                        # 默认这种情况只有1行或2行
														
 
															+                        numbers = [-1]
														
 
															+                        region_xmin = crt_right_max + 5
														
 
															+                        region_xmax = int(region_xmin + 1.2 * choice_s_width)
														
 
															+                        region_ymin = min([int(ele['bounding_box']['ymin']) for ele in choice_m_list])
														
 
															+                        region_ymax = max([int(ele['bounding_box']['ymax']) for ele in choice_m_list])
														
 
															+                        region_ymax = region_ymin + (region_ymax - region_ymin) // 2  # 默认这种情况只有1行或2行
														
 
															+                        region_loc = {'xmin': region_xmin, 'ymin': region_ymin, 'xmax': region_xmax, 'ymax': region_ymax}
														
 
															+
														
 
															+                    try:
														
 
															+                        choice_m_img = utils.crop_region(image, region_loc)
														
 
															+                        if 0 in choice_m_img.shape[:2]:
														
 
															+                            continue
														
 
															+                        right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															+                        if right_loc > 0:
														
 
															+                            region_loc.update(dict(xmax=right_loc + region_loc['xmin']))
														
 
															+                        if bottom_loc > 0:
														
 
															+                            region_loc.update(dict(ymax=bottom_loc + region_loc['ymin']))
														
 
															+                    except Exception as e:
														
 
															+                        print(e)
														
 
															+                        traceback.print_exc()
														
 
															+
														
 
															+                    choice_m = dict(class_name='choice_m',
														
 
															+                                    number=numbers,
														
 
															+                                    bounding_box=region_loc,
														
 
															+                                    choice_option='A,B,C,D',
														
 
															+                                    default_points=[5],
														
 
															+                                    direction=180,
														
 
															+                                    cols=4,
														
 
															+                                    rows=1,
														
 
															+                                    single_width=(region_loc['xmax'] - region_loc['xmin']) // 4,
														
 
															+                                    )
														
 
															+                    choice_m_list.append(choice_m)
														
 
															+
														
 
															+        # 单独一行不聚类(理论上不会再到这一步了, 上个block解决)
														
 
															+        for i, revised_choice_m in enumerate(need_revised_choice_m_list):
														
 
															+            loc = revised_choice_m['bounding_box']
														
 
															+            left_part_loc = loc.copy()
														
 
															+            left_part_loc.update({'xmax': loc['xmin'] + choice_s_width})
														
 
															+            choice_m_img = utils.crop_region(image, left_part_loc)
														
 
															+            right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															+            if right_loc > 0:
														
 
															+                left_part_loc.update(dict(xmax=right_loc + left_part_loc['xmin']))
														
 
															+            if bottom_loc > 0:
														
 
															+                left_part_loc.update(dict(ymax=bottom_loc + left_part_loc['ymin']))
														
 
															+
														
 
															+            left_tmp_height = left_part_loc['ymax'] - left_part_loc['ymin']
														
 
															+
														
 
															+            right_part_loc = loc.copy()
														
 
															+            # right_part_loc.update({'xmin': loc['xmax']-choice_s_width})
														
 
															+            right_part_loc.update({'xmin': left_part_loc['xmax'] + 5})
														
 
															+            choice_m_img = utils.crop_region(image, right_part_loc)
														
 
															+            right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															+            if right_loc > 0:
														
 
															+                right_part_loc.update(dict(xmax=right_loc + right_part_loc['xmin']))
														
 
															+            if bottom_loc > 0:
														
 
															+                right_part_loc.update(dict(ymax=bottom_loc + right_part_loc['ymin']))
														
 
															+
														
 
															+            right_tmp_height = right_part_loc['ymax'] - right_part_loc['ymin']
														
 
															+
														
 
															+            number_len = max(1, int(revised_choice_m['rows'] // (left_tmp_height // right_tmp_height)))
														
 
															+            number = [ele + revised_choice_m['number'][-1] + 1 for ele in range(number_len)]
														
 
															+            rows = len(number)
														
 
															+
														
 
															+            revised_choice_m.update({'bounding_box': left_part_loc})
														
 
															+            choice_m_list.append(revised_choice_m)
														
 
															+
														
 
															+            tmp = revised_choice_m.copy()
														
 
															+            tmp.update({'bounding_box': right_part_loc, 'number': number, 'rows': rows})
														
 
															+            choice_m_list.append(tmp)
														
 
															+
														
 
															+        choice_m_list_copy = choice_m_list.copy()
														
 
															+        for ele in choice_m_list_copy:
														
 
															+            loc = ele["bounding_box"]
														
 
															+            w, h = loc['xmax'] - loc['xmin'], loc['ymax'] - loc['ymin']
														
 
															+            if 2 * w * h < choice_s_width * choice_s_height:
														
 
															+                choice_m_list.remove(ele)
														
 
															+        return choice_m_list
														
 
															+
														
 
															+    else:   # 竖排
														
 
															+        # 横向最大
														
 
															+        choice_m_numbers_list = sorted(choice_m_numbers_list, key=lambda x: x['loc'][2] - x['loc'][0], reverse=True)
														
 
															+        remain_len = len(choice_m_numbers_list)
														
 
															+        choice_m_list = list()
														
 
															+        need_revised_choice_m_list = list()
														
 
															+        while remain_len > 0:
														
 
															+            # 先确定属于同列的数据，然后找字母划分block
														
 
															+            random_index = 0
														
 
															+            xmax_limit = choice_m_numbers_list[random_index]["loc"][2]
														
 
															+            xmin_limit = choice_m_numbers_list[random_index]["loc"][0]
														
 
															+            # choice_m_numbers_list.pop(random_index)
														
 
															+
														
 
															+            # 当前行的choice_m
														
 
															+            current_row_choice_m_d = [ele for ele in choice_m_numbers_list if xmin_limit < ele["loc"][4] < xmax_limit]
														
 
															+            current_row_choice_m_d = sorted(current_row_choice_m_d, key=lambda x: x["loc"][1])
														
 
															+            # current_row_choice_m_d.append(choice_m_numbers_list[random_index])
														
 
															+            split_pix = sorted([ele["loc"][1] for ele in current_row_choice_m_d])  # ymin排序
														
 
															+            split_index = get_split_index(split_pix, dif=choice_s_height * 0.8)
														
 
															+            split_pix = [split_pix[ele] for ele in split_index[:-1]]
														
 
															+
														
 
															+            block_list = []
														
 
															+            for i in range(len(split_index) - 1):
														
 
															+                block = current_row_choice_m_d[split_index[i]: split_index[i + 1]]
														
 
															+                if len(block) > 1:
														
 
															+                    remain_len = remain_len - (len(block) - 1)
														
 
															+                    numbers_new = []
														
 
															+                    loc_new = [[], [], [], []]
														
 
															+                    for blk in block:
														
 
															+                        loc_old = blk["loc"]
														
 
															+                        numbers_new.extend(blk["numbers"])
														
 
															+                        for ii in range(4):
														
 
															+                            loc_new[ii].append(loc_old[ii])
														
 
															+
														
 
															+                    loc_new[0] = min(loc_new[0])
														
 
															+                    loc_new[1] = min(loc_new[1])
														
 
															+                    loc_new[2] = max(loc_new[2])
														
 
															+                    loc_new[3] = max(loc_new[3])
														
 
															+
														
 
															+                    loc_new.append(loc_new[0] + (loc_new[2] - loc_new[0]) // 2)
														
 
															+                    loc_new.append(loc_new[1] + (loc_new[3] - loc_new[1]) // 2)
														
 
															+
														
 
															+                    block = [{"numbers": sorted(numbers_new), "loc": loc_new, "direction": block[0]["direction"]}]
														
 
															+
														
 
															+                block_list.extend(block)
														
 
															+
														
 
															+            current_row_choice_m_d = block_list
														
 
															+            current_row_chars = [ele for ele in chars_list
														
 
															+                                 if xmin_limit < (ele["location"]["top"] + ele["location"]["height"] // 2) < xmax_limit]
														
 
															+
														
 
															+            split_pix.append(limit_bottom)
														
 
															+            for i in range(0, len(split_pix) - 1):
														
 
															+                top_limit = split_pix[i]
														
 
															+                bottom_limit = split_pix[i + 1]
														
 
															+                block_chars = [ele for ele in current_row_chars
														
 
															+                               if top_limit < (ele["location"]["left"] + ele["location"]["width"] // 2) < bottom_limit]
														
 
															+
														
 
															+                a_z = '_ABCD_FGHT'
														
 
															+                letter_text = set([ele['char'].upper() for ele in block_chars if ele['char'].upper() in a_z])
														
 
															+                letter_index = [a_z.index(ele['char'].upper()) for ele in block_chars if ele['char'].upper() in a_z]
														
 
															+
														
 
															+                letter_index_times = {ele: 0 for ele in set(letter_index)}
														
 
															+                for l_index in letter_index:
														
 
															+                    letter_index_times[l_index] += 1
														
 
															+
														
 
															+                if (a_z.index("T") in letter_index) and (a_z.index("F") in letter_index):
														
 
															+                    choice_option = "T, F"
														
 
															+                    cols = 2
														
 
															                 else:
														
 
															-                    if 1.2 * (r_xmax - r_xmin) > choice_s_width:
														
 
															-                        region_loc['xmin'] = r_xmin - 10
														
 
															-                        region_loc['xmax'] = r_xmax + 10
														
 
															+                    if len(letter_index) < 1:
														
 
															+                        tmp = 4
														
 
															+                        choice_option = 'A,B,C,D'
														
 
															                     else:
														
 
															-                        region_loc['xmin'] = max((r_xmax - r_xmin) // 2 + r_xmin - choice_s_width,
														
 
															-                                                 crt_right_max + 10)
														
 
															-                        region_loc['xmax'] = min((r_xmax - r_xmin) // 2 + r_xmin + choice_s_width ,
														
 
															-                                                 limit_right)
														
 
															+                        tmp = max(set(letter_index))
														
 
															+                        choice_option = ",".join(a_z[min(letter_index):tmp + 1])
														
 
															+                    cols = tmp
														
 
															+
														
 
															+                bias = 3  # pix
														
 
															+                current_loc = current_row_choice_m_d[i]["loc"]
														
 
															+                location = dict(xmin=current_loc[0],
														
 
															+                                ymin=current_loc[3] + bias,
														
 
															+                                xmax=current_loc[1],
														
 
															+                                ymax=bottom_limit - bias)
														
 
															+
														
 
															+                try:
														
 
															+                    choice_m_img = utils.crop_region(image, location)
														
 
															+                    right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															+                    if right_loc > 0:
														
 
															+                        location.update(dict(xmax=right_loc + location['xmin']))
														
 
															+                    if bottom_loc > 0:
														
 
															+                        location.update(dict(ymax=bottom_loc + location['ymin']))
														
 
															+                except Exception as e:
														
 
															+                    print(e)
														
 
															+                    traceback.print_exc()
														
 
															+
														
 
															+                tmp_w, tmp_h = location['xmax'] - location['xmin'], location['ymax'] - location['ymin'],
														
 
															+                numbers = current_row_choice_m_d[i]["numbers"]
														
 
															+                direction = current_row_choice_m_d[i]["direction"]
														
 
															+                if direction == 180:
														
 
															+                    choice_m = dict(class_name='choice_m',
														
 
															+                                    number=numbers,
														
 
															+                                    bounding_box=location,
														
 
															+                                    choice_option=choice_option,
														
 
															+                                    default_points=[5] * len(numbers),
														
 
															+                                    direction=direction,
														
 
															+                                    cols=cols,
														
 
															+                                    rows=len(numbers))
														
 
															+                else:
														
 
															+                    choice_m = dict(class_name='choice_m',
														
 
															+                                    number=numbers,
														
 
															+                                    bounding_box=location,
														
 
															+                                    choice_option=choice_option,
														
 
															+                                    default_points=[5] * len(numbers),
														
 
															+                                    direction=direction,
														
 
															+                                    cols=len(numbers),
														
 
															+                                    rows=cols)
														
 
															+
														
 
															+                if tmp_h > 2 * choice_s_height:
														
 
															+                    need_revised_choice_m_list.append(choice_m)
														
 
															+                else:
														
 
															+                    choice_m_list.append(choice_m)
														
 
															-            else:
														
 
															-                # 默认这种情况只有1行或2行
														
 
															-                numbers = [-1]
														
 
															-                region_xmin = crt_right_max + 5
														
 
															-                region_xmax = int(region_xmin + 1.2 * choice_s_width)
														
 
															-                region_ymin = min([int(ele['bounding_box']['ymin']) for ele in choice_m_list])
														
 
															-                region_ymax = max([int(ele['bounding_box']['ymax']) for ele in choice_m_list])
														
 
															-                region_ymax = region_ymin + (region_ymax - region_ymin) // 2  # 默认这种情况只有1行或2行
														
 
															-                region_loc = {'xmin': region_xmin, 'ymin': region_ymin, 'xmax': region_xmax, 'ymax': region_ymax}
														
 
															+            remain_len = remain_len - len(current_row_choice_m_d)
														
 
															+            for ele in choice_m_numbers_list.copy():
														
 
															+                if ele in current_row_choice_m_d:
														
 
															+                    choice_m_numbers_list.remove(ele)
														
 
															-            try:
														
 
															-                choice_m_img = utils.crop_region(image, region_loc)
														
 
															-                if 0 in choice_m_img.shape[:2]:
														
 
															-                    continue
														
 
															-                right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															-                if right_loc > 0:
														
 
															-                    region_loc.update(dict(xmax=right_loc + region_loc['xmin']))
														
 
															-                if bottom_loc > 0:
														
 
															-                    region_loc.update(dict(ymax=bottom_loc + region_loc['ymin']))
														
 
															-            except Exception as e:
														
 
															-                print(e)
														
 
															-                traceback.print_exc()
														
 
															+            for ele in choice_m_numbers_list.copy():
														
 
															+                if ele in current_row_chars:
														
 
															+                    choice_m_numbers_list.remove(ele)
														
 
															-            choice_m = dict(class_name='choice_m',
														
 
															-                            number=numbers,
														
 
															-                            bounding_box=region_loc,
														
 
															-                            choice_option='A,B,C,D',
														
 
															-                            default_points=[5],
														
 
															-                            direction=180,
														
 
															-                            cols=4,
														
 
															-                            rows=1,
														
 
															-                            single_width=(region_loc['xmax'] - region_loc['xmin']) // 4,
														
 
															-                            )
														
 
															-            choice_m_list.append(choice_m)
														
 
															-
														
 
															-    # 单独一行不聚类(理论上不会再到这一步了, 上个block解决)
														
 
															-    for i, revised_choice_m in enumerate(need_revised_choice_m_list):
														
 
															-        loc = revised_choice_m['bounding_box']
														
 
															-        left_part_loc = loc.copy()
														
 
															-        left_part_loc.update({'xmax': loc['xmin'] + choice_s_width})
														
 
															-        choice_m_img = utils.crop_region(image, left_part_loc)
														
 
															-        right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															-        if right_loc > 0:
														
 
															-            left_part_loc.update(dict(xmax=right_loc + left_part_loc['xmin']))
														
 
															-        if bottom_loc > 0:
														
 
															-            left_part_loc.update(dict(ymax=bottom_loc + left_part_loc['ymin']))
														
 
															-
														
 
															-        left_tmp_height = left_part_loc['ymax'] - left_part_loc['ymin']
														
 
															-
														
 
															-        right_part_loc = loc.copy()
														
 
															-        # right_part_loc.update({'xmin': loc['xmax']-choice_s_width})
														
 
															-        right_part_loc.update({'xmin': left_part_loc['xmax'] + 5})
														
 
															-        choice_m_img = utils.crop_region(image, right_part_loc)
														
 
															-        right_loc, bottom_loc = adjust_choice_m(choice_m_img, mean_height, mean_width * 2)
														
 
															-        if right_loc > 0:
														
 
															-            right_part_loc.update(dict(xmax=right_loc + right_part_loc['xmin']))
														
 
															-        if bottom_loc > 0:
														
 
															-            right_part_loc.update(dict(ymax=bottom_loc + right_part_loc['ymin']))
														
 
															-
														
 
															-        right_tmp_height = right_part_loc['ymax'] - right_part_loc['ymin']
														
 
															-
														
 
															-        number_len = max(1, int(revised_choice_m['rows'] // (left_tmp_height // right_tmp_height)))
														
 
															-        number = [ele + revised_choice_m['number'][-1] + 1 for ele in range(number_len)]
														
 
															-        rows = len(number)
														
 
															-
														
 
															-        revised_choice_m.update({'bounding_box': left_part_loc})
														
 
															-        choice_m_list.append(revised_choice_m)
														
 
															-
														
 
															-        tmp = revised_choice_m.copy()
														
 
															-        tmp.update({'bounding_box': right_part_loc, 'number': number, 'rows': rows})
														
 
															-        choice_m_list.append(tmp)
														
 
															-
														
 
															-    choice_m_list_copy = choice_m_list.copy()
														
 
															-    for ele in choice_m_list_copy:
														
 
															-        loc = ele["bounding_box"]
														
 
															-        w, h = loc['xmax'] - loc['xmin'], loc['ymax'] - loc['ymin']
														
 
															-        if 2 * w * h < choice_s_width * choice_s_height:
														
 
															-            choice_m_list.remove(ele)
														
 
															-    return choice_m_list
														
 
															+        choice_m_list_copy = choice_m_list.copy()
														
 
															+        for ele in choice_m_list_copy:
														
 
															+            loc = ele["bounding_box"]
														
 
															+            w, h = loc['xmax'] - loc['xmin'], loc['ymax'] - loc['ymin']
														
 
															+            if 2 * w * h < choice_s_width * choice_s_height:
														
 
															+                choice_m_list.remove(ele)
														
 
															+
														
 
															+        return choice_m_list
														
 
															-def infer_choice_m(image, tf_sheet, col_split_x, ocr, xml=None):
														
 
															-    infer_box_list = ocr2sheet(image, col_split_x, ocr, xml)
														
 
															+def infer_choice_m(image, tf_sheet, infer_box_list, col_split_x, xml=None):
														
 
															+    # infer_box_list = ocr2sheet(image, col_split_x, ocr, xml)
														
 
															     if not infer_box_list:
														
 
															         for ele in tf_sheet:
														
 
															             if ele['class_name'] == 'choice':
														
--- a/segment/sheet_resolve/analysis/sheet/ocr_sheet.py
+++ b/segment/sheet_resolve/analysis/sheet/ocr_sheet.py
@@ -161,10 +161,12 @@ def ocr2sheet(image, col_split_list, raw_ocr, xml_path=None):
 
															         # print(raw_chn_index)
														
 
															-        left_limit = min([ele['location']['left'] for ele in ocr_res
														
 
															-                          if ele['location']['width'] >= ele['location']['height']]) - 10
														
 
															-        right_limit = max([ele['location']['right'] for ele in ocr_res
														
 
															-                           if ele['location']['width'] >= ele['location']['height']]) + 10
														
 
															+        left_limit, right_limit = col_split_list[ii], col_split_list[ii+1]
														
 
															+        if len(ocr_res) > 0:
														
 
															+            left_limit = min([ele['location']['left'] for ele in ocr_res
														
 
															+                              if ele['location']['width'] >= ele['location']['height']]) - 10
														
 
															+            right_limit = max([ele['location']['right'] for ele in ocr_res
														
 
															+                               if ele['location']['width'] >= ele['location']['height']]) + 10
														
 
															         # 文字识别结果可能连横跨栏，并导致文字分栏错误
														
 
															         left_limit = max(left_limit, col_split_list[ii])
														
@@ -237,8 +239,17 @@ def sheet_sorted(regions, split_x):
 
															     region_contain_set.extend(region_contain_set_)
														
 
															     # split_x = tell_columns(image, regions)
														
 
															-    regions = sorted(regions, key=lambda x: x['bounding_box']['xmin'])
														
 
															-    x_min_list = [ele['bounding_box']['xmin'] for ele in regions]
														
 
															+    for rg in regions:
														
 
															+        xi = rg['bounding_box']['xmin']
														
 
															+        xm = rg['bounding_box']['xmax']
														
 
															+        yi = rg['bounding_box']['ymin']
														
 
															+        ym = rg['bounding_box']['ymax']
														
 
															+        xmid = (xm - xi)//2 + xi
														
 
															+        ymid = (ym - yi)//2 + yi
														
 
															+        rg['bounding_box'].update({'xmid': xmid, 'ymid': ymid})
														
 
															+    regions = sorted(regions, key=lambda x: x['bounding_box']['xmid'])
														
 
															+
														
 
															+    x_min_list = [ele['bounding_box']['xmid'] for ele in regions]
														
 
															     # 分栏
														
 
															     col_list = []
														
--- a/segment/sheet_resolve/analysis/sheet/sheet_adjust.py
+++ b/segment/sheet_resolve/analysis/sheet/sheet_adjust.py
@@ -11,6 +11,8 @@ import numpy as np
 
															 ''' 根据CV检测矩形框 调整模型输出框'''
														
 
															 ''' LSD直线检测 暂时改用 霍夫曼检测'''
														
 
															+ADJUST_CLASS = ['solve', 'solve0', 'composition', 'composition0', 'choice', 'cloze', 'correction']
														
 
															+
														
 
															 # 用户自己计算阈值
														
 
															 def custom_threshold(gray, type_inv=cv2.THRESH_BINARY):
														
@@ -53,7 +55,7 @@ def dilation_img(image, kernel_size):
 
															 # 图像padding
														
 
															 def image_padding(image, padding_w, padding_h):
														
 
															     h, w = image.shape[:2]
														
 
															-    if (3 == len(image.shape)):
														
 
															+    if 3 == len(image.shape):
														
 
															         image_new = np.zeros((h + padding_h, w + padding_w, 3), np.uint8)
														
 
															     else:
														
 
															         image_new = np.zeros((h + padding_h, w + padding_w), np.uint8)
														
@@ -62,7 +64,7 @@ def image_padding(image, padding_w, padding_h):
 
															 def horizontal_projection(img_bin, mut=0):
														
 
															-    '''水平方向投影'''
														
 
															+    """水平方向投影"""
														
 
															     h, w = img_bin.shape[:2]
														
 
															     hist = [0 for i in range(w)]
														
 
															     for x in range(w):
														
@@ -90,33 +92,33 @@ def vertical_projection(img_bin, mut=0):
 
															 def get_white_blok_pos(arry, blok_w=0):
														
 
															-    '''获取投影结果中的白色块'''
														
 
															+    """获取投影结果中的白色块"""
														
 
															     pos = []
														
 
															     start = 1
														
 
															     x0 = 0
														
 
															     x1 = 0
														
 
															     for idx, val in enumerate(arry):
														
 
															-        if (start):
														
 
															+        if start:
														
 
															             if val:
														
 
															                 x0 = idx
														
 
															                 start = 0
														
 
															         else:
														
 
															-            if (0 == val):
														
 
															+            if 0 == val:
														
 
															                 x1 = idx
														
 
															                 start = 1
														
 
															-                if (x1 - x0 > blok_w):
														
 
															+                if x1 - x0 > blok_w:
														
 
															                     pos.append((x0, x1))
														
 
															-    if (0 == start):
														
 
															+    if 0 == start:
														
 
															         x1 = len(arry) - 1
														
 
															-        if (x1 - x0 > blok_w):
														
 
															+        if x1 - x0 > blok_w:
														
 
															             pos.append((x0, x1))
														
 
															     return pos
														
 
															 def get_decide_boberLpa(itemRe, itemGT):
														
 
															-    '''
														
 
															+    """
														
 
															     IOU 计算
														
 
															-    '''
														
 
															+    """
														
 
															     x1 = int(itemRe[0])
														
 
															     y1 = int(itemRe[1])
														
 
															     x1_ = int(itemRe[2])
														
@@ -153,6 +155,7 @@ def get_decide_boberLpa(itemRe, itemGT):
 
															 # 查找连通区域 微调专用 不通用
														
 
															+
														
 
															 def get_contours(image):
														
 
															     # image = cv2.imread(img_path,0)
														
 
															     # if debug: plt_imshow(image)
														
@@ -172,29 +175,29 @@ def get_contours(image):
 
															         w = int(box[2])
														
 
															         h = int(box[3])
														
 
															         area = int(box[4])
														
 
															-        if (w < img_w / 5 or w > img_w - 10 or h < 50 or h > img_h - 10):  # 常见框大小限定
														
 
															+        if w < img_w / 5 or w > img_w - 10 or h < 50 or h > img_h - 10:  # 常见框大小限定
														
 
															             continue
														
 
															-        if (img_w > img_h):  # 多栏答题卡 w大于宽度的一般肯定是错误的框
														
 
															-            if (w > img_w / 2):
														
 
															+        if img_w > img_h:  # 多栏答题卡 w大于宽度的一般肯定是错误的框
														
 
															+            if w > img_w / 2:
														
 
															                 continue
														
 
															-        if (area < w * h / 3):  # 大框套小框 中空白色区域形成的面积 排除
														
 
															+        if area < w * h / 3:  # 大框套小框 中空白色区域形成的面积 排除
														
 
															             continue
														
 
															         rects.append((x0, y0, x0 + w, y0 + h))
														
 
															     return rects
														
 
															 def adjust_alarm_info(image, box):
														
 
															-    '''
														
 
															+    """
														
 
															     调整上下坐标 排除内部含有了边框线情况
														
 
															     左右调整只有100%确认的 从边界开始遇到的第一个非0列就终止 误伤情况太多
														
 
															     LSD算法转不过来  霍夫曼检测不靠谱 连通区域测试后排除误伤情况太多  改用投影
														
 
															     image: 灰度 非 二值图
														
 
															     box  : 坐标信息
														
 
															-    '''
														
 
															+    """
														
 
															     # debug
														
 
															     # debug = 0
														
 
															-    if (image is None):
														
 
															+    if image is None:
														
 
															         print("error image")
														
 
															         return box
														
 
															     img_box = image[box[1]:box[3], box[0]:box[2]]
														
@@ -259,15 +262,15 @@ def adjust_alarm_info(image, box):
 
															     new_right = w_len - 1
														
 
															     b_flag = [0, 0]
														
 
															     for idx, val in enumerate(hist_proj):
														
 
															-        if (0 == b_flag[0]):
														
 
															-            if (val != 0):
														
 
															+        if 0 == b_flag[0]:
														
 
															+            if val != 0:
														
 
															                 new_left = idx
														
 
															                 b_flag[0] = 1
														
 
															-        if (0 == b_flag[1]):
														
 
															-            if (hist_proj[w_len - 1 - idx] != 0):
														
 
															+        if 0 == b_flag[1]:
														
 
															+            if hist_proj[w_len - 1 - idx] != 0:
														
 
															                 new_right = w_len - idx - 1
														
 
															                 b_flag[1] = 1
														
 
															-        if (b_flag[0] and b_flag[1]):
														
 
															+        if b_flag[0] and b_flag[1]:
														
 
															             break
														
 
															     new_top = box[1] + y_pos[max_id][0]
														
@@ -283,12 +286,12 @@ def adjust_alarm_info(image, box):
 
															 def adjust_zg_info(image, box, cv_boxes):
														
 
															-    '''
														
 
															+    """
														
 
															     调整大区域的box
														
 
															     1、cvbox要与box纵坐标有交叉
														
 
															     2、IOU值大于0。8时 默认相等拷贝区域坐标
														
 
															-    '''
														
 
															-    if (image is None):
														
 
															+    """
														
 
															+    if image is None:
														
 
															         return box
														
 
															     min_rotio = 0.5
														
@@ -299,9 +302,9 @@ def adjust_zg_info(image, box, cv_boxes):
 
															     tmp_rotio = 0
														
 
															     rc_mz = box
														
 
															     for idx, cv_box in enumerate(cv_boxes):
														
 
															-        if ((box[1] - 10) > (cv_box[3])):  # 首先要保证纵坐标有交叉
														
 
															+        if (box[1] - 10) > (cv_box[3]):  # 首先要保证纵坐标有交叉
														
 
															             continue
														
 
															-        if ((box[3] + 10) < cv_box[1]):
														
 
															+        if (box[3] + 10) < cv_box[1]:
														
 
															             continue
														
 
															         jc_x = max(box[0], cv_box[0])
														
@@ -310,14 +313,14 @@ def adjust_zg_info(image, box, cv_boxes):
 
															         bj_y = max(box[2], cv_box[2])
														
 
															         rt = abs(jc_y - jc_x) * 1.0 / abs(bj_y - bj_x) * 1.0
														
 
															-        if (rt < min_rotio):
														
 
															+        if rt < min_rotio:
														
 
															             continue
														
 
															         jc_boxes.append(cv_box)
														
 
															-        if (rt > tmp_rotio):
														
 
															+        if rt > tmp_rotio:
														
 
															             rc_mz = cv_box
														
 
															             tmp_rotio = rt
														
 
															     # 判断 调整
														
 
															-    if (len(jc_boxes) != 0):
														
 
															+    if len(jc_boxes) != 0:
														
 
															         box[0] = rc_mz[0]
														
 
															         box[2] = rc_mz[2]
														
 
															         b_find = 0
														
@@ -325,29 +328,29 @@ def adjust_zg_info(image, box, cv_boxes):
 
															         rc_biggst = rc_mz
														
 
															         for mz_box in jc_boxes:
														
 
															             iou = get_decide_boberLpa(mz_box, box)
														
 
															-            if (iou > 0.8):
														
 
															+            if iou > 0.8:
														
 
															                 b_find = 1
														
 
															                 frotio = iou
														
 
															                 rc_biggst = mz_box
														
 
															-        if (b_find):
														
 
															+        if b_find:
														
 
															             box[1] = rc_biggst[1]
														
 
															             box[3] = rc_biggst[3]
														
 
															     return box
														
 
															 def adjust_item_edge(img_path, reback_json):
														
 
															-    '''
														
 
															+    """
														
 
															     根据图像的CV分析结果和 模型直接输出结果 对模型输出的边框做微调
														
 
															     1、外接矩形查找
														
 
															     2、LSD直线检测 替换方法 霍夫曼直线检测
														
 
															     3、只处理有把握的情况 任何含有不确定因素的一律不作任何处理
														
 
															     img_path: 待处理图像绝对路径
														
 
															     re_json : 模型输出结果
														
 
															-    '''
														
 
															+    """
														
 
															     debug = 1
														
 
															     # 存放新的结果
														
 
															     re_json = copy.deepcopy(reback_json)
														
 
															-    if (not os.path.exists(img_path) or 0 == len(re_json)):
														
 
															+    if not os.path.exists(img_path) or 0 == len(re_json):
														
 
															         return
														
 
															     image = cv2.imread(img_path, 0)
														
 
															     # 获取CV连通区域结果
														
@@ -365,7 +368,7 @@ def adjust_item_edge(img_path, reback_json):
 
															         box = [item["bounding_box"]["xmin"], item["bounding_box"]["ymin"], item["bounding_box"]["xmax"],
														
 
															                item["bounding_box"]["ymax"]]
														
 
															         # print(name ,box)
														
 
															-        if (name == "alarm_info" or name == "page" or name == "type_score"):
														
 
															+        if name == "alarm_info" or name == "page" or name == "type_score":
														
 
															             if debug:
														
 
															                 cv2.rectangle(image_draw, (box[0], box[1]), (box[2], box[3]), (0, 255, 0), 2)
														
 
															             new_box = adjust_alarm_info(image, box)
														
@@ -423,7 +426,7 @@ def adjust_item_edge_by_gray_image(image, reback_json):
 
															         box = [item["bounding_box"]["xmin"], item["bounding_box"]["ymin"], item["bounding_box"]["xmax"],
														
 
															                item["bounding_box"]["ymax"]]
														
 
															         # print(name ,box)
														
 
															-        if (name == "alarm_info" or name == "page" or name == "type_score"):
														
 
															+        if name == "alarm_info" or name == "page" or name == "type_score":
														
 
															             if debug:
														
 
															                 cv2.rectangle(image_draw, (box[0], box[1]), (box[2], box[3]), (0, 255, 0), 2)
														
 
															             new_box = adjust_alarm_info(image, box)
														
@@ -433,9 +436,7 @@ def adjust_item_edge_by_gray_image(image, reback_json):
 
															             item["bounding_box"]["xmax"] = box[2]
														
 
															             item["bounding_box"]["ymin"] = box[1]
														
 
															             item["bounding_box"]["ymax"] = box[3]
														
 
															-        elif (name == "solve" or name == "solve0"
														
 
															-              or name == "cloze" or name == "choice"
														
 
															-              or name == "composition" or name == "composition0"):
														
 
															+        elif name in ADJUST_CLASS:
														
 
															             if debug:
														
 
															                 cv2.rectangle(image_draw, (box[0], box[1]), (box[2], box[3]), (0, 255, 0), 2)
														
 
															             new_box = adjust_zg_info(image, box, cv_boxes)
														
--- a/segment/sheet_resolve/analysis/sheet/sheet_infer.py
+++ b/segment/sheet_resolve/analysis/sheet/sheet_infer.py
@@ -117,10 +117,11 @@ def infer_bar_code(image, ocr_dict_list, attention_region):
 
															                     xmax = right_board_location['left'] + right_board_location['width']
														
 
															                     ymax = down_board_location['top'] + down_board_location['height']
														
 
															-                    xmin = max(1, int(xmin)-5)
														
 
															-                    ymin = max(1, int(ymin)-5)
														
 
															-                    xmax = min(int(xmax), img_rows - 1)
														
 
															-                    ymax = min(int(ymax), img_cols - 1 )
														
 
															+                    bias = 5
														
 
															+                    xmin = max(1, int(xmin)-bias)
														
 
															+                    ymin = max(1, int(ymin)-bias)
														
 
															+                    xmax = min(int(xmax)+bias, img_rows - 1)
														
 
															+                    ymax = min(int(ymax)+bias, img_cols - 1)
														
 
															                     bar_code_dict = {'class_name': 'bar_code',
														
 
															                                      'bounding_box': {'xmin': xmin, 'ymin': ymin, 'xmax': xmax, 'ymax': ymax}}
														
 
															                     bar_code_dict_list.append(bar_code_dict)
														
@@ -214,7 +215,7 @@ def infer_exam_number(image, ocr_dict_list, existed_regions, times_threshold=5):
 
															                 if 9 in key_digital:
														
 
															                     break
														
 
															-    if 0 in key_digital and 9 in key_digital:
														
 
															+    if 0 in key_digital and 9 in key_digital and len(key_digital) > 4:
														
 
															         mean_height = sum(all_height)//10
														
 
															         exam_number_dict = {'class_name': 'exam_number',
														
 
															                             'bounding_box': {'xmin': xmin, 'ymin': ymin, 'xmax': xmax, 'ymax': ymax+mean_height},
														
@@ -257,29 +258,30 @@ def infer_exam_number(image, ocr_dict_list, existed_regions, times_threshold=5):
 
															         iou_cond = True
														
 
															         exam_number_dict_list_check = []
														
 
															-        for exam_number_dict in exam_number_dict_list:
														
 
															-            exam_number_polygon = Polygon([(exam_number_dict["xmin"], exam_number_dict["ymin"]),
														
 
															-                                           (exam_number_dict["xmax"], exam_number_dict["ymin"]),
														
 
															-                                           (exam_number_dict["xmax"], exam_number_dict["ymax"]),
														
 
															-                                           (exam_number_dict["xmin"], exam_number_dict["ymax"])])
														
 
															-            for region in existed_regions:
														
 
															-                class_name = region["class_name"]
														
 
															-
														
 
															-                if class_name in ["attention", "solve", "choice", "choice_m", 'choice_s', "cloze", 'cloze_s',
														
 
															-                                  'bar_code', 'qr_code', 'composition', 'solve0']:
														
 
															-                    coordinates = region['bounding_box']
														
 
															-                    xmin = coordinates['xmin']
														
 
															-                    ymin = coordinates['ymin']
														
 
															-                    xmax = coordinates['xmax']
														
 
															-                    ymax = coordinates['ymax']
														
 
															-                    existed_polygon = Polygon([(xmin, ymin), (xmax, ymin), (xmax, ymax), (xmin, ymax)])
														
 
															-                    overlab_area = existed_polygon.intersection(exam_number_polygon).area
														
 
															-                    iou = overlab_area / (exam_number_polygon.area + existed_polygon.area - overlab_area)
														
 
															-                    if iou > 0:
														
 
															-                        iou_cond = False
														
 
															-                        break
														
 
															-            if iou_cond:
														
 
															-                exam_number_dict_list_check.append(exam_number_polygon)
														
 
															+        if len(exam_number_dict_list) > 0:
														
 
															+            for exam_number_dict in exam_number_dict_list:
														
 
															+                exam_number_polygon = Polygon([(exam_number_dict["xmin"], exam_number_dict["ymin"]),
														
 
															+                                               (exam_number_dict["xmax"], exam_number_dict["ymin"]),
														
 
															+                                               (exam_number_dict["xmax"], exam_number_dict["ymax"]),
														
 
															+                                               (exam_number_dict["xmin"], exam_number_dict["ymax"])])
														
 
															+                for region in existed_regions:
														
 
															+                    class_name = region["class_name"]
														
 
															+
														
 
															+                    if class_name in ["attention", "solve", "choice", "choice_m", 'choice_s', "cloze", 'cloze_s',
														
 
															+                                      'bar_code', 'qr_code', 'composition', 'solve0']:
														
 
															+                        coordinates = region['bounding_box']
														
 
															+                        xmin = coordinates['xmin']
														
 
															+                        ymin = coordinates['ymin']
														
 
															+                        xmax = coordinates['xmax']
														
 
															+                        ymax = coordinates['ymax']
														
 
															+                        existed_polygon = Polygon([(xmin, ymin), (xmax, ymin), (xmax, ymax), (xmin, ymax)])
														
 
															+                        overlab_area = existed_polygon.intersection(exam_number_polygon).area
														
 
															+                        iou = overlab_area / (exam_number_polygon.area + existed_polygon.area - overlab_area)
														
 
															+                        if iou > 0:
														
 
															+                            iou_cond = False
														
 
															+                            break
														
 
															+                if iou_cond:
														
 
															+                    exam_number_dict_list_check.append(exam_number_polygon)
														
 
															         return exam_number_dict_list_check
														
@@ -393,7 +395,8 @@ def exam_number_adjust_infer(image, regions):
 
															         region = regions[i]
														
 
															         if region['class_name'] == 'exam_number_s':
														
 
															             loc = region['bounding_box']
														
 
															-            box.append([loc['xmin'], loc['ymin'], loc['xmax'], loc['ymax']])
														
 
															+            if loc['ymax'] - loc['ymin'] > loc['xmax'] - loc['xmin']:
														
 
															+                box.append([loc['xmin'], loc['ymin'], loc['xmax'], loc['ymax']])
														
 
															         if region['class_name'] == 'exam_number':
														
 
															             loc = region['bounding_box']
														
@@ -403,7 +406,8 @@ def exam_number_adjust_infer(image, regions):
 
															         if region['class_name'] == 'exam_number_w':
														
 
															             loc = region['bounding_box']
														
 
															-            box1.append([loc['xmin'], loc['ymax'], loc['xmax'], loc['ymax']])
														
 
															+            if loc['xmax'] - loc['xmin'] > loc['ymax'] - loc['ymin']:
														
 
															+                box1.append([loc['xmin'], loc['ymax'], loc['xmax'], loc['ymax']])  # exam_number_w 只取下界
														
 
															     if not box:
														
 
															         return image, regions
														
--- a/segment/sheet_resolve/analysis/solve/optional_solve.py
+++ b/segment/sheet_resolve/analysis/solve/optional_solve.py
@@ -48,10 +48,10 @@ def resolve_optional_choice(l_, t_, direction, image):
 
															     ocr_res = get_ocr_text_and_coordinate(image)
														
 
															     digital_list, chars_list, d_mean_height, d_mean_width = find_digital(ocr_res, 0, 0,)
														
 
															     if not digital_list:
														
 
															-        numbers = [501]
														
 
															+        numbers = [501, 502]
														
 
															         h, w = image.shape
														
 
															         optional_choice_dict = {'class_name': 'optional_choice',
														
 
															-                                'rows': 1, 'cols': 1,
														
 
															+                                'rows': 1, 'cols': 2,
														
 
															                                 'single_width': w,
														
 
															                                 'single_height': h,
														
 
															                                 'direction': direction,
														
@@ -63,7 +63,7 @@ def resolve_optional_choice(l_, t_, direction, image):
 
															     else:
														
 
															         numbers = sorted([ele['digital'] for ele in digital_list])
														
 
															-        contours = find_contours(l_, t_, image, d_mean_width//2, d_mean_height//2)
														
 
															+        contours = find_contours(l_, t_, image, d_mean_width*2, d_mean_height)
														
 
															         res_region = []
														
 
															         for contour in contours:
														
@@ -91,9 +91,13 @@ def resolve_optional_choice(l_, t_, direction, image):
 
															         mean_w, mean_h = sum_w//len(numbers), sum_h//len(numbers)
														
 
															         if direction == 180:
														
 
															-            rows, cols = 1, len(numbers)
														
 
															+            rows, cols = 1, max(2, len(numbers))
														
 
															+            if len(numbers) < 2:
														
 
															+                numbers.append(501)
														
 
															         else:
														
 
															-            rows, cols = len(numbers), 1
														
 
															+            rows, cols = max(2, len(numbers)), 1
														
 
															+            if len(numbers) < 2:
														
 
															+                numbers.append(501)
														
 
															         optional_choice_dict = {'class_name': 'optional_choice',
														
 
															                                 'rows': rows, 'cols': cols,
														
--- a/segment/sheet_resolve/tools/tf_sess.py
+++ b/segment/sheet_resolve/tools/tf_sess.py
@@ -7,6 +7,8 @@ from segment.sheet_resolve.lib.model.config import cfg
 
															 from segment.sheet_resolve.lib.nets.resnet_v1 import resnetv1
														
 
															 from segment.sheet_resolve.tools.tf_settings import model_dict
														
 
															+# os.environ['CUDA_VISIBLE_DEVICES'] = '0,1'
														
 
															+
														
 
															 class TfSess:
														
--- a/segment/sheet_resolve/tools/tf_settings.py
+++ b/segment/sheet_resolve/tools/tf_settings.py
@@ -9,7 +9,7 @@ subject_list = ['math', 'math_zxhx', 'english', 'chinese',
 
															                 'geography', 'science_comprehensive', 'arts_comprehensive', 'cloze', 'choice']
														
 
															 BASE_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
														
 
															-decide_blank_model = model_dir_path = os.path.join(BASE_DIR, 'model', 'decide_blank', 'model.npy')
														
 
															+decide_blank_model = os.path.join(BASE_DIR, 'model', 'decide_blank', 'model.npy')
														
 
															 xml_template_path = os.path.join(BASE_DIR, 'labels', '000000-template.xml')
														
 
															 images_dir_path = os.path.join(BASE_DIR, 'images')
														
--- a/segment/sheet_resolve/tools/utils.py
+++ b/segment/sheet_resolve/tools/utils.py
@@ -155,8 +155,8 @@ def img_resize(analysis_type, im):
 
															 def resize_faster_rcnn(analysis_type, im_orig):
														
 
															-    min_size = 375
														
 
															-    max_size = 500
														
 
															+    min_size = 1500
														
 
															+    max_size = 2000
														
 
															     if analysis_type == 'math_blank':
														
 
															         min_size = 1500
														
 
															         max_size = 2000
														
@@ -172,7 +172,7 @@ def resize_faster_rcnn(analysis_type, im_orig):
 
															     im = cv2.resize(im_orig, None, None, fx=im_scale, fy=im_scale,
														
 
															                     interpolation=cv2.INTER_LINEAR)
														
 
															-    return im, (im_scale, im_scale)
														
 
															+    return im, (1/im_scale, 1/im_scale)
														
 
															 def resize_by_percent(im, percent):
														
--- a/segment/sheet_server.py
+++ b/segment/sheet_server.py
@@ -248,6 +248,7 @@ def sheet_row_col_resolve(raw_img, sheet_dict, choice_sess, cloze_sess, xml_save
 
															     mns_thresh_0 = 0.3
														
 
															     regions = sheet_dict['regions']
														
 
															     classes_name = str([ele['class_name'] for ele in regions])
														
 
															+    subject = sheet_dict['subject']
														
 
															     region_tmp = regions.copy()
														
 
															     # json.dumps(sheet_dict, ensure_ascii=False)
														
@@ -263,7 +264,7 @@ def sheet_row_col_resolve(raw_img, sheet_dict, choice_sess, cloze_sess, xml_save
 
															     if 'choice_m' in classes_name:
														
 
															         try:
														
 
															-            choice_dict_list = choice_m_row_col(raw_img, regions, xml_save_path)
														
 
															+            choice_dict_list = choice_m_row_col(raw_img, regions, subject, xml_save_path)
														
 
															             if len(choice_dict_list) > 0:
														
 
															                 region_tmp.extend(choice_dict_list)
														
 
															         except Exception as e:
														
@@ -296,12 +297,13 @@ def sheet_row_col_resolve(raw_img, sheet_dict, choice_sess, cloze_sess, xml_save
 
															 def sheet_detail_resolve(raw_img, sheet_dict, xml_save_path, shrink=True):
														
 
															     regions = sheet_dict['regions']
														
 
															     classes_names_list = set([ele['class_name'] for ele in regions])
														
 
															+    subject = sheet_dict['subject']
														
 
															     region_tmp = regions.copy()
														
 
															     # json.dumps(sheet_dict, ensure_ascii=False)
														
 
															     if 'choice_m' in classes_names_list:
														
 
															         try:
														
 
															-            choice_dict_list = choice_m_row_col(raw_img, regions, xml_save_path)
														
 
															+            choice_dict_list = choice_m_row_col(raw_img, regions, subject, xml_save_path)
														
 
															             if shrink:
														
 
															                 for ele in choice_dict_list:
														
 
															                     if 'all_small_coordinate' in ele.keys():
														
@@ -361,6 +363,7 @@ def sheet_points(sheet_dict_list, image_list, ocr_list, if_ocr=False):
 
															     try:
														
 
															         res = get_sheet_points(sheet_list)
														
 
															         sheet_dict_list = [ele['sheet_dict'] for ele in res]
														
 
															+        image_list = [ele['raw_image'] for ele in res]
														
 
															     except Exception as e:
														
 
															         traceback.print_exc()
														
 
															         sheet_dict_list = [ele['sheet_dict'] for ele in sheet_list]
														
@@ -384,7 +387,7 @@ def sheet_points(sheet_dict_list, image_list, ocr_list, if_ocr=False):
 
															     if if_ocr:
														
 
															         for index, ele in enumerate(sheet_total_list):
														
 
															             ele.update({'sheet_ocr': ocr_list[index]})
														
 
															-    return sheet_total_list
														
 
															+    return sheet_total_list, image_list
														
 
															 def sheet_format_output(init_number, crt_numbers, sheet_dict, image, subject, shrink):
														
@@ -397,6 +400,7 @@ def sheet_format_output(init_number, crt_numbers, sheet_dict, image, subject, sh
 
															     for col_regions in col_regions_list:
														
 
															         _, init_number, crt_numbers = question_number_format(init_number, crt_numbers, col_regions)
														
 
															+    # 合并跨栏主观题
														
 
															     merge_span_boxes(col_regions_list)
														
 
															     regions = list(itertools.chain(*col_regions_list))
														
--- a/segment/sheet_views.py
+++ b/segment/sheet_views.py
@@ -438,7 +438,7 @@ def analysis_box_once_with_multiple_img(request):
 
															                     detail_xml.append(small_box_xml_path)
														
 
															                     shutil.copy(raw_xml_path, small_box_xml_path)
														
 
															                     try:
														
 
															-                        # 找题号
														
 
															+                        # 找选择题行列题号， 考号行列
														
 
															                         small_box_sheet_dict = sheet_detail_resolve(image, sheet_dict, small_box_xml_path, shrink=True)
														
 
															                     except Exception as e:
														
 
															                         traceback.print_exc()
														
@@ -460,7 +460,7 @@ def analysis_box_once_with_multiple_img(request):
 
															                     error_info = error_info + 'box resolve error;'
														
 
															             try:
														
 
															-                res_info_list = sheet_points(res_info_list, image_list, ocr_list, if_ocr=False)
														
 
															+                res_info_list, image_list = sheet_points(res_info_list, image_list, ocr_list, if_ocr=False)
														
 
															             except Exception as e:
														
 
															                 print(e)
														
 
															                 traceback.print_exc()