Spaces:

bachpc
/

table-structure-recognition

Build error

App Files Files Community

bachpc commited on Apr 21, 2023

Commit

c59b7a8

•

1 Parent(s): 3479c98

Update postprocess.py

Browse files

Files changed (2) hide show

app.py +1 -1
postprocess.py +25 -23

app.py CHANGED Viewed

@@ -141,7 +141,7 @@ def crop_image(pil_img, detection_result):
         fontScale = lw / 3
         thickness = max(lw - 1, 1)
         w_label, h_label = cv2.getTextSize(label, 0, fontScale=fontScale, thickness=thickness)[0]
-        cv2.rectangle(image, (x1, y1), (x1 + w_label, y1 - h_label - 3), (255, 0, 0), -1, cv2.LINE_AA)
         cv2.putText(image, label, (x1, y1 - 2), cv2.FONT_HERSHEY_SIMPLEX, fontScale, (255, 255, 255), thickness=thickness, lineType=cv2.LINE_AA)
     return crop_images, cv_to_PIL(image)

         fontScale = lw / 3
         thickness = max(lw - 1, 1)
         w_label, h_label = cv2.getTextSize(label, 0, fontScale=fontScale, thickness=thickness)[0]
+        cv2.rectangle(image, (x1, y1), (x1 + w_label, y1 - h_label - 3), (0, 0, 255), -1, cv2.LINE_AA)
         cv2.putText(image, label, (x1, y1 - 2), cv2.FONT_HERSHEY_SIMPLEX, fontScale, (255, 255, 255), thickness=thickness, lineType=cv2.LINE_AA)
     return crop_images, cv_to_PIL(image)

postprocess.py CHANGED Viewed

@@ -16,7 +16,7 @@ def apply_threshold(objects, threshold):
 def apply_class_thresholds(bboxes, labels, scores, class_names, class_thresholds):
     """
     Filter out bounding boxes whose confidence is below the confidence threshold for
-    its associated class label.
     """
     # Apply class-specific thresholds
     indices_above_threshold = [idx for idx, (score, label) in enumerate(zip(scores, labels))
@@ -37,11 +37,11 @@ def iou(bbox1, bbox2):
     """
     intersection = Rect(bbox1).intersect(bbox2)
     union = Rect(bbox1).include_rect(bbox2)
     union_area = union.get_area()
     if union_area > 0:
         return intersection.get_area() / union.get_area()
     return 0
@@ -50,11 +50,11 @@ def iob(bbox1, bbox2):
     Compute the intersection area over box area, for bbox1.
     """
     intersection = Rect(bbox1).intersect(bbox2)
     bbox1_area = Rect(bbox1).get_area()
     if bbox1_area > 0:
         return intersection.get_area() / bbox1_area
     return 0
@@ -123,7 +123,7 @@ def objects_to_table_structures(table_object, objects_in_table, tokens_in_table,
     row_rect = Rect()
     for obj in rows:
         row_rect.include_rect(obj['bbox'])
-    column_rect = Rect()
     for obj in columns:
         column_rect.include_rect(obj['bbox'])
     table_object['row_column_bbox'] = [column_rect[0], row_rect[1], column_rect[2], row_rect[3]]
@@ -189,7 +189,7 @@ def nms_by_containment(container_objects, package_objects, overlap_threshold=0.5
     suppression = [False for obj in container_objects]
     packages_by_container, _, _ = slot_into_containers(container_objects, package_objects, overlap_threshold=overlap_threshold,
-                                                 unique_assignment=True, forced_assignment=False)
     for object2_num in range(1, num_objects):
         object2_packages = set(packages_by_container[object2_num])
@@ -198,7 +198,9 @@ def nms_by_containment(container_objects, package_objects, overlap_threshold=0.5
         for object1_num in range(object2_num):
             if not suppression[object1_num]:
                 object1_packages = set(packages_by_container[object1_num])
-                if len(object2_packages.intersection(object1_packages)) > 0:
                     suppression[object2_num] = True
     final_objects = [obj for idx, obj in enumerate(container_objects) if not suppression[idx]]
@@ -222,7 +224,7 @@ def slot_into_containers(container_objects, package_objects, overlap_threshold=0
     for package_num, package in enumerate(package_objects):
         match_scores = []
         package_rect = Rect(package['bbox'])
-        package_area = package_rect.get_area()
         for container_num, container in enumerate(container_objects):
             container_rect = Rect(container['bbox'])
             intersect_area = container_rect.intersect(package['bbox']).get_area()
@@ -244,7 +246,7 @@ def slot_into_containers(container_objects, package_objects, overlap_threshold=0
                     package_assignments[package_num].append(match_score['container_num'])
                 else:
                     break
     return container_assignments, package_assignments, best_match_scores
@@ -268,8 +270,8 @@ def remove_objects_without_content(page_spans, objects):
         object_text, _ = extract_text_inside_bbox(page_spans, obj['bbox'])
         if len(object_text.strip()) == 0:
             objects.remove(obj)
 def extract_text_inside_bbox(spans, bbox):
     """
     Extract the text inside a bounding box.
@@ -314,7 +316,7 @@ def extract_text_from_spans(spans, join_with_space=True, remove_integer_superscr
     else:
         join_char = ""
     spans_copy = spans[:]
     if remove_integer_superscripts:
         for span in spans:
             if not 'flags' in span:
@@ -328,11 +330,11 @@ def extract_text_from_spans(spans, join_with_space=True, remove_integer_superscr
     if len(spans_copy) == 0:
         return ""
     spans_copy.sort(key=lambda span: span['span_num'])
     spans_copy.sort(key=lambda span: span['line_num'])
     spans_copy.sort(key=lambda span: span['block_num'])
     # Force the span at the end of every line within a block to have exactly one space
     # unless the line ends with a space or ends with a non-space followed by a hyphen
     line_texts = []
@@ -351,7 +353,7 @@ def extract_text_from_spans(spans, join_with_space=True, remove_integer_superscr
             line_span_texts.append(span2['text'])
     line_text = join_char.join(line_span_texts)
     line_texts.append(line_text)
     return join_char.join(line_texts).strip()
@@ -443,7 +445,7 @@ def refine_table_structures(table_bbox, table_structures, page_spans, class_thre
 def nms(objects, match_criteria="object2_overlap", match_threshold=0.05, keep_higher=True):
     """
     A customizable version of non-maxima suppression (NMS).
     Default behavior: If a lower-confidence object overlaps more than 5% of its area
     with a higher-confidence object, remove the lower-confidence object.
@@ -493,7 +495,7 @@ def align_headers(headers, rows):
     For now, we are not supporting tables with multiple headers, so we need to
     eliminate anything besides the top-most header.
     """
     aligned_headers = []
     for row in rows:
@@ -672,7 +674,7 @@ def header_supercell_tree(supercells):
     """
     header_supercells = [supercell for supercell in supercells if 'header' in supercell and supercell['header']]
     header_supercells = sort_objects_by_score(header_supercells)
     for header_supercell in header_supercells[:]:
         ancestors_by_row = defaultdict(int)
         min_row = min(header_supercell['row_numbers'])
@@ -687,8 +689,8 @@ def header_supercell_tree(supercells):
             if not ancestors_by_row[row] == 1:
                 supercells.remove(header_supercell)
                 break
 def table_structure_to_cells(table_structures, table_spans, table_bbox):
     """
     Assuming the row, column, supercell, and header bounding boxes have
@@ -787,10 +789,10 @@ def table_structure_to_cells(table_structures, table_spans, table_bbox):
     for cell, cell_span_nums in zip(cells, span_nums_by_cell):
         cell_spans = [table_spans[num] for num in cell_span_nums]
         # TODO: Refine how text is extracted; should be character-based, not span-based;
-        # but need to associate
         # cell['cell_text'] = extract_text_from_spans(cell_spans, remove_integer_superscripts=False)  # TODO
         cell['spans'] = cell_spans
     # Adjust the row, column, and cell bounding boxes to reflect the extracted text
     num_rows = len(rows)
     rows = sort_objects_top_to_bottom(rows)

 def apply_class_thresholds(bboxes, labels, scores, class_names, class_thresholds):
     """
     Filter out bounding boxes whose confidence is below the confidence threshold for
+    its associated class label.
     """
     # Apply class-specific thresholds
     indices_above_threshold = [idx for idx, (score, label) in enumerate(zip(scores, labels))
     """
     intersection = Rect(bbox1).intersect(bbox2)
     union = Rect(bbox1).include_rect(bbox2)
     union_area = union.get_area()
     if union_area > 0:
         return intersection.get_area() / union.get_area()
     return 0
     Compute the intersection area over box area, for bbox1.
     """
     intersection = Rect(bbox1).intersect(bbox2)
     bbox1_area = Rect(bbox1).get_area()
     if bbox1_area > 0:
         return intersection.get_area() / bbox1_area
     return 0
     row_rect = Rect()
     for obj in rows:
         row_rect.include_rect(obj['bbox'])
+    column_rect = Rect()
     for obj in columns:
         column_rect.include_rect(obj['bbox'])
     table_object['row_column_bbox'] = [column_rect[0], row_rect[1], column_rect[2], row_rect[3]]
     suppression = [False for obj in container_objects]
     packages_by_container, _, _ = slot_into_containers(container_objects, package_objects, overlap_threshold=overlap_threshold,
+                                                 unique_assignment=False, forced_assignment=False)
     for object2_num in range(1, num_objects):
         object2_packages = set(packages_by_container[object2_num])
         for object1_num in range(object2_num):
             if not suppression[object1_num]:
                 object1_packages = set(packages_by_container[object1_num])
+                if len(object2_packages.intersection(object1_packages)) > 0 \
+                    and (iob(container_objects[object2_num]['bbox'], container_objects[object1_num]['bbox']) > 0.5 \
+                         or iob(container_objects[object1_num]['bbox'], container_objects[object2_num]['bbox']) > 0.5):
                     suppression[object2_num] = True
     final_objects = [obj for idx, obj in enumerate(container_objects) if not suppression[idx]]
     for package_num, package in enumerate(package_objects):
         match_scores = []
         package_rect = Rect(package['bbox'])
+        package_area = package_rect.get_area()
         for container_num, container in enumerate(container_objects):
             container_rect = Rect(container['bbox'])
             intersect_area = container_rect.intersect(package['bbox']).get_area()
                     package_assignments[package_num].append(match_score['container_num'])
                 else:
                     break
     return container_assignments, package_assignments, best_match_scores
         object_text, _ = extract_text_inside_bbox(page_spans, obj['bbox'])
         if len(object_text.strip()) == 0:
             objects.remove(obj)
 def extract_text_inside_bbox(spans, bbox):
     """
     Extract the text inside a bounding box.
     else:
         join_char = ""
     spans_copy = spans[:]
     if remove_integer_superscripts:
         for span in spans:
             if not 'flags' in span:
     if len(spans_copy) == 0:
         return ""
     spans_copy.sort(key=lambda span: span['span_num'])
     spans_copy.sort(key=lambda span: span['line_num'])
     spans_copy.sort(key=lambda span: span['block_num'])
     # Force the span at the end of every line within a block to have exactly one space
     # unless the line ends with a space or ends with a non-space followed by a hyphen
     line_texts = []
             line_span_texts.append(span2['text'])
     line_text = join_char.join(line_span_texts)
     line_texts.append(line_text)
     return join_char.join(line_texts).strip()
 def nms(objects, match_criteria="object2_overlap", match_threshold=0.05, keep_higher=True):
     """
     A customizable version of non-maxima suppression (NMS).
     Default behavior: If a lower-confidence object overlaps more than 5% of its area
     with a higher-confidence object, remove the lower-confidence object.
     For now, we are not supporting tables with multiple headers, so we need to
     eliminate anything besides the top-most header.
     """
     aligned_headers = []
     for row in rows:
     """
     header_supercells = [supercell for supercell in supercells if 'header' in supercell and supercell['header']]
     header_supercells = sort_objects_by_score(header_supercells)
     for header_supercell in header_supercells[:]:
         ancestors_by_row = defaultdict(int)
         min_row = min(header_supercell['row_numbers'])
             if not ancestors_by_row[row] == 1:
                 supercells.remove(header_supercell)
                 break
 def table_structure_to_cells(table_structures, table_spans, table_bbox):
     """
     Assuming the row, column, supercell, and header bounding boxes have
     for cell, cell_span_nums in zip(cells, span_nums_by_cell):
         cell_spans = [table_spans[num] for num in cell_span_nums]
         # TODO: Refine how text is extracted; should be character-based, not span-based;
+        # but need to associate
         # cell['cell_text'] = extract_text_from_spans(cell_spans, remove_integer_superscripts=False)  # TODO
         cell['spans'] = cell_spans
     # Adjust the row, column, and cell bounding boxes to reflect the extracted text
     num_rows = len(rows)
     rows = sort_objects_top_to_bottom(rows)