add minor edits

This commit is contained in:
Isaac Riley 2022-03-02 07:43:02 +01:00
parent 4c06206445
commit ff84734ee8
4 changed files with 8 additions and 7 deletions

View File

@ -22,7 +22,7 @@ dvc pull
### As an API
The module provided functions for the individual tasks that all return some kid of collection of points, depending on
The module provided functions for the individual tasks that all return some kind of collection of points, depending on
the specific task.
#### Redaction Detection

View File

@ -29,7 +29,7 @@ if __name__ == "__main__":
show_mpl(page)
# page_ = deskew_linebased(page, verbose=True)
# show_mpl(page_)
page_corr = deskew_histbased(page, verbose=True)
page_corr, _ = deskew_histbased(page, verbose=True)
show_mpl(page_corr)
if args.save_path:
page_ = Image.fromarray(page).convert("RGB")

View File

@ -145,7 +145,7 @@ def annotate_tables_in_pdf(pdf_path, page_index=0, deskew=False):
page = pdf2image.convert_from_path(pdf_path, first_page=page_index + 1, last_page=page_index + 1)[0]
page = np.array(page)
if deskew:
page = deskew_histbased(page)
page, _ = deskew_histbased(page)
stats = parse_table(page)
page = draw_rectangles(page, stats, annotate=True)

View File

@ -52,9 +52,10 @@ def deskew_linebased(image: np.array, verbose=False) -> np.array:
return image
def deskew_histbased(page: np.array, max_abs_angle=1.5, delta=0.15, mode="nearest", verbose=False):
page = cv2.cvtColor(page, cv2.COLOR_BGR2GRAY)
page = cv2.fastNlMeansDenoising(page, h=3)
def deskew_histbased(page: np.array, preprocess=True, max_abs_angle=1.5, delta=0.15, mode="nearest", verbose=False):
if preprocess:
page = cv2.cvtColor(page, cv2.COLOR_BGR2GRAY)
page = cv2.fastNlMeansDenoising(page, h=3)
w, h = page.shape
def find_score(arr, angle):
@ -73,4 +74,4 @@ def deskew_histbased(page: np.array, max_abs_angle=1.5, delta=0.15, mode="neares
print("Skew angle from pixel histogram: {}".format(best_angle))
rotated = rotate(page, best_angle, reshape=False, order=0, mode=mode)
return rotated
return rotated, best_angle