Merge in RR/table_parsing from layout_detetciton_happy_little_accident to master
Squashed commit of the following:
commit eb4452c9a488df16085a16eba08b7a182274d331
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 16:08:12 2022 +0100
Empty line added
commit d2fedf9a2f982af2157a408077654d388ca6cc6d
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 16:07:20 2022 +0100
Empty line added
commit 638d14a4b6c7b4d34222fd3b4cbb8ce79bb32ef0
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 16:05:43 2022 +0100
Quickfix typo
commit 0271d2ba2e51227aa53e128bf857394e5b5b2d48
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 15:57:06 2022 +0100
black
commit c95c4ad3f3d01857e7dd1dde0802ed7f2a5837c1
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 15:53:42 2022 +0100
Refactored layout_detection prototype
commit 766bd0b916b532885e44a13581f100ffaa39bb55
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 13:16:36 2022 +0100
reset table_parsing to table parsing functionality, moved layout detection accident to layout_detection
commit 7c8955f56dfae2aef814caf4cbc6e903406994ba
Merge: 9a065a0 af5c6d0
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Fri Feb 4 13:11:28 2022 +0100
Merge branch 'master' of ssh://git.iqser.com:2222/rr/table_parsing into layout_detetciton_happy_little_accident
commit 9a065a0e7f62823a3b18e301d12c80b1a74f0b3e
Author: Julius Unverfehrt <Julius.Unverfehrt@iqser.com>
Date: Thu Feb 3 16:45:09 2022 +0100
Made Bob proud
28 lines
862 B
Python
28 lines
862 B
Python
import argparse
|
|
|
|
from table_parsing.table_parsig import annotate_tables_in_pdf
|
|
from box_detection.box_detection import annotate_boxes_in_pdf
|
|
from layout_detection.layout_detection import annotate_layout_in_pdf
|
|
|
|
|
|
def parse_args():
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument("pdf_path")
|
|
parser.add_argument("page_index", type=int)
|
|
parser.add_argument("--object", choices=["table", "box", "layout"], default="table")
|
|
|
|
args = parser.parse_args()
|
|
|
|
return args
|
|
|
|
|
|
if __name__ == "__main__":
|
|
args = parse_args()
|
|
if args.object == "table":
|
|
annotate_tables_in_pdf(args.pdf_path, page_index=args.page_index)
|
|
elif args.object == "box":
|
|
annotate_boxes_in_pdf(args.pdf_path, page_index=args.page_index)
|
|
elif args.object == "layout":
|
|
annotate_layout_in_pdf(args.pdf_path, page_index=args.page_index)
|
|
|