diff --git a/.gitignore b/.gitignore index e399835..a369ba5 100644 --- a/.gitignore +++ b/.gitignore @@ -1,5 +1,6 @@ /results/before/morph_operator_open.png /env/ +/.idea/ /home/lillian/table_parsing/.idea/ /.idea/.gitignore /.idea/misc.xml @@ -8,3 +9,4 @@ /.idea/vcs.xml /pdfs/ /results/ +/.idea/modules.xml diff --git a/table_parsing/table_parsig.py b/table_parsing/table_parsig.py index e90b8b9..d00eafd 100644 --- a/table_parsing/table_parsig.py +++ b/table_parsing/table_parsig.py @@ -41,6 +41,7 @@ def annotate_image(image, stats): return image + def parse_tables_in_pdf(pages): return zip(map(parse, pages), count()) @@ -58,9 +59,3 @@ def annotate_tables_in_pdf(pdf_path, page_index=1): plt.show() -#annotate_tables_in_pdf("/home/lillian/table_parsing/pdfs/pdfs_syngenta/026c917f04660aaea4bb57d180f9598b.pdf", 4) -#annotate_tables_in_pdf("/home/lillian/table_parsing/pdfs/pdfs_syngenta/8dc4a4bf9c439eb402adfa2c53ce5c0c.pdf", 8) -#annotate_tables_in_pdf("/home/lillian/table_parsing/pdfs/pdfs_efsa/Quartz sand_RAR_13_Volume_3CP_Repentol6PA_B2_2021_03_24.pdf", 6) -# annotate_tables_in_pdf("/home/lillian/table_parsing/pdfs/pdfs_efsa/Sulphur_RAR_18_Volume_3CP_SULFUR 80_ WG_B-8_2021-04-09.pdf", 24) -# annotate_tables_in_pdf("/home/lillian/table_parsing/pdfs/pdfs_efsa/Sulphur_RAR_18_Volume_3CP_SULFUR 80_ WG_B-8_2021-04-09.pdf", 5) -annotate_tables_in_pdf("/home/lillian/table_parsing/pdfs/Dokument6.pdf", 0) \ No newline at end of file