From 4b15d2c2ca58598563cad9f22706b3c05aeec808 Mon Sep 17 00:00:00 2001 From: Julius Unverfehrt Date: Wed, 18 Dec 2024 11:27:33 +0100 Subject: [PATCH] fix: RED-10686: set minimum permissable value for logos Reference the jira ticket for more information. This change can introduce unwanted behavior. --- config/settings.toml | 5 ++++- scripts/run_pipeline.py | 2 ++ 2 files changed, 6 insertions(+), 1 deletion(-) diff --git a/config/settings.toml b/config/settings.toml index 40d76a2..a094cc5 100644 --- a/config/settings.toml +++ b/config/settings.toml @@ -4,7 +4,7 @@ level = "INFO" [service] # Print document processing progress to stdout verbose = false -batch_size = 16 +batch_size = 6 image_stiching_tolerance = 1 # in pixels mlflow_run_id = "fabfb1f192c745369b88cab34471aba7" @@ -36,4 +36,7 @@ max = 10 [filters.overrides.signature.image_to_page_quotient] max = 0.4 +[filters.overrides.logo.image_to_page_quotient] +min = 0.06 + diff --git a/scripts/run_pipeline.py b/scripts/run_pipeline.py index 613b49f..cade47b 100644 --- a/scripts/run_pipeline.py +++ b/scripts/run_pipeline.py @@ -10,6 +10,8 @@ from image_prediction.utils.pdf_annotation import annotate_pdf logger = get_logger() +logger.setLevel("DEBUG") + def parse_args(): parser = argparse.ArgumentParser()