chore: formatting and linting

2024-04-29 12:09:44 +02:00 · 2024-04-29 12:09:44 +02:00 · 5d13d8b3d0
commit 5d13d8b3d0
parent 9e04693ee1
37 changed files with 260 additions and 254 deletions
--- a/README.md
+++ b/README.md
@ -1,4 +1,5 @@
-# cv-analysis &mdash; Visual (CV-Based) Document Parsing
+# cv-analysis - Visual (CV-Based) Document Parsing
+
 parse_pdf()
 This repository implements computer vision based approaches for detecting and parsing visual features such as tables or
 previous redactions in documents.
--- a/poetry.lock
+++ b/poetry.lock
@ -305,19 +305,17 @@ tests = ["mypy (>=0.800)", "pytest", "pytest-asyncio"]

 [[package]]
 name = "astroid"
-version = "2.15.8"
+version = "3.1.0"
 description = "An abstract syntax tree for Python with inference support."
 optional = false
-python-versions = ">=3.7.2"
+python-versions = ">=3.8.0"
 files = [
-    {file = "astroid-2.15.8-py3-none-any.whl", hash = "sha256:1aa149fc5c6589e3d0ece885b4491acd80af4f087baafa3fb5203b113e68cd3c"},
-    {file = "astroid-2.15.8.tar.gz", hash = "sha256:6c107453dffee9055899705de3c9ead36e74119cee151e5a9aaf7f0b0e020a6a"},
+    {file = "astroid-3.1.0-py3-none-any.whl", hash = "sha256:951798f922990137ac090c53af473db7ab4e70c770e6d7fae0cec59f74411819"},
+    {file = "astroid-3.1.0.tar.gz", hash = "sha256:ac248253bfa4bd924a0de213707e7ebeeb3138abeb48d798784ead1e56d419d4"},
 ]

 [package.dependencies]
-lazy-object-proxy = ">=1.4.0"
 typing-extensions = {version = ">=4.0.0", markers = "python_version < \"3.11\""}
-wrapt = {version = ">=1.11,<2", markers = "python_version < \"3.11\""}

 [[package]]
 name = "asttokens"
@ -539,13 +537,13 @@ files = [

 [[package]]
 name = "blinker"
-version = "1.7.0"
+version = "1.8.1"
 description = "Fast, simple object-to-object and broadcast signaling"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "blinker-1.7.0-py3-none-any.whl", hash = "sha256:c3f865d4d54db7abc53758a01601cf343fe55b84c1de4e3fa910e420b438d5b9"},
-    {file = "blinker-1.7.0.tar.gz", hash = "sha256:e6820ff6fa4e4d1d8e2747c2283749c3f547e4fee112b98555cdcdae32996182"},
+    {file = "blinker-1.8.1-py3-none-any.whl", hash = "sha256:5f1cdeff423b77c31b89de0565cd03e5275a03028f44b2b15f912632a58cced6"},
+    {file = "blinker-1.8.1.tar.gz", hash = "sha256:da44ec748222dcd0105ef975eed946da197d5bdf8bafb6aa92f5bc89da63fa25"},
 ]

 [[package]]
@ -2407,52 +2405,6 @@ sqs = ["boto3 (>=1.26.143)", "pycurl (>=7.43.0.5)", "urllib3 (>=1.26.16)"]
 yaml = ["PyYAML (>=3.10)"]
 zookeeper = ["kazoo (>=2.8.0)"]

-[[package]]
-name = "lazy-object-proxy"
-version = "1.10.0"
-description = "A fast and thorough lazy object proxy."
-optional = false
-python-versions = ">=3.8"
-files = [
-    {file = "lazy-object-proxy-1.10.0.tar.gz", hash = "sha256:78247b6d45f43a52ef35c25b5581459e85117225408a4128a3daf8bf9648ac69"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:855e068b0358ab916454464a884779c7ffa312b8925c6f7401e952dcf3b89977"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:7ab7004cf2e59f7c2e4345604a3e6ea0d92ac44e1c2375527d56492014e690c3"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:dc0d2fc424e54c70c4bc06787e4072c4f3b1aa2f897dfdc34ce1013cf3ceef05"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:e2adb09778797da09d2b5ebdbceebf7dd32e2c96f79da9052b2e87b6ea495895"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:b1f711e2c6dcd4edd372cf5dec5c5a30d23bba06ee012093267b3376c079ec83"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-win32.whl", hash = "sha256:76a095cfe6045c7d0ca77db9934e8f7b71b14645f0094ffcd842349ada5c5fb9"},
-    {file = "lazy_object_proxy-1.10.0-cp310-cp310-win_amd64.whl", hash = "sha256:b4f87d4ed9064b2628da63830986c3d2dca7501e6018347798313fcf028e2fd4"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:fec03caabbc6b59ea4a638bee5fce7117be8e99a4103d9d5ad77f15d6f81020c"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:02c83f957782cbbe8136bee26416686a6ae998c7b6191711a04da776dc9e47d4"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:009e6bb1f1935a62889ddc8541514b6a9e1fcf302667dcb049a0be5c8f613e56"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:75fc59fc450050b1b3c203c35020bc41bd2695ed692a392924c6ce180c6f1dc9"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:782e2c9b2aab1708ffb07d4bf377d12901d7a1d99e5e410d648d892f8967ab1f"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-win32.whl", hash = "sha256:edb45bb8278574710e68a6b021599a10ce730d156e5b254941754a9cc0b17d03"},
-    {file = "lazy_object_proxy-1.10.0-cp311-cp311-win_amd64.whl", hash = "sha256:e271058822765ad5e3bca7f05f2ace0de58a3f4e62045a8c90a0dfd2f8ad8cc6"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:e98c8af98d5707dcdecc9ab0863c0ea6e88545d42ca7c3feffb6b4d1e370c7ba"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:952c81d415b9b80ea261d2372d2a4a2332a3890c2b83e0535f263ddfe43f0d43"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:80b39d3a151309efc8cc48675918891b865bdf742a8616a337cb0090791a0de9"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:e221060b701e2aa2ea991542900dd13907a5c90fa80e199dbf5a03359019e7a3"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:92f09ff65ecff3108e56526f9e2481b8116c0b9e1425325e13245abfd79bdb1b"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-win32.whl", hash = "sha256:3ad54b9ddbe20ae9f7c1b29e52f123120772b06dbb18ec6be9101369d63a4074"},
-    {file = "lazy_object_proxy-1.10.0-cp312-cp312-win_amd64.whl", hash = "sha256:127a789c75151db6af398b8972178afe6bda7d6f68730c057fbbc2e96b08d282"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:9e4ed0518a14dd26092614412936920ad081a424bdcb54cc13349a8e2c6d106a"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:5ad9e6ed739285919aa9661a5bbed0aaf410aa60231373c5579c6b4801bd883c"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:2fc0a92c02fa1ca1e84fc60fa258458e5bf89d90a1ddaeb8ed9cc3147f417255"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:0aefc7591920bbd360d57ea03c995cebc204b424524a5bd78406f6e1b8b2a5d8"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:5faf03a7d8942bb4476e3b62fd0f4cf94eaf4618e304a19865abf89a35c0bbee"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-win32.whl", hash = "sha256:e333e2324307a7b5d86adfa835bb500ee70bfcd1447384a822e96495796b0ca4"},
-    {file = "lazy_object_proxy-1.10.0-cp38-cp38-win_amd64.whl", hash = "sha256:cb73507defd385b7705c599a94474b1d5222a508e502553ef94114a143ec6696"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:366c32fe5355ef5fc8a232c5436f4cc66e9d3e8967c01fb2e6302fd6627e3d94"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:2297f08f08a2bb0d32a4265e98a006643cd7233fb7983032bd61ac7a02956b3b"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:18dd842b49456aaa9a7cf535b04ca4571a302ff72ed8740d06b5adcd41fe0757"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:217138197c170a2a74ca0e05bddcd5f1796c735c37d0eee33e43259b192aa424"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:9a3a87cf1e133e5b1994144c12ca4aa3d9698517fe1e2ca82977781b16955658"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-win32.whl", hash = "sha256:30b339b2a743c5288405aa79a69e706a06e02958eab31859f7f3c04980853b70"},
-    {file = "lazy_object_proxy-1.10.0-cp39-cp39-win_amd64.whl", hash = "sha256:a899b10e17743683b293a729d3a11f2f399e8a90c73b089e29f5d0fe3509f0dd"},
-    {file = "lazy_object_proxy-1.10.0-pp310.pp311.pp312.pp38.pp39-none-any.whl", hash = "sha256:80fa48bd89c8f2f456fc0765c11c23bf5af827febacd2f523ca5bc1893fcc09d"},
-]
-
 [[package]]
 name = "loguru"
 version = "0.7.2"
@ -2817,6 +2769,64 @@ files = [
    {file = "multidict-6.0.5.tar.gz", hash = "sha256:f7e301075edaf50500f0b341543c41194d8df3ae5caf4702f2095f3ca73dd8da"},
 ]

+[[package]]
+name = "mypy"
+version = "1.10.0"
+description = "Optional static typing for Python"
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "mypy-1.10.0-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:da1cbf08fb3b851ab3b9523a884c232774008267b1f83371ace57f412fe308c2"},
+    {file = "mypy-1.10.0-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:12b6bfc1b1a66095ab413160a6e520e1dc076a28f3e22f7fb25ba3b000b4ef99"},
+    {file = "mypy-1.10.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9e36fb078cce9904c7989b9693e41cb9711e0600139ce3970c6ef814b6ebc2b2"},
+    {file = "mypy-1.10.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:2b0695d605ddcd3eb2f736cd8b4e388288c21e7de85001e9f85df9187f2b50f9"},
+    {file = "mypy-1.10.0-cp310-cp310-win_amd64.whl", hash = "sha256:cd777b780312ddb135bceb9bc8722a73ec95e042f911cc279e2ec3c667076051"},
+    {file = "mypy-1.10.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:3be66771aa5c97602f382230165b856c231d1277c511c9a8dd058be4784472e1"},
+    {file = "mypy-1.10.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:8b2cbaca148d0754a54d44121b5825ae71868c7592a53b7292eeb0f3fdae95ee"},
+    {file = "mypy-1.10.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1ec404a7cbe9fc0e92cb0e67f55ce0c025014e26d33e54d9e506a0f2d07fe5de"},
+    {file = "mypy-1.10.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:e22e1527dc3d4aa94311d246b59e47f6455b8729f4968765ac1eacf9a4760bc7"},
+    {file = "mypy-1.10.0-cp311-cp311-win_amd64.whl", hash = "sha256:a87dbfa85971e8d59c9cc1fcf534efe664d8949e4c0b6b44e8ca548e746a8d53"},
+    {file = "mypy-1.10.0-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:a781f6ad4bab20eef8b65174a57e5203f4be627b46291f4589879bf4e257b97b"},
+    {file = "mypy-1.10.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:b808e12113505b97d9023b0b5e0c0705a90571c6feefc6f215c1df9381256e30"},
+    {file = "mypy-1.10.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8f55583b12156c399dce2df7d16f8a5095291354f1e839c252ec6c0611e86e2e"},
+    {file = "mypy-1.10.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:4cf18f9d0efa1b16478c4c129eabec36148032575391095f73cae2e722fcf9d5"},
+    {file = "mypy-1.10.0-cp312-cp312-win_amd64.whl", hash = "sha256:bc6ac273b23c6b82da3bb25f4136c4fd42665f17f2cd850771cb600bdd2ebeda"},
+    {file = "mypy-1.10.0-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:9fd50226364cd2737351c79807775136b0abe084433b55b2e29181a4c3c878c0"},
+    {file = "mypy-1.10.0-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:f90cff89eea89273727d8783fef5d4a934be2fdca11b47def50cf5d311aff727"},
+    {file = "mypy-1.10.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:fcfc70599efde5c67862a07a1aaf50e55bce629ace26bb19dc17cece5dd31ca4"},
+    {file = "mypy-1.10.0-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:075cbf81f3e134eadaf247de187bd604748171d6b79736fa9b6c9685b4083061"},
+    {file = "mypy-1.10.0-cp38-cp38-win_amd64.whl", hash = "sha256:3f298531bca95ff615b6e9f2fc0333aae27fa48052903a0ac90215021cdcfa4f"},
+    {file = "mypy-1.10.0-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:fa7ef5244615a2523b56c034becde4e9e3f9b034854c93639adb667ec9ec2976"},
+    {file = "mypy-1.10.0-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:3236a4c8f535a0631f85f5fcdffba71c7feeef76a6002fcba7c1a8e57c8be1ec"},
+    {file = "mypy-1.10.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4a2b5cdbb5dd35aa08ea9114436e0d79aceb2f38e32c21684dcf8e24e1e92821"},
+    {file = "mypy-1.10.0-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:92f93b21c0fe73dc00abf91022234c79d793318b8a96faac147cd579c1671746"},
+    {file = "mypy-1.10.0-cp39-cp39-win_amd64.whl", hash = "sha256:28d0e038361b45f099cc086d9dd99c15ff14d0188f44ac883010e172ce86c38a"},
+    {file = "mypy-1.10.0-py3-none-any.whl", hash = "sha256:f8c083976eb530019175aabadb60921e73b4f45736760826aa1689dda8208aee"},
+    {file = "mypy-1.10.0.tar.gz", hash = "sha256:3d087fcbec056c4ee34974da493a826ce316947485cef3901f511848e687c131"},
+]
+
+[package.dependencies]
+mypy-extensions = ">=1.0.0"
+tomli = {version = ">=1.1.0", markers = "python_version < \"3.11\""}
+typing-extensions = ">=4.1.0"
+
+[package.extras]
+dmypy = ["psutil (>=4.0)"]
+install-types = ["pip"]
+mypyc = ["setuptools (>=50)"]
+reports = ["lxml"]
+
+[[package]]
+name = "mypy-extensions"
+version = "1.0.0"
+description = "Type system extensions for programs checked with the mypy type checker."
+optional = false
+python-versions = ">=3.5"
+files = [
+    {file = "mypy_extensions-1.0.0-py3-none-any.whl", hash = "sha256:4392f6c0eb8a5668a69e23d168ffa70f0be9ccfd32b5cc2d26a34ae5b844552d"},
+    {file = "mypy_extensions-1.0.0.tar.gz", hash = "sha256:75dbf8955dc00442a438fc4d0666508a9a97b6bd41aa2f0ffe9d2f2725af0782"},
+]
+
 [[package]]
 name = "nanotime"
 version = "0.5.2"
@ -3924,20 +3934,20 @@ tests = ["coverage[toml] (==5.0.4)", "pytest (>=6.0.0,<7.0.0)"]

 [[package]]
 name = "pylint"
-version = "2.17.7"
+version = "3.1.0"
 description = "python code static checker"
 optional = false
-python-versions = ">=3.7.2"
+python-versions = ">=3.8.0"
 files = [
-    {file = "pylint-2.17.7-py3-none-any.whl", hash = "sha256:27a8d4c7ddc8c2f8c18aa0050148f89ffc09838142193fdbe98f172781a3ff87"},
-    {file = "pylint-2.17.7.tar.gz", hash = "sha256:f4fcac7ae74cfe36bc8451e931d8438e4a476c20314b1101c458ad0f05191fad"},
+    {file = "pylint-3.1.0-py3-none-any.whl", hash = "sha256:507a5b60953874766d8a366e8e8c7af63e058b26345cfcb5f91f89d987fd6b74"},
+    {file = "pylint-3.1.0.tar.gz", hash = "sha256:6a69beb4a6f63debebaab0a3477ecd0f559aa726af4954fc948c51f7a2549e23"},
 ]

 [package.dependencies]
-astroid = ">=2.15.8,<=2.17.0-dev0"
+astroid = ">=3.1.0,<=3.2.0-dev0"
 colorama = {version = ">=0.4.5", markers = "sys_platform == \"win32\""}
 dill = {version = ">=0.2", markers = "python_version < \"3.11\""}
-isort = ">=4.2.5,<6"
+isort = ">=4.2.5,<5.13.0 || >5.13.0,<6"
 mccabe = ">=0.6,<0.8"
 platformdirs = ">=2.2.0"
 tomli = {version = ">=1.1.0", markers = "python_version < \"3.11\""}
@ -4579,6 +4589,17 @@ files = [
 docs = ["myst-parser", "pydata-sphinx-theme", "sphinx"]
 test = ["argcomplete (>=3.0.3)", "mypy (>=1.7.0)", "pre-commit", "pytest (>=7.0,<8.2)", "pytest-mock", "pytest-mypy-testing"]

+[[package]]
+name = "types-pillow"
+version = "10.2.0.20240423"
+description = "Typing stubs for Pillow"
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "types-Pillow-10.2.0.20240423.tar.gz", hash = "sha256:696e68b9b6a58548fc307a8669830469237c5b11809ddf978ac77fafa79251cd"},
+    {file = "types_Pillow-10.2.0.20240423-py3-none-any.whl", hash = "sha256:bd12923093b96c91d523efcdb66967a307f1a843bcfaf2d5a529146c10a9ced3"},
+]
+
 [[package]]
 name = "typing-extensions"
 version = "4.11.0"
@ -4933,4 +4954,4 @@ testing = ["big-O", "jaraco.functools", "jaraco.itertools", "more-itertools", "p
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.10,<3.11"
-content-hash = "67faa0bb4b0477691c9cbb10f5a9e4a5d30c1bba99802f1059e7be63fe94db7d"
+content-hash = "06b9635bd0acdb0cd78ee9ab0e6a8c75ef91648c36bbc1f78ac44a5c0671990b"
--- a/pyproject.toml
+++ b/pyproject.toml
@ -30,14 +30,17 @@ kn-utils = { version = "0.2.7", source = "gitlab-research" }
 pdf2img = { version = "0.7.0", source = "gitlab-red" }
 dvc-azure = "^2.21.2"
 pymupdf = "^1.24.1"
+types-pillow = "^10.2.0.20240423"

 [tool.poetry.group.test.dependencies]
 pytest = "^7.0.1"
-pylint = "^2.17.4"
+pylint = "^3.1"


 [tool.poetry.group.dev.dependencies]
 ipython = "^8.21.0"
+mypy = "^1.10.0"
+pylint = "^3.1.0"

 [tool.pytest.ini_options]
 testpaths = ["test"]
@ -57,6 +60,12 @@ name = "gitlab-red"
 url = "https://gitlab.knecon.com/api/v4/groups/12/-/packages/pypi/simple"
 priority = "explicit"

+[tool.pylint]
+max-line-length = 120
+docstring-min-length=4
+extension-pkg-whitelist = ["cv2"]
+extension-pkg-allow-list = ["cv2"]
+
 [build-system]
 requires = ["poetry-core"]
 build-backend = "poetry.core.masonry.api"
--- a/scripts/annotate.py
+++ b/scripts/annotate.py
@ -45,6 +45,7 @@ if __name__ == "__main__":
    elif args.type == "layout":
        from cv_analysis.layout_parsing import parse_layout as analyze
    elif args.type == "figure":
-        from cv_analysis.figure_detection.figure_detection import detect_figures
+        from cv_analysis.figure_detection.figure_detection import \
+            detect_figures
        analyze = detect_figures
    annotate_page(page, analyze, draw, name=name, show=args.show)
--- a/scripts/annotate_pdf.py
+++ b/scripts/annotate_pdf.py
@ -1,14 +1,16 @@
 import argparse
 import timeit
+from itertools import starmap
+from pathlib import Path
+
+from funcy import lmap
+from pdf2img.conversion import convert_pages_to_images
 from PIL import Image
+
 from cv_analysis.figure_detection.figure_detection import detect_figures
 from cv_analysis.layout_parsing import parse_layout
 from cv_analysis.table_parsing import parse_tables
 from cv_analysis.utils.draw import draw_rectangles
-from funcy import lmap
-from itertools import starmap
-from pathlib import Path
-from pdf2img.conversion import convert_pages_to_images


 def parse_args():
--- a/scripts/explore_aio_detection.py
+++ b/scripts/explore_aio_detection.py
@ -1,15 +1,15 @@
 import argparse
-from dataclasses import dataclass, asdict, field
+from dataclasses import asdict, dataclass, field
 from operator import truth
 from typing import List

 import cv2
 import numpy as np
-from funcy import lfilter, lmap, lflatten
+from funcy import lfilter, lflatten, lmap
+from pdf2img.conversion import convert_pages_to_images

 from cv_analysis.table_parsing import parse_tables
 from cv_analysis.utils.display import show_image_mpl
-from pdf2img.conversion import convert_pages_to_images


 def parse_args():
--- a/scripts/k8s_startup_probe.py
+++ b/scripts/k8s_startup_probe.py
@ -1,5 +1,5 @@
-from pyinfra.k8s_probes import startup
 from loguru import logger
+from pyinfra.k8s_probes import startup

 if __name__ == "__main__":
    logger.debug("running health check")
--- a/scripts/manage_minio.py
+++ b/scripts/manage_minio.py
@ -4,10 +4,9 @@ import json
 import os
 from pathlib import Path

-from tqdm import tqdm
-
 from pyinfra.config import get_config
 from pyinfra.storage.storage import get_s3_storage
+from tqdm import tqdm

 CONFIG = get_config()

--- a/scripts/measure_runtimes.py
+++ b/scripts/measure_runtimes.py
@ -8,7 +8,7 @@ import numpy as np
 from funcy import lmap
 from matplotlib import pyplot as plt

-from cv_analysis.server.pipeline import make_analysis_pipeline, get_analysis_fn
+from cv_analysis.server.pipeline import get_analysis_fn, make_analysis_pipeline


 def parse_args():
--- a/scripts/publish_requests.py
+++ b/scripts/publish_requests.py
@ -2,7 +2,6 @@ import argparse
 import json

 import pika
-
 from pyinfra.config import get_config
 from pyinfra.storage.storage import get_s3_storage

--- a/src/cv_analysis/config.py
+++ b/src/cv_analysis/config.py
@ -1,6 +1,6 @@
 from pathlib import Path

-from pyinfra.config.loader import load_settings
+from pyinfra.config.loader import load_settings  # type: ignore


 def get_config():
--- a/src/cv_analysis/figure_detection/figure_detection.py
+++ b/src/cv_analysis/figure_detection/figure_detection.py
@ -5,11 +5,7 @@ import numpy as np

 from cv_analysis.figure_detection.figures import detect_large_coherent_structures
 from cv_analysis.figure_detection.text import remove_primary_text_regions
-from cv_analysis.utils.filters import (
-    is_large_enough,
-    has_acceptable_format,
-    is_not_too_large,
-)
+from cv_analysis.utils.filters import has_acceptable_format, is_large_enough, is_not_too_large
 from cv_analysis.utils.postprocessing import remove_included
 from cv_analysis.utils.structures import Rectangle

--- a/src/cv_analysis/layout_parsing.py
+++ b/src/cv_analysis/layout_parsing.py
@ -1,21 +1,16 @@
 import itertools
-from itertools import compress
-from itertools import starmap
+from itertools import compress, starmap
 from operator import __and__

 import cv2
 import numpy as np

-
 from cv_analysis.utils.connect_rects import connect_related_rects2
+from cv_analysis.utils.postprocessing import has_no_parent, remove_included, remove_overlapping
 from cv_analysis.utils.structures import Rectangle
-from cv_analysis.utils.postprocessing import (
-    remove_overlapping,
-    remove_included,
-    has_no_parent,
-)
 from cv_analysis.utils.visual_logging import vizlogger

+
 # could be dynamic parameter is the scan is noisy
 def is_likely_segment(rect, min_area=100):
    return cv2.contourArea(rect, False) > min_area
@ -49,7 +44,6 @@ def fill_in_component_area(image, rect):
    return ~image


-
 def parse_layout(image: np.array):
    image = image.copy()
    image_ = image.copy()
--- a/src/cv_analysis/redaction_detection.py
+++ b/src/cv_analysis/redaction_detection.py
@ -2,9 +2,9 @@ from functools import partial

 import cv2
 import numpy as np
-from iteration_utilities import starfilter, first
+from iteration_utilities import first, starfilter

-from cv_analysis.utils.filters import is_large_enough, is_filled, is_boxy
+from cv_analysis.utils.filters import is_boxy, is_filled, is_large_enough
 from cv_analysis.utils.visual_logging import vizlogger


--- a/src/cv_analysis/server/pipeline.py
+++ b/src/cv_analysis/server/pipeline.py
@ -1,6 +1,6 @@
 from dataclasses import asdict
 from operator import itemgetter, truth
-from typing import Generator, Callable
+from typing import Callable, Generator

 from funcy import flatten, lmap
 from pdf2img.conversion import convert_pages_to_images
@ -48,6 +48,7 @@ def make_image_analysis_pipeline(
        images, info, page_info = extract_images_from_pdf(pdf_bytes, vlp_output)
        # rel_bboxes = map()
        img_results = lmap(analysis_fn, images)
+
        def make_offsets():
            ...

--- a/src/cv_analysis/table_inference.py
+++ b/src/cv_analysis/table_inference.py
@ -2,12 +2,12 @@ from operator import itemgetter
 from pathlib import Path
 from typing import Callable, Optional, Tuple

-import cv2
 import matplotlib.pyplot as plt
 import numpy as np
-from kn_utils.logging import logger
+from cv2 import cv2
+from kn_utils.logging import logger  # type: ignore
 from numpy import ndarray as Array
-from scipy.stats import norm
+from scipy.stats import norm  # type: ignore


 def show_multiple(arrs: Tuple[Array], title: str = ""):
@ -70,9 +70,7 @@ def make_gaussian_nonpositive_kernel(kernel_size: int, sd: float) -> Array:
 def make_quadratic_kernel(kernel_size: int, ratio: float) -> Array:
    kernel_size += int(not kernel_size % 2)
    wing_size = int((kernel_size - 1) / 2)
-    kernel = np.array(
-        list(map(lambda x: float(-(x**2)), range(-wing_size, wing_size + 1)))
-    )
+    kernel = np.array(list(map(lambda x: float(-(x**2)), range(-wing_size, wing_size + 1))))
    maxval, minval = np.max(kernel), np.min(kernel)
    diff = maxval - minval
    kernel += diff / (1 - ratio)
@ -80,17 +78,16 @@ def make_quadratic_kernel(kernel_size: int, ratio: float) -> Array:
    return kernel


-def min_avg_for_interval(filtered: Array, interval: int) -> float:
+def min_avg_for_interval(filtered: Array, interval: int) -> tuple[float, int]:
    n = len(filtered)
-    avgs = [np.mean(filtered[range(start, n, interval)]) for start in range(interval)]
-    best = min(avgs)
+    avgs: list[float] = [np.mean(filtered[range(start, n, interval)]) for start in range(interval)]
+    best: float = min(avgs)
    return best, avgs.index(best)


 def search_intervals(filtered: Array, min_interval: int, max_interval: int):
    performance = [
-        (interval, *min_avg_for_interval(filtered, interval))
-        for interval in range(min_interval, max_interval + 1)
+        (interval, *min_avg_for_interval(filtered, interval)) for interval in range(min_interval, max_interval + 1)
    ]
    best = min(performance, key=lambda x: x[1])
    return best[0], best[2]
@ -98,7 +95,7 @@ def search_intervals(filtered: Array, min_interval: int, max_interval: int):

 def filter_array(
    array: Array,
-    sum_filter: Array,
+    sum_filter: Array | None,
    padding: Optional[Array] = None,
    pad_value_function: Callable[[Array], float] = lambda x: 255.0,  # np.mean,
 ) -> Array:
@ -123,7 +120,7 @@ COL_FILTER2_WIDTH = 70
 COL_FILTER2_SD = 12
 COL_FILTER3_WIDTH = 200
 COL_FILTER3_SD = 20
-FILTERS = {
+FILTERS: dict[str, dict[int, np.ndarray | None]] = {
    "row": {
        1: make_gaussian_kernel(ROW_FILTER1_WIDTH, ROW_FILTER1_SD),
        2: make_gaussian_kernel(ROW_FILTER2_WIDTH, ROW_FILTER2_SD),
@ -140,20 +137,13 @@ FILTERS = {
 def filter_fp_col_lines(line_list: list[int], filt_sums: Array) -> list[int]:
    if not line_list:
        return []
-    centers = list(
-        np.where(
-            (filt_sums[1:-1] < filt_sums[:-2]) * (filt_sums[1:-1] < filt_sums[2:])
-        )[0]
-        + 1
-    )
+    centers = list(np.where((filt_sums[1:-1] < filt_sums[:-2]) * (filt_sums[1:-1] < filt_sums[2:]))[0] + 1)

    if line_list[0] > centers[0]:
        centers = centers[1:] + [len(filt_sums) - 1]
    mindiff = np.std(filt_sums)
    line_list = [
-        maxidx
-        for maxidx, minidx in zip(line_list, centers)
-        if (filt_sums[maxidx] - filt_sums[minidx]) > mindiff
+        maxidx for maxidx, minidx in zip(line_list, centers) if (filt_sums[maxidx] - filt_sums[minidx]) > mindiff
    ]
    return line_list

@ -161,7 +151,6 @@ def filter_fp_col_lines(line_list: list[int], filt_sums: Array) -> list[int]:
 def get_lines_either(table_array: Array, horizontal=True) -> Array:
    key = "row" if horizontal else "col"

-    filters = FILTERS
    sums = np.mean(table_array, axis=int(horizontal))
    threshold = 0.3 * 255  # np.mean(sums) - (1 + 2 * horizontal) * np.std(sums)
    predicate = 1000.0 * (sums < threshold)
@ -174,11 +163,7 @@ def get_lines_either(table_array: Array, horizontal=True) -> Array:
    filtered_sums = filter_array(filtered_sums, FILTERS[key][3])

    lines = list(
-        np.where(
-            (filtered_sums[1:-1] > filtered_sums[:-2])
-            * (filtered_sums[1:-1] > filtered_sums[2:])
-        )[0]
-        + 1
+        np.where((filtered_sums[1:-1] > filtered_sums[:-2]) * (filtered_sums[1:-1] > filtered_sums[2:]))[0] + 1
    )
    if not horizontal:
        lines = filter_fp_col_lines(lines, filtered_sums)
@ -191,7 +176,7 @@ def img_bytes_to_array(img_bytes: bytes) -> Array:
    return img_np


-def infer_lines(img: Array) -> dict[str, list[dict[str, int]]]:
+def infer_lines(img: Array) -> dict[str, list[dict[str, int]] | list[dict[str, int]]]:
    cv2.imwrite("/tmp/table.png", img)
    _, img = cv2.threshold(img, 220, 255, cv2.THRESH_BINARY)
    cv2.imwrite("/tmp/table_bin.png", img)
--- a/src/cv_analysis/table_parsing.py
+++ b/src/cv_analysis/table_parsing.py
@ -1,19 +1,15 @@
-import cv2
 import numpy as np
-from funcy import lfilter, lmap
+from cv2 import cv2
+from funcy import lfilter, lmap  # type: ignore

 from cv_analysis.layout_parsing import parse_layout
-from cv_analysis.utils.postprocessing import (
-    remove_isolated,
-)  # xywh_to_vecs, xywh_to_vec_rect, adjacent1d
+from cv_analysis.utils.postprocessing import remove_isolated  # xywh_to_vecs, xywh_to_vec_rect, adjacent1d
 from cv_analysis.utils.structures import Rectangle
 from cv_analysis.utils.visual_logging import vizlogger


-def add_external_contours(image, image_h_w_lines_only):
-    contours, _ = cv2.findContours(
-        image_h_w_lines_only, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE
-    )
+def add_external_contours(image: np.ndarray, image_h_w_lines_only):
+    contours, _ = cv2.findContours(image_h_w_lines_only, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_NONE)
    for cnt in contours:
        x, y, w, h = cv2.boundingRect(cnt)
        cv2.rectangle(image, (x, y), (x + w, y + h), 255, 1)
@ -21,7 +17,7 @@ def add_external_contours(image, image_h_w_lines_only):
    return image


-def apply_motion_blur(image: np.array, angle, size=80):
+def apply_motion_blur(image: np.ndarray, angle, size=80):
    """Solidifies and slightly extends detected lines.

    Args:
@ -33,19 +29,19 @@ def apply_motion_blur(image: np.array, angle, size=80):
        np.array

    """
-    k = np.zeros((size, size), dtype=np.float32)
-    vizlogger.debug(k, "tables08_blur_kernel1.png")
-    k[(size - 1) // 2, :] = np.ones(size, dtype=np.float32)
-    vizlogger.debug(k, "tables09_blur_kernel2.png")
-    k = cv2.warpAffine(
-        k,
+    kernel = np.zeros((size, size), dtype=np.float32)
+    vizlogger.debug(kernel, "tables08_blur_kernel1.png")
+    kernel[(size - 1) // 2, :] = np.ones(size, dtype=np.float32)
+    vizlogger.debug(kernel, "tables09_blur_kernel2.png")
+    new_kernel: np.ndarray = cv2.warpAffine(
+        kernel,
        cv2.getRotationMatrix2D((size / 2 - 0.5, size / 2 - 0.5), angle, 1.0),
        (size, size),
    )
-    vizlogger.debug(k, "tables10_blur_kernel3.png")
-    k = k * (1.0 / np.sum(k))
-    vizlogger.debug(k, "tables11_blur_kernel4.png")
-    blurred = cv2.filter2D(image, -1, k)
+    vizlogger.debug(new_kernel, "tables10_blur_kernel3.png")
+    new_kernel = new_kernel * (1.0 / np.sum(new_kernel))
+    vizlogger.debug(new_kernel, "tables11_blur_kernel4.png")
+    blurred = cv2.filter2D(image, -1, new_kernel)
    return blurred


@ -57,7 +53,7 @@ def isolate_vertical_and_horizontal_components(img_bin):
        bounding_rects (list): list of layout boxes of the form (x, y, w, h), potentially containing tables

    Returns:
-        np.array
+        np.ndarray
    """
    line_min_width = 48
    kernel_h = np.ones((1, line_min_width), np.uint8)
@ -78,16 +74,14 @@ def isolate_vertical_and_horizontal_components(img_bin):
    img_bin_extended = img_bin_h | img_bin_v

    _, img_bin_extended = cv2.threshold(img_bin_extended, 120, 255, cv2.THRESH_BINARY)
-    img_bin_final = cv2.dilate(
-        img_bin_extended, np.ones((1, 1), np.uint8), iterations=1
-    )
+    img_bin_final = cv2.dilate(img_bin_extended, np.ones((1, 1), np.uint8), iterations=1)
    # add contours before lines are extended by blurring
    img_bin_final = add_external_contours(img_bin_final, img_lines_raw)

    return img_bin_final


-def find_table_layout_boxes(image: np.array):
+def find_table_layout_boxes(image: np.ndarray):
    def is_large_enough(box):
        (_, _, w, h) = box
        if w * h >= 100000:
@ -98,29 +92,27 @@ def find_table_layout_boxes(image: np.array):
    return lmap(is_large_enough, layout_boxes)


-def preprocess(image: np.array):
+def preprocess(image: np.ndarray):
    image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY) if len(image.shape) > 2 else image
    _, image = cv2.threshold(image, 195, 255, cv2.THRESH_BINARY)
    return ~image


-def turn_connected_components_into_rects(image: np.array):
+def turn_connected_components_into_rects(image: np.ndarray):
    def is_large_enough(stat):
        x1, y1, w, h, area = stat
        return area > 2000 and w > 35 and h > 25

-    _, _, stats, _ = cv2.connectedComponentsWithStats(
-        ~image, connectivity=8, ltype=cv2.CV_32S
-    )
+    _, _, stats_list, _ = cv2.connectedComponentsWithStats(~image, connectivity=8, ltype=cv2.CV_32S)

-    stats = lfilter(is_large_enough, stats)
-    if stats:
-        stats = np.vstack(stats)
+    rects_list: list[np.ndarray] = lfilter(is_large_enough, stats_list)
+    if rects_list:
+        stats: np.ndarray = np.vstack(rects_list)
        return stats[:, :-1][2:]
    return []


-def parse_tables(image: np.array, show=False):
+def parse_tables(image: np.ndarray, show=False):
    """Runs the full table parsing process.

    Args:
@ -142,7 +134,7 @@ def parse_tables(image: np.array, show=False):
 # def make_lines(image: np.array, horizontal=True, kernel_length=40)


-def detect_horizontal_lines(image_bin: np.array, kernel_length=40):
+def detect_horizontal_lines(image_bin: np.ndarray, kernel_length=40):
    line_min_width = 48
    kernel_h = np.ones((1, line_min_width), np.uint8)
    img_bin_h = cv2.morphologyEx(image_bin, cv2.MORPH_OPEN, kernel_h)
@ -154,7 +146,7 @@ def detect_horizontal_lines(image_bin: np.array, kernel_length=40):
    return img_bin_h


-def detect_vertical_lines(image_bin: np.array, kernel_length=40):
+def detect_vertical_lines(image_bin: np.ndarray, kernel_length=40):
    line_min_width = 48
    kernel_v = np.ones((line_min_width, 1), np.uint8)
    img_bin_v = cv2.morphologyEx(image_bin, cv2.MORPH_OPEN, kernel_v)
@ -166,12 +158,8 @@ def detect_vertical_lines(image_bin: np.array, kernel_length=40):
    return img_bin_v


-def detect_endpoints(
-    image: np.array, is_horizontal: bool
-) -> list[tuple[int, int, int, int]]:
-    def are_collinear(
-        quad1: tuple[int, int, int, int], quad2: tuple[int, int, int, int], index: int
-    ) -> bool:
+def detect_endpoints(image: np.ndarray, is_horizontal: bool) -> list[tuple[int, int, int, int]]:
+    def are_collinear(quad1: tuple[int, int, int, int], quad2: tuple[int, int, int, int], index: int) -> bool:
        dist_a = abs(quad1[index] - quad2[index])
        dist_b = abs(quad1[index + 2] - quad2[index + 2])
        overlap = True if index else (quad1[1] >= quad2[3] or quad1[3] >= quad2[1])
@ -218,7 +206,7 @@ def detect_endpoints(
    return corrected


-def parse_lines(image: np.array, show=False) -> list[dict[str, list[int]]]:
+def parse_lines(image: np.ndarray, show=False) -> list[dict[str, list[int]]]:
    image = preprocess(image)
    # kernel = cv2.getStructuringElement(cv2.MORPH_ELLIPSE, (2, 2))
    # image = cv2.dilate(image, kernel, iterations=4)
@ -228,9 +216,7 @@ def parse_lines(image: np.array, show=False) -> list[dict[str, list[int]]]:
    horizontal_endpoints = detect_endpoints(horizontal_line_img, is_horizontal=True)
    vertical_endpoints = detect_endpoints(vertical_line_img, is_horizontal=False)

-    def format_quad(
-        quad: tuple[int, int, int, int], max_x: int, max_y: int
-    ) -> tuple[int, int, int, int]:
+    def format_quad(quad: tuple[int, int, int, int], max_x: int, max_y: int) -> tuple[int, int, int, int]:
        x1, y1, x2, y2 = quad
        if x1 > (x2 + 5):
            x1, y1, x2, y2 = x2, y2, x1, y1
--- a/src/cv_analysis/utils/annotate.py
+++ b/src/cv_analysis/utils/annotate.py
@ -8,7 +8,9 @@ from kn_utils.logging import logger


 def annotate_pdf(
-    pdf: Union[str, bytes, Path], annotations, output_path: Union[str, Path] = None
+    pdf: Union[str, bytes, Path],
+    annotations,
+    output_path: Union[str, Path, None] = None,
 ):
    pdf_bytes = provide_byte_stream(pdf)
    with fitz.open(stream=pdf_bytes) as pdf_handle:
--- a/src/cv_analysis/utils/connect_rects.py
+++ b/src/cv_analysis/utils/connect_rects.py
@ -1,4 +1,4 @@
-from itertools import combinations, starmap, product
+from itertools import combinations, product, starmap
 from typing import Iterable


@ -6,10 +6,14 @@ def is_near_enough(rect_pair, max_gap=14):
    x1, y1, w1, h1 = rect_pair[0]
    x2, y2, w2, h2 = rect_pair[1]

-    return any([abs(x1 - (x2 + w2)) <= max_gap,
+    return any(
+        [
+            abs(x1 - (x2 + w2)) <= max_gap,
            abs(x2 - (x1 + w1)) <= max_gap,
            abs(y2 - (y1 + h1)) <= max_gap,
-                abs(y1 - (y2 + h2)) <= max_gap])
+            abs(y1 - (y2 + h2)) <= max_gap,
+        ]
+    )


 def is_overlapping(rect_pair):
@ -23,28 +27,41 @@ def is_overlapping(rect_pair):
 def is_on_same_line(rect_pair):
    x1, y1, w1, h1 = rect_pair[0]
    x2, y2, w2, h2 = rect_pair[1]
-    return any([any([abs(y1 - y2) <= 10,
-                     abs(y1 + h1 - (y2 + h2)) <= 10]),
-                any([y2 <= y1 and y1 + h1 <= y2 + h2,
-                     y1 <= y2 and y2 + h2 <= y1 + h1])])
+    return any(
+        [
+            any([abs(y1 - y2) <= 10, abs(y1 + h1 - (y2 + h2)) <= 10]),
+            any([y2 <= y1 and y1 + h1 <= y2 + h2, y1 <= y2 and y2 + h2 <= y1 + h1]),
+        ]
+    )


 def has_correct_position1(rect_pair):
    x1, y1, w1, h1 = rect_pair[0]
    x2, y2, w2, h2 = rect_pair[1]
-    return any([any([abs(x1 - x2) <= 10,
+    return any(
+        [
+            any(
+                [
+                    abs(x1 - x2) <= 10,
                    abs(y1 - y2) <= 10,
                    abs(x1 + w1 - (x2 + w2)) <= 10,
-                     abs(y1 + h1 - (y2 + h2)) <= 10]),
-                any([y2 <= y1 and y1 + h1 <= y2 + h2,
+                    abs(y1 + h1 - (y2 + h2)) <= 10,
+                ]
+            ),
+            any(
+                [
+                    y2 <= y1 and y1 + h1 <= y2 + h2,
                    y1 <= y2 and y2 + h2 <= y1 + h1,
                    x2 <= x1 and x1 + w1 <= x2 + w2,
-                     x1 <= x2 and x2 + w2 <= x1 + w1])])
+                    x1 <= x2 and x2 + w2 <= x1 + w1,
+                ]
+            ),
+        ]
+    )


 def is_related(rect_pair):
-    return (is_near_enough(rect_pair) and has_correct_position1(rect_pair)) or is_overlapping(
-        rect_pair)
+    return (is_near_enough(rect_pair) and has_correct_position1(rect_pair)) or is_overlapping(rect_pair)


 def fuse_rects(rect1, rect2):
--- a/src/cv_analysis/utils/display.py
+++ b/src/cv_analysis/utils/display.py
@ -1,10 +1,12 @@
 import os
+
 import cv2
 from matplotlib import pyplot as plt

 if os.environ["USER"] == "isaac":
    import matplotlib
-    matplotlib.use('module://matplotlib-backend-wezterm')
+
+    matplotlib.use("module://matplotlib-backend-wezterm")


 def show_image_cv2(image, maxdim=700):
--- a/src/cv_analysis/utils/draw.py
+++ b/src/cv_analysis/utils/draw.py
@ -4,7 +4,6 @@ from cv_analysis.utils import copy_and_normalize_channels


 def draw_contours(image, contours, color=None, annotate=False):
-
    image = copy_and_normalize_channels(image)

    for cont in contours:
--- a/src/cv_analysis/utils/image_extraction.py
+++ b/src/cv_analysis/utils/image_extraction.py
@ -29,9 +29,7 @@ def transform_image_coordinates_to_pdf_coordinates(
    transformation_matrix: fitz.Matrix,
    dpi: int = None,
 ) -> Tuple:
-    x1, y1, x2, y2 = (
-        map(lambda x: (x / dpi) * 72, bbox) if dpi else bbox
-    )  # Convert to points, can be done before
+    x1, y1, x2, y2 = map(lambda x: (x / dpi) * 72, bbox) if dpi else bbox  # Convert to points, can be done before
    rect = fitz.Rect(x1, y1, x2, y2)
    rect = rect * rotation_matrix * transformation_matrix

@ -45,18 +43,12 @@ def rescale_to_pdf(bbox: Iterable[int | float], page_info: PageInfo) -> Iterable
    pix_h, pix_w = page_info.image_height, page_info.image_width
    ratio_h, ratio_w = pdf_h / pix_h, pdf_w / pix_w
    round3 = lambda x: tuple(map(lambda y: round(y, 3), x))
-    ratio_w, ratio_h, pdf_w, pdf_h, pix_w, pix_h = round3(
-        (ratio_w, ratio_h, pdf_w, pdf_h, pix_w, pix_h)
-    )
-    new_bbox = round3(
-        (bbox[0] * ratio_w, bbox[1] * ratio_h, bbox[2] * ratio_w, bbox[3] * ratio_h)
-    )
+    ratio_w, ratio_h, pdf_w, pdf_h, pix_w, pix_h = round3((ratio_w, ratio_h, pdf_w, pdf_h, pix_w, pix_h))
+    new_bbox = round3((bbox[0] * ratio_w, bbox[1] * ratio_h, bbox[2] * ratio_w, bbox[3] * ratio_h))
    return new_bbox


-def transform_table_lines_by_page_info(
-    bboxes: dict, offsets: tuple, page_info: PageInfo
-) -> dict:
+def transform_table_lines_by_page_info(bboxes: dict, offsets: tuple, page_info: PageInfo) -> dict:
    transform = partial(rescale_to_pdf, page_info=page_info)
    logger.debug(f"{offsets=}")

@ -74,9 +66,7 @@ def transform_table_lines_by_page_info(

    table_lines = bboxes.get("tableLines", [])
    transformed_lines = list(map(convert, table_lines))
-    bboxes[
-        "tableLines"
-    ] = transformed_lines  # lfilter(lambda b: b['y1']==b['y2'], transformed_lines)
+    bboxes["tableLines"] = transformed_lines  # lfilter(lambda b: b['y1']==b['y2'], transformed_lines)
    import json

    for i in range(len(table_lines)):
@ -126,11 +116,7 @@ def extract_images_from_pdf(
                #  current_page_info object to include the derotation_matrix.
                rect = rect * page.transformation_matrix * page.rotation_matrix
                pixmap = page.get_pixmap(clip=rect, dpi=dpi, colorspace=fitz.csGRAY)
-                shape = (
-                    (pixmap.h, pixmap.w, pixmap.n)
-                    if pixmap.n > 1
-                    else (pixmap.h, pixmap.w)
-                )
+                shape = (pixmap.h, pixmap.w, pixmap.n) if pixmap.n > 1 else (pixmap.h, pixmap.w)
                image = np.frombuffer(pixmap.samples, dtype=np.uint8).reshape(*shape)

                table_images.append(image)
--- a/src/cv_analysis/utils/open_pdf.py
+++ b/src/cv_analysis/utils/open_pdf.py
@ -13,17 +13,11 @@ def open_pdf(pdf, first_page=0, last_page=None):
        if pdf.lower().endswith((".png", ".jpg", ".jpeg")):
            pages = [Image.open(pdf)]
        elif pdf.lower().endswith(".pdf"):
-            pages = pdf2image.convert_from_path(
-                pdf, first_page=first_page, last_page=last_page
-            )
+            pages = pdf2image.convert_from_path(pdf, first_page=first_page, last_page=last_page)
        else:
-            raise IOError(
-                "Invalid file extension. Accepted filetypes:\n\t.png\n\t.jpg\n\t.jpeg\n\t.pdf"
-            )
+            raise IOError("Invalid file extension. Accepted filetypes:\n\t.png\n\t.jpg\n\t.jpeg\n\t.pdf")
    elif type(pdf) == bytes:
-        pages = pdf2image.convert_from_bytes(
-            pdf, first_page=first_page, last_page=last_page
-        )
+        pages = pdf2image.convert_from_bytes(pdf, first_page=first_page, last_page=last_page)
    elif type(pdf) in {list, ndarray}:
        return pdf

--- a/src/cv_analysis/utils/postprocessing.py
+++ b/src/cv_analysis/utils/postprocessing.py
@ -1,7 +1,8 @@
 from collections import namedtuple
 from functools import partial
-from itertools import starmap, compress
+from itertools import compress, starmap
 from typing import Iterable, List
+
 from cv_analysis.utils.structures import Rectangle


--- a/src/cv_analysis/utils/preprocessing.py
+++ b/src/cv_analysis/utils/preprocessing.py
@ -1,5 +1,5 @@
-from numpy import frombuffer, ndarray
 import cv2
+from numpy import frombuffer, ndarray


 def preprocess_page_array(page):
@ -10,7 +10,6 @@ def preprocess_page_array(page):


 def page2image(page):
-
    if type(page) == bytes:
        page = frombuffer(page)
    elif type(page) == ndarray:
--- a/src/cv_analysis/utils/structures.py
+++ b/src/cv_analysis/utils/structures.py
@ -1,12 +1,23 @@
 from json import dumps
-
 from typing import Iterable
+
 import numpy as np
 from funcy import identity


 class Rectangle:
-    def __init__(self, x1=None, y1=None, w=None, h=None, x2=None, y2=None, indent=4, format="xywh", discrete=True):
+    def __init__(
+        self,
+        x1=None,
+        y1=None,
+        w=None,
+        h=None,
+        x2=None,
+        y2=None,
+        indent=4,
+        format="xywh",
+        discrete=True,
+    ):
        make_discrete = int if discrete else identity

        try:
@ -111,7 +122,13 @@ class Rectangle:

    @classmethod
    def from_dict_xywh(cls, xywh_dict, discrete=True):
-        return cls(x1=xywh_dict["x"], y1=xywh_dict["y"], w=xywh_dict["width"], h=xywh_dict["height"], discrete=discrete)
+        return cls(
+            x1=xywh_dict["x"],
+            y1=xywh_dict["y"],
+            w=xywh_dict["width"],
+            h=xywh_dict["height"],
+            discrete=discrete,
+        )

    def __str__(self):
        return dumps(self.json(), indent=self.indent)
--- a/src/cv_analysis/utils/test_metrics.py
+++ b/src/cv_analysis/utils/test_metrics.py
@ -1,5 +1,7 @@
 from typing import Iterable
+
 import numpy as np
+
 from cv_analysis.utils.structures import Rectangle


@ -26,7 +28,6 @@ def compute_page_iou(results_boxes: Iterable[Rectangle], ground_truth_boxes: Ite


 def compute_document_score(results_dict, annotation_dict):
-
    page_weights = np.array([len(page["cells"]) for page in annotation_dict["pages"]])
    page_weights = page_weights / sum(page_weights)

--- a/src/cv_analysis/utils/utils.py
+++ b/src/cv_analysis/utils/utils.py
@ -1,9 +1,8 @@
-from numpy import generic
 import cv2
+from numpy import generic


 def copy_and_normalize_channels(image):
-
    image = image.copy()
    try:
        image = cv2.cvtColor(image, cv2.COLOR_GRAY2BGR)
--- a/src/cv_analysis/utils/visual_logging.py
+++ b/src/cv_analysis/utils/visual_logging.py
@ -1,4 +1,5 @@
 import os
+
 from pyinfra.config.loader import load_settings

 from cv_analysis.config import get_config
--- a/src/serve.py
+++ b/src/serve.py
@ -1,9 +1,9 @@
 from sys import stdout
 from typing import Union

-from kn_utils.logging import logger
-from pyinfra.examples import start_standard_queue_consumer
-from pyinfra.queue.callback import make_download_process_upload_callback
+from kn_utils.logging import logger  # type: ignore
+from pyinfra.examples import start_standard_queue_consumer  # type: ignore
+from pyinfra.queue.callback import make_download_process_upload_callback  # type: ignore

 from cv_analysis.config import get_config
 from cv_analysis.server.pipeline import get_analysis_pipeline
--- a/test/fixtures/figure_detection.py
+++ b/test/fixtures/figure_detection.py
@ -5,9 +5,7 @@ import numpy as np
 import pytest
 from lorem_text import lorem

-from cv_analysis.figure_detection.figure_detection import (
-    detect_figures,
-)
+from cv_analysis.figure_detection.figure_detection import detect_figures


@pytest.fixture
--- a/test/fixtures/server.py
+++ b/test/fixtures/server.py
@ -1,8 +1,8 @@
 import gzip
 import io

-import numpy as np
 import cv2
+import numpy as np
 import pytest
 from funcy import first

--- a/test/fixtures/table_parsing.py
+++ b/test/fixtures/table_parsing.py
@ -1,5 +1,6 @@
 import json
 from os.path import join
+from test.fixtures.figure_detection import paste_text

 import cv2
 import pytest
@ -11,7 +12,6 @@ from cv_analysis.config import get_config
 from cv_analysis.locations import REPO_ROOT_PATH, TEST_DATA_DVC
 from cv_analysis.utils.draw import draw_rectangles
 from cv_analysis.utils.open_pdf import open_pdf
-from test.fixtures.figure_detection import paste_text

 settings = get_config()

--- a/test/unit_tests/figure_detection/figure_detection_test.py
+++ b/test/unit_tests/figure_detection/figure_detection_test.py
@ -1,10 +1,9 @@
 from math import prod
+from test.utils.utils import powerset

 import cv2
 import pytest

-from test.utils.utils import powerset
-

@pytest.mark.parametrize("background_color", [255, 220])
 class TestFindPrimaryTextRegions:
--- a/test/unit_tests/figure_detection/text_test.py
+++ b/test/unit_tests/figure_detection/text_test.py
@ -1,12 +1,11 @@
+from test.utils.utils import powerset
+
 import cv2
 import numpy as np
 import pytest

-from cv_analysis.figure_detection.text import (
-    remove_primary_text_regions,
-    apply_threshold_to_image,
-)
-from test.utils.utils import powerset
+from cv_analysis.figure_detection.text import (apply_threshold_to_image,
+                                               remove_primary_text_regions)


@pytest.mark.parametrize("error_tolerance", [0.07])
--- a/test/unit_tests/server_pipeline_test.py
+++ b/test/unit_tests/server_pipeline_test.py
@ -2,11 +2,9 @@ import fitz
 import numpy as np
 import pytest

-from cv_analysis.server.pipeline import (
-    figure_detection_formatter,
+from cv_analysis.server.pipeline import (figure_detection_formatter,
                                         make_analysis_pipeline,
-    table_parsing_formatter,
-)
+                                         table_parsing_formatter)
 from cv_analysis.utils.structures import Rectangle