2022-02-03 13:32:22 +01:00

56 lines
1.3 KiB
Python

import argparse
import json
from operator import itemgetter
import pdf2image
import requests
from PIL import ImageDraw
def draw_coco_box(draw: ImageDraw.Draw, bbox, klass):
x1, y1, x2, y2 = itemgetter("x1", "y1", "x2", "y2")(bbox)
draw.rectangle(((x1, y1), (x2, y2)), outline="red")
draw.text((x1, y1), text=klass, fill=(0, 0, 0, 100))
def draw_coco_boxes(image, bboxes, classes):
draw = ImageDraw.Draw(image)
for bbox, klass in zip(bboxes, classes):
draw_coco_box(draw, bbox, klass)
return image
def annotate(pdf_path, predictions):
pages = pdf2image.convert_from_path(pdf_path)
for prd in predictions:
page_idx, boxes, classes = itemgetter("page_idx", "bboxes", "classes")(prd)
page = pages[page_idx]
image = draw_coco_boxes(page, boxes, classes)
image.save(f"/tmp/serv_out/{page_idx}.png")
def parse_args():
parser = argparse.ArgumentParser()
parser.add_argument("--pdf_path", required=True)
args = parser.parse_args()
return args
def main(args):
response = requests.post("http://127.0.0.1:5000", data=open(args.pdf_path, "rb"))
response.raise_for_status()
predictions = response.json()
print(json.dumps(predictions, indent=2))
annotate(args.pdf_path, predictions)
if __name__ == "__main__":
args = parse_args()
main(args)