From 4078b3e4ecdbf5cba7c41c78f6e6a4b9531bde6f Mon Sep 17 00:00:00 2001 From: Matthias Bisping Date: Tue, 26 Apr 2022 14:37:12 +0200 Subject: [PATCH] signatures for services --- doc/signatures.txt | 44 ++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 44 insertions(+) create mode 100644 doc/signatures.txt diff --git a/doc/signatures.txt b/doc/signatures.txt new file mode 100644 index 0000000..3825ddb --- /dev/null +++ b/doc/signatures.txt @@ -0,0 +1,44 @@ +Processing service interface + +image classification now : JSON (Mdat PDF) -> (Data PDF -> JSON [Mdat ImObj] +image classification future: JSON [Mdat FunkIm] | Mdat PDF -> (Data [FunkIm] -> JSON [Mdat FunkIm]) +object detection : JSON [Mdat PagIm] | Mdat PDF -> (Data [PagIm] -> JSON [[Mdat SemIm]]) +NER : JSON [Mdat Dict] -> (Data [Dict] -> JSON [Mdat]) +table parsing : JSON [Mdat FunkIm] | Mdat PDF -> (Data [PagIm] -> JSON [[Mdat FunkIm]]) +pdf2image : Mdat (fn, [Int], PDF) -> (JSON ([Int], Data PDF) -> [(FunkIm, Mdat)]) + + +image classification now : Mdat (fn, [Int], file) -> (Data PDF -> JSON [Mdat ImObj] +image classification future: Mdat (fn, [Int], dir) -> (Data [FunkIm] -> JSON [Mdat FunkIm]) +object detection : Mdat (fn, [Int], dir) -> (Data [PagIm] -> JSON [[Mdat SemIm]]) +table parsing : Mdat (fn, [Int], dir) -> (Data [PagIm] -> JSON [[Mdat FunkIm]]) +NER : Mdat (fn, [Int], file) -> (Data [Dict] -> JSON [Mdat]) +pdf2image : Mdat (fn, [Int], file) -> (JSON ([Int], Data PDF) -> [(FunkIm, Mdat)]) + + +from funcy import identity + +access(mdat): + if mdat.path is file: + request = {"data": load(mdat.path), "metadata": mdat} + elif mdat.path is dir: + get_indexed = identity if not mdat.idx else itemgetter(*mdat.idx) + request = {"data": get_indexed(get_files(mdat.path)), "metadata": mdat} + else: + raise BadRequest + + +storage: + +fileId: { + pages: [PagIm] + images: [FunkIm] + sections: gz +} + + + + + + +