[WIP] Make texture show through page content

2023-01-31 13:53:52 +01:00 · 2023-01-31 13:53:52 +01:00 · 186b4530f0
commit 186b4530f0
parent a1ccda4ea9
2 changed files with 171 additions and 22 deletions
--- a/cv_analysis/utils/conversion.py
+++ b/cv_analysis/utils/conversion.py
@ -40,10 +40,8 @@ class RectangleJSONEncoder(json.JSONEncoder):


 def normalize_image_format_to_array(image: Image_t):
-    return np.array(image) if isinstance(image, Image.Image) else image
+    return np.array(image).astype(np.uint8) if isinstance(image, Image.Image) else image


 def normalize_image_format_to_pil(image: Image_t):
-    if isinstance(image, np.ndarray):
-        return Image.fromarray(image)
-    return image
+    return Image.fromarray(image.astype(np.uint8)) if isinstance(image, np.ndarray) else image
--- a/test/fixtures/page_generation/page.py
+++ b/test/fixtures/page_generation/page.py
@ -3,7 +3,10 @@ import io
 import itertools
 import random
 import string
+import sys
 import textwrap
+from collections import Counter
+from copy import deepcopy
 from enum import Enum
 from functools import lru_cache, partial
 from math import sqrt
@ -31,6 +34,9 @@ from cv_analysis.utils.merging import merge_related_rectangles
 from cv_analysis.utils.postprocessing import remove_overlapping, remove_included
 from cv_analysis.utils.spacial import area

+logger.remove()
+logger.add(sys.stderr, level="INFO")
+
 random_seed = random.randint(0, 2**32 - 1)
 # random_seed = 3896311122
 # random_seed = 1986343479
@ -38,7 +44,7 @@ random_seed = random.randint(0, 2**32 - 1)
 # random_seed = 273244862  # empty large table
 # random_seed = 3717442900
 # random_seed = 2508340737
-random_seed = 2212357755
+# random_seed = 2212357755
 rnd = random.Random(random_seed)
 logger.info(f"Random seed: {random_seed}")

@ -180,6 +186,7 @@ Color = Tuple[int, int, int]
 def base_texture(request, size):
    texture = Image.open(TEST_PAGE_TEXTURES_DIR / (request.param + ".jpg"))
    texture = texture.resize(size)
+    texture.putalpha(255)
    return texture


@ -298,16 +305,22 @@ def overlay(images, mode=np.sum):


@pytest.fixture
-def texture(blank_page, base_texture):
-    texture = superimpose_texture_with_transparency(base_texture, blank_page)
+def texture(tinted_blank_page, base_texture):
+    texture = superimpose_texture_with_transparency(base_texture, tinted_blank_page)
    return texture


+@pytest.fixture
+def tinted_blank_page(size, color, color_intensity):
+    tinted_page = Image.new("RGBA", size, color)
+    tinted_page.putalpha(color_intensity)
+    return tinted_page
+
+
@pytest.fixture
 def blank_page(size, color, color_intensity):
-    color_image = Image.new("RGBA", size, color)
-    color_image.putalpha(color_intensity)
-    return color_image
+    page = Image.new("RGBA", size, color=(255, 255, 255, 0))
+    return page


 def tint_image(src, color="#FFFFFF"):
@ -350,15 +363,40 @@ def size(dpi, orientation):
    return size


-def superimpose_texture_with_transparency(page: Image, texture: Image, autocrop=True) -> Image:
-    """Superimposes a noise image with transparency onto a page image."""
+def superimpose_texture_with_transparency(
+    page: Image,
+    texture: Image,
+    crop_to_content=True,
+    pad=True,
+) -> Image:
+    """Superimposes a noise image with transparency onto a page image.

-    if autocrop:
+    TODO: Rename page and texture to something more generic.
+
+    Args:
+        page: The page image.
+        texture: The texture image.
+        crop_to_content: If True, the texture will be cropped to content (i.e. the bounding box of all non-transparent
+            parts of the texture image).
+        pad: If True, the texture will be padded to the size of the page.
+
+    Returns:
+        Image where the texture is superimposed onto the page.
+    """
+    page = normalize_image_format_to_pil(page)
+    texture = normalize_image_format_to_pil(texture)
+
+    if crop_to_content:
        texture = texture.crop(texture.getbbox())

    if page.size != texture.size:
-        logger.trace(f"Padding image before pasting to fit size {page.size}")
-        texture = pad_image_to_size(texture, page.size)
+        logger.trace(f"Size of page and texture do not match: {page.size} != {texture.size}")
+        if pad:
+            logger.trace(f"Padding texture before pasting to fit size {page.size}")
+            texture = pad_image_to_size(texture, page.size)
+        else:
+            logger.trace(f"Resizing texture before pasting to fit size {page.size}")
+            texture = texture.resize(page.size)

    assert page.size == texture.size
    assert texture.mode == "RGBA"
@ -375,7 +413,11 @@ def pad_image_to_size(image: Image, size: Tuple[int, int]) -> Image:
    if image.size[0] > size[0] or image.size[1] > size[1]:
        raise ValueError(f"Image size {image.size} is larger than target size {size}.")

+    # get average alpha value from image
+    # alpha = int(np.mean(np.array(image.split()[-1]))) or 255
+    # padded = Image.new(image.mode, size, color=(255, 255, 255, alpha))
    padded = Image.new(image.mode, size, color=255)
+
    pasting_coords = compute_pasting_coordinates(image, padded)
    assert image.mode == "RGBA"
    padded.paste(image, pasting_coords)
@ -388,31 +430,134 @@ def compute_pasting_coordinates(smaller: Image, larger: Image.Image):


@pytest.fixture
-def page_with_content(texture, texture_fn) -> np.ndarray:
+def page_with_content(blank_page, tinted_blank_page, texture, texture_fn) -> np.ndarray:
    """Creates a page with content"""
-    page = random_flip(texture)
-    page = texture_fn(page)
    page_partitioner = rnd.choice(
        [
            TwoColumnPagePartitioner(),
            # RandomPagePartitioner(),
        ]
    )
-    boxes = page_partitioner(page)
+
+    ###############################
+    # texture = random_flip(texture)
+    # texture = texture_fn(texture)
+    #
+    # boxes = page_partitioner(texture)
+    # content_generator = ContentGenerator()
+    # boxes = content_generator(boxes)
+    # page = paste_contents(texture, boxes)
+    ###############################
+
+    ################################
+    boxes = page_partitioner(blank_page)
    content_generator = ContentGenerator()
    boxes = content_generator(boxes)
-    page = paste_contents(page, boxes)
+    page_content = paste_contents(blank_page, boxes)
+
+    texture = random_flip(texture)
+    texture = texture_fn(texture)
+
+    page_content = multiply_alpha_where_alpha_channel_is_nonzero(page_content, factor=0.6)
+    page = superimpose_texture_with_transparency(texture, page_content, crop_to_content=False)
+    ################################
+
    draw_boxes(page, boxes)

-    page = np.array(page)
    return page


-def blend(a, b):
+def provide_image_format(required_format):
+    def inner(fn):
+        def inner(image, *args, **kwargs):
+
+            ret = fn(converter(image), *args, **kwargs)
+
+            if get_image_format(image) != required_format:
+                ret = back_converter(ret)
+
+            return ret
+
+        converter = {
+            "array": normalize_image_format_to_array,
+            "pil": normalize_image_format_to_pil,
+        }[required_format]
+
+        back_converter = {
+            "array": normalize_image_format_to_pil,
+            "pil": normalize_image_format_to_array,
+        }[required_format]
+
+        return inner
+
+    return inner
+
+
+@provide_image_format("array")
+def set_alpha_where_color_channels_are_nonzero(image: np.ndarray, alpha: int) -> np.ndarray:
+    """Sets the alpha channel of an image to a given value where the color channels are nonzero."""
+
+    assert image.ndim == 3
+    assert image.shape[-1] == 4
+    assert 0 <= alpha <= 255
+
+    image = image.copy()
+    image[..., -1] = np.where(np.logical_or.reduce(image[..., :-1] > 0, axis=-1), alpha, image[..., -1])
+    return image
+
+
+@provide_image_format("array")
+def multiply_alpha_where_alpha_channel_is_nonzero(image: np.ndarray, factor: float) -> np.ndarray:
+    """Increases the alpha channel of an image where the alpha channel is nonzero."""
+
+    assert image.ndim == 3
+    assert image.shape[-1] == 4
+
+    image = image.copy().astype(np.float32)
+    image[..., -1] = np.where(image[..., -1] > 0, image[..., -1] * factor, image[..., -1])
+    image[..., -1] = np.clip(image[..., -1], 0, 255)
+
+    assert image.max() <= 255
+    assert image.min() >= 0
+    return image
+
+
+@provide_image_format("array")
+def set_alpha_where_alpha_channel_is_nonzero(image: np.ndarray, alpha: int) -> np.ndarray:
+    """Sets the alpha channel of an image to a given value where the alpha channel is nonzero."""
+
+    assert image.ndim == 3
+    assert image.shape[-1] == 4
+    assert 0 <= alpha <= 255
+
+    image = image.copy()
+    image[..., -1] = np.where(image[..., -1] > 0, alpha, image[..., -1])
+    return image
+
+
+def get_image_format(image):
+    if isinstance(image, np.ndarray):
+        return "array"
+    elif isinstance(image, Image.Image):
+        return "pil"
+    else:
+        raise ValueError(f"Unknown image format: {type(image)}")
+
+
+def blend(a: np.ndarray, b: np.ndarray):
    """Reference: https://stackoverflow.com/a/52143032"""
+
+    assert a.max() <= 255
+    assert a.min() >= 0
+
+    assert b.max() <= 255
+    assert b.min() >= 0
+
    a = a.astype(float) / 255
    b = b.astype(float) / 255  # make float on range 0-1

+    print(a.shape, b.shape)
+
    mask = a >= 0.5  # generate boolean mask of everywhere a > 0.5
    ab = np.zeros_like(a)  # generate an output container for the blended image

@ -420,6 +565,11 @@ def blend(a, b):
    ab[~mask] = (2 * a * b)[~mask]  # 2ab everywhere a<0.5
    ab[mask] = (1 - 2 * (1 - a) * (1 - b))[mask]  # else this

+    assert ab.max() <= 1
+    assert ab.min() >= 0
+
+    return (ab * 255).astype(np.uint8)
+

 class ContentRectangle(Rectangle):
    def __init__(self, x1, y1, x2, y2, content=None):
@ -1425,6 +1575,7 @@ def paste_content(page, content_box: ContentRectangle):


 def paste_contents(page, contents: Iterable[ContentRectangle]):
+    page = deepcopy(page)
    for content in contents:
        paste_content(page, content)
    return page