add DOCUMENTATION???

what is this. documentation in python code? clearly I am neither a python programmer nor a signal processing graduate student.
bunnie · Dec 27, 2023 · d27669d · d27669d
1 parent e788bdd
commit d27669d
Show file tree

Hide file tree

Showing 2 changed files with 212 additions and 0 deletions.
diff --git a/stitch.py b/stitch.py
@@ -203,26 +203,41 @@ def load_schema(self, blend=False):
             y -= Schema.Y_RES / 2
 
             if blend:
+                # the mask is 255 where pixels should be copied into the final mosaic canvas. In this case, we
+                # want to overlay the full image every time, so the mask is easy.
                 mask = np.full((img.shape[0], img.shape[1]), 255, dtype=np.uint8)
                 masks += [mask]
+                # The image needs to be RGB 8-bit per channel for the cv2 blending algorithm
                 images += [cv2.cvtColor(img, cv2.COLOR_GRAY2RGB)]
+                # the corner is the top left corner of where the image should go after alignment
                 corners += [(int(x), int(y))]
             else:
                 canvas, mask = safe_image_broadcast(img, canvas, x, y, mask)
 
         if blend:
+            # this computes the full size of the resulting canvas
             dst_sz = cv2.detail.resultRoi(corners=corners, images=images)
+            # set up the blender algorithm. This case uses the Burt & Adelson 1983 multiresolution
+            # spline algorithm (gaussian/laplacian pyramids) with some modern refinements that
+            # haven't been explicitly documented by opencv.
             blender = cv2.detail_MultiBandBlender(try_gpu=1) # GPU is wicked fast - the computation is much faster than reading in the data
+            # I *think* this sets how far the blending seam should go from the edge.
             blend_strength = 5 # default from example program
             blend_width = np.sqrt(dst_sz[2] * dst_sz[3]) * blend_strength / 100
+            # I read "bands" as basically how deep you want the pyramids to go
             blender.setNumBands((np.log(blend_width) / np.log(2.) - 1.).astype(np.int32))
+            # Allocates memory for the final image
             blender.prepare(dst_sz)
 
+            # Feed the images into the blender itself
             logging.info("Blending...")
             for (img, mask, corner) in zip(images, masks, corners):
                 blender.feed(img, mask, corner)
 
+            # Actual computational step
             canvas_rgb, _canvas_mask = blender.blend(None, None)
+            # The result is a uint16 RGB image: some magic happens to prevent precision loss. This is good.
+            # Re-normalize and convert to gray scale.
             canvas = cv2.normalize(canvas_rgb, None, alpha=0, beta=255, norm_type=cv2.NORM_MINMAX, dtype=cv2.CV_8U)
             # cv2.imshow('blended', canvas)
             canvas = cv2.cvtColor(canvas, cv2.COLOR_RGB2GRAY)

diff --git a/stitch_test.py b/stitch_test.py
@@ -0,0 +1,197 @@
+#! /usr/bin/env python3
+
+import argparse
+from pathlib import Path
+import logging
+import numpy as np
+import math
+import re
+import cv2
+import sys
+
+from math import log2, ceil
+
+def make_gaussian_pyramid(base, levels):
+    g = base.copy()
+    pyramid = [g]
+    for i in range(levels):
+        g = cv2.pyrDown(g)
+        pyramid += [g]
+    return pyramid
+
+def make_laplacian_from_gaussian(gaussian):
+    lp = [gaussian[-1]]
+    for i in range(len(gaussian) - 1, 0, -1):
+        ge = cv2.pyrUp(gaussian[i])
+        l = cv2.subtract(gaussian[i-1], ge)
+        lp += [l]
+    return lp
+
+def square_image(img, pad=0):
+    # square up an image to the nearest power of 2
+    max_dim = max(img.shape[0], img.shape[1])
+    max_dim = 2**ceil(log2(max_dim))
+    sq_canvas = np.full((max_dim, max_dim), pad, dtype=np.uint8)
+    # Calculate the position to paste the non-square image in the center
+    x_offset = (sq_canvas.shape[1] - img.shape[1]) // 2
+    y_offset = (sq_canvas.shape[0] - img.shape[0]) // 2
+
+    # Paste the non-square image in the center of the square canvas
+    sq_canvas[y_offset:y_offset + img.shape[0], x_offset:x_offset + img.shape[1]] = img
+    return sq_canvas, (x_offset, y_offset)
+
+def composite_gaussian_pyramid(pyramid):
+    rows, cols = pyramid[0].shape
+    # determine the total number of rows and columns for the composite
+    composite_rows = max(rows, sum(p.shape[0] for p in pyramid[1:]))
+    composite_cols = cols + pyramid[1].shape[1]
+    composite_image = np.zeros((composite_rows, composite_cols),
+                            dtype=np.uint8)
+
+    # store the original to the left
+    composite_image[:rows, :cols] = pyramid[0]
+
+    # stack all downsampled images in a column to the right of the original
+    i_row = 0
+    for p in pyramid[1:]:
+        n_rows, n_cols = p.shape[:2]
+        composite_image[i_row:i_row + n_rows, cols:cols + n_cols] = p
+        i_row += n_rows
+
+    return composite_image
+
+def composite_laplacian_pyramid(pyramid):
+    rows, cols = pyramid[-1].shape
+    # determine the total number of rows and columns for the composite
+    composite_rows = max(rows, sum(p.shape[0] for p in pyramid[:-1]))
+    composite_cols = cols + pyramid[-2].shape[1]
+    composite_image = np.zeros((composite_rows, composite_cols),
+                            dtype=np.uint8)
+
+    # store the original to the left
+    composite_image[:rows, :cols] = pyramid[-1]
+
+    # stack all downsampled images in a column to the right of the original
+    i_row = 0
+    for p in reversed(pyramid[:-1]):
+        n_rows, n_cols = p.shape[:2]
+        composite_image[i_row:i_row + n_rows, cols:cols + n_cols] = p
+        i_row += n_rows
+
+    return composite_image
+
+
+# https://stackoverflow.com/questions/43391205/add-padding-to-images-to-get-them-into-the-same-shape
+def pad_images_to_same_size(images):
+    """
+    :param images: sequence of images
+    :return: list of images padded so that all images have same width and height (max width and height are used)
+    """
+    width_max = 0
+    height_max = 0
+    for img in images:
+        h, w = img.shape[:2]
+        width_max = max(width_max, w)
+        height_max = max(height_max, h)
+
+    images_padded = []
+    for img in images:
+        h, w = img.shape[:2]
+        diff_vert = height_max - h
+        pad_top = diff_vert//2
+        pad_bottom = diff_vert - pad_top
+        diff_hori = width_max - w
+        pad_left = diff_hori//2
+        pad_right = diff_hori - pad_left
+        img_padded = cv2.copyMakeBorder(img, pad_top, pad_bottom, pad_left, pad_right, cv2.BORDER_CONSTANT, value=0)
+        assert img_padded.shape[:2] == (height_max, width_max)
+        images_padded.append(img_padded)
+
+    return images_padded
+
+
+def main():
+    parser = argparse.ArgumentParser(description="IRIS Stitching Scripts")
+    parser.add_argument(
+        "--loglevel", required=False, help="set logging level (INFO/DEBUG/WARNING/ERROR)", type=str, default="INFO",
+    )
+    parser.add_argument(
+        "--name", required=False, help="base name", default='test'
+    )
+    parser.add_argument(
+        '--blend_strength', action='store', default=5,
+        help="Blending strength from [0,100] range. The default is 5",
+        type=np.int32, dest='blend_strength'
+    )
+    args = parser.parse_args()
+    numeric_level = getattr(logging, args.loglevel.upper(), None)
+    if not isinstance(numeric_level, int):
+        raise ValueError('Invalid log level: %s' % args.loglevel)
+    logging.basicConfig(level=numeric_level)
+
+    test_path = Path("./")
+    files = [file for file in test_path.glob(f'{args.name}*.png') if file.is_file()]
+
+    db = []
+    for file in files:
+        (_root, x, y, index) = file.stem.split('_')
+        img = cv2.imread(str(test_path / file), cv2.IMREAD_GRAYSCALE)
+        img = cv2.cvtColor(img, cv2.COLOR_GRAY2RGB)
+        db += [(img, int(x), int(y), int(index))]
+
+    SCALE = 0.5
+    CANVAS_W = 7000
+    CANVAS_H = 7000
+
+    corners = []
+    images = []
+    masks = []
+    for (img, x, y, _index) in db:
+        # the corner is the top left corner of where the image should go after alignment
+        corners += [(x, y)]
+        if False:
+            canvas = np.zeros((CANVAS_H, CANVAS_W, 3), dtype=np.uint8)
+            mask = np.zeros((CANVAS_H, CANVAS_W), dtype=np.uint8)
+            canvas[y : y + img.shape[0], x : x + img.shape[1]] = img
+            images += [canvas]
+            mask[y : y + img.shape[0], x : x + img.shape[1]] = np.ones((img.shape[0], img.shape[1]), dtype=np.uint8)
+            masks += [mask]
+        else:
+            images += [img]
+            # the mask is 255 where pixels should be copied into the final mosaic canvas
+            mask = np.full((img.shape[0], img.shape[1]), 255, dtype=np.uint8)
+            masks += [mask]
+
+    # this computes the full size of the resulting canvas
+    dst_sz = cv2.detail.resultRoi(corners=corners, images=images)
+
+    # set up the blender algorithm. This case uses the Burt & Adelson 1983 multiresolution
+    # spline algorithm (gaussian/laplacian pyramids) with some modern refinements that
+    # haven't been explicitly documented by opencv.
+    blender = cv2.detail_MultiBandBlender(try_gpu=1)
+    # I *think* this sets how far the blending seam should go from the edge.
+    blend_width = np.sqrt(dst_sz[2] * dst_sz[3]) * args.blend_strength / 100
+    # I read "bands" as basically how deep you want the pyramids to go
+    blender.setNumBands((np.log(blend_width) / np.log(2.) - 1.).astype(np.int32))
+    # Allocates memory for the final image
+    blender.prepare(dst_sz)
+
+    # Feed the images into the blender itself
+    for (img, mask, corner) in zip(images, masks, corners):
+        print(corner)
+        blender.feed(img, mask, corner)
+
+    # The actual computational step.
+    result, result_mask = blender.blend(None, None)
+
+    # Show results
+    cv2.imshow("blend",
+        cv2.resize(cv2.normalize(result, None, alpha=0, beta=255, norm_type=cv2.NORM_MINMAX, dtype=cv2.CV_8U), None, None, SCALE, SCALE),
+    )
+    cv2.imshow("mask",
+        cv2.resize(result_mask, None, None, SCALE, SCALE),
+    )
+    cv2.waitKey()
+
+if __name__ == "__main__":
+    main()