Skip to content


Browse files Browse the repository at this point in the history
what is this. documentation in python code?

clearly I am neither a python programmer nor a signal processing
graduate student.
  • Loading branch information
bunnie committed Dec 27, 2023
1 parent e788bdd commit d27669d
Show file tree
Hide file tree
Showing 2 changed files with 212 additions and 0 deletions.
15 changes: 15 additions & 0 deletions
Original file line number Diff line number Diff line change
Expand Up @@ -203,26 +203,41 @@ def load_schema(self, blend=False):
y -= Schema.Y_RES / 2

if blend:
# the mask is 255 where pixels should be copied into the final mosaic canvas. In this case, we
# want to overlay the full image every time, so the mask is easy.
mask = np.full((img.shape[0], img.shape[1]), 255, dtype=np.uint8)
masks += [mask]
# The image needs to be RGB 8-bit per channel for the cv2 blending algorithm
images += [cv2.cvtColor(img, cv2.COLOR_GRAY2RGB)]
# the corner is the top left corner of where the image should go after alignment
corners += [(int(x), int(y))]
canvas, mask = safe_image_broadcast(img, canvas, x, y, mask)

if blend:
# this computes the full size of the resulting canvas
dst_sz = cv2.detail.resultRoi(corners=corners, images=images)
# set up the blender algorithm. This case uses the Burt & Adelson 1983 multiresolution
# spline algorithm (gaussian/laplacian pyramids) with some modern refinements that
# haven't been explicitly documented by opencv.
blender = cv2.detail_MultiBandBlender(try_gpu=1) # GPU is wicked fast - the computation is much faster than reading in the data
# I *think* this sets how far the blending seam should go from the edge.
blend_strength = 5 # default from example program
blend_width = np.sqrt(dst_sz[2] * dst_sz[3]) * blend_strength / 100
# I read "bands" as basically how deep you want the pyramids to go
blender.setNumBands((np.log(blend_width) / np.log(2.) - 1.).astype(np.int32))
# Allocates memory for the final image

# Feed the images into the blender itself"Blending...")
for (img, mask, corner) in zip(images, masks, corners):
blender.feed(img, mask, corner)

# Actual computational step
canvas_rgb, _canvas_mask = blender.blend(None, None)
# The result is a uint16 RGB image: some magic happens to prevent precision loss. This is good.
# Re-normalize and convert to gray scale.
canvas = cv2.normalize(canvas_rgb, None, alpha=0, beta=255, norm_type=cv2.NORM_MINMAX, dtype=cv2.CV_8U)
# cv2.imshow('blended', canvas)
canvas = cv2.cvtColor(canvas, cv2.COLOR_RGB2GRAY)
Expand Down
197 changes: 197 additions & 0 deletions
Original file line number Diff line number Diff line change
@@ -0,0 +1,197 @@
#! /usr/bin/env python3

import argparse
from pathlib import Path
import logging
import numpy as np
import math
import re
import cv2
import sys

from math import log2, ceil

def make_gaussian_pyramid(base, levels):
g = base.copy()
pyramid = [g]
for i in range(levels):
g = cv2.pyrDown(g)
pyramid += [g]
return pyramid

def make_laplacian_from_gaussian(gaussian):
lp = [gaussian[-1]]
for i in range(len(gaussian) - 1, 0, -1):
ge = cv2.pyrUp(gaussian[i])
l = cv2.subtract(gaussian[i-1], ge)
lp += [l]
return lp

def square_image(img, pad=0):
# square up an image to the nearest power of 2
max_dim = max(img.shape[0], img.shape[1])
max_dim = 2**ceil(log2(max_dim))
sq_canvas = np.full((max_dim, max_dim), pad, dtype=np.uint8)
# Calculate the position to paste the non-square image in the center
x_offset = (sq_canvas.shape[1] - img.shape[1]) // 2
y_offset = (sq_canvas.shape[0] - img.shape[0]) // 2

# Paste the non-square image in the center of the square canvas
sq_canvas[y_offset:y_offset + img.shape[0], x_offset:x_offset + img.shape[1]] = img
return sq_canvas, (x_offset, y_offset)

def composite_gaussian_pyramid(pyramid):
rows, cols = pyramid[0].shape
# determine the total number of rows and columns for the composite
composite_rows = max(rows, sum(p.shape[0] for p in pyramid[1:]))
composite_cols = cols + pyramid[1].shape[1]
composite_image = np.zeros((composite_rows, composite_cols),

# store the original to the left
composite_image[:rows, :cols] = pyramid[0]

# stack all downsampled images in a column to the right of the original
i_row = 0
for p in pyramid[1:]:
n_rows, n_cols = p.shape[:2]
composite_image[i_row:i_row + n_rows, cols:cols + n_cols] = p
i_row += n_rows

return composite_image

def composite_laplacian_pyramid(pyramid):
rows, cols = pyramid[-1].shape
# determine the total number of rows and columns for the composite
composite_rows = max(rows, sum(p.shape[0] for p in pyramid[:-1]))
composite_cols = cols + pyramid[-2].shape[1]
composite_image = np.zeros((composite_rows, composite_cols),

# store the original to the left
composite_image[:rows, :cols] = pyramid[-1]

# stack all downsampled images in a column to the right of the original
i_row = 0
for p in reversed(pyramid[:-1]):
n_rows, n_cols = p.shape[:2]
composite_image[i_row:i_row + n_rows, cols:cols + n_cols] = p
i_row += n_rows

return composite_image

def pad_images_to_same_size(images):
:param images: sequence of images
:return: list of images padded so that all images have same width and height (max width and height are used)
width_max = 0
height_max = 0
for img in images:
h, w = img.shape[:2]
width_max = max(width_max, w)
height_max = max(height_max, h)

images_padded = []
for img in images:
h, w = img.shape[:2]
diff_vert = height_max - h
pad_top = diff_vert//2
pad_bottom = diff_vert - pad_top
diff_hori = width_max - w
pad_left = diff_hori//2
pad_right = diff_hori - pad_left
img_padded = cv2.copyMakeBorder(img, pad_top, pad_bottom, pad_left, pad_right, cv2.BORDER_CONSTANT, value=0)
assert img_padded.shape[:2] == (height_max, width_max)

return images_padded

def main():
parser = argparse.ArgumentParser(description="IRIS Stitching Scripts")
"--loglevel", required=False, help="set logging level (INFO/DEBUG/WARNING/ERROR)", type=str, default="INFO",
"--name", required=False, help="base name", default='test'
'--blend_strength', action='store', default=5,
help="Blending strength from [0,100] range. The default is 5",
type=np.int32, dest='blend_strength'
args = parser.parse_args()
numeric_level = getattr(logging, args.loglevel.upper(), None)
if not isinstance(numeric_level, int):
raise ValueError('Invalid log level: %s' % args.loglevel)

test_path = Path("./")
files = [file for file in test_path.glob(f'{}*.png') if file.is_file()]

db = []
for file in files:
(_root, x, y, index) = file.stem.split('_')
img = cv2.imread(str(test_path / file), cv2.IMREAD_GRAYSCALE)
img = cv2.cvtColor(img, cv2.COLOR_GRAY2RGB)
db += [(img, int(x), int(y), int(index))]

SCALE = 0.5
CANVAS_W = 7000
CANVAS_H = 7000

corners = []
images = []
masks = []
for (img, x, y, _index) in db:
# the corner is the top left corner of where the image should go after alignment
corners += [(x, y)]
if False:
canvas = np.zeros((CANVAS_H, CANVAS_W, 3), dtype=np.uint8)
mask = np.zeros((CANVAS_H, CANVAS_W), dtype=np.uint8)
canvas[y : y + img.shape[0], x : x + img.shape[1]] = img
images += [canvas]
mask[y : y + img.shape[0], x : x + img.shape[1]] = np.ones((img.shape[0], img.shape[1]), dtype=np.uint8)
masks += [mask]
images += [img]
# the mask is 255 where pixels should be copied into the final mosaic canvas
mask = np.full((img.shape[0], img.shape[1]), 255, dtype=np.uint8)
masks += [mask]

# this computes the full size of the resulting canvas
dst_sz = cv2.detail.resultRoi(corners=corners, images=images)

# set up the blender algorithm. This case uses the Burt & Adelson 1983 multiresolution
# spline algorithm (gaussian/laplacian pyramids) with some modern refinements that
# haven't been explicitly documented by opencv.
blender = cv2.detail_MultiBandBlender(try_gpu=1)
# I *think* this sets how far the blending seam should go from the edge.
blend_width = np.sqrt(dst_sz[2] * dst_sz[3]) * args.blend_strength / 100
# I read "bands" as basically how deep you want the pyramids to go
blender.setNumBands((np.log(blend_width) / np.log(2.) - 1.).astype(np.int32))
# Allocates memory for the final image

# Feed the images into the blender itself
for (img, mask, corner) in zip(images, masks, corners):
blender.feed(img, mask, corner)

# The actual computational step.
result, result_mask = blender.blend(None, None)

# Show results
cv2.resize(cv2.normalize(result, None, alpha=0, beta=255, norm_type=cv2.NORM_MINMAX, dtype=cv2.CV_8U), None, None, SCALE, SCALE),
cv2.resize(result_mask, None, None, SCALE, SCALE),

if __name__ == "__main__":

0 comments on commit d27669d

Please sign in to comment.