pano360/blend.py at master · Banus/pano360 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
"""Warps and blend images."""
import os
import heapq

import numpy as np
import scipy.sparse as ssp

try:
    # ~6x faster than scipy
    from pypardiso import spsolve  # type: ignore (pylance bug)
except ImportError:
    from scipy.sparse.linalg import spsolve

import cv2

from stitcher import SphProj
from bundle_adj import intrinsics


# from: https://gist.github.com/royshil/0b21e8e7c6c1f46a16db66c384742b2b
def warp(img, kint, hom=np.eye(3), projector=SphProj.proj2hom):
    """Warp the image in cylindrical/spherical coordinates."""
    hh_, ww_ = img.shape[:2]
    y_i, x_i = np.indices((hh_, ww_))  # pixel coordinates

    # homogeneous coordinates
    xx_ = np.stack([x_i, y_i, np.ones_like(x_i)], axis=-1).reshape(-1, 3)
    xx_ = hom.dot(xx_.T).T
    xx_ = np.linalg.inv(kint).dot(xx_.T).T  # normalize coordinate

    x_n = projector(xx_)

    # project back to image-pixels and pixel coordinates
    x_pr = kint.dot(x_n.reshape(-1, 3).T).T
    x_pr = x_pr[:, :-1] / x_pr[:, [-1]]
    # make sure warp coords only within image bounds
    x_pr[(x_pr[:, 0] < 0) | (x_pr[:, 0] >= ww_) |
         (x_pr[:, 1] < 0) | (x_pr[:, 1] >= hh_)] = -1
    x_pr = x_pr.reshape(hh_, ww_, -1)

    img_rgba = cv2.cvtColor(img, cv2.COLOR_BGR2BGRA)
    # warp the image to cylindrical coords and transparent background
    return cv2.remap(img_rgba, x_pr[:, :, 0].astype(np.float32),
                     x_pr[:, :, 1].astype(np.float32), cv2.INTER_AREA,
                     borderMode=cv2.BORDER_TRANSPARENT)


def alpha_blend(img1, img2, mask=None):
    """Blend using an alpha ramp."""
    if mask is None:
        delta = img1.shape[1]
        mask = np.linspace(1, 0, delta).reshape((1, delta, 1))
    return (img1*mask + img2*(1-mask)).astype("uint8")


def graph_cut(img1, img2, shrink=5):
    # pylint: disable=too-many-locals
    """Blend two images using graph cuts with optional downsampling."""
    dd_ = [[0, 1], [0, -1], [1, 0], [-1, 0]]

    diff = np.max(np.abs(img1 - img2), axis=2)
    if img1.shape[2] == 4:  # borders are low priority
        diff[img1[:, :, 3] == 0], diff[img2[:, :, 3] == 0] = -1, -1
    if shrink > 1:
        # when subsampling, the weakest difference matters
        hh_, ww_ = diff.shape
        hh_, ww_ = hh_ // shrink, ww_ // shrink
        diff = diff[:shrink*hh_, :shrink*ww_]
        diff = np.min(diff.reshape(hh_, shrink, ww_, shrink), axis=(1, 3))

    mask = np.zeros(diff.shape, dtype=np.int32)
    rows, cols = mask.shape[:2]

    qq_, border = [], int(13/shrink) + 1
    mask[:, :border] = -1
    mask[:, -border+1:] = 1

    for yy_ in range(rows):
        qq_ += [(-1e3, -1, border, yy_), (-1e3, 1, cols-border, yy_)]
    heapq.heapify(qq_)

    while True:
        try:
            _, clr, xx_, yy_ = heapq.heappop(qq_)
        except IndexError:
            break

        if mask[yy_, xx_] != 0:
            continue
        mask[yy_, xx_] = clr

        for dx_, dy_ in dd_:
            nx_, ny_ = xx_ + dx_, yy_ + dy_
            if not(0 <= nx_ < cols and 0 <= ny_ < rows):
                continue
            if mask[ny_, nx_] == 0:
                heapq.heappush(qq_, (-diff[ny_, nx_], clr, nx_, ny_))

    mask = cv2.resize((mask == -1).astype("float32"), img1.shape[:2][::-1])
    return (mask[..., None]*255).astype("uint8")


# adapted from: https://docs.opencv.org/3.0-beta/doc/py_tutorials/py_imgproc/
#   py_pyramids/py_pyramids.html
def laplacian_blending(img1, img2, mask=None, n_levels=6):
    """Use a Laplacian pyramid on the images for blending."""
    if mask is None:
        hh_, ww_, cc_ = img1.shape
        mask = np.linspace(1, -1, ww_).reshape((1, ww_, 1))
        mask = 1.0 / (1 + np.exp(-100 * mask))  # sigmoid
        mask = np.tile(mask, (hh_, 1, cc_))

    if mask.shape[2] == 1:
        mask = np.repeat(mask, img1.shape[2], axis=2)

    def _gassian_pyr(img):
        pyr = [img]
        for _ in range(n_levels):
            img = cv2.pyrDown(img)
            pyr.append(img)
        return pyr

    def _laplacian_pyr(img):
        pyr = _gassian_pyr(img)
        lap = [pyr[-1]]
        for idx in range(n_levels, 0, -1):
            im_ = pyr[idx-1]
            lap.append(im_ - cv2.pyrUp(pyr[idx])[:im_.shape[0], :im_.shape[1]])
        return lap

    pyr1 = _laplacian_pyr(img1.astype("float32"))
    pyr2 = _laplacian_pyr(img2.astype("float32"))
    pyrm = _gassian_pyr(mask)[::-1]

    pyrs = [la * gm + lb * (1.0 - gm) for la, lb, gm in zip(pyr1, pyr2, pyrm)]
    blended = pyrs[0]
    for ls_ in pyrs[1:]:
        blended = ls_ + cv2.pyrUp(blended)[:ls_.shape[0], :ls_.shape[1]]

    return np.clip(blended, 0, 255).astype("uint8")


def poisson_matrix(x_max, y_max, positions=None):
    """Create a Poisson matrix with mask positions."""
    n_pix = x_max * y_max
    zeros = np.arange(1, y_max+1) * x_max - 1

    if positions is None:
        diagonals = [np.full(n_pix, 4)] + [-np.ones(n_pix)] * 4
        diagonals[1][zeros] = 0
        diagonals[2][zeros] = 0
        return ssp.spdiags(diagonals, [0, -1, 1, -x_max, x_max], n_pix, n_pix,
                           'csr').tocsc()

    main_diagonal = np.ones(n_pix)
    main_diagonal[positions] = 4
    diagonals = [main_diagonal]
    diagonals_positions = [0]

    # creating the diagonals of the coefficient matrix
    for diagonal_pos in [-1, 1, -x_max, x_max]:
        in_bounds_positions = positions[((positions + diagonal_pos) >= 0) &
                                        ((positions + diagonal_pos) < n_pix)]

        diagonal = np.zeros(n_pix)
        diagonal[in_bounds_positions + diagonal_pos] = -1
        if diagonal_pos in (-1, 1):
            diagonal[zeros] = 0
        diagonals.append(diagonal)
        diagonals_positions.append(diagonal_pos)

    return ssp.spdiags(diagonals, diagonals_positions, n_pix, n_pix, 'csr')


# from: https://github.com/fbessho/PyPoi/blob/master/pypoi/poissonblending.py
def poisson_blend(img_source, img_target, img_mask):
    """Combine images using Poisson editing."""
    x_max, y_max = img_source.shape[1], img_source.shape[0]
    img_mask = img_mask != 0

    # determines the diagonals on the coefficient matrix - flattened
    positions = np.where(img_mask)
    positions = (positions[0] * x_max) + positions[1]

    mat_a = poisson_matrix(x_max, y_max, positions)
    pois = poisson_matrix(x_max, y_max)

    # get positions in mask that should be taken from the target
    positions_from_target = np.where((~img_mask).flatten())[0]

    # for each layer (ex. RGB)
    for num_layer in range(img_target.shape[2]):
        tgt = img_target[..., num_layer].flatten()
        src = img_source[..., num_layer].flatten()

        mat_b = pois * src
        mat_b[positions_from_target] = tgt[positions_from_target]
        sol = spsolve(mat_a, mat_b)

        sol = np.clip(sol.reshape((y_max, x_max)), 0, 255)
        img_target[..., num_layer] = np.array(sol, img_target.dtype)

    return img_target


def main():
    """Script entry point."""
    base_path = "../data/ppwwyyxx/CMU2"
    img1 = cv2.imread(os.path.join(base_path, "medium01.JPG"))
    img2 = cv2.imread(os.path.join(base_path, "medium00.JPG"))

    foc, delta = 3e3, 976

    # intrinsics
    height, width = img1.shape[:2]
    intr = intrinsics(foc, [width/2, height/2])
    img1, img2 = warp(img1, intr), warp(img2, intr)

    mask = graph_cut(img1[:, -delta:], img2[:, :delta])

    overlap = poisson_blend(img1[:, -delta:], img2[:, :delta], mask > 127)
    # overlap = laplacian_blending(
    #     img1[:, -delta:], img2[:, :delta], mask / 255.0)

    blended = np.concatenate(
        [img1[:, :-delta], overlap.astype("uint8"), img2[:, delta:]], axis=1)

    cv2.imshow('blend', blended)

    if cv2.waitKey(0) & 0xff == 27:
        cv2.destroyAllWindows()


if __name__ == '__main__':
    main()