-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathstitcher.py
executable file
·336 lines (258 loc) · 13.9 KB
/
stitcher.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
# © 2024 Regents of the University of Minnesota. All rights reserved.
# This program is shared under the terms and conditions of the GNU General Public License 3.0, License. Further details about the GNU GPL 3.0 license are available in the license.txt file
from __future__ import print_function
import numpy as np
import cv2
import os
import platform
import pyopencl as cl
import ctypes
import ctypes.util
# if (ctypes.util.find_library('libvips-42') or ctypes.util.find_library('libvips')):
import pyvips
CONFIG={}
CONFIG['max_features'] = 500
CONFIG['scale_factor'] = 0.25
CONFIG['flann_checks'] = 12
class Stitcher:
maxOffset = 0;
overlap = 0.35;
def __init__(self, overlapValue):
self.overlap = overlapValue
def calculate_offset(self,img1, img2, enableMask):
# Calculate rough overlap in pixels
overlap_px = img2.shape[1] * self.overlap
# Convert images to grayscale and reduce size to scale_factor
i1 = cv2.cvtColor(cv2.resize(img1[:, -int(overlap_px):, :], (0, 0), fx=CONFIG['scale_factor'], fy=CONFIG['scale_factor']), cv2.COLOR_BGR2GRAY)
i2 = cv2.cvtColor(cv2.resize(img2[:, :int(overlap_px), :], (0, 0), fx=CONFIG['scale_factor'], fy=CONFIG['scale_factor']), cv2.COLOR_BGR2GRAY)
if(enableMask):
height, width = i1.shape[:2]
mask = np.zeros(i1.shape[:2], np.uint8)
rounded = round(height/4);
mask[rounded:height-rounded, 0:width] = 255
else:
mask = None;
# Find SIFT keypoints and descriptors
sift = cv2.SIFT_create(nfeatures=CONFIG['max_features'])
self.logMessage('\t- Finding keypoints and descriptors for image 1')
kp1, des1 = sift.detectAndCompute(i1, mask)
self.logMessage('\t- Finding keypoints and descriptors for image 2')
kp2, des2 = sift.detectAndCompute(i2, mask)
# Use FLANN to determine matches
self.logMessage('\t- Finding matches')
# As of 10/11/2016, Flann is broken on binary builds of opencv for windows. Fall back to BF in those cases.
# if(platform.system() != 'Windows'):
flann = cv2.FlannBasedMatcher({'algorithm': 0, 'trees': 5}, {'checks': CONFIG['flann_checks']})
matches = flann.knnMatch(des1, des2, k=2)
# else:
# bfMatch = cv2.BFMatcher(cv2.NORM_L2)
# matches = bfMatch.knnMatch(des1, des2, k=2)
# Limit to reasonable matches
good_matches = [m for m, n in matches if m.distance < 0.7 * n.distance]
src_pts = np.float32([kp1[match.queryIdx].pt for match in good_matches]).reshape(-1, 1, 2)
dst_pts = np.float32([kp2[match.trainIdx].pt for match in good_matches]).reshape(-1, 1, 2)
# We're not doing any robust analyses of outliers, so let's just take the median and see how it works
x_offset = int(np.median([elem[0][0] for elem in np.subtract(src_pts, dst_pts)]))
y_offset = int(np.median([elem[0][1] for elem in np.subtract(src_pts, dst_pts)]))
# Rescale offset for original size and return
self.logMessage('\t- X Offset found: {} px'.format(x_offset * (1/CONFIG['scale_factor'])))
self.logMessage('\t- Y Offset found: {} px'.format(y_offset * (1/CONFIG['scale_factor'])))
return (x_offset * (1/CONFIG['scale_factor']),y_offset * (1/CONFIG['scale_factor']))
def stitch_images(self,img1, img2, enableMask):
# Find the offset between the images and calcuate where the seam lies
x_offset, y_offset = self.calculate_offset(img1, img2, enableMask)
# we want to seam the images such that we crop the left and right equally. So use roughly have the overlap betwen them.
x_seam = int(img1.shape[1] - (img2.shape[1] * self.overlap*.5) + x_offset)
# how much of the new image should we crop out?
partialImage = int(img2.shape[1] * self.overlap*.5);
self.maxOffset = max(self.maxOffset, y_offset);
# Create the composite image and return
width = x_seam + (img2.shape[1]-partialImage)
height = img2.shape[0] + abs(int(self.maxOffset))
if(y_offset < 0.0):
comp_img = np.zeros((height+int(abs(y_offset)), width, 3), np.uint8)
self.maxOffset += int(abs(y_offset))
comp_img[int(abs(y_offset)):img1.shape[0]+int(abs(y_offset)), 0:x_seam] = img1[0:img1.shape[0], 0:x_seam]
comp_img[0:img2.shape[0], x_seam:(x_seam+img2.shape[1]-partialImage)] = img2[0:img2.shape[0], partialImage:img2.shape[1]]
else:
comp_img = np.zeros((height, width, 3), np.uint8)
comp_img[0:img1.shape[0], 0:x_seam] = img1[0:img1.shape[0], 0:x_seam]
comp_img[int(y_offset):img2.shape[0]+int(y_offset), x_seam:(x_seam+img2.shape[1]-partialImage)] = img2[0:img2.shape[0], partialImage:img2.shape[1]]
return comp_img
def logMessage(self, message):
self.logFile.write(message + "\n")
print(message)
def removeVignette(self, img, vignetteMagicNumber):
gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
# apply the vignette correction algorithm using OpenCL
rows, cols = gray.shape
center = (cols//2, rows//2)
mask = np.zeros(gray.shape, dtype=np.float32)
# define an OpenCL kernel that computes the mask for a given row
mask_kernel = f'''
__kernel void compute_mask(__global float *mask, int rows, int cols, int center_x, int center_y)
\u007b
int row = get_global_id(1);
int col = get_global_id(0);
if (row < rows && col < cols)
mask[row * cols + col] = 1 + {vignetteMagicNumber}*(pow((float)(row - center_y), 2) + pow((float)(col - center_x), 2))/(rows*rows + cols*cols);
\u007d
'''
# create an OpenCL context and queue
platform = cl.get_platforms()
my_gpu_devices = platform[0].get_devices(device_type=cl.device_type.GPU)
ctx = cl.Context(devices=my_gpu_devices)
queue = cl.CommandQueue(ctx)
# create an OpenCL buffer for the mask
mask_buf = cl.Buffer(ctx, cl.mem_flags.WRITE_ONLY, mask.nbytes)
# compile and run the OpenCL kernel
prg = cl.Program(ctx, mask_kernel).build()
prg.compute_mask(queue, (cols, rows), None, mask_buf, np.int32(rows), np.int32(cols), np.int32(center[0]), np.int32(center[1]))
# copy the result from the OpenCL buffer to the NumPy array
cl.enqueue_copy(queue, mask, mask_buf)
corrected = np.clip(img * mask[:,:,np.newaxis], 0, 255)
return np.rint(corrected).astype(np.uint8)
def rotateAndCrop(self, image):
scale_percent = 2.5 # percent of original size
width = int(image.shape[1] * scale_percent / 100)
height = int(image.shape[0] * scale_percent / 100)
dim = (width, height)
# resize image
resized = cv2.resize(image, dim, interpolation = cv2.INTER_AREA)
# write the scaled image to disk
cv2.imwrite('scaled_image.jpg', resized)
# Convert the image to grayscale
gray = cv2.cvtColor(resized, cv2.COLOR_BGR2GRAY)
(thresh, blackAndWhiteImage) = cv2.threshold(gray, 127, 255, cv2.THRESH_BINARY)
# blur the image with a guassian blur
blurred = cv2.GaussianBlur(blackAndWhiteImage, (5, 5), 0)
# Find contours
contours, _ = cv2.findContours(blurred, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
# Find largest contour
max_area = 0
largest_contour = None
for contour in contours:
area = cv2.contourArea(contour)
if area > max_area:
max_area = area
largest_contour = contour
if largest_contour is not None:
# Get moments of the largest contour
M = cv2.moments(largest_contour)
# Get center of mass of the largest contour
cx = int(M["m10"] / M["m00"])
cy = int(M["m01"] / M["m00"])
# Get angle of the largest contour
(x, y), (MA, ma), angle = cv2.fitEllipse(largest_contour)
x = pyvips.Image.new_from_array(image[...,::-1])
x = x.rotate((90-angle), interpolate=pyvips.Interpolate.new("bicubic"))
print(angle)
# get the height of the area that we want to crop by using the inverse sign of the rotation angle and the width of the image
height = int(image.shape[1] * np.abs(np.sin(np.radians(90-angle))))
# crop the height of the image to 2x height center crop
x = x.crop(0, height, x.width, x.height - (height * 2))
# mask = (x.median(3) - [0.0, 0.0, 0.0]).abs() > 10
# columns, rows = mask.project()
# left = columns.profile()[1].min()
# right = columns.width - columns.flip("horizontal").profile()[1].min()
# top = rows.profile()[0].min()
# bottom = rows.height - rows.flip("vertical").profile()[0].min()
# x = x.crop(left, top, right - left, bottom - top)
# find the rectangle which crops all of the black area from the image
result = x.numpy()
return result[...,::-1]
def stitchFileList(self,images, outputPath,scaledPreviewFile, logFile, callback, enableMask, scaleImage, verticalCore, removeVignette, vignetteMagicNumber=1.1, rotateImage = False, cropImage = False):
composite = None;
# Starting from the left, stitch the next image in the sequence to the intermediate file.
self.logFile = open(logFile, 'w');
self.logMessage("Beginning batch processing for: " + outputPath);
self.logMessage("Masking is: " + str(enableMask));
if(scaleImage):
self.logMessage("Scale File Is: " + scaleImage);
firstImage = True;
for i in range(0, len(images) - 1):
if i == 0:
img1 = cv2.imread(images[i])
img2 = cv2.imread(images[i + 1])
if(removeVignette):
img1 = self.removeVignette(img1, vignetteMagicNumber)
img2 = self.removeVignette(img2, vignetteMagicNumber)
if(verticalCore):
img1 = cv2.rotate(img1, cv2.ROTATE_90_COUNTERCLOCKWISE)
img2 = cv2.rotate(img2, cv2.ROTATE_90_COUNTERCLOCKWISE)
else:
img1 = composite
img2 = cv2.imread(images[i + 1])
if(removeVignette):
img2 = self.removeVignette(img2, vignetteMagicNumber)
if(verticalCore):
img2 = cv2.rotate(img2, cv2.ROTATE_90_COUNTERCLOCKWISE)
try:
self.logMessage("Stitching Image {} and {}".format(images[i], images[i + 1]))
composite = self.stitch_images(img1, img2, enableMask)
if(firstImage):
firstImage = False;
if(scaleImage):
img1 = cv2.imread(scaleImage);
h1, w1 = img1.shape[:2]
h2, w2 = composite.shape[:2]
vis = np.zeros((max(h1, h2), w1+w2, 3), np.uint8)
vis[:h1, :w1] = img1
vis[:h2, w1:w1+w2] = composite
composite = vis
self.logMessage("Size of Composite: " + str(composite.shape))
if(callback):
callback(1, round(i / len(images) * 100));
except Exception as e:
print(e)
self.logMessage("Error stitching {} and {}".format(images[i], images[i + 1]))
if(cropImage and not rotateImage):
self.logMessage("Cropping Image")
composite = composite[int(self.maxOffset):(composite.shape[0]-int(self.maxOffset)), 0:composite.shape[1]]
if(rotateImage):
self.logMessage("Rotating Image")
composite = self.rotateAndCrop(composite)
# crop image based on max offset
# scale_percent = 5 # percent of original size
# width = int(composite.shape[1] * scale_percent / 100)
# height = int(composite.shape[0] * scale_percent / 100)
# dim = (width, height)
# # resize image
# resized = cv2.resize(composite, dim, interpolation = cv2.INTER_AREA)
# # Convert the image to grayscale
# gray = cv2.cvtColor(resized, cv2.COLOR_BGR2GRAY)
# (thresh, blackAndWhiteImage) = cv2.threshold(gray, 127, 255, cv2.THRESH_BINARY)
# # Find contours
# contours, _ = cv2.findContours(blackAndWhiteImage, cv2.RETR_TREE, cv2.CHAIN_APPROX_SIMPLE)
# # Find largest contour
# max_area = 0
# largest_contour = None
# for contour in contours:
# area = cv2.contourArea(contour)
# if area > max_area:
# max_area = area
# largest_contour = contour
# #draw the largest contour to screen
# cv2.drawContours(resized, [largest_contour], 0, (0, 255, 0), 3)
# # display on screen
# cv2.imshow('Largest Contour', resized)
self.logMessage("Size of Composite: " + str(composite.shape))
if(composite is not None):
cv2.imwrite(outputPath, composite)
# resize the image to a max 1000pixel wide by 1000pixel high
if composite.shape[0] > 1000 or composite.shape[1] > 1000:
self.logMessage("Writing preview image")
if composite.shape[0] > composite.shape[1]:
scale_percent = 1000 / composite.shape[0] * 100
else:
scale_percent = 1000 / composite.shape[1] * 100
width = int(composite.shape[1] * scale_percent / 100)
height = int(composite.shape[0] * scale_percent / 100)
dim = (width, height)
# resize image
resized = cv2.resize(composite, dim, interpolation = cv2.INTER_AREA)
cv2.imwrite(scaledPreviewFile, resized)
self.logMessage("Finished")
if(callback):
callback(1, 100);
self.logFile.close();