-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfilter_to_motion.py
executable file
·285 lines (212 loc) · 8.33 KB
/
filter_to_motion.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
#!python3
# gen-unique-video from video with lots of changeless frames
# My use case - I want to look at my ring videos, but skip the parts where nothing changes.
# When ring creates a motion video, it starts 30s before motion, and often ends with 30s
# no motion. E.g <same-20s>-<motion-20s>-<same-20s>
# So, my goal is trim the video down to <same-2s>-<motion-20s><same-2s>
# Random Libraries
# pose-detectin: https://github.com/CMU-Perceptual-Computing-Lab/openpose
# easier open CV: https://github.com/jrosebr1/imutils
# Sci-Kit Image: https://scikit-image.org/
# Python Motion Detecor: https://www.geeksforgeeks.org/webcam-motion-detector-python/
#######
# Higher level primitive being used - Background substituion
############
# - https://docs.opencv.org/3.4/d1/dc5/tutorial_background_subtraction.html
# TODOs
# There are a few inter frame artifacts to clean up, consider 2 pass
# 1 pass build the masks
# 2 clean up things we can detect inter frame
# E.g. 10s motion -> 2s no_motion -> 10s motion, should assume motion in between
import cv_helper
from icecream import ic
import cv2
import numpy as np
from dataclasses import dataclass
import typer
import os.path
app = typer.Typer()
backSub = cv2.createBackgroundSubtractorMOG2(history=120)
# backSub = cv2.createBackgroundSubtractorKNN()
# Some globals
color_black = 0
color_white = 255
color_grey = 127
fill_rectangle_thickness = -1
@dataclass
class FrameState:
idx: any
last_fg_mask: any
# Input is 20FPS, analyze every 1/2 second
# TBD compute this.
analysis_key_frame_rate = 10
def obsolete_handled_by_bg_remover_remove_ring_timestamp(frame):
max_y, max_x = frame.shape[0], frame.shape[1]
start_point = (0 + int(max_x * 0.7), max_y - 100)
bottom_right = max_x, max_y
end_point = bottom_right
color = (0, 0, 0)
thickness = fill_rectangle_thickness
return cv2.rectangle(frame, start_point, end_point, color, thickness)
def to_black_and_white(frame):
color_threshold = 127
convert_to_color = color_white
# QQ: Is this doing anything if I've already bg subtracted - not so sure!
# I guess I can histogram to find out?
ret, threshed = cv2.threshold(
frame,
color_threshold,
convert_to_color,
cv2.THRESH_BINARY_INV | cv2.THRESH_OTSU,
)
frame = threshed
# findContours needs image to contour to be white, so invert threshold
# Should be able to do in cv2.threshold, but feeling lazy.
return cv2.bitwise_not(frame)
def square_kernel(side):
return np.ones((side, side), np.uint8)
def to_contours(frame):
frame = to_black_and_white(frame)
# Remove artifact noise, 10x10 seems like plenty
frame = cv2.erode(frame, square_kernel(10))
# Without noise, can dialate (fill in) with a decent kernel size.
frame = cv2.dilate(frame, square_kernel(40))
contouring_method = cv2.RETR_EXTERNAL # Only outer edges
# contouring_method = cv2.RETR_CCOMP # 2 level outer, then inner
# contouring_method = cv2.RETR_FLOODFILL # Fill it in
contours, hierachy = cv2.findContours(
frame, contouring_method, cv2.CHAIN_APPROX_NONE
)
# Draw in the found contours
draw_all_counters = -1
contour_color = color_grey # Black
contour_thickness_fill = -1
good_contours = [c for c in contours if cv2.contourArea(c) > 100]
frame = cv2.drawContours(
frame, good_contours, draw_all_counters, contour_color, contour_thickness_fill
)
# Dialate again to try and fill holes
dialate_kernel = square_kernel(200)
frame = cv2.dilate(frame, dialate_kernel)
return frame
def to_motion_mask(frame):
motion_mask = backSub.apply(frame)
motion_mask = to_contours(motion_mask)
return motion_mask
def create_analyze_debug_frame(frame, motion_mask):
masked_input = cv2.bitwise_and(frame, frame, mask=motion_mask)
mask_3c = cv2.cvtColor(motion_mask, cv2.COLOR_GRAY2BGR)
top_row = np.concatenate((frame, mask_3c), axis=1)
bottom_row = np.concatenate((mask_3c, masked_input), axis=1)
merge_image = np.concatenate((top_row, bottom_row), axis=0)
return merge_image
# Gray Scale Frame
def to_grayscale(f):
return cv2.cvtColor(f, cv2.COLOR_BGR2GRAY)
def to_blur(f):
return cv2.blur(f, (20, 20))
def to_motion_mask_fast(state: FrameState, frame):
# Function is fast because analysis is sampled
is_first_frame = state.idx < 2
is_analysis_frame = state.idx % analysis_key_frame_rate == 0
is_do_analyze = is_analysis_frame or is_first_frame
if not is_do_analyze:
return state.last_fg_mask
fast_transforms = [to_grayscale]
for t in fast_transforms:
frame = t(frame)
state.last_fg_mask = to_motion_mask(frame)
return state.last_fg_mask
def shrink_image_half(src):
if not isinstance(src, np.ndarray):
return src
# calculate the 50 percent of original dimensions
scale_percent = 50
width = int(src.shape[1] * scale_percent / 100)
height = int(src.shape[0] * scale_percent / 100)
dsize = (width, height)
return cv2.resize(src, dsize)
def burn_in_debug_info(frame, idx, in_fps):
cv2.rectangle(frame, (0, 0), (650, 70), color_black, fill_rectangle_thickness)
cv2.putText(
frame,
f"{int(idx/in_fps)}:{idx}",
(10, 50),
cv2.FONT_HERSHEY_SIMPLEX,
2,
(255, 255, 255),
2,
)
def is_frame_black(frame):
# Even mostly black images have some noise, set a threshold
percent_image_non_zero_still_black = 0.1
total_pixels = frame.shape[0] * frame.shape[1]
non_zero_pixels_in_black_image = int(
0.01 * percent_image_non_zero_still_black * total_pixels
)
count_non_zero = np.count_nonzero(frame)
return count_non_zero < non_zero_pixels_in_black_image
class remove_background:
def __init__(self, base_filename):
self.base_filename = base_filename
pass
def create(self, input_video):
self.video = input_video
self.state = FrameState(0, 0)
self.in_fps = input_video.get(cv2.CAP_PROP_FPS)
self.debug_window_refresh_rate = int(
self.in_fps / 2
) # every 0.5 seconds; TODO Compute
self.unique_filename = f"{self.base_filename}_unique.mp4"
self.output_unique = cv_helper.LazyVideoWriter(
self.unique_filename, self.in_fps
)
self.mask_filename = f"{self.base_filename}_mask.mp4"
self.output_unique_mask = cv_helper.LazyVideoWriter(
self.mask_filename, self.in_fps
)
self.output_video_files = [self.output_unique, self.output_unique_mask]
def destroy(self):
cv2.destroyAllWindows()
for f in self.output_video_files:
f.release()
def frame(self, idx, original_frame):
self.state.idx = idx
# PERF: Processing at 1/4 size boosts FPS by TK%
in_frame = shrink_image_half(original_frame)
# PERF: Motion Mask sampled frames
motion_mask = to_motion_mask_fast(self.state, in_frame)
# skip frames with no motion
if is_frame_black(motion_mask):
return
# PERF - show_debug_window at on sampled frames
if idx % self.debug_window_refresh_rate == 0:
debug_frame = create_analyze_debug_frame(in_frame, motion_mask)
burn_in_debug_info(debug_frame, idx, self.in_fps)
# cv2.imshow(f"{self.base_filename} Input", shrink_image_half(debug_frame))
# cv2.waitKey(1)
self.output_unique.write(original_frame)
masked_input = cv2.bitwise_and(in_frame, in_frame, mask=motion_mask)
self.output_unique_mask.write(masked_input)
@app.command()
def RemoveBackground(
video_input_file: str = typer.Argument("in.mp4"), force: bool = typer.Option(False)
) -> None:
"""
Remove background from Ring Video
"""
ic(f"Removing Video Background {video_input_file}")
base_filename = video_input_file.split(".")[0]
unique_filename = f"{base_filename}_unique.mp4"
if not force and os.path.exists(unique_filename):
print(f"{unique_filename} exists, skipping")
return
input_video = cv2.VideoCapture(video_input_file)
if not input_video.isOpened():
print(f"Unable to Open {video_input_file}")
return
ic(f"Processing File {video_input_file}")
rb = remove_background(base_filename)
return cv_helper.process_video(input_video, rb)
if __name__ == "__main__":
app()