forked from BananaNosh/OpenposeTools
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Visualizer.py
executable file
·330 lines (291 loc) · 15.7 KB
/
Visualizer.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
import cv2
import zipfile
import json
from types import SimpleNamespace as Namespace
import numpy as np
import os
import re
import argparse
import tempfile
import atexit
import sys
from skvideo import io
from moviepy.editor import VideoFileClip, concatenate_videoclips
import enum
import time
import subprocess
class OpenposeOutputFormat(enum.Enum):
COCO = "coco",
BODY_25 = "body_25"
HD_THRESHOLD = 1300
# line thickness for different body parts for Non-HD and HD
ALL_THICKNESS = [[2, 1, 2, 2], [8, 4, 6, 6]]
# PoseConnection and colors can be found here
# https://github.com/CMU-Perceptual-Computing-Lab/openpose/blob/master/include/openpose/pose/poseParametersRender.hpp
# but they have to be corrected at least for B25
# Pose sequence (the connected keypoints) in COCO
POSE_SEQ_COCO = [(1, 2), (1, 5), (2, 3), (3, 4), (5, 6), (6, 7), (1, 8), (8, 9), (9, 10),
(1, 11), (11, 12), (12, 13), (1, 0), (0, 14), (14, 16), (0, 15), (15, 17)]
# Pose colors for COCO
POSE_COLORS_COCO = [[255, 0, 85], [255, 0, 0], [255, 85, 0], [255, 170, 0],
[255, 255, 0], [170, 255, 0], [85, 255, 0], [0, 255, 0],
[0, 255, 85], [0, 255, 170], [0, 255, 255], [0, 170, 255],
[0, 85, 255], [0, 0, 255], [255, 0, 170], [170, 0, 255], [255, 0, 255]]
# Pose sequence (the connected keypoints) in BODY_25
POSE_SEQ_B25 = [(1, 8), (1, 2), (1, 5), (2, 3),
(3, 4), (5, 6), (6, 7), (8, 9),
(9, 10), (10, 11), (8, 12), (12, 13),
(13, 14), (1, 0), (0, 15), (15, 17),
(0, 16), (16, 18), (14, 19), (19, 20),
(14, 21), (11, 22), (22, 23), (11, 24)]
# Pose colors for BODY_25
POSE_COLORS_B25 = [[255, 0, 85], [255, 0, 0], [255, 85, 0], [255, 170, 0],
[255, 255, 0], [170, 255, 0], [85, 255, 0], [0, 255, 0],
[255, 0, 0], [0, 255, 85], [0, 255, 170], [0, 255, 255],
[0, 170, 255], [0, 85, 255], [0, 0, 255], [255, 0, 170],
[170, 0, 255], [255, 0, 255], [85, 0, 255], [0, 0, 255],
[0, 0, 255], [0, 0, 255], [0, 255, 255], [0, 255, 255], [0, 255, 255]]
# Face sequences (the connected keypoints) for the old and the new format
FACE_SEQ = list(zip(range(16), range(1, 17))) + list(zip(range(17, 21), range(18, 22))) \
+ list(zip(range(22, 26), range(23, 27))) + list(zip(range(27, 30), range(28, 31))) \
+ list(zip(range(31, 35), range(32, 36))) + list(zip(range(36, 41), range(37, 42))) \
+ [(41, 36)] + list(zip(range(42, 47), range(43, 48))) + [(47, 42)] \
+ list(zip(range(48, 59), range(49, 60))) + [(59, 48)] \
+ list(zip(range(60, 67), range(61, 68))) + [(67, 60)]
FACE_COLORS = [[255, 255, 255]] * 68
HAND_SEQ = list(zip(range(4), range(1, 5))) + [(0, 5)] + list(zip(range(5, 8), range(6, 9))) + [(0, 9)] \
+ list(zip(range(9, 12), range(10, 13))) + [(0, 13)] + list(zip(range(13, 16), range(14, 17))) \
+ [(0, 17)] + list(zip(range(17, 20), range(18, 21)))
HAND_COLORS = [[100, 100, 100], [100, 0, 0], [150, 0, 0], [200, 0, 0], [255, 0, 0], [100, 100, 0]] \
+ [[150, 150, 0], [200, 200, 0], [255, 255, 0], [0, 100, 50], [0, 150, 75], [0, 200, 100]] \
+ [[0, 255, 125], [0, 50, 100], [0, 75, 150], [0, 100, 200], [0, 125, 255], [100, 0, 100]] \
+ [[150, 0, 150], [200, 0, 200], [255, 0, 255]]
# the combination of all seqs for COCO and BODY_25 format
ALL_SEQS = [[POSE_SEQ_COCO, FACE_SEQ, HAND_SEQ, HAND_SEQ],
[POSE_SEQ_B25, FACE_SEQ, HAND_SEQ, HAND_SEQ]]
ALL_COLORS = [[POSE_COLORS_COCO, FACE_COLORS, HAND_COLORS, HAND_COLORS],
[POSE_COLORS_B25, FACE_COLORS, HAND_COLORS, HAND_COLORS]]
##################################################################################################################
def main():
parser = argparse.ArgumentParser(description='Draw the lines given with the json data on to the given video.')
parser.add_argument("videofile", type=argparse.FileType(mode="r"), help="the video file to write on")
parser.add_argument("json", help="the folder of json files with the data for each frame (might be zipped)")
parser.add_argument("--outfile", help='the output video file (.mp4-format). If not specified, it will only display the video')
parser.add_argument("-oi --out_images", dest="out_images", help='the output folder for the images')
parser.add_argument("-coco", dest="coco_format",
help='add if the COCO openpose format is used instead of body_25', action='store_true')
parser.add_argument("-t --temp", metavar='tempfolder', dest="temp", help="folder for saving the temp files")
parser.add_argument("--maxframes", metavar="maxframes", type=int, default=100,
help="maximal number of frames before splitting the video sequence - default to 100")
parser.add_argument('--noBG', help='Include to show skeleton only.', action='store_true')
parser.add_argument('--noFPS', help='Include to not show the FPS.', action='store_true')
args = parser.parse_args()
video, json_folder, out_video_path, out_images_path, use_coco_format, temp \
= args.videofile.name, args.json, args.outfile, args.out_images, args.coco_format, args.temp
no_bg, no_fps = args.noBG, args.noFPS
if not os.path.exists(json_folder):
print("Json folder not found!")
exit(-1)
if out_video_path:
_, out_extension = os.path.splitext(out_video_path)
if out_extension != ".mp4":
print("So far only .mp4 extension allowed for outfile!")
exit(-1)
out_folder, _ = os.path.split(out_video_path)
os.makedirs(out_folder, exist_ok=True)
if out_images_path is not None:
os.makedirs(out_images_path, exist_ok=True)
if not temp:
temp = tempfile.mkdtemp()
used_format = OpenposeOutputFormat.COCO if use_coco_format else OpenposeOutputFormat.BODY_25
color_video(json_folder, video, out_video_path, temp_folder=temp, out_images=out_images_path,
max_frames=args.maxframes, openpose_format=used_format, no_bg=no_bg, no_fps=no_fps)
import matplotlib.pyplot as plt
import matplotlib.colors as mplcolors
def imshow(img, title='', hsv=False):
if hsv: img = mplcolors.hsv_to_rgb(img)
plt.imshow(img, cmap='Greys_r')
if title or title==0: plt.title(title)
plt.show()
def color_video(frames_json_folder, vid_file, out_file, temp_folder, out_images=None, max_frames=None,
frame_range=None, openpose_format=OpenposeOutputFormat.BODY_25, no_bg=False, no_fps=False):
"""
Create a video from the vid_file with the poses given in the frames_json_folder colored on it
Args:
frames_json_folder(str): path to folder of json files (might me a zip folder)
vid_file(str): path to the video file
out_file(str): filename of the output video
temp_folder(str): path to the temp folder to store videos in in intermediate steps
out_images(str|None): path to folder to store rendered images
max_frames(int): the maximum number of frames before the video is splitted during the process
frame_range(Range): the range of frames which should be used to write the new video
openpose_format(OpenposeOutputFormat): the used output format of openpose
"""
video_capture = cv2.VideoCapture(vid_file)
if out_file:
output_without_ext, output_type = os.path.splitext(out_file)
else:
output_without_ext = os.path.splitext(vid_file)[0]
frame_count = int(video_capture.get(cv2.CAP_PROP_FRAME_COUNT))
fps_string = subprocess.Popen('ffprobe -v 0 -of csv=p=0 -select_streams v:0 -show_entries stream=r_frame_rate'.split(' ')+[vid_file], stdout=subprocess.PIPE, stderr=subprocess.STDOUT).communicate()[0].decode('UTF-8')[:-1]
if fps_string != '0/0':
fps = eval(fps_string)
else:
fps = video_capture.get(cv2.CAP_PROP_FPS)
all_colored_frames = []
colored_frames = []
json_files = get_json_files_from_folder(frames_json_folder)
json_count = len(json_files)
frame_count = min(frame_count, json_count)
splitted = max_frames and max_frames < frame_count
if splitted:
temp_folder = generate_temp_folder(temp_folder)
temp_name = os.path.join(temp_folder, os.path.basename(output_without_ext))
json_files = json_files[:frame_count]
frame_range = frame_range or range(frame_count)
enumerating = zip(frame_range, json_files[frame_range.start:frame_range.stop:frame_range.step])
if frame_range.start > 0:
video_capture.set(cv2.CAP_PROP_POS_FRAMES, frame_range.start)
video_number = None
fps_time = 0
for i, file_name in enumerating:
if i % 10 + 1 == 0:
print("{}/{} frames ready ".format(i, frame_count), end='\r')
sys.stdout.flush()
video_number = (i + 1) // max_frames if max_frames else None
canvas = None
for j in range(frame_range.step):
_, canvas = video_capture.read()
if no_bg:
canvas = np.zeros(canvas.shape, dtype=np.uint8)
elif canvas is None:
print("")
print("No canvas for file: ", file_name)
break
written_canvas = canvas_for_frame(canvas, file_name, frames_json_folder, openpose_format=openpose_format)
canvas = cv2.addWeighted(canvas, 0.1, written_canvas, 0.9, 0)
if (not out_file) and (out_images is None):
time.sleep(max(0, 1/(fps*1.02) - (time.time()-fps_time))) #without the *1.02 it's too slow
if not no_fps:
cv2.putText(canvas, "FPS: %f" % (1.0 / (time.time() - fps_time)), (10, 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
# print(f'Pause: {(time.time() - fps_time)*1000}, FPS: {(1.0 / (time.time() - fps_time))}, wished FPS: {fps}')
cv2.imshow('tf-pose-estimation result', canvas)
fps_time = time.time()
if cv2.waitKey(1) == 27:
break
else:
all_colored_frames.append((file_name, canvas))
#imshow(cv2.cvtColor(canvas, cv2.COLOR_BGR2RGB))
colored_frames.append(canvas[:, :, [2, 1, 0]])
if max_frames and (i + 1) % max_frames == 0 and max_frames != frame_count:
colored_frames = np.array(colored_frames)
write_file(colored_frames, fps, output_type, temp_name, video_number)
colored_frames = []
if out_file:
if len(colored_frames) > 0:
colored_frames = np.array(colored_frames)
video_number = video_number + 1 if splitted else None
write_file(colored_frames, fps, output_type, temp_name if splitted else output_without_ext, video_number)
if splitted:
combine_videos(out_file, temp_folder, True)
if out_images is not None:
write_out_images(out_images, all_colored_frames)
else:
cv2.destroyAllWindows()
def write_out_images(out_images_path, all_colored_frames):
for json_name, frame in all_colored_frames:
name, _ = os.path.splitext(json_name)
_, name = os.path.split(name)
name = name if not name.endswith("_keypoints") else name[:-10]
name += "_rendered.png"
path = os.path.join(out_images_path, name)
cv2.imwrite(path, frame)
def get_json_files_from_folder(frames_json_folder):
json_ext = ".json"
_, ext = os.path.splitext(frames_json_folder)
if ext == ".zip":
with zipfile.ZipFile(frames_json_folder) as zip_file:
json_files = [file for file in zip_file.namelist() if file.endswith(json_ext)]
else:
json_files = [file for file in os.listdir(frames_json_folder) if file.endswith(json_ext)]
json_files.sort()
return json_files
def canvas_for_frame(current_canvas, frame_json, frames_json_folder, openpose_format=OpenposeOutputFormat.BODY_25):
def load_json_from_file(json_string):
return json.loads(json_string, object_hook=lambda d: Namespace(**d))
hd = current_canvas.shape[1] > HD_THRESHOLD
_, ext = os.path.splitext(frames_json_folder)
if ext == ".zip":
zip_file = zipfile.ZipFile(frames_json_folder)
with zip_file.open(frame_json, "r") as json_file:
json_obj = load_json_from_file(json_file.read().decode("utf-8"))
else:
with open(os.path.join(frames_json_folder, frame_json), "r", encoding="utf-8") as json_file:
json_obj = load_json_from_file(json_file.read())
canvas_copy = current_canvas.copy()
people = json_obj.people
for person in people:
pose_key_points = np.array(person.pose_keypoints_2d).reshape(-1, 3)
face_key_points = np.array(person.face_keypoints_2d).reshape(-1, 3)
hand_left_key_points = np.array(person.hand_left_keypoints_2d).reshape(-1, 3)
hand_right_key_points = np.array(person.hand_right_keypoints_2d).reshape(-1, 3)
all_key_points = [pose_key_points, face_key_points, hand_left_key_points, hand_right_key_points]
thick = ALL_THICKNESS[0] if not hd else ALL_THICKNESS[1]
format_index = int(openpose_format == OpenposeOutputFormat.BODY_25)
for key_points, seq, colors, thickness in zip(all_key_points,
ALL_SEQS[format_index],
ALL_COLORS[format_index],
thick):
for joints, color in zip(seq, colors):
points = key_points[joints, :]
x = points[:, 0]
y = points[:, 1]
c = points[:, 2]
if any(c < 0.05):
continue
color = [color[2], color[1], color[0]]
cv2.line(canvas_copy, (int(x[0]), int(y[0])), (int(x[1]), int(y[1])), color=color, thickness=thickness)
point_size = thickness + (3 if not hd else 12)
cv2.line(canvas_copy, (int(x[0]), int(y[0])), (int(x[0]), int(y[0])), color=color, thickness=point_size)
current_canvas = cv2.addWeighted(current_canvas, 0.1, canvas_copy, 0.9, 0)
return current_canvas
def generate_temp_folder(temp_folder):
if not os.path.isdir(temp_folder):
os.mkdir(temp_folder)
elif len(os.listdir(temp_folder)) > 0:
temp_folder = tempfile.mkdtemp(dir=temp_folder)
def delete_temp():
if os.path.exists(temp_folder):
remove_all_files_in_folder(temp_folder)
os.rmdir(temp_folder)
atexit.register(delete_temp)
return temp_folder
def remove_all_files_in_folder(folder):
for the_file in os.listdir(folder):
file_path = os.path.join(folder, the_file)
try:
if os.path.isfile(file_path):
os.unlink(file_path)
except Exception as e:
print(e)
def write_file(colored_frames, fps, output_type, output_wihout_ext, video_number):
name = "{}_{}{}".format(output_wihout_ext, video_number, output_type) \
if video_number else "{}{}".format(output_wihout_ext, output_type)
fps_string = "{:.2f}".format(fps)
io.vwrite(name, colored_frames, inputdict={"-framerate": fps_string},
outputdict={"-r": fps_string}) # WRITE VIDEO
print("\nwritten to {}".format(name))
def combine_videos(outfile, temp_path, delete=False):
file_names = os.listdir(temp_path)
file_names.sort(key=lambda _file: [int(s) if s.isdigit() else s for s in re.split(r'(\d+)', _file)])
if len(file_names) == 0:
return
total_file_names = [os.path.join(temp_path, video_name) for video_name in file_names]
video_clips = [VideoFileClip(video_name) for video_name in total_file_names]
final_clip = concatenate_videoclips(video_clips)
final_clip.write_videofile(outfile)
if delete:
remove_all_files_in_folder(temp_path)
os.rmdir(temp_path)
if __name__ == '__main__':
main()