-
Notifications
You must be signed in to change notification settings - Fork 8
/
Copy pathconcat.py
143 lines (115 loc) · 4.46 KB
/
concat.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
# Copyright (c) 2024, Patricio Gonzalez Vivo
#
# Licensed under the Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International Public License (the "License").
# You may not use this file except in compliance with the License. You may obtain a copy of the License at https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode
#
import os
import cv2
import argparse
import numpy as np
import decord
import math
from tqdm import tqdm
from bands.common.meta import load_metadata, is_video
from bands.common.io import VideoWriter, get_video_data
top = ['depth_patchfusion']
bottom = ['rgba']
data = None
def concat_image(args, top, bottom):
global data
top_row = None
bottom_row = None
# vertically concatenate the top row
for band in top:
img = cv2.imread( os.path.join( args.input, data["bands"][band]["url"] ) )
if top_row is None:
top_row = img
else:
top_row = cv2.hconcat([top_row, img])
# vertically concatenate the bottom row
for band in bottom:
img = cv2.imread( os.path.join( args.input, data["bands"][band]["url"] ) )
if bottom_row is None:
bottom_row = img
else:
bottom_row = cv2.hconcat([bottom_row, img])
# horizontally concatenate the top and bottom rows
if top_row is None:
conc = bottom_row
elif bottom_row is None:
conc = top_row
else:
conc = cv2.vconcat([top_row, bottom_row])
cv2.imwrite(args.output, conc)
def concat_video(args, top, bottom):
global data
width_top = 0
width_bottom = 0
height_top = 0
height_bottom = 0
# load videos
videos = {}
for band in top:
band_path = os.path.join( args.input, data["bands"][band]["url"] )
band_width, band_height, _, _ = get_video_data(band_path)
print("Loading top band {} with shape {}".format(band_path, (band_width, band_height)))
videos[band] = decord.VideoReader( band_path )
width_top += band_width
height_top = max(height_top, band_height)
for band in bottom:
band_path = os.path.join( args.input, data["bands"][band]["url"] )
band_width, band_height, _, _ = get_video_data(band_path)
print("Loading bottom band {} with shape {}".format(band_path, (band_width, band_height)))
videos[band] = decord.VideoReader( band_path )
width_bottom += band_width
height_bottom = max(height_bottom, band_height)
width = max(width_top, width_bottom)
height = height_top + height_bottom
video_out = VideoWriter(width=width, height=height, frame_rate=data["fps"], filename=args.output )
frames = data["frames"]
for i in tqdm(range(frames)):
top_row = None
bottom_row = None
frame_out = np.zeros((height, width, 3), dtype=np.uint8)
# vertically concatenate the top row
for band in top:
img = videos[band][i].asnumpy()
if top_row is None:
top_row = img
else:
top_row = cv2.hconcat([top_row, img])
# vertically concatenate the bottom row
for band in bottom:
img = videos[band][i].asnumpy()
if bottom_row is None:
bottom_row = img
else:
bottom_row = cv2.hconcat([bottom_row, img])
# horizontally concatenate the top and bottom rows
if top_row is None:
frame_out = bottom_row
elif bottom_row is None:
frame_out = top_row
else:
frame_out = cv2.vconcat([top_row, bottom_row])
video_out.write(frame_out)
video_out.close()
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('-input', '-i', help="Input folder. Ex: `data/000`", type=str, required=True)
parser.add_argument('-output', '-o', help="Output file. Ex: `000.png`", type=str, required=True)
parser.add_argument('-top', '-t', help="Top row of images", type=str, nargs='+')
parser.add_argument('-bottom', '-b', help="Bottom row of images", type=str, nargs='+')
args = parser.parse_args()
data = load_metadata(args.input)
if data is None:
print("ERROR: No metadata found in {}".format(args.input))
exit()
if args.top:
top = args.top
if args.bottom:
bottom = args.bottom
if is_video(data["bands"]["rgba"]["url"]):
concat_video(args, top, bottom)
else:
concat_image(args, top, bottom)