a b/tools/data/build_videos.py
1
# Copyright (c) OpenMMLab. All rights reserved.
2
import argparse
3
import glob
4
import os
5
import os.path as osp
6
import sys
7
from multiprocessing import Pool
8
9
10
def encode_video(frame_dir_item):
11
    """Encode frames to video using ffmpeg.
12
13
    Args:
14
        frame_dir_item (list): Rawframe item containing raw frame directory
15
            full path, rawframe directory (short) path, rawframe directory id.
16
17
    Returns:
18
        bool: Whether synthesize video successfully.
19
    """
20
    full_path, frame_dir_path, frame_dir_id = frame_dir_item
21
    out_full_path = args.out_dir
22
23
    img_name_tmpl = args.filename_tmpl + '.' + args.in_format
24
    img_path = osp.join(full_path, img_name_tmpl)
25
26
    out_vid_name = frame_dir_path + '.' + args.ext
27
    out_vid_path = osp.join(out_full_path, out_vid_name)
28
29
    cmd = osp.join(
30
        f"ffmpeg -start_number {args.start_idx} -r {args.fps} -i '{img_path}' "
31
        f"-vcodec {args.vcodec} '{out_vid_path}'")
32
    os.system(cmd)
33
34
    print(f'{frame_dir_id} {frame_dir_path} done')
35
    sys.stdout.flush()
36
    return True
37
38
39
def parse_args():
40
    parser = argparse.ArgumentParser(description='synthesize videos')
41
    parser.add_argument('src_dir', type=str, help='source rawframe directory')
42
    parser.add_argument('out_dir', type=str, help='output video directory')
43
    parser.add_argument(
44
        '--fps', type=int, default=30, help='fps of videos to be synthesized')
45
    parser.add_argument(
46
        '--level',
47
        type=int,
48
        choices=[1, 2],
49
        default=2,
50
        help='directory level of data')
51
    parser.add_argument(
52
        '--num-worker',
53
        type=int,
54
        default=8,
55
        help='number of workers to build videos')
56
    parser.add_argument(
57
        '--in-format',
58
        type=str,
59
        default='jpg',
60
        choices=['jpg', 'png'],
61
        help='input format')
62
    parser.add_argument(
63
        '--start-idx', type=int, default=0, help='starting index of rawframes')
64
    parser.add_argument(
65
        '--filename-tmpl',
66
        type=str,
67
        default='img_%05d',
68
        help='filename template of rawframes')
69
    parser.add_argument(
70
        '--vcodec', type=str, default='mpeg4', help='coding method of videos')
71
    parser.add_argument(
72
        '--ext',
73
        type=str,
74
        default='mp4',
75
        choices=['mp4', 'avi'],
76
        help='video file extensions')
77
    parser.add_argument('--num-gpu', type=int, default=8, help='number of GPU')
78
    parser.add_argument(
79
        '--resume',
80
        action='store_true',
81
        default=False,
82
        help='resume optical flow extraction instead of overwriting')
83
    args = parser.parse_args()
84
85
    return args
86
87
88
if __name__ == '__main__':
89
    args = parse_args()
90
91
    if not osp.isdir(args.out_dir):
92
        print(f'Creating folder: {args.out_dir}')
93
        os.makedirs(args.out_dir)
94
95
    if args.level == 2:
96
        classes = os.listdir(args.src_dir)
97
        for classname in classes:
98
            new_dir = osp.join(args.out_dir, classname)
99
            if not osp.isdir(new_dir):
100
                print(f'Creating folder: {new_dir}')
101
                os.makedirs(new_dir)
102
103
    print('Reading rgb frames from folder: ', args.src_dir)
104
    print('Input format of rgb frames: ', args.in_format)
105
    fullpath_list = glob.glob(args.src_dir + '/*' * args.level)
106
    done_fullpath_list = glob.glob(args.src_dir + '/*' * args.level + '.' +
107
                                   args.ext)
108
    print('Total number of rgb frame folders found: ', len(fullpath_list))
109
110
    if args.resume:
111
        fullpath_list = set(fullpath_list).difference(set(done_fullpath_list))
112
        fullpath_list = list(fullpath_list)
113
        print('Resuming. number of videos to be synthesized: ',
114
              len(fullpath_list))
115
116
    if args.level == 2:
117
        frame_dir_list = list(
118
            map(
119
                lambda p: osp.join(
120
                    osp.basename(osp.dirname(p)), osp.basename(p)),
121
                fullpath_list))
122
    elif args.level == 1:
123
        frame_dir_list = list(map(osp.basename, fullpath_list))
124
125
    pool = Pool(args.num_worker)
126
    pool.map(encode_video,
127
             zip(fullpath_list, frame_dir_list, range(len(frame_dir_list))))