diff --git a/tools/datasets/filter_panda10m.py b/tools/datasets/filter_panda10m.py index d4397c2..c6c3ef3 100644 --- a/tools/datasets/filter_panda10m.py +++ b/tools/datasets/filter_panda10m.py @@ -245,32 +245,6 @@ def filter_panda10m_timestamp(meta_path): print(f"New meta (shape={meta.shape}) saved to '{out_path}'.") -def append_timestamp(meta_path): - - def process_single_row(row): - path = row['path'] - wo_ext, ext = os.path.splitext(path) - json_path = f'{wo_ext}.json' - try: - with open(json_path, 'r') as f: - data = json.load(f) - timestamp = data['clips'][2:-2] - a, b = timestamp.split(', ') - timestamp = f"('{a}', '{b}')" - except Exception as e: - timestamp = '' - return timestamp - - meta = pd.read_csv(meta_path) - ret = apply(meta, process_single_row, axis=1) - meta['timestamp'] = ret - - wo_ext, ext = os.path.splitext(meta_path) - out_path = f"{wo_ext}_timestamp{ext}" - meta.to_csv(out_path, index=False) - print(f"New meta (shape={meta.shape}) saved to '{out_path}'.") - - def parse_args(): parser = argparse.ArgumentParser() parser.add_argument('--meta_path', type=str, nargs='+') @@ -282,7 +256,6 @@ def parse_args(): if __name__ == '__main__': args = parse_args() - # append_timestamp(args.meta_path) text_set = get_10m_set() for x in args.meta_path: diff --git a/tools/scene_cut/README.md b/tools/scene_cut/README.md index 0f1ac7d..bb8c254 100644 --- a/tools/scene_cut/README.md +++ b/tools/scene_cut/README.md @@ -1,9 +1,15 @@ # Scene Detection and Video Splitting + +- [Scene Detection and Video Splitting](#scene-detection-and-video-splitting) + - [Prepare Meta Files](#prepare-meta-files) + - [Scene Detection](#scene-detection) + - [Video Splitting](#video-splitting) + In many cases, raw videos contain several scenes and are too long for training. Thus, it is essential to split them into shorter clips based on scenes. Here, we provide code for scene detection and video splitting. -## Prepare a meta file -At this step, you should have a raw video dataset prepared. We need a meta file for the dataset. To create a meta file from a folder, run: +## Prepare Meta Files +At this step, you should have a raw video dataset prepared. A meta file of the dataset information is needed for data processing. To create a meta file from a folder, run: ```bash python -m tools.datasets.convert video /path/to/video/folder --output /path/to/save/meta.csv