| 12345678910111213141516171819202122232425262728293031323334353637 |
- import os
- import time
- from argparse import ArgumentDefaultsHelpFormatter, ArgumentParser
- from subprocess import call
- from data_preprocessing.convert2tfrec import Converter
- from data_preprocessing.preprocessor import Preprocessor
- from utils.utils import get_task_code
- parser = ArgumentParser(formatter_class=ArgumentDefaultsHelpFormatter)
- parser.add_argument("--data", type=str, default="/data", help="Path to data directory")
- parser.add_argument("--results", type=str, default="/data", help="Path for saving results directory")
- parser.add_argument(
- "--exec_mode",
- type=str,
- default="training",
- choices=["training", "test"],
- help="Mode for data preprocessing",
- )
- parser.add_argument("--task", type=str, help="Number of task to be run. MSD uses numbers 01-10")
- parser.add_argument("--dim", type=int, default=3, choices=[2, 3], help="Data dimension to prepare")
- parser.add_argument("--n_jobs", type=int, default=-1, help="Number of parallel jobs for data preprocessing")
- parser.add_argument("--vpf", type=int, default=1, help="Volumes per tfrecord")
- if __name__ == "__main__":
- args = parser.parse_args()
- start = time.time()
- Preprocessor(args).run()
- Converter(args).run()
- task_code = get_task_code(args)
- path = os.path.join(args.data, task_code)
- if args.exec_mode == "test":
- path = os.path.join(path, "test")
- call(f'find {path} -name "*.npy" -print0 | xargs -0 rm', shell=True)
- end = time.time()
- print(f"Preprocessing time: {(end - start):.2f}")
|