DeepLearningExamples/PyTorch/Detection/SSD/qa/benchmark_performance.py

import argparse
import subprocess

from qa.qa_utils import compare_benchmarks, load_json, save_json, OKBLUE, ENDC, FAIL


# parsing
def parse_testscript_args():
    parser = argparse.ArgumentParser(description='PyTorch Benchmark Tests')
    parser.add_argument('--bs', default=[1], type=int, nargs='+')
    parser.add_argument('--ngpus', default=[1], type=int, nargs='+')
    parser.add_argument('--benchmark-mode', default='training', choices=['training', 'inference'],
                        help='benchmark training or inference', required=True)
    parser.add_argument('--bench-iterations', type=int, default=20, metavar='N',
                        help='Run N iterations while benchmarking (ignored when training and validation)')
    parser.add_argument('--bench-warmup', type=int, default=10, metavar='N',
                        help='Number of warmup iterations for benchmarking')
    parser.add_argument('--fp16', action='store_true', help='Run model in mixed precision.')
    parser.add_argument('-j', '--workers', default=4, type=int, metavar='N',
                        help='number of data loading workers')
    parser.add_argument('--data', type=str, metavar='<PATH>', required=True,
                        help='path to the dataset')
    parser.add_argument('--results-file', default='experiment_raport.json', type=str,
                        help='file in which to store JSON experiment raport')
    parser.add_argument('--benchmark-file', type=str, metavar='FILE', required=True,
                        help='path to the file with baselines')
    return parser.parse_args()


# job command
command_template = 'python3 {launcher} qa/qa_perf_main.py --bs {bs} --ebs {bs} ' \
                   '--benchmark-mode {mode} --benchmark-warmup {bw} --benchmark-iterations {bi} {fp16} ' \
                   '--backbone resnet50 --seed 1 --data {data} --results-file {results_file} --benchmark-file {benchmark_file}'

if __name__ == '__main__':
    args = parse_testscript_args()

    fp16 = '--fp16' if args.fp16 else ''

    # create results json file
    # todo: maybe some template json file?
    results = {'ngpus': args.ngpus,
               'bs': args.bs,
               'metric_keys': ['images_per_second'],
               'metrics': {}}

    for gpu in args.ngpus:
        results['metrics'][str(gpu)] = {}
        for bs in args.bs:
            results['metrics'][str(gpu)][str(bs)] = {'images_per_second': None}

    save_json(args.results_file, results)

    # run qa_perf_main.py tests one by one
    for gpu in args.ngpus:
        launcher = '' if gpu == 1 else '-m torch.distributed.launch --nproc_per_node={}'.format(gpu)
        for bs in args.bs:
            print('#' * 80)
            command = command_template.format(launcher=launcher, bs=bs, workers=args.workers, mode=args.benchmark_mode,
                                              bw=args.bench_warmup, bi=args.bench_iterations, fp16=fp16,
                                              data=args.data, results_file=args.results_file,
                                              benchmark_file=args.benchmark_file)

            print('Running "{}"'.format(command))

            process = subprocess.Popen(command, shell=True)
            output, error = process.communicate()

            if error is not None:
                print(FAIL + 'Program exited with status {}. Data has not been collected'.format(error) + ENDC)
            # elif results['metrics'][str(gpu)][str(bs)]['images_per_second'] is None:
            #     print(WARNING + 'Program did not end sucessfully. Data has not been collected.' + ENDC)
            else:
                print(OKBLUE + 'Program ended sucessfully. Data has been collected.' + ENDC)

    results_data = load_json(args.results_file)
    benchmark_data = load_json(args.benchmark_file)
    exit_code = compare_benchmarks(results_data, benchmark_data, args, 0.16 if args.benchmark_mode == 'inference' else 0.1)
    print(exit_code)
    exit(exit_code)
Adding 9 new models: ResNet50/TF, SSD/TF, BERT/TF, NCF/TF, UNet/TF, GNMT/TF, SSD/PyT, MaskRCNN/PyT, Tacotron2+Waveglow/PyT 2019-03-18 19:45:05 +01:00			`import argparse`
			`import subprocess`

			`from qa.qa_utils import compare_benchmarks, load_json, save_json, OKBLUE, ENDC, FAIL`



			`# parsing`
			`def parse_testscript_args():`
			`parser = argparse.ArgumentParser(description='PyTorch Benchmark Tests')`
			`parser.add_argument('--bs', default=[1], type=int, nargs='+')`
			`parser.add_argument('--ngpus', default=[1], type=int, nargs='+')`
			`parser.add_argument('--benchmark-mode', default='training', choices=['training', 'inference'],`
			`help='benchmark training or inference', required=True)`
			`parser.add_argument('--bench-iterations', type=int, default=20, metavar='N',`
			`help='Run N iterations while benchmarking (ignored when training and validation)')`
			`parser.add_argument('--bench-warmup', type=int, default=10, metavar='N',`
			`help='Number of warmup iterations for benchmarking')`
			`parser.add_argument('--fp16', action='store_true', help='Run model in mixed precision.')`
			`parser.add_argument('-j', '--workers', default=4, type=int, metavar='N',`
			`help='number of data loading workers')`
			`parser.add_argument('--data', type=str, metavar='<PATH>', required=True,`
			`help='path to the dataset')`
			`parser.add_argument('--results-file', default='experiment_raport.json', type=str,`
			`help='file in which to store JSON experiment raport')`
			`parser.add_argument('--benchmark-file', type=str, metavar='FILE', required=True,`
			`help='path to the file with baselines')`
			`return parser.parse_args()`


			`# job command`
			`command_template = 'python3 {launcher} qa/qa_perf_main.py --bs {bs} --ebs {bs} ' \`
			`'--benchmark-mode {mode} --benchmark-warmup {bw} --benchmark-iterations {bi} {fp16} ' \`
			`'--backbone resnet50 --seed 1 --data {data} --results-file {results_file} --benchmark-file {benchmark_file}'`

			`if __name__ == '__main__':`
			`args = parse_testscript_args()`

			`fp16 = '--fp16' if args.fp16 else ''`

			`# create results json file`
			`# todo: maybe some template json file?`
			`results = {'ngpus': args.ngpus,`
			`'bs': args.bs,`
			`'metric_keys': ['images_per_second'],`
			`'metrics': {}}`

			`for gpu in args.ngpus:`
			`results['metrics'][str(gpu)] = {}`
			`for bs in args.bs:`
			`results['metrics'][str(gpu)][str(bs)] = {'images_per_second': None}`

			`save_json(args.results_file, results)`

			`# run qa_perf_main.py tests one by one`
			`for gpu in args.ngpus:`
			`launcher = '' if gpu == 1 else '-m torch.distributed.launch --nproc_per_node={}'.format(gpu)`
			`for bs in args.bs:`
			`print('#' * 80)`
			`command = command_template.format(launcher=launcher, bs=bs, workers=args.workers, mode=args.benchmark_mode,`
			`bw=args.bench_warmup, bi=args.bench_iterations, fp16=fp16,`
			`data=args.data, results_file=args.results_file,`
			`benchmark_file=args.benchmark_file)`

			`print('Running "{}"'.format(command))`

			`process = subprocess.Popen(command, shell=True)`
			`output, error = process.communicate()`

			`if error is not None:`
			`print(FAIL + 'Program exited with status {}. Data has not been collected'.format(error) + ENDC)`
			`# elif results['metrics'][str(gpu)][str(bs)]['images_per_second'] is None:`
			`# print(WARNING + 'Program did not end sucessfully. Data has not been collected.' + ENDC)`
			`else:`
			`print(OKBLUE + 'Program ended sucessfully. Data has been collected.' + ENDC)`

			`results_data = load_json(args.results_file)`
			`benchmark_data = load_json(args.benchmark_file)`
			`exit_code = compare_benchmarks(results_data, benchmark_data, args, 0.16 if args.benchmark_mode == 'inference' else 0.1)`
			`print(exit_code)`
			`exit(exit_code)`