45 строки
1.6 KiB
Python
45 строки
1.6 KiB
Python
# Copyright (c) Microsoft Corporation.
|
|
# Licensed under the MIT license.
|
|
|
|
"""Model benchmark example for CNN models.
|
|
|
|
Commands to run:
|
|
python3 examples/benchmarks/pytorch_cnn.py (Single GPU)
|
|
python3 -m torch.distributed.launch --use_env --nproc_per_node=8 examples/benchmarks/pytorch_cnn.py \
|
|
--distributed (Distributed)
|
|
"""
|
|
|
|
import argparse
|
|
|
|
from superbench.benchmarks import Platform, Framework, BenchmarkRegistry
|
|
from superbench.common.utils import logger
|
|
|
|
if __name__ == '__main__':
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument(
|
|
'--distributed', action='store_true', default=False, help='Whether to enable distributed training.'
|
|
)
|
|
args = parser.parse_args()
|
|
|
|
# Specify the model name and benchmark parameters.
|
|
# For example, resnet50, resnet101, resnet152, densenet169, densenet201, vgg11, vgg13, vgg16, vgg19.
|
|
model_name = 'resnet101'
|
|
parameters = '--batch_size 192 --precision float32 float16 --num_warmup 64 --num_steps 512 \
|
|
--sample_count 8192 --pin_memory'
|
|
|
|
if args.distributed:
|
|
parameters += ' --distributed_impl ddp --distributed_backend nccl'
|
|
|
|
# Create context for resnet101 benchmark and run it for 2048 steps.
|
|
context = BenchmarkRegistry.create_benchmark_context(
|
|
model_name, platform=Platform.CUDA, parameters=parameters, framework=Framework.PYTORCH
|
|
)
|
|
|
|
benchmark = BenchmarkRegistry.launch_benchmark(context)
|
|
if benchmark:
|
|
logger.info(
|
|
'benchmark: {}, return code: {}, result: {}'.format(
|
|
benchmark.name, benchmark.return_code, benchmark.result
|
|
)
|
|
)
|