Skip to content

Instantly share code, notes, and snippets.

@FindHao
Created July 22, 2022 16:47
Show Gist options
  • Star 0 You must be signed in to star a gist
  • Fork 0 You must be signed in to fork a gist
  • Save FindHao/ef5732a6ec558d24c4df694b39b66886 to your computer and use it in GitHub Desktop.
Save FindHao/ef5732a6ec558d24c4df694b39b66886 to your computer and use it in GitHub Desktop.
from torch import profiler
import torch
import torch.nn.functional as F
import argparse
def run_conv2d(input_shape, weight_shape, other_args, profile_folder):
input = torch.ones(input_shape, dtype=torch.float32, device='cuda')
weight = torch.ones(weight_shape, dtype=torch.float32, device='cuda')
bias = other_args[0]
stride = other_args[1]
padding = other_args[2]
dilation = other_args[3]
groups = other_args[4]
# warmup
for i in range(11):
x = F.conv2d(input, weight, bias, stride, padding, dilation, groups)
for i in range(1000):
x = F.conv2d(input, weight, bias, stride, padding, dilation, groups)
return x
def profile(input_shape, weight_shape, other_args, profile_folder):
activity_groups = []
activity_groups.append(profiler.ProfilerActivity.CUDA)
activity_groups.append(profiler.ProfilerActivity.CPU)
profile_detailed = True
input = torch.ones(input_shape, dtype=torch.float32, device='cuda')
weight = torch.ones(weight_shape, dtype=torch.float32, device='cuda')
bias = other_args[0]
stride = other_args[1]
padding = other_args[2]
dilation = other_args[3]
groups = other_args[4]
with profiler.profile(
schedule=profiler.schedule(wait=0, warmup=0, active=1),
activities=activity_groups,
record_shapes=profile_detailed,
profile_memory=profile_detailed,
with_stack=profile_detailed,
with_flops=profile_detailed,
on_trace_ready=profiler.tensorboard_trace_handler(profile_folder)
) as prof:
x = F.conv2d(input, weight, bias, stride, padding, dilation, groups)
return x
if __name__ == "__main__":
parser = argparse.ArgumentParser(__doc__)
SUPPORT_BATCHSIZE_LIST = ['32', '64']
parser.add_argument("--bs", choices=SUPPORT_BATCHSIZE_LIST, required=True,
help="Specify batch size to the test.")
parser.add_argument("--profile-folder", default="./logs", help="Save profiling model traces to this directory.")
args, extra_args = parser.parse_known_args()
# torch.backends.cudnn.benchmark = True
if args.bs == '64':
input_shape = (64, 224, 112, 112)
other_args = [None, (2, 2), (1, 1), (1, 1), 2]
else:
input_shape = (32, 224, 56, 56)
other_args = [None, (1, 1), (1, 1), (1, 1), 2]
weight_shape = (224, 112, 3, 3)
# profile(input_shape, weight_shape, other_args, args.profile_folder)
run_conv2d(input_shape, weight_shape, other_args, args.profile_folder)
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment