blob: ccfa62cc364e3a735850c501c618c8058f6623c8 [file] [log] [blame]
import operator_benchmark as op_bench
"""
Configs shared by multiple benchmarks
"""
def remove_cuda(config_list):
cuda_config = {"device": "cuda"}
return [config for config in config_list if cuda_config not in config]
# Configs for conv-1d ops
conv_1d_configs_short = op_bench.config_list(
attr_names=["IC", "OC", "kernel", "stride", "N", "L"],
attrs=[
[128, 256, 3, 1, 1, 64],
[256, 256, 3, 2, 4, 64],
],
cross_product_configs={
"device": ["cpu", "cuda"],
},
tags=["short"],
)
conv_1d_configs_long = op_bench.cross_product_configs(
IC=[128, 512],
OC=[128, 512],
kernel=[3],
stride=[1, 2],
N=[8],
L=[128],
device=["cpu", "cuda"],
tags=["long"],
)
convtranspose_1d_configs_short = op_bench.config_list(
attr_names=["IC", "OC", "kernel", "stride", "N", "L"],
attrs=[
[2016, 1026, 1024, 256, 1, 224],
],
cross_product_configs={
"device": ["cpu", "cuda"],
},
tags=["short"],
)
# Configs for Conv2d and ConvTranspose1d
conv_2d_configs_short = op_bench.config_list(
attr_names=[
"IC",
"OC",
"kernel",
"stride",
"N",
"H",
"W",
"G",
"pad",
],
attrs=[
[256, 256, 3, 1, 1, 16, 16, 1, 0],
],
cross_product_configs={
"device": ["cpu", "cuda"],
},
tags=["short"],
)
conv_2d_configs_long = op_bench.cross_product_configs(
IC=[128, 256],
OC=[128, 256],
kernel=[3],
stride=[1, 2],
N=[4],
H=[32],
W=[32],
G=[1],
pad=[0],
device=["cpu", "cuda"],
tags=["long"],
)
# Configs for Conv2dPointwise
conv_2d_pw_configs_short = op_bench.config_list(
attr_names=[
"IC",
"OC",
"stride",
"N",
"H",
"W",
"G",
"pad",
],
attrs=[
[256, 256, 1, 1, 16, 16, 1, 0],
],
cross_product_configs={
"device": ["cpu", "cuda"],
},
tags=["short"],
)
conv_2d_pw_configs_long = op_bench.cross_product_configs(
IC=[128, 256],
OC=[128, 256],
stride=[1, 2],
N=[4],
H=[32],
W=[32],
G=[1],
pad=[0],
device=["cpu", "cuda"],
tags=["long"],
)
# Configs for Conv3d and ConvTranspose3d
conv_3d_configs_short = op_bench.config_list(
attr_names=["IC", "OC", "kernel", "stride", "N", "D", "H", "W"],
attrs=[
[64, 64, 3, 1, 8, 4, 16, 16],
],
cross_product_configs={
"device": ["cpu", "cuda"],
},
tags=["short"],
)
linear_configs_short = op_bench.config_list(
attr_names=["N", "IN", "OUT"],
attrs=[
[1, 1, 1],
[4, 256, 128],
[16, 512, 256],
],
cross_product_configs={
"device": ["cpu", "cuda"],
},
tags=["short"],
)
linear_configs_long = op_bench.cross_product_configs(
N=[32, 64], IN=[128, 512], OUT=[64, 128], device=["cpu", "cuda"], tags=["long"]
)
embeddingbag_short_configs = op_bench.cross_product_configs(
embeddingbags=[10, 120, 1000, 2300],
dim=[64],
mode=["sum"],
input_size=[8, 16, 64],
offset=[0],
sparse=[True, False],
include_last_offset=[True, False],
device=["cpu"],
tags=["short"],
)
embedding_short_configs = op_bench.cross_product_configs(
num_embeddings=[10, 120, 1000, 2300],
embedding_dim=[64],
input_size=[8, 16, 64],
device=["cpu"],
tags=["short"],
)