| import operator_benchmark as op_bench |
| |
| """ |
| Configs shared by multiple benchmarks |
| """ |
| |
| |
| def remove_cuda(config_list): |
| cuda_config = {"device": "cuda"} |
| return [config for config in config_list if cuda_config not in config] |
| |
| |
| # Configs for conv-1d ops |
| conv_1d_configs_short = op_bench.config_list( |
| attr_names=["IC", "OC", "kernel", "stride", "N", "L"], |
| attrs=[ |
| [128, 256, 3, 1, 1, 64], |
| [256, 256, 3, 2, 4, 64], |
| ], |
| cross_product_configs={ |
| "device": ["cpu", "cuda"], |
| }, |
| tags=["short"], |
| ) |
| |
| conv_1d_configs_long = op_bench.cross_product_configs( |
| IC=[128, 512], |
| OC=[128, 512], |
| kernel=[3], |
| stride=[1, 2], |
| N=[8], |
| L=[128], |
| device=["cpu", "cuda"], |
| tags=["long"], |
| ) |
| |
| convtranspose_1d_configs_short = op_bench.config_list( |
| attr_names=["IC", "OC", "kernel", "stride", "N", "L"], |
| attrs=[ |
| [2016, 1026, 1024, 256, 1, 224], |
| ], |
| cross_product_configs={ |
| "device": ["cpu", "cuda"], |
| }, |
| tags=["short"], |
| ) |
| |
| # Configs for Conv2d and ConvTranspose1d |
| conv_2d_configs_short = op_bench.config_list( |
| attr_names=[ |
| "IC", |
| "OC", |
| "kernel", |
| "stride", |
| "N", |
| "H", |
| "W", |
| "G", |
| "pad", |
| ], |
| attrs=[ |
| [256, 256, 3, 1, 1, 16, 16, 1, 0], |
| ], |
| cross_product_configs={ |
| "device": ["cpu", "cuda"], |
| }, |
| tags=["short"], |
| ) |
| |
| conv_2d_configs_long = op_bench.cross_product_configs( |
| IC=[128, 256], |
| OC=[128, 256], |
| kernel=[3], |
| stride=[1, 2], |
| N=[4], |
| H=[32], |
| W=[32], |
| G=[1], |
| pad=[0], |
| device=["cpu", "cuda"], |
| tags=["long"], |
| ) |
| |
| # Configs for Conv2dPointwise |
| conv_2d_pw_configs_short = op_bench.config_list( |
| attr_names=[ |
| "IC", |
| "OC", |
| "stride", |
| "N", |
| "H", |
| "W", |
| "G", |
| "pad", |
| ], |
| attrs=[ |
| [256, 256, 1, 1, 16, 16, 1, 0], |
| ], |
| cross_product_configs={ |
| "device": ["cpu", "cuda"], |
| }, |
| tags=["short"], |
| ) |
| |
| conv_2d_pw_configs_long = op_bench.cross_product_configs( |
| IC=[128, 256], |
| OC=[128, 256], |
| stride=[1, 2], |
| N=[4], |
| H=[32], |
| W=[32], |
| G=[1], |
| pad=[0], |
| device=["cpu", "cuda"], |
| tags=["long"], |
| ) |
| |
| # Configs for Conv3d and ConvTranspose3d |
| conv_3d_configs_short = op_bench.config_list( |
| attr_names=["IC", "OC", "kernel", "stride", "N", "D", "H", "W"], |
| attrs=[ |
| [64, 64, 3, 1, 8, 4, 16, 16], |
| ], |
| cross_product_configs={ |
| "device": ["cpu", "cuda"], |
| }, |
| tags=["short"], |
| ) |
| |
| linear_configs_short = op_bench.config_list( |
| attr_names=["N", "IN", "OUT"], |
| attrs=[ |
| [1, 1, 1], |
| [4, 256, 128], |
| [16, 512, 256], |
| ], |
| cross_product_configs={ |
| "device": ["cpu", "cuda"], |
| }, |
| tags=["short"], |
| ) |
| |
| |
| linear_configs_long = op_bench.cross_product_configs( |
| N=[32, 64], IN=[128, 512], OUT=[64, 128], device=["cpu", "cuda"], tags=["long"] |
| ) |
| |
| embeddingbag_short_configs = op_bench.cross_product_configs( |
| embeddingbags=[10, 120, 1000, 2300], |
| dim=[64], |
| mode=["sum"], |
| input_size=[8, 16, 64], |
| offset=[0], |
| sparse=[True, False], |
| include_last_offset=[True, False], |
| device=["cpu"], |
| tags=["short"], |
| ) |
| |
| embedding_short_configs = op_bench.cross_product_configs( |
| num_embeddings=[10, 120, 1000, 2300], |
| embedding_dim=[64], |
| input_size=[8, 16, 64], |
| device=["cpu"], |
| tags=["short"], |
| ) |