import operator_benchmark as op_bench """ Configs shared by multiple benchmarks """ def remove_cuda(config_list): cuda_config = {"device": "cuda"} return [config for config in config_list if cuda_config not in config] # Configs for conv-1d ops conv_1d_configs_short = op_bench.config_list( attr_names=["IC", "OC", "kernel", "stride", "N", "L"], attrs=[ [128, 256, 3, 1, 1, 64], [256, 256, 3, 2, 4, 64], ], cross_product_configs={ "device": ["cpu", "cuda"], }, tags=["short"], ) conv_1d_configs_long = op_bench.cross_product_configs( IC=[128, 512], OC=[128, 512], kernel=[3], stride=[1, 2], N=[8], L=[128], device=["cpu", "cuda"], tags=["long"], ) convtranspose_1d_configs_short = op_bench.config_list( attr_names=["IC", "OC", "kernel", "stride", "N", "L"], attrs=[ [2016, 1026, 1024, 256, 1, 224], ], cross_product_configs={ "device": ["cpu", "cuda"], }, tags=["short"], ) # Configs for Conv2d and ConvTranspose1d conv_2d_configs_short = op_bench.config_list( attr_names=[ "IC", "OC", "kernel", "stride", "N", "H", "W", "G", "pad", ], attrs=[ [256, 256, 3, 1, 1, 16, 16, 1, 0], ], cross_product_configs={ "device": ["cpu", "cuda"], }, tags=["short"], ) conv_2d_configs_long = op_bench.cross_product_configs( IC=[128, 256], OC=[128, 256], kernel=[3], stride=[1, 2], N=[4], H=[32], W=[32], G=[1], pad=[0], device=["cpu", "cuda"], tags=["long"], ) # Configs for Conv2dPointwise conv_2d_pw_configs_short = op_bench.config_list( attr_names=[ "IC", "OC", "stride", "N", "H", "W", "G", "pad", ], attrs=[ [256, 256, 1, 1, 16, 16, 1, 0], ], cross_product_configs={ "device": ["cpu", "cuda"], }, tags=["short"], ) conv_2d_pw_configs_long = op_bench.cross_product_configs( IC=[128, 256], OC=[128, 256], stride=[1, 2], N=[4], H=[32], W=[32], G=[1], pad=[0], device=["cpu", "cuda"], tags=["long"], ) # Configs for Conv3d and ConvTranspose3d conv_3d_configs_short = op_bench.config_list( attr_names=["IC", "OC", "kernel", "stride", "N", "D", "H", "W"], attrs=[ [64, 64, 3, 1, 8, 4, 16, 16], ], cross_product_configs={ "device": ["cpu", "cuda"], }, tags=["short"], ) linear_configs_short = op_bench.config_list( attr_names=["N", "IN", "OUT"], attrs=[ [1, 1, 1], [4, 256, 128], [16, 512, 256], ], cross_product_configs={ "device": ["cpu", "cuda"], }, tags=["short"], ) linear_configs_long = op_bench.cross_product_configs( N=[32, 64], IN=[128, 512], OUT=[64, 128], device=["cpu", "cuda"], tags=["long"] ) embeddingbag_short_configs = op_bench.cross_product_configs( embeddingbags=[10, 120, 1000, 2300], dim=[64], mode=["sum"], input_size=[8, 16, 64], offset=[0], sparse=[True, False], include_last_offset=[True, False], device=["cpu"], tags=["short"], ) embedding_short_configs = op_bench.cross_product_configs( num_embeddings=[10, 120, 1000, 2300], embedding_dim=[64], input_size=[8, 16, 64], device=["cpu"], tags=["short"], )