diff --git a/.github/workflows/operator_benchmark.yml b/.github/workflows/operator_benchmark.yml index 09f14b545cdb..40fb3b8d0c85 100644 --- a/.github/workflows/operator_benchmark.yml +++ b/.github/workflows/operator_benchmark.yml @@ -52,3 +52,27 @@ jobs: docker-image: ${{ needs.x86-opbenchmark-build.outputs.docker-image }} test-matrix: ${{ needs.x86-opbenchmark-build.outputs.test-matrix }} secrets: inherit + + aarch64-opbenchmark-build: + if: github.repository_owner == 'pytorch' + name: aarch64-opbenchmark-build + uses: ./.github/workflows/_linux-build.yml + with: + build-environment: linux-jammy-aarch64-py3.10 + runner: linux.arm64.m7g.4xlarge + docker-image-name: ci-image:pytorch-linux-jammy-aarch64-py3.10-gcc11 + test-matrix: | + { include: [ + { config: "cpu_operator_benchmark_short", shard: 1, num_shards: 1, runner: "linux.arm64.m8g.4xlarge" }, + ]} + secrets: inherit + + aarch64-opbenchmark-test: + name: aarch64-opbenchmark-test + uses: ./.github/workflows/_linux-test.yml + needs: aarch64-opbenchmark-build + with: + build-environment: linux-jammy-aarch64-py3.10 + docker-image: ${{ needs.aarch64-opbenchmark-build.outputs.docker-image }} + test-matrix: ${{ needs.aarch64-opbenchmark-build.outputs.test-matrix }} + secrets: inherit diff --git a/benchmarks/operator_benchmark/aarch64_expected_ci_operator_benchmark_eager_float32_cpu.csv b/benchmarks/operator_benchmark/aarch64_expected_ci_operator_benchmark_eager_float32_cpu.csv new file mode 100644 index 000000000000..dfc72e4665dd --- /dev/null +++ b/benchmarks/operator_benchmark/aarch64_expected_ci_operator_benchmark_eager_float32_cpu.csv @@ -0,0 +1,1319 @@ +Benchmarking Framework,Benchmarking Module Name,Case Name,tag,run_backward,Execution Time,Peak Memory (KB) +PyTorch,add,add_M1_N1_K1_cpu,short,False,4.244240,0.000000 +PyTorch,add,add_M64_N64_K64_cpu,short,False,56.719577,0.000000 +PyTorch,add,add_M64_N64_K128_cpu,short,False,56.826275,0.000000 +PyTorch,add,add_M1_N1_K1_cpu_bwdall_BACKWARD,short,True,47.834313,0.000000 +PyTorch,add,add_M1_N1_K1_cpu_bwd1_BACKWARD,short,True,47.872547,0.000000 +PyTorch,add,add_M1_N1_K1_cpu_bwd2_BACKWARD,short,True,47.790496,0.000000 +PyTorch,add,add_M64_N64_K64_cpu_bwdall_BACKWARD,short,True,216.173346,0.000000 +PyTorch,add,add_M64_N64_K64_cpu_bwd1_BACKWARD,short,True,217.600432,0.000000 +PyTorch,add,add_M64_N64_K64_cpu_bwd2_BACKWARD,short,True,216.916940,0.000000 +PyTorch,add,add_M64_N64_K128_cpu_bwdall_BACKWARD,short,True,250.406573,0.000000 +PyTorch,add,add_M64_N64_K128_cpu_bwd1_BACKWARD,short,True,250.049463,0.000000 +PyTorch,add,add_M64_N64_K128_cpu_bwd2_BACKWARD,short,True,250.817280,0.000000 +PyTorch,arange,arange_start0_end1000_step2.5_cpu_dtypetorch.float32,short,False,7.851754,0.000000 +PyTorch,arange,arange_start-1024_end2048_step1_cpu_dtypetorch.float32,short,False,8.597164,0.000000 +PyTorch,as_strided,"as_strided_M8_N8_size(2,2)_stride(1,1)_storage_offset0_cpu",short,False,3.503591,0.000000 +PyTorch,as_strided,"as_strided_M256_N256_size(32,32)_stride(1,1)_storage_offset0_cpu",short,False,3.584804,0.000000 +PyTorch,as_strided,"as_strided_M512_N512_size(64,64)_stride(2,2)_storage_offset1_cpu",short,False,3.723034,0.000000 +PyTorch,batchnorm,batchnorm_M1_N256_K3136_cpu_trainingTrue_cudnnFalse,short,False,343.685714,0.000000 +PyTorch,batchnorm,batchnorm_M1_N256_K3136_cpu_trainingFalse_cudnnFalse,short,False,96.169117,0.000000 +PyTorch,batchnorm,batchnorm_M1_N256_K3136_cpu_trainingTrue_cudnnFalse_bwdall_BACKWARD,short,True,335.407438,0.000000 +PyTorch,batchnorm,batchnorm_M1_N256_K3136_cpu_trainingTrue_cudnnFalse_bwd1_BACKWARD,short,True,337.885862,0.000000 +PyTorch,batchnorm,batchnorm_M1_N256_K3136_cpu_trainingFalse_cudnnFalse_bwdall_BACKWARD,short,True,326.908147,0.000000 +PyTorch,batchnorm,batchnorm_M1_N256_K3136_cpu_trainingFalse_cudnnFalse_bwd1_BACKWARD,short,True,329.085216,0.000000 +PyTorch,batchnorm,batchnorm_N3136_C256_cpu_trainingTrue_cudnnFalse,short,False,363.524665,0.000000 +PyTorch,batchnorm,batchnorm_N3136_C256_cpu_trainingFalse_cudnnFalse,short,False,129.891489,0.000000 +PyTorch,batchnorm,batchnorm_N3136_C256_cpu_trainingTrue_cudnnFalse_bwdall_BACKWARD,short,True,484.415291,0.000000 +PyTorch,batchnorm,batchnorm_N3136_C256_cpu_trainingTrue_cudnnFalse_bwd1_BACKWARD,short,True,486.083544,0.000000 +PyTorch,batchnorm,batchnorm_N3136_C256_cpu_trainingFalse_cudnnFalse_bwdall_BACKWARD,short,True,439.912925,0.000000 +PyTorch,batchnorm,batchnorm_N3136_C256_cpu_trainingFalse_cudnnFalse_bwd1_BACKWARD,short,True,439.728483,0.000000 +PyTorch,add_,add__M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,3.355920,0.000000 +PyTorch,add_,add__M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,54.177022,0.000000 +PyTorch,add_,add__M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,55.350490,0.000000 +PyTorch,sub_,sub__M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,1.466720,0.000000 +PyTorch,sub_,sub__M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,53.482515,0.000000 +PyTorch,sub_,sub__M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,55.382850,0.000000 +PyTorch,mul_,mul__M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,3.065535,0.000000 +PyTorch,mul_,mul__M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,51.635021,0.000000 +PyTorch,mul_,mul__M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,54.669222,0.000000 +PyTorch,copy_,copy__M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,1.412698,0.000000 +PyTorch,copy_,copy__M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,50.044207,0.000000 +PyTorch,copy_,copy__M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,49.480417,0.000000 +PyTorch,div_,div__M1_N1_K1_cpu_dtype_onetorch.float32_dtype_twotorch.float32,short,False,3.127072,0.000000 +PyTorch,div_,div__M64_N64_K64_cpu_dtype_onetorch.float32_dtype_twotorch.float32,short,False,59.241161,0.000000 +PyTorch,div_,div__M64_N64_K128_cpu_dtype_onetorch.float32_dtype_twotorch.float32,short,False,59.852816,0.000000 +PyTorch,add,"add_in_one[64,1,64]_in_two[1,64,1]_cpu_dtypetorch.float32",short,False,57.006677,0.000000 +PyTorch,sub,"sub_in_one[64,1,64]_in_two[1,64,1]_cpu_dtypetorch.float32",short,False,55.606088,0.000000 +PyTorch,div,"div_in_one[64,1,64]_in_two[1,64,1]_cpu_dtypetorch.float32",short,False,58.529255,0.000000 +PyTorch,mul,"mul_in_one[64,1,64]_in_two[1,64,1]_cpu_dtypetorch.float32",short,False,54.645077,0.000000 +PyTorch,add,add_M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,4.397014,0.000000 +PyTorch,add,add_M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,59.243500,0.000000 +PyTorch,add,add_M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,57.947691,0.000000 +PyTorch,sub,sub_M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,1.925851,0.000000 +PyTorch,sub,sub_M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,57.308320,0.000000 +PyTorch,sub,sub_M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,57.787743,0.000000 +PyTorch,div,div_M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,7.978539,0.000000 +PyTorch,div,div_M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,159.754860,0.000000 +PyTorch,div,div_M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,165.360235,0.000000 +PyTorch,mul,mul_M1_N1_K1_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,3.928136,0.000000 +PyTorch,mul,mul_M64_N64_K64_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,56.413499,0.000000 +PyTorch,mul,mul_M64_N64_K128_cpu_dtype_onetorch.int32_dtype_twotorch.int32,short,False,55.925090,0.000000 +PyTorch,logical_and,"logical_and_in_one[64,1,64]_in_two[1,64,1]_cpu_dtypetorch.bool",short,False,78.404254,0.000000 +PyTorch,logical_and,logical_and_M1_N1_K1_cpu_dtype_onetorch.bool_dtype_twotorch.bool,short,False,5.354032,0.000000 +PyTorch,logical_and,logical_and_M64_N64_K64_cpu_dtype_onetorch.bool_dtype_twotorch.bool,short,False,54.072783,0.000000 +PyTorch,logical_and,logical_and_M64_N64_K128_cpu_dtype_onetorch.bool_dtype_twotorch.bool,short,False,53.680283,0.000000 +PyTorch,bmm,bmm_B2_M1_N8_K2_cpu_dtypetorch.float32,short,False,4.407892,0.000000 +PyTorch,bmm,bmm_B2_M1_N8_K2_cpu_dtypetorch.bfloat16,short,False,4.213927,0.000000 +PyTorch,bmm,bmm_B128_M64_N32_K64_cpu_dtypetorch.float32,short,False,200.303424,0.000000 +PyTorch,bmm,bmm_B128_M64_N32_K64_cpu_dtypetorch.bfloat16,short,False,229.912606,0.000000 +PyTorch,baddbmm,baddbmm_B2_M1_N8_K2_cpu_dtypetorch.float32,short,False,6.631313,0.000000 +PyTorch,baddbmm,baddbmm_B2_M1_N8_K2_cpu_dtypetorch.bfloat16,short,False,6.476986,0.000000 +PyTorch,baddbmm,baddbmm_B128_M64_N32_K64_cpu_dtypetorch.float32,short,False,266.065131,0.000000 +PyTorch,baddbmm,baddbmm_B128_M64_N32_K64_cpu_dtypetorch.bfloat16,short,False,295.503063,0.000000 +PyTorch,cat,"cat_sizes(1,1,1)_N2_dim0_cpu",short,False,4.301950,0.000000 +PyTorch,cat,"cat_sizes(512,512,2)_N2_dim1_cpu",short,False,99.093415,0.000000 +PyTorch,cat,"cat_sizes(128,1024,2)_N2_dim1_cpu",short,False,96.771578,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size2_channels_per_group16_height16_width16_groups2_channel_lastTrue,short,False,52.475549,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size2_channels_per_group16_height16_width16_groups2_channel_lastFalse,short,False,46.483135,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size2_channels_per_group32_height32_width32_groups2_channel_lastTrue,short,False,57.179441,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size2_channels_per_group32_height32_width32_groups2_channel_lastFalse,short,False,51.114112,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size4_channels_per_group32_height32_width32_groups4_channel_lastTrue,short,False,77.045573,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size4_channels_per_group32_height32_width32_groups4_channel_lastFalse,short,False,57.527440,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size4_channels_per_group64_height64_width64_groups4_channel_lastTrue,short,False,299.237060,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size4_channels_per_group64_height64_width64_groups4_channel_lastFalse,short,False,165.268507,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size8_channels_per_group64_height64_width64_groups8_channel_lastTrue,short,False,1034.480289,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size8_channels_per_group64_height64_width64_groups8_channel_lastFalse,short,False,627.552450,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size16_channels_per_group64_height64_width64_groups16_channel_lastTrue,short,False,4709.313910,0.000000 +PyTorch,channel_shuffle,channel_shuffle_batch_size16_channels_per_group64_height64_width64_groups16_channel_lastFalse,short,False,2470.991690,0.000000 +PyTorch,chunk,chunk_M8_N8_chunks2_cpu,short,False,6.881959,0.000000 +PyTorch,chunk,chunk_M256_N512_chunks2_cpu,short,False,7.016489,0.000000 +PyTorch,chunk,chunk_M512_N512_chunks2_cpu,short,False,6.829479,0.000000 +PyTorch,Conv1d,Conv1d_IC128_OC256_kernel3_stride1_N1_L64_cpu,short,False,161.526501,0.000000 +PyTorch,Conv1d,Conv1d_IC256_OC256_kernel3_stride2_N4_L64_cpu,short,False,389.396360,0.000000 +PyTorch,Conv2d,Conv2d_IC256_OC256_kernel3_stride1_N1_H16_W16_G1_pad0_cpu,short,False,837.232033,0.000000 +PyTorch,ConvTranspose2d,ConvTranspose2d_IC256_OC256_kernel3_stride1_N1_H16_W16_G1_pad0_cpu,short,False,1259.104354,0.000000 +PyTorch,Conv2dPointwise,Conv2dPointwise_IC256_OC256_stride1_N1_H16_W16_G1_pad0_cpu,short,False,423.592581,0.000000 +PyTorch,Conv3d,Conv3d_IC64_OC64_kernel3_stride1_N8_D4_H16_W16_cpu,short,False,4713.401237,0.000000 +PyTorch,ConvTranspose3d,ConvTranspose3d_IC64_OC64_kernel3_stride1_N8_D4_H16_W16_cpu,short,False,9798.085490,0.000000 +PyTorch,diag,diag_dim1_M64_N64_diagonal0_outTrue_cpu,short,False,9.983573,0.000000 +PyTorch,diag,diag_dim2_M128_N128_diagonal-10_outFalse_cpu,short,False,7.817579,0.000000 +PyTorch,diag,diag_dim1_M256_N256_diagonal20_outTrue_cpu,short,False,102.008750,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.932070,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,79.094040,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.618948,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,71.670897,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.800482,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,63.936052,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.779446,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,70.597326,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,26.118981,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,62.572553,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,26.209740,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,62.822163,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.702759,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,66.037250,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.827319,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,71.249488,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.775656,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,62.907740,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.834111,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,75.054840,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,26.253773,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,61.943780,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,26.276609,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,61.851260,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.689124,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,69.262678,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.672505,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,73.133838,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.631939,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,66.750426,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.913212,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,64.675854,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,26.447855,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,61.601586,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,26.252401,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,61.955597,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.703098,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,68.315884,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.807940,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,75.701812,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,25.857585,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,62.865699,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,25.785043,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,63.303901,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,26.329548,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,61.085350,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,26.401250,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,61.327850,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,76.646453,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,76.408263,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,66.143049,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,66.626689,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,78.586541,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,78.437226,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,67.294776,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,67.519295,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,83.240654,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,82.798171,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,70.350631,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,71.047552,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,76.947381,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,76.043851,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,68.641934,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,68.768893,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,78.648941,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,77.599791,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,69.483032,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,69.184328,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,83.075783,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,83.171316,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,72.100870,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,72.667771,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,77.178308,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,76.987765,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,173.891298,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,174.383305,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,78.001683,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,78.145431,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,174.426247,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,173.456537,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,83.578019,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,83.350259,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,179.564871,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,181.208623,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,76.724585,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,77.335260,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,172.416292,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,170.913750,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,77.864377,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,77.955812,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,173.070785,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,173.094255,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu_BACKWARD,short,True,82.591598,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu_BACKWARD,short,True,82.869897,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,181.269854,0.000000 +PyTorch,embeddingbag,embeddingbag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,181.079995,0.000000 +PyTorch,embedding,embedding_num_embeddings10_embedding_dim64_input_size8_cpu,short,False,13.257645,0.000000 +PyTorch,embedding,embedding_num_embeddings10_embedding_dim64_input_size16_cpu,short,False,13.274894,0.000000 +PyTorch,embedding,embedding_num_embeddings10_embedding_dim64_input_size64_cpu,short,False,13.594135,0.000000 +PyTorch,embedding,embedding_num_embeddings120_embedding_dim64_input_size8_cpu,short,False,13.210569,0.000000 +PyTorch,embedding,embedding_num_embeddings120_embedding_dim64_input_size16_cpu,short,False,13.358302,0.000000 +PyTorch,embedding,embedding_num_embeddings120_embedding_dim64_input_size64_cpu,short,False,13.676537,0.000000 +PyTorch,embedding,embedding_num_embeddings1000_embedding_dim64_input_size8_cpu,short,False,13.230114,0.000000 +PyTorch,embedding,embedding_num_embeddings1000_embedding_dim64_input_size16_cpu,short,False,13.316872,0.000000 +PyTorch,embedding,embedding_num_embeddings1000_embedding_dim64_input_size64_cpu,short,False,13.728165,0.000000 +PyTorch,embedding,embedding_num_embeddings2300_embedding_dim64_input_size8_cpu,short,False,13.240829,0.000000 +PyTorch,embedding,embedding_num_embeddings2300_embedding_dim64_input_size16_cpu,short,False,13.322630,0.000000 +PyTorch,embedding,embedding_num_embeddings2300_embedding_dim64_input_size64_cpu,short,False,13.678991,0.000000 +PyTorch,embedding,embedding_num_embeddings10_embedding_dim64_input_size8_cpu_BACKWARD,short,True,52.434260,0.000000 +PyTorch,embedding,embedding_num_embeddings10_embedding_dim64_input_size16_cpu_BACKWARD,short,True,54.270657,0.000000 +PyTorch,embedding,embedding_num_embeddings10_embedding_dim64_input_size64_cpu_BACKWARD,short,True,60.054990,0.000000 +PyTorch,embedding,embedding_num_embeddings120_embedding_dim64_input_size8_cpu_BACKWARD,short,True,55.491721,0.000000 +PyTorch,embedding,embedding_num_embeddings120_embedding_dim64_input_size16_cpu_BACKWARD,short,True,56.325304,0.000000 +PyTorch,embedding,embedding_num_embeddings120_embedding_dim64_input_size64_cpu_BACKWARD,short,True,61.959455,0.000000 +PyTorch,embedding,embedding_num_embeddings1000_embedding_dim64_input_size8_cpu_BACKWARD,short,True,158.577292,0.000000 +PyTorch,embedding,embedding_num_embeddings1000_embedding_dim64_input_size16_cpu_BACKWARD,short,True,157.616690,0.000000 +PyTorch,embedding,embedding_num_embeddings1000_embedding_dim64_input_size64_cpu_BACKWARD,short,True,164.962560,0.000000 +PyTorch,embedding,embedding_num_embeddings2300_embedding_dim64_input_size8_cpu_BACKWARD,short,True,191.301190,0.000000 +PyTorch,embedding,embedding_num_embeddings2300_embedding_dim64_input_size16_cpu_BACKWARD,short,True,196.503447,0.000000 +PyTorch,embedding,embedding_num_embeddings2300_embedding_dim64_input_size64_cpu_BACKWARD,short,True,201.295830,0.000000 +PyTorch,fill_,fill__N1_cpu_dtypetorch.int32,short,False,1.126186,0.000000 +PyTorch,fill_,fill__N1024_cpu_dtypetorch.int32,short,False,2.565226,0.000000 +PyTorch,fill_,fill__N2048_cpu_dtypetorch.int32,short,False,2.978169,0.000000 +PyTorch,gather,gather_M256_N512_dim0_cpu,short,False,113.958748,0.000000 +PyTorch,gather,gather_M512_N512_dim1_cpu,short,False,72.347757,0.000000 +PyTorch,GroupNormBenchmark,"GroupNormBenchmark_dims(32,8,16)_num_groups2",short,False,60.884617,0.000000 +PyTorch,GroupNormBenchmark,"GroupNormBenchmark_dims(32,8,16)_num_groups4",short,False,53.373645,0.000000 +PyTorch,GroupNormBenchmark,"GroupNormBenchmark_dims(32,8,56,56)_num_groups2",short,False,113.483659,0.000000 +PyTorch,GroupNormBenchmark,"GroupNormBenchmark_dims(32,8,56,56)_num_groups4",short,False,114.206127,0.000000 +PyTorch,Hardsigmoid,Hardsigmoid_N1_C3_H256_W256_cpu,short,False,66.121431,0.000000 +PyTorch,Hardsigmoid,Hardsigmoid_N4_C3_H256_W256_cpu,short,False,74.423833,0.000000 +PyTorch,Hardswish,Hardswish_N1_C3_H256_W256_cpu,short,False,67.379220,0.000000 +PyTorch,Hardswish,Hardswish_N4_C3_H256_W256_cpu,short,False,82.693655,0.000000 +PyTorch,index_add_,index_add__M8_N32_K1_dim0_cpu_dtypetorch.float32,short,False,7.053411,0.000000 +PyTorch,index_add_,index_add__M256_N512_K1_dim1_cpu_dtypetorch.float32,short,False,13.263054,0.000000 +PyTorch,index_add_,index_add__M512_N512_K1_dim2_cpu_dtypetorch.float32,short,False,108.319590,0.000000 +PyTorch,index_select,index_select_M8_N8_K1_dim1_cpu,short,False,4.514675,0.000000 +PyTorch,index_select,index_select_M256_N512_K1_dim1_cpu,short,False,54.654160,0.000000 +PyTorch,index_select,index_select_M512_N512_K1_dim1_cpu,short,False,103.358516,0.000000 +PyTorch,index_select,index_select_M8_N8_K2_dim1_cpu,short,False,4.561579,0.000000 +PyTorch,index_select,index_select_M256_N512_K2_dim1_cpu,short,False,212.789483,0.000000 +PyTorch,index_select,index_select_M512_N512_K2_dim1_cpu,short,False,430.552168,0.000000 +PyTorch,InstanceNormBenchmark,"InstanceNormBenchmark_dims(32,8,16)",short,False,169.785802,0.000000 +PyTorch,InstanceNormBenchmark,"InstanceNormBenchmark_dims(32,8,56,56)",short,False,359.232437,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastTrue_modenearest",short,False,10.529644,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastTrue_modelinear",short,False,12.189028,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastTrue_modebicubic",short,False,46.246996,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastFalse_modenearest",short,False,22.743285,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastFalse_modelinear",short,False,24.601899,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastFalse_modebicubic",short,False,34.769822,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastTrue_modenearest",short,False,128.987081,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastTrue_modelinear",short,False,193.039880,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastTrue_modebicubic",short,False,487.996140,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastFalse_modenearest",short,False,80.409450,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastFalse_modelinear",short,False,112.757609,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastFalse_modebicubic",short,False,291.153090,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastTrue_modenearest",short,False,136.694490,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastTrue_modelinear",short,False,207.920459,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastTrue_modebicubic",short,False,547.632725,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastFalse_modenearest",short,False,81.090366,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastFalse_modelinear",short,False,117.256844,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastFalse_modebicubic",short,False,319.923544,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastTrue_modenearest",short,False,10.135673,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastTrue_modelinear",short,False,11.241479,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastTrue_modebicubic",short,False,25.862923,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastFalse_modenearest",short,False,9.880939,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastFalse_modelinear",short,False,11.446106,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastFalse_modebicubic",short,False,25.877143,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastTrue_modenearest",short,False,80.987965,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastTrue_modelinear",short,False,112.928955,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastTrue_modebicubic",short,False,293.535760,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastFalse_modenearest",short,False,80.649728,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastFalse_modelinear",short,False,112.735063,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastFalse_modebicubic",short,False,292.594442,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastTrue_modenearest",short,False,81.071167,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastTrue_modelinear",short,False,119.073692,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastTrue_modebicubic",short,False,325.062960,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastFalse_modenearest",short,False,80.776966,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastFalse_modelinear",short,False,118.075726,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastFalse_modebicubic",short,False,325.422923,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastTrue_modenearest_dtypetorch.uint8",short,False,10.408200,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,60,40)_output_size(24,24)_channels_lastFalse_modenearest_dtypetorch.uint8",short,False,23.989929,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastTrue_modenearest_dtypetorch.uint8",short,False,142.707918,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,600,400)_output_size(240,240)_channels_lastFalse_modenearest_dtypetorch.uint8",short,False,100.752786,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastTrue_modenearest_dtypetorch.uint8",short,False,153.185516,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,3,320,320)_output_size(256,256)_channels_lastFalse_modenearest_dtypetorch.uint8",short,False,104.761840,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastTrue_modenearest_dtypetorch.uint8",short,False,9.870818,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,60,40)_output_size(24,24)_channels_lastFalse_modenearest_dtypetorch.uint8",short,False,9.931431,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastTrue_modenearest_dtypetorch.uint8",short,False,99.600515,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,600,400)_output_size(240,240)_channels_lastFalse_modenearest_dtypetorch.uint8",short,False,99.164257,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastTrue_modenearest_dtypetorch.uint8",short,False,103.419602,0.000000 +PyTorch,interpolate,"interpolate_input_size(1,1,320,320)_output_size(256,256)_channels_lastFalse_modenearest_dtypetorch.uint8",short,False,103.148608,0.000000 +PyTorch,LayerNormBenchmark,"LayerNormBenchmark_dims(1,8,16)",short,False,9.418410,0.000000 +PyTorch,LayerNormBenchmark,"LayerNormBenchmark_dims(8,8,16)",short,False,57.969351,0.000000 +PyTorch,LayerNormBenchmark,"LayerNormBenchmark_dims(32,8,16)",short,False,59.316279,0.000000 +PyTorch,LayerNormBenchmark,"LayerNormBenchmark_dims(64,128,56,56)",short,False,2573.762285,0.000000 +PyTorch,linear,linear_N1_IN1_OUT1_cpu,short,False,17.240207,0.000000 +PyTorch,linear,linear_N4_IN256_OUT128_cpu,short,False,70.636017,0.000000 +PyTorch,linear,linear_N16_IN512_OUT256_cpu,short,False,155.853732,0.000000 +PyTorch,matmul,matmul_M1_N1_K1_trans_aTrue_trans_bFalse_cpu,short,False,5.217676,0.000000 +PyTorch,matmul,matmul_M128_N128_K128_trans_aTrue_trans_bFalse_cpu,short,False,130.986713,0.000000 +PyTorch,matmul,matmul_M256_N256_K256_trans_aFalse_trans_bTrue_cpu,short,False,4967.684160,0.000000 +PyTorch,mm,mm_M1_N1_K1_cpu_dtypetorch.float32,short,False,4.969217,0.000000 +PyTorch,mm,mm_M64_N64_K64_cpu_dtypetorch.float32,short,False,56.936066,0.000000 +PyTorch,mm,mm_M64_N64_K128_cpu_dtypetorch.float32,short,False,59.284410,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float32_replace_infTrue,short,False,6.358168,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float32_replace_infFalse,short,False,6.798741,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float64_replace_infTrue,short,False,8.008753,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float64_replace_infFalse,short,False,8.567021,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float32_replace_infTrue,short,False,6.319673,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float32_replace_infFalse,short,False,6.744320,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float64_replace_infTrue,short,False,8.063743,0.000000 +PyTorch,nan_to_num,nan_to_num_M16_N64_dtypetorch.float64_replace_infFalse,short,False,8.583122,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float32_replace_infTrue,short,False,7.557407,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float32_replace_infFalse,short,False,8.056106,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float64_replace_infTrue,short,False,13.849453,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float64_replace_infFalse,short,False,14.596365,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float32_replace_infTrue,short,False,7.504524,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float32_replace_infFalse,short,False,8.090356,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float64_replace_infTrue,short,False,14.077416,0.000000 +PyTorch,nan_to_num,nan_to_num_M64_N64_dtypetorch.float64_replace_infFalse,short,False,14.615643,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float32_replace_infTrue,short,False,4.053200,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float32_replace_infFalse,short,False,4.485825,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float64_replace_infTrue,short,False,5.800954,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float64_replace_infFalse,short,False,6.403105,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float32_replace_infTrue,short,False,4.020517,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float32_replace_infFalse,short,False,4.438027,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float64_replace_infTrue,short,False,5.689130,0.000000 +PyTorch,nan_to_num_,nan_to_num__M16_N64_dtypetorch.float64_replace_infFalse,short,False,6.420881,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float32_replace_infTrue,short,False,4.984703,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float32_replace_infFalse,short,False,5.660661,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float64_replace_infTrue,short,False,11.735412,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float64_replace_infFalse,short,False,12.347645,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float32_replace_infTrue,short,False,5.176911,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float32_replace_infFalse,short,False,5.569892,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float64_replace_infTrue,short,False,11.676570,0.000000 +PyTorch,nan_to_num_,nan_to_num__M64_N64_dtypetorch.float64_replace_infFalse,short,False,12.506719,0.000000 +PyTorch,MaxPool1d,MaxPool1d_kernel3_stride1_N8_C256_L256_cpu,short,False,121.343571,0.000000 +PyTorch,AvgPool1d,AvgPool1d_kernel3_stride1_N8_C256_L256_cpu,short,False,315.454573,0.000000 +PyTorch,MaxPool2d,"MaxPool2d_kernel[3,1]_stride[2,1]_N1_C16_H32_W32_cpu",short,False,58.314310,0.000000 +PyTorch,AvgPool2d,"AvgPool2d_kernel[3,1]_stride[2,1]_N1_C16_H32_W32_cpu",short,False,55.510125,0.000000 +PyTorch,AdaptiveMaxPool2d,"AdaptiveMaxPool2d_kernel[3,1]_stride[2,1]_N1_C16_H32_W32_cpu",short,False,63.309880,0.000000 +PyTorch,FractionalMaxPool2d,"FractionalMaxPool2d_kernel[3,1]_stride[2,1]_N1_C16_H32_W32_cpu",short,False,66.127681,0.000000 +PyTorch,MaxPool3d,"MaxPool3d_kernel[3,1,3]_stride[2,1,2]_N1_C16_D16_H32_W32_cpu",short,False,236.593780,0.000000 +PyTorch,AvgPool3d,"AvgPool3d_kernel[3,1,3]_stride[2,1,2]_N1_C16_D16_H32_W32_cpu",short,False,100.692771,0.000000 +PyTorch,AdaptiveMaxPool3d,"AdaptiveMaxPool3d_kernel[3,1,3]_stride[2,1,2]_N1_C16_D16_H32_W32_cpu",short,False,192.562352,0.000000 +PyTorch,FractionalMaxPool3d,"FractionalMaxPool3d_kernel[3,1,3]_stride[2,1,2]_N1_C16_D16_H32_W32_cpu",short,False,66.164532,0.000000 +PyTorch,fmod,fmod_M1_N1_K1_cpu_dtypetorch.int32,short,False,3.635065,0.000000 +PyTorch,fmod,fmod_M1_N1_K1_cpu_dtypetorch.float32,short,False,3.901028,0.000000 +PyTorch,fmod,fmod_M1_N1_K1_cpu_dtypetorch.float64,short,False,4.041925,0.000000 +PyTorch,fmod,fmod_M64_N64_K64_cpu_dtypetorch.int32,short,False,129.514345,0.000000 +PyTorch,fmod,fmod_M64_N64_K64_cpu_dtypetorch.float32,short,False,151.149918,0.000000 +PyTorch,fmod,fmod_M64_N64_K64_cpu_dtypetorch.float64,short,False,746.067340,0.000000 +PyTorch,fmod,fmod_M64_N64_K128_cpu_dtypetorch.int32,short,False,210.913781,0.000000 +PyTorch,fmod,fmod_M64_N64_K128_cpu_dtypetorch.float32,short,False,252.686828,0.000000 +PyTorch,fmod,fmod_M64_N64_K128_cpu_dtypetorch.float64,short,False,1484.044931,0.000000 +PyTorch,remainder,remainder_M1_N1_K1_cpu_dtypetorch.int32,short,False,3.976802,0.000000 +PyTorch,remainder,remainder_M1_N1_K1_cpu_dtypetorch.float32,short,False,4.075495,0.000000 +PyTorch,remainder,remainder_M1_N1_K1_cpu_dtypetorch.float64,short,False,3.834691,0.000000 +PyTorch,remainder,remainder_M64_N64_K64_cpu_dtypetorch.int32,short,False,146.646648,0.000000 +PyTorch,remainder,remainder_M64_N64_K64_cpu_dtypetorch.float32,short,False,170.557022,0.000000 +PyTorch,remainder,remainder_M64_N64_K64_cpu_dtypetorch.float64,short,False,867.868537,0.000000 +PyTorch,remainder,remainder_M64_N64_K128_cpu_dtypetorch.int32,short,False,243.740380,0.000000 +PyTorch,remainder,remainder_M64_N64_K128_cpu_dtypetorch.float32,short,False,292.164866,0.000000 +PyTorch,remainder,remainder_M64_N64_K128_cpu_dtypetorch.float64,short,False,1730.402555,0.000000 +PyTorch,Softmax,Softmax_N1_C3_H256_W256_cpu,short,False,122.847048,0.000000 +PyTorch,Softmax,Softmax_N4_C3_H256_W256_cpu,short,False,317.788112,0.000000 +PyTorch,Softmax2d,Softmax2d_N1_C3_H256_W256_cpu,short,False,120.565735,0.000000 +PyTorch,Softmax2d,Softmax2d_N4_C3_H256_W256_cpu,short,False,316.982444,0.000000 +PyTorch,LogSoftmax,LogSoftmax_N1_C3_H256_W256_cpu,short,False,162.530153,0.000000 +PyTorch,LogSoftmax,LogSoftmax_N4_C3_H256_W256_cpu,short,False,266.478752,0.000000 +PyTorch,split,split_M8_N8_parts2_cpu,short,False,6.753952,0.000000 +PyTorch,split,split_M256_N512_parts2_cpu,short,False,6.873656,0.000000 +PyTorch,split,split_M512_N512_parts2_cpu,short,False,6.848019,0.000000 +PyTorch,stack,"stack_sizes(1,1,1)_N2_cpu_dim0",short,False,5.736891,0.000000 +PyTorch,stack,"stack_sizes(1,1,1)_N2_cpu_dim1",short,False,6.185757,0.000000 +PyTorch,stack,"stack_sizes(1,1,1)_N2_cpu_dim2",short,False,6.094516,0.000000 +PyTorch,stack,"stack_sizes(1,1,1)_N2_cpu_dim3",short,False,6.894034,0.000000 +PyTorch,stack,"stack_sizes(512,512,2)_N2_cpu_dim0",short,False,98.350665,0.000000 +PyTorch,stack,"stack_sizes(512,512,2)_N2_cpu_dim1",short,False,100.461322,0.000000 +PyTorch,stack,"stack_sizes(512,512,2)_N2_cpu_dim2",short,False,218.911485,0.000000 +PyTorch,stack,"stack_sizes(512,512,2)_N2_cpu_dim3",short,False,166.567879,0.000000 +PyTorch,stack,"stack_sizes(128,1024,2)_N2_cpu_dim0",short,False,99.504077,0.000000 +PyTorch,stack,"stack_sizes(128,1024,2)_N2_cpu_dim1",short,False,98.383429,0.000000 +PyTorch,stack,"stack_sizes(128,1024,2)_N2_cpu_dim2",short,False,153.173778,0.000000 +PyTorch,stack,"stack_sizes(128,1024,2)_N2_cpu_dim3",short,False,123.909933,0.000000 +PyTorch,sum,sum_R64_V32_dim0_contiguousTrue_cpu,short,False,6.692267,0.000000 +PyTorch,sum,sum_R64_V32_dim0_contiguousFalse_cpu,short,False,8.023065,0.000000 +PyTorch,sum,sum_R64_V32_dim1_contiguousTrue_cpu,short,False,6.881371,0.000000 +PyTorch,sum,sum_R64_V32_dim1_contiguousFalse_cpu,short,False,7.601940,0.000000 +PyTorch,sum,sum_R64_V512_dim0_contiguousTrue_cpu,short,False,44.774431,0.000000 +PyTorch,sum,sum_R64_V512_dim0_contiguousFalse_cpu,short,False,49.214148,0.000000 +PyTorch,sum,sum_R64_V512_dim1_contiguousTrue_cpu,short,False,45.532505,0.000000 +PyTorch,sum,sum_R64_V512_dim1_contiguousFalse_cpu,short,False,51.539750,0.000000 +PyTorch,sum,sum_R256_V32_dim0_contiguousTrue_cpu,short,False,7.732977,0.000000 +PyTorch,sum,sum_R256_V32_dim0_contiguousFalse_cpu,short,False,9.670269,0.000000 +PyTorch,sum,sum_R256_V32_dim1_contiguousTrue_cpu,short,False,7.691115,0.000000 +PyTorch,sum,sum_R256_V32_dim1_contiguousFalse_cpu,short,False,9.625176,0.000000 +PyTorch,sum,sum_R256_V512_dim0_contiguousTrue_cpu,short,False,50.954394,0.000000 +PyTorch,sum,sum_R256_V512_dim0_contiguousFalse_cpu,short,False,57.957757,0.000000 +PyTorch,sum,sum_R256_V512_dim1_contiguousTrue_cpu,short,False,53.592068,0.000000 +PyTorch,sum,sum_R256_V512_dim1_contiguousFalse_cpu,short,False,51.339726,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M8_N16_cpu,short,False,7.040985,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M8_N64_cpu,short,False,7.168604,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M8_N128_cpu,short,False,7.434442,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M16_N16_cpu,short,False,7.078318,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M16_N64_cpu,short,False,7.426670,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M16_N128_cpu,short,False,7.679027,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M32_N16_cpu,short,False,7.281365,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M32_N64_cpu,short,False,7.682783,0.000000 +PyTorch,FloatToHalfTensorConversionBenchmark,FloatToHalfTensorConversionBenchmark_M32_N128_cpu,short,False,8.381938,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M8_N16_cpu,short,False,7.039854,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M8_N64_cpu,short,False,7.399855,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M8_N128_cpu,short,False,7.715193,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M16_N16_cpu,short,False,7.255140,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M16_N64_cpu,short,False,7.753522,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M16_N128_cpu,short,False,8.364281,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M32_N16_cpu,short,False,7.476377,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M32_N64_cpu,short,False,8.458564,0.000000 +PyTorch,HalfToFloatTensorConversionBenchmark,HalfToFloatTensorConversionBenchmark_M32_N128_cpu,short,False,9.391939,0.000000 +PyTorch,addcmul,addcmul_M1_N2_cpu_dtypetorch.float32,short,False,4.461410,0.000000 +PyTorch,addcmul,addcmul_M1_N2_cpu_dtypetorch.bfloat16,short,False,4.560082,0.000000 +PyTorch,addcmul,addcmul_M32_N64_cpu_dtypetorch.float32,short,False,5.141248,0.000000 +PyTorch,addcmul,addcmul_M32_N64_cpu_dtypetorch.bfloat16,short,False,5.819053,0.000000 +PyTorch,addcdiv,addcdiv_M1_N2_cpu_dtypetorch.float32,short,False,4.922033,0.000000 +PyTorch,addcdiv,addcdiv_M1_N2_cpu_dtypetorch.bfloat16,short,False,4.861055,0.000000 +PyTorch,addcdiv,addcdiv_M32_N64_cpu_dtypetorch.float32,short,False,5.560473,0.000000 +PyTorch,addcdiv,addcdiv_M32_N64_cpu_dtypetorch.bfloat16,short,False,6.113489,0.000000 +PyTorch,topk,"topk_shape(16,4)_k4_dim1_cpu_dtypetorch.float32",short,False,6.656324,0.000000 +PyTorch,topk,"topk_shape(1048576,)_k16_dim0_cpu_dtypetorch.float32",short,False,2137.073922,0.000000 +PyTorch,where,"where_cond_shape(8,16,1)_input_shape(1,)_other_shape(1,)_cpu_dtypetorch.float32",short,False,6.551560,0.000000 +PyTorch,where,"where_cond_shape(8,16,1)_input_shape(16,1)_other_shape(8,16,1)_cpu_dtypetorch.float32",short,False,6.548704,0.000000 +PyTorch,where,"where_cond_shape(8,16,1)_input_shape(8,1,1)_other_shape(1,)_cpu_dtypetorch.float32",short,False,6.417945,0.000000 +PyTorch,relu,"relu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,9.394759,0.000000 +PyTorch,relu,"relu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,9.308802,0.000000 +PyTorch,relu,"relu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,9.267544,0.000000 +PyTorch,relu,"relu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,9.685650,0.000000 +PyTorch,relu,"relu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,9.606769,0.000000 +PyTorch,relu,"relu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,9.553571,0.000000 +PyTorch,relu,"relu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,80.796781,0.000000 +PyTorch,relu,"relu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,91.592676,0.000000 +PyTorch,relu,"relu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,83.363830,0.000000 +PyTorch,relu,"relu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,82.888682,0.000000 +PyTorch,relu,"relu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,97.166943,0.000000 +PyTorch,relu,"relu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,104.243662,0.000000 +PyTorch,relu6,"relu6_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,8.418549,0.000000 +PyTorch,relu6,"relu6_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,8.500449,0.000000 +PyTorch,relu6,"relu6_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,8.443481,0.000000 +PyTorch,relu6,"relu6_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,8.960919,0.000000 +PyTorch,relu6,"relu6_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,8.986856,0.000000 +PyTorch,relu6,"relu6_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,8.814634,0.000000 +PyTorch,relu6,"relu6_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,80.921564,0.000000 +PyTorch,relu6,"relu6_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,81.595518,0.000000 +PyTorch,relu6,"relu6_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,85.112929,0.000000 +PyTorch,relu6,"relu6_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,84.740682,0.000000 +PyTorch,relu6,"relu6_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,85.530059,0.000000 +PyTorch,relu6,"relu6_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,106.365863,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,8.055478,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,8.238628,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,8.119306,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,8.683609,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,8.759866,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,8.594149,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,77.579946,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,83.634438,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,84.316144,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,84.438504,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,84.312683,0.000000 +PyTorch,functional.hardtanh,"functional.hardtanh_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,105.458681,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,6.480224,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,6.658893,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,6.502791,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,7.091508,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,7.071250,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,7.143394,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,344.615549,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,360.922264,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,360.622480,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,344.514761,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,361.637229,0.000000 +PyTorch,functional.hardsigmoid,"functional.hardsigmoid_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,360.860964,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,12.176948,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,11.734075,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,11.181202,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,13.658838,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,13.976081,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,12.947895,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,437.285316,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,445.478465,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,523.076388,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,442.810632,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,449.038734,0.000000 +PyTorch,functional.leaky_relu,"functional.leaky_relu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,541.625834,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,6.427155,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,6.355635,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,6.445739,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,7.175534,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,7.055749,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,7.111532,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,321.942471,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,412.526749,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,413.297580,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,322.569442,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,413.410907,0.000000 +PyTorch,functional.sigmoid,"functional.sigmoid_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,414.466411,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,6.392274,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,6.349999,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,6.554333,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,7.061919,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,7.149233,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,7.086558,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,406.644221,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,373.447059,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,371.772997,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,409.167217,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,373.676758,0.000000 +PyTorch,functional.tanh,"functional.tanh_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,374.537943,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,9.930822,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,10.116378,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,10.149234,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,11.481823,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,11.614461,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,11.762893,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,335.415021,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,350.660354,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,351.735603,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,336.152532,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,350.996697,0.000000 +PyTorch,functional.hardswish,"functional.hardswish_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,353.547824,0.000000 +PyTorch,functional.elu,"functional.elu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,10.267545,0.000000 +PyTorch,functional.elu,"functional.elu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,10.379921,0.000000 +PyTorch,functional.elu,"functional.elu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,10.477865,0.000000 +PyTorch,functional.elu,"functional.elu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,11.684307,0.000000 +PyTorch,functional.elu,"functional.elu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,12.064549,0.000000 +PyTorch,functional.elu,"functional.elu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,12.134612,0.000000 +PyTorch,functional.elu,"functional.elu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,154.252406,0.000000 +PyTorch,functional.elu,"functional.elu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,450.243138,0.000000 +PyTorch,functional.elu,"functional.elu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,449.014350,0.000000 +PyTorch,functional.elu,"functional.elu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,153.808653,0.000000 +PyTorch,functional.elu,"functional.elu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,445.457985,0.000000 +PyTorch,functional.elu,"functional.elu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,453.355262,0.000000 +PyTorch,functional.celu,"functional.celu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,9.940230,0.000000 +PyTorch,functional.celu,"functional.celu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,10.151808,0.000000 +PyTorch,functional.celu,"functional.celu_dims(3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,10.292930,0.000000 +PyTorch,functional.celu,"functional.celu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,11.492981,0.000000 +PyTorch,functional.celu,"functional.celu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,11.703474,0.000000 +PyTorch,functional.celu,"functional.celu_dims(2,3,4,5)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,11.779910,0.000000 +PyTorch,functional.celu,"functional.celu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,156.045063,0.000000 +PyTorch,functional.celu,"functional.celu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,446.178772,0.000000 +PyTorch,functional.celu,"functional.celu_dims(512,512)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,449.322654,0.000000 +PyTorch,functional.celu,"functional.celu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.quint8",short,False,155.598436,0.000000 +PyTorch,functional.celu,"functional.celu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint8",short,False,451.376561,0.000000 +PyTorch,functional.celu,"functional.celu_dims(256,1024)_contigFalse_inplaceFalse_dtypetorch.qint32",short,False,456.399200,0.000000 +PyTorch,add,add_N2_dtypetorch.quint8_contigFalse,short,False,54.525704,0.000000 +PyTorch,add,add_N2_dtypetorch.quint8_contigTrue,short,False,48.507417,0.000000 +PyTorch,add,add_N2_dtypetorch.qint8_contigFalse,short,False,54.165648,0.000000 +PyTorch,add,add_N2_dtypetorch.qint8_contigTrue,short,False,49.270978,0.000000 +PyTorch,add,add_N2_dtypetorch.qint32_contigFalse,short,False,10.166548,0.000000 +PyTorch,add,add_N2_dtypetorch.qint32_contigTrue,short,False,9.839232,0.000000 +PyTorch,add,add_N8_dtypetorch.quint8_contigFalse,short,False,55.172433,0.000000 +PyTorch,add,add_N8_dtypetorch.quint8_contigTrue,short,False,46.703761,0.000000 +PyTorch,add,add_N8_dtypetorch.qint8_contigFalse,short,False,55.712299,0.000000 +PyTorch,add,add_N8_dtypetorch.qint8_contigTrue,short,False,47.370029,0.000000 +PyTorch,add,add_N8_dtypetorch.qint32_contigFalse,short,False,11.358310,0.000000 +PyTorch,add,add_N8_dtypetorch.qint32_contigTrue,short,False,11.571205,0.000000 +PyTorch,add,add_N64_dtypetorch.quint8_contigFalse,short,False,59.735500,0.000000 +PyTorch,add,add_N64_dtypetorch.quint8_contigTrue,short,False,47.242686,0.000000 +PyTorch,add,add_N64_dtypetorch.qint8_contigFalse,short,False,60.975918,0.000000 +PyTorch,add,add_N64_dtypetorch.qint8_contigTrue,short,False,47.022490,0.000000 +PyTorch,add,add_N64_dtypetorch.qint32_contigFalse,short,False,29.096942,0.000000 +PyTorch,add,add_N64_dtypetorch.qint32_contigTrue,short,False,89.559198,0.000000 +PyTorch,add,add_N512_dtypetorch.quint8_contigFalse,short,False,213.117569,0.000000 +PyTorch,add,add_N512_dtypetorch.quint8_contigTrue,short,False,58.900791,0.000000 +PyTorch,add,add_N512_dtypetorch.qint8_contigFalse,short,False,212.745501,0.000000 +PyTorch,add,add_N512_dtypetorch.qint8_contigTrue,short,False,58.136227,0.000000 +PyTorch,add,add_N512_dtypetorch.qint32_contigFalse,short,False,186.300471,0.000000 +PyTorch,add,add_N512_dtypetorch.qint32_contigTrue,short,False,690.767958,0.000000 +PyTorch,add_relu,add_relu_N2_dtypetorch.quint8_contigFalse,short,False,10.009465,0.000000 +PyTorch,add_relu,add_relu_N2_dtypetorch.quint8_contigTrue,short,False,9.746104,0.000000 +PyTorch,add_relu,add_relu_N2_dtypetorch.qint8_contigFalse,short,False,10.162506,0.000000 +PyTorch,add_relu,add_relu_N2_dtypetorch.qint8_contigTrue,short,False,9.701948,0.000000 +PyTorch,add_relu,add_relu_N2_dtypetorch.qint32_contigFalse,short,False,10.097318,0.000000 +PyTorch,add_relu,add_relu_N2_dtypetorch.qint32_contigTrue,short,False,9.738773,0.000000 +PyTorch,add_relu,add_relu_N8_dtypetorch.quint8_contigFalse,short,False,11.193524,0.000000 +PyTorch,add_relu,add_relu_N8_dtypetorch.quint8_contigTrue,short,False,11.319229,0.000000 +PyTorch,add_relu,add_relu_N8_dtypetorch.qint8_contigFalse,short,False,11.153031,0.000000 +PyTorch,add_relu,add_relu_N8_dtypetorch.qint8_contigTrue,short,False,11.185324,0.000000 +PyTorch,add_relu,add_relu_N8_dtypetorch.qint32_contigFalse,short,False,11.368479,0.000000 +PyTorch,add_relu,add_relu_N8_dtypetorch.qint32_contigTrue,short,False,11.326698,0.000000 +PyTorch,add_relu,add_relu_N64_dtypetorch.quint8_contigFalse,short,False,29.288667,0.000000 +PyTorch,add_relu,add_relu_N64_dtypetorch.quint8_contigTrue,short,False,81.897881,0.000000 +PyTorch,add_relu,add_relu_N64_dtypetorch.qint8_contigFalse,short,False,39.738525,0.000000 +PyTorch,add_relu,add_relu_N64_dtypetorch.qint8_contigTrue,short,False,82.035375,0.000000 +PyTorch,add_relu,add_relu_N64_dtypetorch.qint32_contigFalse,short,False,43.063633,0.000000 +PyTorch,add_relu,add_relu_N64_dtypetorch.qint32_contigTrue,short,False,89.797751,0.000000 +PyTorch,add_relu,add_relu_N512_dtypetorch.quint8_contigFalse,short,False,186.276330,0.000000 +PyTorch,add_relu,add_relu_N512_dtypetorch.quint8_contigTrue,short,False,621.216089,0.000000 +PyTorch,add_relu,add_relu_N512_dtypetorch.qint8_contigFalse,short,False,397.837161,0.000000 +PyTorch,add_relu,add_relu_N512_dtypetorch.qint8_contigTrue,short,False,626.707880,0.000000 +PyTorch,add_relu,add_relu_N512_dtypetorch.qint32_contigFalse,short,False,399.039524,0.000000 +PyTorch,add_relu,add_relu_N512_dtypetorch.qint32_contigTrue,short,False,695.372335,0.000000 +PyTorch,mul,mul_N2_dtypetorch.quint8_contigFalse,short,False,10.792049,0.000000 +PyTorch,mul,mul_N2_dtypetorch.quint8_contigTrue,short,False,10.337356,0.000000 +PyTorch,mul,mul_N2_dtypetorch.qint8_contigFalse,short,False,29.766997,0.000000 +PyTorch,mul,mul_N2_dtypetorch.qint8_contigTrue,short,False,10.670764,0.000000 +PyTorch,mul,mul_N2_dtypetorch.qint32_contigFalse,short,False,10.747730,0.000000 +PyTorch,mul,mul_N2_dtypetorch.qint32_contigTrue,short,False,10.272625,0.000000 +PyTorch,mul,mul_N8_dtypetorch.quint8_contigFalse,short,False,11.249079,0.000000 +PyTorch,mul,mul_N8_dtypetorch.quint8_contigTrue,short,False,10.184144,0.000000 +PyTorch,mul,mul_N8_dtypetorch.qint8_contigFalse,short,False,412.500754,0.000000 +PyTorch,mul,mul_N8_dtypetorch.qint8_contigTrue,short,False,380.488152,0.000000 +PyTorch,mul,mul_N8_dtypetorch.qint32_contigFalse,short,False,11.217967,0.000000 +PyTorch,mul,mul_N8_dtypetorch.qint32_contigTrue,short,False,10.372477,0.000000 +PyTorch,mul,mul_N64_dtypetorch.quint8_contigFalse,short,False,26.384046,0.000000 +PyTorch,mul,mul_N64_dtypetorch.quint8_contigTrue,short,False,13.281053,0.000000 +PyTorch,mul,mul_N64_dtypetorch.qint8_contigFalse,short,False,427.333217,0.000000 +PyTorch,mul,mul_N64_dtypetorch.qint8_contigTrue,short,False,378.800277,0.000000 +PyTorch,mul,mul_N64_dtypetorch.qint32_contigFalse,short,False,22.636102,0.000000 +PyTorch,mul,mul_N64_dtypetorch.qint32_contigTrue,short,False,13.891831,0.000000 +PyTorch,mul,mul_N512_dtypetorch.quint8_contigFalse,short,False,324.837860,0.000000 +PyTorch,mul,mul_N512_dtypetorch.quint8_contigTrue,short,False,70.655191,0.000000 +PyTorch,mul,mul_N512_dtypetorch.qint8_contigFalse,short,False,697.828340,0.000000 +PyTorch,mul,mul_N512_dtypetorch.qint8_contigTrue,short,False,414.893995,0.000000 +PyTorch,mul,mul_N512_dtypetorch.qint32_contigFalse,short,False,140.090565,0.000000 +PyTorch,mul,mul_N512_dtypetorch.qint32_contigTrue,short,False,72.970641,0.000000 +PyTorch,add_scalar,add_scalar_N2_dtypetorch.quint8_contigFalse,short,False,9.650154,0.000000 +PyTorch,add_scalar,add_scalar_N2_dtypetorch.quint8_contigTrue,short,False,9.056958,0.000000 +PyTorch,add_scalar,add_scalar_N2_dtypetorch.qint8_contigFalse,short,False,10.032105,0.000000 +PyTorch,add_scalar,add_scalar_N2_dtypetorch.qint8_contigTrue,short,False,9.419741,0.000000 +PyTorch,add_scalar,add_scalar_N2_dtypetorch.qint32_contigFalse,short,False,9.857270,0.000000 +PyTorch,add_scalar,add_scalar_N2_dtypetorch.qint32_contigTrue,short,False,9.260383,0.000000 +PyTorch,add_scalar,add_scalar_N8_dtypetorch.quint8_contigFalse,short,False,10.275563,0.000000 +PyTorch,add_scalar,add_scalar_N8_dtypetorch.quint8_contigTrue,short,False,8.914322,0.000000 +PyTorch,add_scalar,add_scalar_N8_dtypetorch.qint8_contigFalse,short,False,9.973162,0.000000 +PyTorch,add_scalar,add_scalar_N8_dtypetorch.qint8_contigTrue,short,False,9.329676,0.000000 +PyTorch,add_scalar,add_scalar_N8_dtypetorch.qint32_contigFalse,short,False,9.742725,0.000000 +PyTorch,add_scalar,add_scalar_N8_dtypetorch.qint32_contigTrue,short,False,9.058522,0.000000 +PyTorch,add_scalar,add_scalar_N64_dtypetorch.quint8_contigFalse,short,False,20.745533,0.000000 +PyTorch,add_scalar,add_scalar_N64_dtypetorch.quint8_contigTrue,short,False,11.517188,0.000000 +PyTorch,add_scalar,add_scalar_N64_dtypetorch.qint8_contigFalse,short,False,14.588801,0.000000 +PyTorch,add_scalar,add_scalar_N64_dtypetorch.qint8_contigTrue,short,False,9.918611,0.000000 +PyTorch,add_scalar,add_scalar_N64_dtypetorch.qint32_contigFalse,short,False,13.542074,0.000000 +PyTorch,add_scalar,add_scalar_N64_dtypetorch.qint32_contigTrue,short,False,10.794776,0.000000 +PyTorch,add_scalar,add_scalar_N512_dtypetorch.quint8_contigFalse,short,False,120.869888,0.000000 +PyTorch,add_scalar,add_scalar_N512_dtypetorch.quint8_contigTrue,short,False,75.806970,0.000000 +PyTorch,add_scalar,add_scalar_N512_dtypetorch.qint8_contigFalse,short,False,81.201255,0.000000 +PyTorch,add_scalar,add_scalar_N512_dtypetorch.qint8_contigTrue,short,False,55.456395,0.000000 +PyTorch,add_scalar,add_scalar_N512_dtypetorch.qint32_contigFalse,short,False,85.280151,0.000000 +PyTorch,add_scalar,add_scalar_N512_dtypetorch.qint32_contigTrue,short,False,59.971946,0.000000 +PyTorch,mul_scalar,mul_scalar_N2_dtypetorch.quint8_contigFalse,short,False,9.801843,0.000000 +PyTorch,mul_scalar,mul_scalar_N2_dtypetorch.quint8_contigTrue,short,False,9.290992,0.000000 +PyTorch,mul_scalar,mul_scalar_N2_dtypetorch.qint8_contigFalse,short,False,9.980126,0.000000 +PyTorch,mul_scalar,mul_scalar_N2_dtypetorch.qint8_contigTrue,short,False,9.359637,0.000000 +PyTorch,mul_scalar,mul_scalar_N2_dtypetorch.qint32_contigFalse,short,False,9.915617,0.000000 +PyTorch,mul_scalar,mul_scalar_N2_dtypetorch.qint32_contigTrue,short,False,9.210668,0.000000 +PyTorch,mul_scalar,mul_scalar_N8_dtypetorch.quint8_contigFalse,short,False,9.820922,0.000000 +PyTorch,mul_scalar,mul_scalar_N8_dtypetorch.quint8_contigTrue,short,False,9.130066,0.000000 +PyTorch,mul_scalar,mul_scalar_N8_dtypetorch.qint8_contigFalse,short,False,9.822860,0.000000 +PyTorch,mul_scalar,mul_scalar_N8_dtypetorch.qint8_contigTrue,short,False,9.208939,0.000000 +PyTorch,mul_scalar,mul_scalar_N8_dtypetorch.qint32_contigFalse,short,False,9.923802,0.000000 +PyTorch,mul_scalar,mul_scalar_N8_dtypetorch.qint32_contigTrue,short,False,9.228233,0.000000 +PyTorch,mul_scalar,mul_scalar_N64_dtypetorch.quint8_contigFalse,short,False,13.801614,0.000000 +PyTorch,mul_scalar,mul_scalar_N64_dtypetorch.quint8_contigTrue,short,False,9.730629,0.000000 +PyTorch,mul_scalar,mul_scalar_N64_dtypetorch.qint8_contigFalse,short,False,14.292015,0.000000 +PyTorch,mul_scalar,mul_scalar_N64_dtypetorch.qint8_contigTrue,short,False,9.772135,0.000000 +PyTorch,mul_scalar,mul_scalar_N64_dtypetorch.qint32_contigFalse,short,False,13.532725,0.000000 +PyTorch,mul_scalar,mul_scalar_N64_dtypetorch.qint32_contigTrue,short,False,10.971262,0.000000 +PyTorch,mul_scalar,mul_scalar_N512_dtypetorch.quint8_contigFalse,short,False,79.350580,0.000000 +PyTorch,mul_scalar,mul_scalar_N512_dtypetorch.quint8_contigTrue,short,False,56.108255,0.000000 +PyTorch,mul_scalar,mul_scalar_N512_dtypetorch.qint8_contigFalse,short,False,80.221636,0.000000 +PyTorch,mul_scalar,mul_scalar_N512_dtypetorch.qint8_contigTrue,short,False,54.967161,0.000000 +PyTorch,mul_scalar,mul_scalar_N512_dtypetorch.qint32_contigFalse,short,False,85.677349,0.000000 +PyTorch,mul_scalar,mul_scalar_N512_dtypetorch.qint32_contigTrue,short,False,58.340807,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,274.988859,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,314.877017,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,274.143065,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,333.170297,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,276.114808,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,318.133386,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,316.446400,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,351.285540,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,316.018478,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,351.023262,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,314.584634,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,348.879078,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,510.666462,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,546.541658,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,513.146251,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,544.085314,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,512.262547,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,563.350471,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,526.527040,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,561.490715,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,526.299266,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,563.797929,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,533.919534,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,585.499031,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,77.160832,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,77.230151,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,77.935535,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,77.894121,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,81.645482,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,81.267530,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,87.730819,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,87.759078,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,88.382237,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,88.687020,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,92.216803,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,92.051609,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,318.113337,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,316.527647,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,311.871957,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,316.786788,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,318.008949,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,318.298942,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,309.078271,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,309.316080,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,309.372130,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,311.992863,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu_BACKWARD,short,True,312.211778,0.000000 +PyTorch,qatEmbeddingBag,qatEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu_BACKWARD,short,True,311.930870,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings10_embedding_dim64_input_size8_cpu,short,False,266.095368,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings10_embedding_dim64_input_size16_cpu,short,False,264.323879,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings10_embedding_dim64_input_size64_cpu,short,False,265.230784,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings120_embedding_dim64_input_size8_cpu,short,False,300.983800,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings120_embedding_dim64_input_size16_cpu,short,False,302.473380,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings120_embedding_dim64_input_size64_cpu,short,False,302.886389,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings1000_embedding_dim64_input_size8_cpu,short,False,497.948795,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings1000_embedding_dim64_input_size16_cpu,short,False,497.101363,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings1000_embedding_dim64_input_size64_cpu,short,False,498.723660,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings2300_embedding_dim64_input_size8_cpu,short,False,516.198427,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings2300_embedding_dim64_input_size16_cpu,short,False,516.910952,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings2300_embedding_dim64_input_size64_cpu,short,False,518.768045,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings10_embedding_dim64_input_size8_cpu_BACKWARD,short,True,64.304382,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings10_embedding_dim64_input_size16_cpu_BACKWARD,short,True,65.962808,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings10_embedding_dim64_input_size64_cpu_BACKWARD,short,True,71.122468,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings120_embedding_dim64_input_size8_cpu_BACKWARD,short,True,73.623478,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings120_embedding_dim64_input_size16_cpu_BACKWARD,short,True,75.755343,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings120_embedding_dim64_input_size64_cpu_BACKWARD,short,True,81.115363,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings1000_embedding_dim64_input_size8_cpu_BACKWARD,short,True,295.989743,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings1000_embedding_dim64_input_size16_cpu_BACKWARD,short,True,296.732952,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings1000_embedding_dim64_input_size64_cpu_BACKWARD,short,True,303.545079,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings2300_embedding_dim64_input_size8_cpu_BACKWARD,short,True,332.342200,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings2300_embedding_dim64_input_size16_cpu_BACKWARD,short,True,333.213785,0.000000 +PyTorch,qatEmbedding,qatEmbedding_num_embeddings2300_embedding_dim64_input_size64_cpu_BACKWARD,short,True,339.762786,0.000000 +PyTorch,QBatchNorm1d,QBatchNorm1d_M1_N256_K3136_cpu_dtypetorch.qint8,short,False,1279.230735,0.000000 +PyTorch,QBatchNorm2d,QBatchNorm2d_M1_N256_K3136_cpu_dtypetorch.qint8,short,False,1143.587020,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contigall_dtypetorch.quint8,short,False,229.089037,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contigall_dtypetorch.qint8,short,False,229.814037,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contigall_dtypetorch.qint32,short,False,919.673338,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contigone_dtypetorch.quint8,short,False,301.101660,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contigone_dtypetorch.qint8,short,False,300.354370,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contigone_dtypetorch.qint32,short,False,996.242370,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contignone_dtypetorch.quint8,short,False,367.358463,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contignone_dtypetorch.qint8,short,False,373.531795,0.000000 +PyTorch,qcat,qcat_M256_N512_K1_L2_dim0_contignone_dtypetorch.qint32,short,False,1071.199771,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contigall_dtypetorch.quint8,short,False,355.003390,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contigall_dtypetorch.qint8,short,False,357.724388,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contigall_dtypetorch.qint32,short,False,1591.623679,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contigone_dtypetorch.quint8,short,False,458.641811,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contigone_dtypetorch.qint8,short,False,458.108343,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contigone_dtypetorch.qint32,short,False,1715.952436,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contignone_dtypetorch.quint8,short,False,556.800793,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contignone_dtypetorch.qint8,short,False,557.022942,0.000000 +PyTorch,qcat,qcat_M512_N512_K2_L1_dim1_contignone_dtypetorch.qint32,short,False,1831.625177,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.659249,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.488580,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.062653,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.175123,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,7.031340,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.240752,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.901555,0.000000 +PyTorch,eq,eq_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.333026,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.366241,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,23.646604,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.343720,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.861064,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.998121,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.624672,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.924173,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.223008,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.916533,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.926139,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.413789,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.167968,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,7.286591,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,19.297183,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.087414,0.000000 +PyTorch,eq,eq_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.674432,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,18.425990,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,33.055810,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,21.737632,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,37.173348,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,11.547812,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.831548,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.424478,0.000000 +PyTorch,eq,eq_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.738332,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,19.230981,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,34.484918,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,22.740766,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,38.301714,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,10.705394,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.413391,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.401949,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.602660,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,28.037415,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,43.889381,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,27.580923,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,43.491900,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,21.994874,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,34.649429,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,20.859801,0.000000 +PyTorch,eq,eq_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,33.119628,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.472581,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.114184,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.017749,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.735235,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.569071,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.797276,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.891585,0.000000 +PyTorch,ne,ne_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.659451,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.143022,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,23.786464,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.225867,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.986286,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.614645,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.335371,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.021240,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.611790,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.667795,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.338721,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.562054,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.746058,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,7.040875,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.537772,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.289554,0.000000 +PyTorch,ne,ne_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,24.121479,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,17.736341,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,32.487414,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,20.927801,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,36.157429,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,11.152495,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.151756,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,15.921099,0.000000 +PyTorch,ne,ne_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.827231,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,18.198807,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,33.871904,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,21.828119,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,38.920595,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,11.054162,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.071486,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.014435,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,29.079400,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,28.000709,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,42.665661,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,26.996536,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,42.408350,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,22.120757,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,34.036985,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,20.305630,0.000000 +PyTorch,ne,ne_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,33.293711,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.989175,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.022303,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.211976,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.225586,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.725662,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.036751,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.195603,0.000000 +PyTorch,lt,lt_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.173156,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.922803,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.063407,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.478919,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.725090,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.556450,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.992666,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.041052,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.128039,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.908588,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.932022,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.509387,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.507423,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.991223,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.883428,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.340537,0.000000 +PyTorch,lt,lt_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.474580,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,17.780582,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,33.483268,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,21.736950,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,37.622393,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,11.501619,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,25.636465,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.487000,0.000000 +PyTorch,lt,lt_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.538948,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,19.407710,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,34.710407,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,23.001715,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,38.803145,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,11.308907,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,25.126098,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.409281,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.723077,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,28.078608,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,43.862870,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,28.342684,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,45.247717,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,22.467307,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,35.229839,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,20.828508,0.000000 +PyTorch,lt,lt_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,34.281815,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.201065,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.046987,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,13.518527,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.247002,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.413535,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.443923,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.946319,0.000000 +PyTorch,gt,gt_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.251914,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,9.841737,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,23.463844,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,13.387307,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.580578,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.499470,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.091755,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.880642,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.144200,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.522574,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.733810,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,13.634346,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.491347,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.759546,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.334460,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.276761,0.000000 +PyTorch,gt,gt_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.338620,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,17.579850,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,33.150634,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,21.018504,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,37.094236,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,10.386846,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.705712,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.199474,0.000000 +PyTorch,gt,gt_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.768630,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,18.496909,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,34.266361,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,22.630030,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,38.576213,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,10.491930,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,23.950235,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,15.528805,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.809764,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,27.852019,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,43.631335,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,28.047012,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,43.522750,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,21.437350,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,34.323098,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,20.572556,0.000000 +PyTorch,gt,gt_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,33.726399,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.355769,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.231171,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.381682,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,27.908206,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,7.015842,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.156515,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.764506,0.000000 +PyTorch,le,le_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,22.775082,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.645387,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,23.661967,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.528062,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,28.619186,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.821544,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.372435,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.892625,0.000000 +PyTorch,le,le_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,22.654621,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.859466,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.897908,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.472520,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,27.655807,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,7.103746,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.891796,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,11.237153,0.000000 +PyTorch,le,le_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.076524,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,18.089216,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,33.345103,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,21.725297,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,35.991615,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,12.072585,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.803279,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.287302,0.000000 +PyTorch,le,le_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.200946,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,19.513103,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,34.783793,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,22.548814,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,37.271383,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,11.784068,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.427171,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.172816,0.000000 +PyTorch,le,le_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.083668,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,28.238695,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,44.109961,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,28.149361,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,41.709949,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,22.886642,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,34.559269,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,20.791157,0.000000 +PyTorch,le,le_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,33.302911,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.306199,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,23.398023,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.367481,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.014630,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.389997,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,17.330705,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.804766,0.000000 +PyTorch,ge,ge_N8_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.171337,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.069797,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,23.063348,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.393169,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.074848,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.426396,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,16.922122,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.935307,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.255825,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,10.479719,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,24.519697,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,14.386574,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,29.143988,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,6.898638,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,18.271767,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,10.997651,0.000000 +PyTorch,ge,ge_N8_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,23.476497,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,16.836825,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,32.890492,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,20.590077,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,36.788412,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,9.996323,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.700884,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,16.088683,0.000000 +PyTorch,ge,ge_N64_dtypetorch.quint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.550079,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantFalse,short,False,18.296114,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigFalse_other_scalarFalse_out_variantTrue,short,False,34.263955,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantFalse,short,False,21.947267,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigFalse_other_scalarTrue_out_variantTrue,short,False,38.622379,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantFalse,short,False,10.075395,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigTrue_other_scalarFalse_out_variantTrue,short,False,24.391116,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantFalse,short,False,15.990073,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint8_contigTrue_other_scalarTrue_out_variantTrue,short,False,28.557654,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantFalse,short,False,28.126564,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigFalse_other_scalarFalse_out_variantTrue,short,False,43.531679,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantFalse,short,False,26.983753,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigFalse_other_scalarTrue_out_variantTrue,short,False,43.014786,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantFalse,short,False,21.464556,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigTrue_other_scalarFalse_out_variantTrue,short,False,34.336164,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantFalse,short,False,20.083832,0.000000 +PyTorch,ge,ge_N64_dtypetorch.qint32_contigTrue_other_scalarTrue_out_variantTrue,short,False,33.717209,0.000000 +PyTorch,QConv1d,QConv1d_IC128_OC256_kernel3_stride1_N1_L64_cpu,short,False,2474.554141,0.000000 +PyTorch,QConv1d,QConv1d_IC256_OC256_kernel3_stride2_N4_L64_cpu,short,False,10019.689350,0.000000 +PyTorch,QConv2d,QConv2d_IC256_OC256_kernel3_stride1_N1_H16_W16_G1_pad0_cpu,short,False,2819.508730,0.000000 +PyTorch,qembeddingbag_byte_prepack,qembeddingbag_byte_prepack_num_embeddings80_embedding_dim128,short,False,18.134076,0.000000 +PyTorch,qembeddingbag_byte_prepack,qembeddingbag_byte_prepack_num_embeddings80_embedding_dim256,short,False,34.939813,0.000000 +PyTorch,qembeddingbag_byte_prepack,qembeddingbag_byte_prepack_num_embeddings80_embedding_dim512,short,False,65.717219,0.000000 +PyTorch,qembeddingbag_4bit_prepack,qembeddingbag_4bit_prepack_num_embeddings80_embedding_dim128,short,False,36.029054,0.000000 +PyTorch,qembeddingbag_4bit_prepack,qembeddingbag_4bit_prepack_num_embeddings80_embedding_dim256,short,False,66.511117,0.000000 +PyTorch,qembeddingbag_4bit_prepack,qembeddingbag_4bit_prepack_num_embeddings80_embedding_dim512,short,False,128.594099,0.000000 +PyTorch,qembeddingbag_2bit_prepack,qembeddingbag_2bit_prepack_num_embeddings80_embedding_dim128,short,False,35.738603,0.000000 +PyTorch,qembeddingbag_2bit_prepack,qembeddingbag_2bit_prepack_num_embeddings80_embedding_dim256,short,False,67.034801,0.000000 +PyTorch,qembeddingbag_2bit_prepack,qembeddingbag_2bit_prepack_num_embeddings80_embedding_dim512,short,False,129.472195,0.000000 +PyTorch,qembeddingbag_byte_unpack,qembeddingbag_byte_unpack_num_embeddings80_embedding_dim128,short,False,6.597953,0.000000 +PyTorch,qembeddingbag_byte_unpack,qembeddingbag_byte_unpack_num_embeddings80_embedding_dim256,short,False,9.279742,0.000000 +PyTorch,qembeddingbag_byte_unpack,qembeddingbag_byte_unpack_num_embeddings80_embedding_dim512,short,False,12.878452,0.000000 +PyTorch,qembeddingbag_4bit_unpack,qembeddingbag_4bit_unpack_num_embeddings80_embedding_dim128,short,False,57.690957,0.000000 +PyTorch,qembeddingbag_4bit_unpack,qembeddingbag_4bit_unpack_num_embeddings80_embedding_dim256,short,False,109.143374,0.000000 +PyTorch,qembeddingbag_4bit_unpack,qembeddingbag_4bit_unpack_num_embeddings80_embedding_dim512,short,False,211.718602,0.000000 +PyTorch,qembeddingbag_2bit_unpack,qembeddingbag_2bit_unpack_num_embeddings80_embedding_dim128,short,False,110.866952,0.000000 +PyTorch,qembeddingbag_2bit_unpack,qembeddingbag_2bit_unpack_num_embeddings80_embedding_dim256,short,False,213.131957,0.000000 +PyTorch,qembeddingbag_2bit_unpack,qembeddingbag_2bit_unpack_num_embeddings80_embedding_dim512,short,False,418.880093,0.000000 +PyTorch,qembeddingbag_byte_prepack,qembeddingbag_byte_prepack_num_embeddings80_embedding_dim128_batch_size10,short,False,206.945818,0.000000 +PyTorch,qembeddingbag_byte_prepack,qembeddingbag_byte_prepack_num_embeddings80_embedding_dim256_batch_size10,short,False,363.442792,0.000000 +PyTorch,qembeddingbag_byte_prepack,qembeddingbag_byte_prepack_num_embeddings80_embedding_dim512_batch_size10,short,False,666.987745,0.000000 +PyTorch,qembeddingbag_4bit_prepack,qembeddingbag_4bit_prepack_num_embeddings80_embedding_dim128_batch_size10,short,False,6.759820,0.000000 +PyTorch,qembeddingbag_4bit_prepack,qembeddingbag_4bit_prepack_num_embeddings80_embedding_dim256_batch_size10,short,False,6.655541,0.000000 +PyTorch,qembeddingbag_4bit_prepack,qembeddingbag_4bit_prepack_num_embeddings80_embedding_dim512_batch_size10,short,False,6.737512,0.000000 +PyTorch,qembeddingbag_2bit_prepack,qembeddingbag_2bit_prepack_num_embeddings80_embedding_dim128_batch_size10,short,False,6.743112,0.000000 +PyTorch,qembeddingbag_2bit_prepack,qembeddingbag_2bit_prepack_num_embeddings80_embedding_dim256_batch_size10,short,False,6.652576,0.000000 +PyTorch,qembeddingbag_2bit_prepack,qembeddingbag_2bit_prepack_num_embeddings80_embedding_dim512_batch_size10,short,False,6.841990,0.000000 +PyTorch,qembeddingbag_byte_unpack,qembeddingbag_byte_unpack_num_embeddings80_embedding_dim128_batch_size10,short,False,23.021744,0.000000 +PyTorch,qembeddingbag_byte_unpack,qembeddingbag_byte_unpack_num_embeddings80_embedding_dim256_batch_size10,short,False,38.487234,0.000000 +PyTorch,qembeddingbag_byte_unpack,qembeddingbag_byte_unpack_num_embeddings80_embedding_dim512_batch_size10,short,False,71.024263,0.000000 +PyTorch,qembeddingbag_4bit_unpack,qembeddingbag_4bit_unpack_num_embeddings80_embedding_dim128_batch_size10,short,False,8.177698,0.000000 +PyTorch,qembeddingbag_4bit_unpack,qembeddingbag_4bit_unpack_num_embeddings80_embedding_dim256_batch_size10,short,False,8.039202,0.000000 +PyTorch,qembeddingbag_4bit_unpack,qembeddingbag_4bit_unpack_num_embeddings80_embedding_dim512_batch_size10,short,False,8.332832,0.000000 +PyTorch,qembeddingbag_2bit_unpack,qembeddingbag_2bit_unpack_num_embeddings80_embedding_dim128_batch_size10,short,False,11.874304,0.000000 +PyTorch,qembeddingbag_2bit_unpack,qembeddingbag_2bit_unpack_num_embeddings80_embedding_dim256_batch_size10,short,False,11.875088,0.000000 +PyTorch,qembeddingbag_2bit_unpack,qembeddingbag_2bit_unpack_num_embeddings80_embedding_dim512_batch_size10,short,False,11.973970,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.749198,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.918866,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.601117,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,37.524010,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.579205,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.955366,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.884045,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.208370,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,38.443378,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,38.740487,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,38.368374,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags10_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.422703,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.686129,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.801677,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.489407,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,37.679521,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.752840,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.905238,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.819355,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.130109,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,38.408468,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,38.747029,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,38.404787,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags120_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.502984,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.756773,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.893388,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.831078,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,37.867489,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.857305,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.989236,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.809535,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,37.960946,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,38.544690,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,38.844939,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,38.371755,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags1000_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,39.108865,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.655707,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,37.948385,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.677788,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size8_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.097931,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,37.906198,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,38.246369,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,37.859952,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size16_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.499342,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetTrue_cpu,short,False,38.788211,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseTrue_include_last_offsetFalse_cpu,short,False,38.998297,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetTrue_cpu,short,False,38.683481,0.000000 +PyTorch,qEmbeddingBag,qEmbeddingBag_embeddingbags2300_dim64_modesum_input_size64_offset0_sparseFalse_include_last_offsetFalse_cpu,short,False,38.536436,0.000000 +PyTorch,QGroupNormBenchmark,"QGroupNormBenchmark_dims(32,8,16)_num_groups2_dtypetorch.qint8",short,False,58.164334,0.000000 +PyTorch,QGroupNormBenchmark,"QGroupNormBenchmark_dims(32,8,16)_num_groups4_dtypetorch.qint8",short,False,57.796211,0.000000 +PyTorch,QGroupNormBenchmark,"QGroupNormBenchmark_dims(32,8,56,56)_num_groups2_dtypetorch.qint8",short,False,1148.216412,0.000000 +PyTorch,QGroupNormBenchmark,"QGroupNormBenchmark_dims(32,8,56,56)_num_groups4_dtypetorch.qint8",short,False,1148.804126,0.000000 +PyTorch,QInstanceNormBenchmark,"QInstanceNormBenchmark_dims(32,8,16)_dtypetorch.qint8",short,False,57.575234,0.000000 +PyTorch,QInstanceNormBenchmark,"QInstanceNormBenchmark_dims(32,8,56,56)_dtypetorch.qint8",short,False,1147.707670,0.000000 +PyTorch,q_interpolate,q_interpolate_M32_N32_K32_dtypetorch.quint8_modenearest_scale0.5_contigTrue,short,False,7.150264,0.000000 +PyTorch,q_interpolate,q_interpolate_M32_N32_K32_dtypetorch.quint8_modebilinear_scale0.5_contigTrue,short,False,9.218789,0.000000 +PyTorch,q_interpolate,q_interpolate_M32_N32_K32_dtypetorch.quint8_modenearest_scale2.0_contigTrue,short,False,7.490512,0.000000 +PyTorch,q_interpolate,q_interpolate_M32_N32_K32_dtypetorch.quint8_modebilinear_scale2.0_contigTrue,short,False,9.314491,0.000000 +PyTorch,q_interpolate,q_interpolate_M3_N720_K1280_dtypetorch.quint8_modebilinear_scale0.83333_contigTrue,short,False,66.910531,0.000000 +PyTorch,QLayerNormBenchmark,"QLayerNormBenchmark_dims(1,8,16)_dtypetorch.qint8",short,False,15.853110,0.000000 +PyTorch,QLayerNormBenchmark,"QLayerNormBenchmark_dims(8,8,16)_dtypetorch.qint8",short,False,62.647792,0.000000 +PyTorch,QLayerNormBenchmark,"QLayerNormBenchmark_dims(32,8,16)_dtypetorch.qint8",short,False,66.094037,0.000000 +PyTorch,QLayerNormBenchmark,"QLayerNormBenchmark_dims(64,128,56,56)_dtypetorch.qint8",short,False,51655.592280,0.000000 +PyTorch,QLinear,QLinear_N1_IN1_OUT1_cpu,short,False,48.466068,0.000000 +PyTorch,QLinear,QLinear_N4_IN256_OUT128_cpu,short,False,97.047966,0.000000 +PyTorch,QLinear,QLinear_N16_IN512_OUT256_cpu,short,False,92.013699,0.000000 +PyTorch,QDynamicLinear,QDynamicLinear_N1_IN1_OUT1_cpu,short,False,55.162945,0.000000 +PyTorch,QDynamicLinear,QDynamicLinear_N4_IN256_OUT128_cpu,short,False,181.460491,0.000000 +PyTorch,QDynamicLinear,QDynamicLinear_N16_IN512_OUT256_cpu,short,False,186.868091,0.000000 +PyTorch,MinMaxObserver,MinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_affine,short,False,178.683642,0.000000 +PyTorch,MinMaxObserver,MinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_symmetric,short,False,165.985880,0.000000 +PyTorch,MovingAverageMinMaxObserver,MovingAverageMinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_affine,short,False,209.793412,0.000000 +PyTorch,MovingAverageMinMaxObserver,MovingAverageMinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_symmetric,short,False,199.116115,0.000000 +PyTorch,PerChannelMinMaxObserver,PerChannelMinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_channel_affine,short,False,383.567212,0.000000 +PyTorch,PerChannelMinMaxObserver,PerChannelMinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_channel_symmetric,short,False,386.658467,0.000000 +PyTorch,MovingAveragePerChannelMinMaxObserver,MovingAveragePerChannelMinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_channel_affine,short,False,406.231582,0.000000 +PyTorch,MovingAveragePerChannelMinMaxObserver,MovingAveragePerChannelMinMaxObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_channel_symmetric,short,False,424.846136,0.000000 +PyTorch,HistogramObserver,HistogramObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_affine,short,False,1852.950257,0.000000 +PyTorch,HistogramObserver,HistogramObserver_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_symmetric,short,False,1886.575278,0.000000 +PyTorch,HistogramObserverCalculateQparams,HistogramObserverCalculateQparams_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_affine,short,False,1916.034661,0.000000 +PyTorch,HistogramObserverCalculateQparams,HistogramObserverCalculateQparams_C3_M512_N512_dtypetorch.quint8_cpu_qschemetorch.per_tensor_symmetric,short,False,1848.436297,0.000000 +PyTorch,QAdaptiveAvgPool2dBenchmark,"QAdaptiveAvgPool2dBenchmark_N4_C3_input_size(224,224)_output_size(112,112)_contigTrue_dtypetorch.qint32",short,False,125.012330,0.000000 +PyTorch,QAdaptiveAvgPool2dBenchmark,"QAdaptiveAvgPool2dBenchmark_N4_C3_input_size(224,224)_output_size(112,112)_contigTrue_dtypetorch.qint8",short,False,120.338743,0.000000 +PyTorch,QAdaptiveAvgPool2dBenchmark,"QAdaptiveAvgPool2dBenchmark_N4_C3_input_size(224,224)_output_size(112,112)_contigTrue_dtypetorch.quint8",short,False,120.237932,0.000000 +PyTorch,QAvgPool2dBenchmark,"QAvgPool2dBenchmark_C1_H3_W3_k(3,3)_s(1,1)_p(0,0)_N2_contigTrue_dtypetorch.qint32",short,False,58.290125,0.000000 +PyTorch,QAvgPool2dBenchmark,"QAvgPool2dBenchmark_C1_H3_W3_k(3,3)_s(1,1)_p(0,0)_N2_contigTrue_dtypetorch.qint8",short,False,56.845484,0.000000 +PyTorch,QAvgPool2dBenchmark,"QAvgPool2dBenchmark_C1_H3_W3_k(3,3)_s(1,1)_p(0,0)_N2_contigTrue_dtypetorch.quint8",short,False,57.068030,0.000000 +PyTorch,QMaxPool2dBenchmark,"QMaxPool2dBenchmark_C1_H3_W3_k(3,3)_s(1,1)_p(0,0)_N2_contigTrue_dtypetorch.qint32",short,False,62.013425,0.000000 +PyTorch,QMaxPool2dBenchmark,"QMaxPool2dBenchmark_C1_H3_W3_k(3,3)_s(1,1)_p(0,0)_N2_contigTrue_dtypetorch.qint8",short,False,61.332599,0.000000 +PyTorch,QMaxPool2dBenchmark,"QMaxPool2dBenchmark_C1_H3_W3_k(3,3)_s(1,1)_p(0,0)_N2_contigTrue_dtypetorch.quint8",short,False,60.981402,0.000000 +PyTorch,QLSTM,QLSTM_I1_H3_NL1_BTrue_DFalse_dtypetorch.qint8,short,False,20708.077910,0.000000 +PyTorch,QLSTM,QLSTM_I1_H3_NL1_BTrue_DTrue_dtypetorch.qint8,short,False,41009.405290,0.000000 +PyTorch,QLSTM,QLSTM_I5_H7_NL4_BTrue_DFalse_dtypetorch.qint8,short,False,81385.994580,0.000000 +PyTorch,QLSTM,QLSTM_I5_H7_NL4_BTrue_DTrue_dtypetorch.qint8,short,False,162347.641390,0.000000 +PyTorch,QMethodTensorInputCopyBenchmark,QMethodTensorInputCopyBenchmark_M32_N32_dtypetorch.quint8_contigFalse,short,False,0.884224,0.000000 +PyTorch,QMethodTensorInputCopyBenchmark,QMethodTensorInputCopyBenchmark_M32_N32_dtypetorch.quint8_contigTrue,short,False,0.881290,0.000000 +PyTorch,QuantizePerTensor,QuantizePerTensor_C3_M512_N512_dtypetorch.quint8_modeQ,short,False,139.818657,0.000000 +PyTorch,DequantizePerTensor,DequantizePerTensor_C3_M512_N512_dtypetorch.quint8_modeD,short,False,111.856445,0.000000 +PyTorch,QuantizePerChannel,QuantizePerChannel_C3_M512_N512_dtypetorch.quint8_modeQ_axis0,short,False,137.870248,0.000000 +PyTorch,DequantizePerChannel,DequantizePerChannel_C3_M512_N512_dtypetorch.quint8_modeD_axis0,short,False,295.384286,0.000000 +PyTorch,FakeQuantize,FakeQuantize_N1_C3_H512_W512_zero_point_dtypetorch.int32_cpu,short,False,498.468140,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu,short,False,212.106189,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu,short,False,212.103393,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu,short,False,210.769552,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu,short,False,210.336579,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwdall_BACKWARD,short,True,645.670738,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd1_BACKWARD,short,True,646.979930,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd2_BACKWARD,short,True,648.774775,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd3_BACKWARD,short,True,647.536140,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwdall_BACKWARD,short,True,645.420480,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd1_BACKWARD,short,True,647.989360,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd2_BACKWARD,short,True,648.279117,0.000000 +PyTorch,learnable_kernel_tensor,learnable_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd3_BACKWARD,short,True,648.012305,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwdall_BACKWARD,short,True,396.607204,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd1_BACKWARD,short,True,396.439610,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd2_BACKWARD,short,True,398.157875,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd3_BACKWARD,short,True,393.582596,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwdall_BACKWARD,short,True,394.932475,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd1_BACKWARD,short,True,398.150060,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd2_BACKWARD,short,True,394.573905,0.000000 +PyTorch,original_kernel_tensor,original_kernel_tensor_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd3_BACKWARD,short,True,389.742169,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu,short,False,462.132270,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu,short,False,460.794395,0.000000 +PyTorch,original_kernel_channel,original_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu,short,False,454.659963,0.000000 +PyTorch,original_kernel_channel,original_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu,short,False,450.819046,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwdall_BACKWARD,short,True,727.548224,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd1_BACKWARD,short,True,732.767646,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd2_BACKWARD,short,True,731.549638,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd3_BACKWARD,short,True,732.523360,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwdall_BACKWARD,short,True,734.845672,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd1_BACKWARD,short,True,734.484530,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd2_BACKWARD,short,True,731.358856,0.000000 +PyTorch,learnable_kernel_channel,learnable_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd3_BACKWARD,short,True,732.279545,0.000000 +PyTorch,original_kernel_channel,original_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwdall_BACKWARD,short,True,392.022089,0.000000 +PyTorch,original_kernel_channel,original_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits4_cpu_bwd1_BACKWARD,short,True,396.691596,0.000000 +PyTorch,original_kernel_channel,original_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwdall_BACKWARD,short,True,395.044202,0.000000 +PyTorch,original_kernel_channel,original_kernel_channel_N1_C3_H512_W512_zero_point_dtypetorch.int32_nbits8_cpu_bwd1_BACKWARD,short,True,393.618618,0.000000 +PyTorch,q_argsort,q_argsort_M512_N512_dtypetorch.quint8,short,False,498.230444,0.000000 +PyTorch,q_clone,q_clone_M512_N512_dtypetorch.quint8,short,False,54.217228,0.000000 +PyTorch,q_mean,q_mean_M512_N512_dtypetorch.quint8,short,False,98.299090,0.000000 +PyTorch,q_relu,q_relu_M512_N512_dtypetorch.quint8,short,False,50.626535,0.000000 +PyTorch,q_relu_,q_relu__M512_N512_dtypetorch.quint8,short,False,50.900865,0.000000 +PyTorch,q_sort,q_sort_M512_N512_dtypetorch.quint8,short,False,489.762199,0.000000 +PyTorch,qtopk,qtopk_M512_N512_k5_dtypetorch.quint8,short,False,106.761619,0.000000 +PyTorch,abs,abs_M512_N512_cpu,short,False,57.051424,0.000000 +PyTorch,abs_,abs__M512_N512_cpu,short,False,52.200911,0.000000 +PyTorch,acos,acos_M512_N512_cpu,short,False,163.152278,0.000000 +PyTorch,acos_,acos__M512_N512_cpu,short,False,154.986924,0.000000 +PyTorch,argsort,argsort_M512_N512_cpu,short,False,1293.551670,0.000000 +PyTorch,asin,asin_M512_N512_cpu,short,False,143.466299,0.000000 +PyTorch,asin_,asin__M512_N512_cpu,short,False,138.166554,0.000000 +PyTorch,atan,atan_M512_N512_cpu,short,False,183.999280,0.000000 +PyTorch,atan_,atan__M512_N512_cpu,short,False,178.477300,0.000000 +PyTorch,ceil,ceil_M512_N512_cpu,short,False,53.237791,0.000000 +PyTorch,ceil_,ceil__M512_N512_cpu,short,False,51.146127,0.000000 +PyTorch,clamp,clamp_M512_N512_cpu,short,False,57.982160,0.000000 +PyTorch,clone,clone_M512_N512_cpu,short,False,55.928251,0.000000 +PyTorch,cos,cos_M512_N512_cpu,short,False,153.934110,0.000000 +PyTorch,cos_,cos__M512_N512_cpu,short,False,149.205590,0.000000 +PyTorch,cosh,cosh_M512_N512_cpu,short,False,233.610736,0.000000 +PyTorch,digamma,digamma_M512_N512_cpu,short,False,512.670916,0.000000 +PyTorch,erf,erf_M512_N512_cpu,short,False,248.115065,0.000000 +PyTorch,erf_,erf__M512_N512_cpu,short,False,245.928480,0.000000 +PyTorch,erfc,erfc_M512_N512_cpu,short,False,471.492698,0.000000 +PyTorch,erfc_,erfc__M512_N512_cpu,short,False,466.460295,0.000000 +PyTorch,erfinv,erfinv_M512_N512_cpu,short,False,1359.954587,0.000000 +PyTorch,exp,exp_M512_N512_cpu,short,False,102.685068,0.000000 +PyTorch,exp_,exp__M512_N512_cpu,short,False,98.656667,0.000000 +PyTorch,expm1,expm1_M512_N512_cpu,short,False,224.464036,0.000000 +PyTorch,expm1_,expm1__M512_N512_cpu,short,False,220.063117,0.000000 +PyTorch,floor,floor_M512_N512_cpu,short,False,53.244395,0.000000 +PyTorch,floor_,floor__M512_N512_cpu,short,False,51.672797,0.000000 +PyTorch,frac,frac_M512_N512_cpu,short,False,55.433832,0.000000 +PyTorch,frac_,frac__M512_N512_cpu,short,False,51.270698,0.000000 +PyTorch,gelu,gelu_M512_N512_cpu,short,False,156.736075,0.000000 +PyTorch,hardshrink,hardshrink_M512_N512_cpu,short,False,57.883780,0.000000 +PyTorch,lgamma,lgamma_M512_N512_cpu,short,False,853.460615,0.000000 +PyTorch,log,log_M512_N512_cpu,short,False,154.847541,0.000000 +PyTorch,log10,log10_M512_N512_cpu,short,False,163.334617,0.000000 +PyTorch,log10_,log10__M512_N512_cpu,short,False,157.360735,0.000000 +PyTorch,log1p,log1p_M512_N512_cpu,short,False,163.516254,0.000000 +PyTorch,log1p_,log1p__M512_N512_cpu,short,False,159.639356,0.000000 +PyTorch,log2,log2_M512_N512_cpu,short,False,163.969243,0.000000 +PyTorch,log2_,log2__M512_N512_cpu,short,False,159.835136,0.000000 +PyTorch,log_,log__M512_N512_cpu,short,False,150.952504,0.000000 +PyTorch,logit,logit_M512_N512_cpu,short,False,177.961690,0.000000 +PyTorch,logit_,logit__M512_N512_cpu,short,False,172.351381,0.000000 +PyTorch,neg,neg_M512_N512_cpu,short,False,55.097290,0.000000 +PyTorch,neg_,neg__M512_N512_cpu,short,False,50.983444,0.000000 +PyTorch,reciprocal,reciprocal_M512_N512_cpu,short,False,63.374416,0.000000 +PyTorch,reciprocal_,reciprocal__M512_N512_cpu,short,False,58.360915,0.000000 +PyTorch,relu,relu_M512_N512_cpu,short,False,55.350610,0.000000 +PyTorch,relu_,relu__M512_N512_cpu,short,False,52.531514,0.000000 +PyTorch,round,round_M512_N512_cpu,short,False,54.882808,0.000000 +PyTorch,round_,round__M512_N512_cpu,short,False,51.705845,0.000000 +PyTorch,rsqrt,rsqrt_M512_N512_cpu,short,False,72.353625,0.000000 +PyTorch,rsqrt_,rsqrt__M512_N512_cpu,short,False,67.110910,0.000000 +PyTorch,sigmoid,sigmoid_M512_N512_cpu,short,False,101.934045,0.000000 +PyTorch,sigmoid_,sigmoid__M512_N512_cpu,short,False,101.207989,0.000000 +PyTorch,sign,sign_M512_N512_cpu,short,False,57.157465,0.000000 +PyTorch,sgn,sgn_M512_N512_cpu,short,False,56.892450,0.000000 +PyTorch,sin,sin_M512_N512_cpu,short,False,129.825713,0.000000 +PyTorch,sin_,sin__M512_N512_cpu,short,False,124.252865,0.000000 +PyTorch,sinh,sinh_M512_N512_cpu,short,False,237.181745,0.000000 +PyTorch,sqrt,sqrt_M512_N512_cpu,short,False,55.643847,0.000000 +PyTorch,sqrt_,sqrt__M512_N512_cpu,short,False,51.970346,0.000000 +PyTorch,square,square_M512_N512_cpu,short,False,56.493474,0.000000 +PyTorch,square_,square__M512_N512_cpu,short,False,53.660946,0.000000 +PyTorch,tan,tan_M512_N512_cpu,short,False,212.381058,0.000000 +PyTorch,tan_,tan__M512_N512_cpu,short,False,209.302840,0.000000 +PyTorch,tanh,tanh_M512_N512_cpu,short,False,254.571910,0.000000 +PyTorch,tanh_,tanh__M512_N512_cpu,short,False,250.419008,0.000000 +PyTorch,trunc,trunc_M512_N512_cpu,short,False,50.202160,0.000000 +PyTorch,trunc_,trunc__M512_N512_cpu,short,False,48.335770,0.000000 +PyTorch,unique,unique_M512_N512_cpu,short,False,18881.017060,0.000000 +PyTorch,zero_,zero__M512_N512_cpu,short,False,48.573353,0.000000 +PyTorch,bernoulli_,bernoulli__M512_N512_cpu,short,False,2761.902873,0.000000 +PyTorch,cauchy_,cauchy__M512_N512_cpu,short,False,6134.592810,0.000000 +PyTorch,digamma_,digamma__M512_N512_cpu,short,False,968.574541,0.000000 +PyTorch,exponential_,exponential__M512_N512_cpu,short,False,4554.747990,0.000000 +PyTorch,normal_,normal__M512_N512_cpu,short,False,1969.108666,0.000000 +PyTorch,random_,random__M512_N512_cpu,short,False,742.022216,0.000000 +PyTorch,sign_,sign__M512_N512_cpu,short,False,53.070620,0.000000 +PyTorch,uniform_,uniform__M512_N512_cpu,short,False,719.128405,0.000000 +PyTorch,half,half_M512_N512_cpu,short,False,56.301074,0.000000 +PyTorch,long,long_M512_N512_cpu,short,False,69.495610,0.000000 diff --git a/benchmarks/operator_benchmark/pt/conv_test.py b/benchmarks/operator_benchmark/pt/conv_test.py index 93b4942cea2b..65baf47e0d67 100644 --- a/benchmarks/operator_benchmark/pt/conv_test.py +++ b/benchmarks/operator_benchmark/pt/conv_test.py @@ -38,12 +38,16 @@ class ConvTranspose1dBenchmark(op_bench.TorchBenchmarkBase): op_bench.generate_pt_test( configs.conv_1d_configs_short + configs.conv_1d_configs_long, Conv1dBenchmark ) -op_bench.generate_pt_test( - configs.convtranspose_1d_configs_short - + configs.conv_1d_configs_short - + configs.conv_1d_configs_long, - ConvTranspose1dBenchmark, -) + + +if not torch.backends.mkldnn.is_acl_available(): + # convtranpose1d crashes with ACL, see https://github.com/pytorch/pytorch/issues/165654 + op_bench.generate_pt_test( + configs.convtranspose_1d_configs_short + + configs.conv_1d_configs_short + + configs.conv_1d_configs_long, + ConvTranspose1dBenchmark, + ) """