Update slow tests (#145206)

This PR is auto-generated weekly by [this action](https://github.com/pytorch/pytorch/blob/main/.github/workflows/weekly.yml).
Update the list of slow tests.
Pull Request resolved: https://github.com/pytorch/pytorch/pull/145206
Approved by: https://github.com/pytorchbot
This commit is contained in:
PyTorch UpdateBot 2025-01-27 11:40:39 +00:00 committed by PyTorch MergeBot
parent e6c1e6e20e
commit 7b6029dcc2

View File

@ -1,308 +1,308 @@
{
"EndToEndLSTM (__main__.RNNTest)": 219.01666768391928,
"MultiheadAttention (__main__.ModulesTest)": 174.21966552734375,
"test_AllenaiLongformerBase_repro_cpu (__main__.CpuHalideTests)": 216.12166341145834,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 164.42666710747613,
"test_adaptive_max_pool2d1_cpu (__main__.CpuHalideTests)": 113.75033569335938,
"test_after_aot_cpu_runtime_error (__main__.MinifierIsolateTests)": 61.27166620890299,
"test_alexnet_prefix_cpu (__main__.CpuHalideTests)": 191.17266845703125,
"test_aot_autograd_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 76.49633280436198,
"test_aot_autograd_symbolic_exhaustive_linalg_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 63.89333470662435,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 93.37866719563802,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 177.83633677164713,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 113.58966573079427,
"test_aot_autograd_symbolic_exhaustive_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 61.64871397472563,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 119.6356684366862,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 511.6263732910156,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 95.9540008544922,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 501.61433580186633,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 510.3060031467014,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 129.74549865722656,
"test_avg_pool3d_backward_cpu (__main__.CpuHalideTests)": 62.59933344523112,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 80.09766642252605,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 71.14580078125,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 314.9518737792969,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 192.08616892496744,
"test_builtin_equivalent_funcs (__main__.TorchFunctionModeTests)": 91.91841388570852,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 359.6031265258789,
"test_comprehensive_constant_pad_nd_cpu_float16 (__main__.TestInductorOpInfoCPU)": 70.37266794840495,
"test_comprehensive_constant_pad_nd_cpu_float32 (__main__.TestInductorOpInfoCPU)": 76.47233327229817,
"test_comprehensive_constant_pad_nd_cpu_float64 (__main__.TestInductorOpInfoCPU)": 68.93833414713542,
"test_comprehensive_constant_pad_nd_cpu_int32 (__main__.TestInductorOpInfoCPU)": 66.1010004679362,
"test_comprehensive_constant_pad_nd_cpu_int64 (__main__.TestInductorOpInfoCPU)": 69.34066772460938,
"test_comprehensive_diff_cpu_bool (__main__.TestInductorOpInfoCPU)": 103.67199961344402,
"test_comprehensive_diff_cpu_float32 (__main__.TestInductorOpInfoCPU)": 103.93333435058594,
"test_comprehensive_diff_cpu_float64 (__main__.TestInductorOpInfoCPU)": 101.26199849446614,
"test_comprehensive_diff_cpu_int32 (__main__.TestInductorOpInfoCPU)": 103.43300120035808,
"test_comprehensive_diff_cpu_int64 (__main__.TestInductorOpInfoCPU)": 102.98933410644531,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 95.76133346557617,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 139.30020141601562,
"test_comprehensive_diff_cuda_float32 (__main__.TestDecompCUDA)": 64.03244484795465,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 61.661333084106445,
"test_comprehensive_dist_cpu_float16 (__main__.TestInductorOpInfoCPU)": 92.57433319091797,
"test_comprehensive_dist_cpu_float32 (__main__.TestInductorOpInfoCPU)": 80.80066935221355,
"test_comprehensive_dist_cpu_float64 (__main__.TestInductorOpInfoCPU)": 84.26466623942058,
"test_comprehensive_eye_cpu_bool (__main__.TestInductorOpInfoCPU)": 124.48333231608073,
"test_comprehensive_eye_cpu_float16 (__main__.TestInductorOpInfoCPU)": 127.46799723307292,
"test_comprehensive_eye_cpu_float32 (__main__.TestInductorOpInfoCPU)": 120.62799835205078,
"test_comprehensive_eye_cpu_float64 (__main__.TestInductorOpInfoCPU)": 136.93400065104166,
"test_comprehensive_eye_cpu_int32 (__main__.TestInductorOpInfoCPU)": 129.24666595458984,
"test_comprehensive_eye_cpu_int64 (__main__.TestInductorOpInfoCPU)": 123.21799977620442,
"test_comprehensive_grid_sampler_2d_cpu_bfloat16 (__main__.TestDecompCPU)": 72.43999989827473,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestDecompCPU)": 71.22533162434895,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 84.48433430989583,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 328.62400309244794,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 82.0076675415039,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 322.2469991048177,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 82.78066762288411,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 257.7654978434245,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 290.05539855957034,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 1175.2658386230469,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 71.83983357747395,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 988.3565165201823,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 79.0331662495931,
"test_comprehensive_linalg_lu_solve_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 82.20579986572265,
"test_comprehensive_linalg_lu_solve_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 76.20133209228516,
"test_comprehensive_linalg_solve_triangular_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 70.49620056152344,
"test_comprehensive_linalg_solve_triangular_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 69.98949940999348,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 66.22066752115886,
"test_comprehensive_linalg_svd_cuda_complex64 (__main__.TestDecompCUDA)": 62.03222105238173,
"test_comprehensive_linalg_vector_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 198.07999674479166,
"test_comprehensive_linalg_vector_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 204.8566691080729,
"test_comprehensive_linalg_vector_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 197.94000244140625,
"test_comprehensive_linalg_vector_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 72.01380004882813,
"test_comprehensive_linalg_vector_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 70.19919967651367,
"test_comprehensive_logspace_cpu_float32 (__main__.TestInductorOpInfoCPU)": 426.4303283691406,
"test_comprehensive_logspace_cpu_float64 (__main__.TestInductorOpInfoCPU)": 422.5133361816406,
"test_comprehensive_logspace_cpu_int32 (__main__.TestInductorOpInfoCPU)": 410.77333577473956,
"test_comprehensive_logspace_cpu_int64 (__main__.TestInductorOpInfoCPU)": 399.1383361816406,
"test_comprehensive_logspace_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 69.45479888916016,
"test_comprehensive_logspace_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 67.26920013427734,
"test_comprehensive_masked_amax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 97.7530008951823,
"test_comprehensive_masked_amax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 92.8076655069987,
"test_comprehensive_masked_amax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 104.97799936930339,
"test_comprehensive_masked_amax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 90.8633321126302,
"test_comprehensive_masked_amax_cpu_int64 (__main__.TestInductorOpInfoCPU)": 90.08966827392578,
"test_comprehensive_masked_amin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 93.20333353678386,
"test_comprehensive_masked_amin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 94.15066782633464,
"test_comprehensive_masked_amin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 94.77933247884114,
"test_comprehensive_masked_amin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 90.3489990234375,
"test_comprehensive_masked_amin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 95.64933522542317,
"test_comprehensive_masked_mean_cpu_float16 (__main__.TestInductorOpInfoCPU)": 97.31866455078125,
"test_comprehensive_masked_mean_cpu_float32 (__main__.TestInductorOpInfoCPU)": 93.01966603597005,
"test_comprehensive_masked_mean_cpu_float64 (__main__.TestInductorOpInfoCPU)": 96.31433359781902,
"test_comprehensive_masked_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 469.4216715494792,
"test_comprehensive_masked_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 452.2100016276042,
"test_comprehensive_masked_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 454.2533264160156,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 159.33299865722657,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 158.02383422851562,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 152.2355972290039,
"test_comprehensive_masked_prod_cpu_bool (__main__.TestInductorOpInfoCPU)": 88.12666575113933,
"test_comprehensive_masked_prod_cpu_float16 (__main__.TestInductorOpInfoCPU)": 97.00100199381511,
"test_comprehensive_masked_prod_cpu_float32 (__main__.TestInductorOpInfoCPU)": 91.61366526285808,
"test_comprehensive_masked_prod_cpu_float64 (__main__.TestInductorOpInfoCPU)": 94.33899943033855,
"test_comprehensive_masked_prod_cpu_int32 (__main__.TestInductorOpInfoCPU)": 93.58066813151042,
"test_comprehensive_masked_prod_cpu_int64 (__main__.TestInductorOpInfoCPU)": 86.63633219401042,
"test_comprehensive_masked_sum_cpu_bool (__main__.TestInductorOpInfoCPU)": 87.10366821289062,
"test_comprehensive_masked_sum_cpu_float16 (__main__.TestInductorOpInfoCPU)": 91.91966756184895,
"test_comprehensive_masked_sum_cpu_float32 (__main__.TestInductorOpInfoCPU)": 89.0056660970052,
"test_comprehensive_masked_sum_cpu_float64 (__main__.TestInductorOpInfoCPU)": 95.69266764322917,
"test_comprehensive_masked_sum_cpu_int32 (__main__.TestInductorOpInfoCPU)": 96.12366739908855,
"test_comprehensive_masked_sum_cpu_int64 (__main__.TestInductorOpInfoCPU)": 85.56033325195312,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 94.3606669108073,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 91.39319915771485,
"test_comprehensive_nn_functional_glu_cpu_float16 (__main__.TestInductorOpInfoCPU)": 75.17366790771484,
"test_comprehensive_nn_functional_glu_cpu_float32 (__main__.TestInductorOpInfoCPU)": 73.51633199055989,
"test_comprehensive_nn_functional_glu_cpu_float64 (__main__.TestInductorOpInfoCPU)": 72.20166524251302,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 85.47899881998698,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 82.7643305460612,
"test_comprehensive_nn_functional_grid_sample_cuda_float16 (__main__.TestDecompCUDA)": 71.34377839830186,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 245.36333211263022,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 217.09620056152343,
"test_comprehensive_nn_functional_interpolate_bicubic_cpu_uint8 (__main__.TestInductorOpInfoCPU)": 67.65433247884114,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 76.41720123291016,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 76.63816706339519,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 74.07599767049153,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float64 (__main__.TestDecompCUDA)": 76.38788816663954,
"test_comprehensive_nn_functional_max_pool1d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 183.63033040364584,
"test_comprehensive_nn_functional_max_pool1d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 185.07866923014322,
"test_comprehensive_nn_functional_max_pool1d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 181.17666625976562,
"test_comprehensive_nn_functional_max_pool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 951.9180094401041,
"test_comprehensive_nn_functional_max_pool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 898.5603230794271,
"test_comprehensive_nn_functional_max_pool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 872.6630045572916,
"test_comprehensive_nn_functional_max_pool2d_cpu_int32 (__main__.TestInductorOpInfoCPU)": 867.6906534830729,
"test_comprehensive_nn_functional_max_pool2d_cpu_int64 (__main__.TestInductorOpInfoCPU)": 846.8659871419271,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 905.4492065429688,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 921.333994547526,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 893.0242065429687,
"test_comprehensive_nn_functional_max_pool3d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 65.94383303324382,
"test_comprehensive_nn_functional_max_pool3d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 61.17511134677463,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 197.9020029703776,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 202.92266845703125,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 198.81666564941406,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 63.80933380126953,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 99.99519958496094,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 114.78399912516277,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 127.79300181070964,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 136.90966288248697,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 144.04033406575522,
"test_comprehensive_nn_functional_pad_constant_cpu_float16 (__main__.TestInductorOpInfoCPU)": 68.3290023803711,
"test_comprehensive_nn_functional_pad_constant_cpu_float32 (__main__.TestInductorOpInfoCPU)": 70.11433410644531,
"test_comprehensive_nn_functional_pad_constant_cpu_float64 (__main__.TestInductorOpInfoCPU)": 72.62233479817708,
"test_comprehensive_nn_functional_pad_constant_cpu_int32 (__main__.TestInductorOpInfoCPU)": 70.95999908447266,
"test_comprehensive_nn_functional_pad_constant_cpu_int64 (__main__.TestInductorOpInfoCPU)": 67.1433334350586,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float16 (__main__.TestInductorOpInfoCPU)": 116.43599955240886,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestInductorOpInfoCPU)": 122.10533142089844,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float64 (__main__.TestInductorOpInfoCPU)": 133.65133412679037,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int32 (__main__.TestInductorOpInfoCPU)": 110.69800313313802,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int64 (__main__.TestInductorOpInfoCPU)": 111.77166748046875,
"test_comprehensive_nn_functional_unfold_cpu_bool (__main__.TestInductorOpInfoCPU)": 127.3866704305013,
"test_comprehensive_nn_functional_unfold_cpu_float16 (__main__.TestInductorOpInfoCPU)": 233.09599812825522,
"test_comprehensive_nn_functional_unfold_cpu_float32 (__main__.TestInductorOpInfoCPU)": 234.11399841308594,
"test_comprehensive_nn_functional_unfold_cpu_float64 (__main__.TestInductorOpInfoCPU)": 226.98400370279947,
"test_comprehensive_nn_functional_unfold_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 89.39950052897136,
"test_comprehensive_nn_functional_unfold_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 74.69460067749023,
"test_comprehensive_nn_functional_unfold_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 81.90066719055176,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 116.8889986673991,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 110.37666575113933,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 74.48516654968262,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 122.96380004882812,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestDecompCUDA)": 64.73344463772244,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 93.02200164794922,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 68.18680038452149,
"test_comprehensive_svd_cuda_complex64 (__main__.TestDecompCUDA)": 67.39633263481988,
"test_cond_autograd_nested (__main__.TestControlFlow)": 84.44266510009766,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 377.3101666768392,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 100.73100026448567,
"test_constructor_autograd_SparseCSC_cuda (__main__.TestSparseAnyCUDA)": 83.851500193278,
"test_constructor_autograd_SparseCSR_cuda (__main__.TestSparseAnyCUDA)": 67.7853323618571,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 328.25274181365967,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 447.28986740112305,
"test_conv2d_unary_cpu_cpp_wrapper (__main__.TestCppWrapper)": 107.9556655883789,
"test_correctness_AdamW_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 64.6594009399414,
"test_correctness_AdamW_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 112.1166000366211,
"test_correctness_Adam_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 62.93920059204102,
"test_correctness_Adam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 112.84459991455078,
"test_correctness_NAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 69.20719985961914,
"test_correctness_RAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 60.54666709899902,
"test_count_nonzero_all (__main__.TestBool)": 595.4372219509548,
"test_custom_module_lstm (__main__.TestQuantizedOps)": 522.6370048522949,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 86.56959991455078,
"test_distributed_checkpoint_state_dict_type0_cuda (__main__.TestDistributedCheckpointCUDA)": 107.90633074442546,
"test_dtensor_op_db_nn_functional_gaussian_nll_loss_cpu_float32 (__main__.TestDTensorOpsCPU)": 89.07333119710286,
"test_eig_check_magma_cuda_float32 (__main__.TestLinalgCUDA)": 242.41000003814696,
"test_fail_creation_ops.py (__main__.TestTyping)": 63.9422492980957,
"test_fail_random.py (__main__.TestTyping)": 72.27856661478678,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 81.51600036621093,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 81.64050038655598,
"test_fn_gradgrad_map_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 84.40933481852214,
"test_fn_gradgrad_map_triple_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 539.1473388671875,
"test_fn_gradgrad_map_triple_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 357.4328358968099,
"test_fuse_large_params_cpu (__main__.CpuTests)": 62.61687517166138,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 95.7061243057251,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 98.63437461853027,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 68.34640045166016,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 71.67316754659016,
"test_get_future_result (__main__.NcclErrorHandlingTest)": 70.02166509628296,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 85.97466659545898,
"test_gradgrad_nn_LSTM_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 106.56066385904948,
"test_gradgrad_nn_LSTM_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 100.10433451334636,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 197.9608357747396,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 121.5308354695638,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 138.2099978129069,
"test_grid_sampler_2d_cpu (__main__.CpuHalideTests)": 184.44500223795572,
"test_group_norm (__main__.TestQuantizedOps)": 103.21900272369385,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 217.30499776204428,
"test_inductor_no_recursionerror_on_for_loops_dynamic_shapes (__main__.DynamicShapesReproTests)": 75.90662479400635,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 113.31633122762044,
"test_inputs_overlapping_with_mutation_stress_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 138.96125316619873,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 110.0633316040039,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 724.2651733398437,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 65.02860107421876,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 81.81559906005859,
"test_linear (__main__.TestStaticQuantizedModule)": 160.7091144985623,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 67.73933283487956,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 71.7346674601237,
"test_lobpcg_ortho_cuda_float64 (__main__.TestLinalgCUDA)": 165.26700077056884,
"test_lstm_cpu (__main__.TestMkldnnCPU)": 65.87166595458984,
"test_many_overlapping_inputs_does_not_explode_guards_dynamic_shapes (__main__.DynamicShapesReproTests)": 116.96750068664551,
"test_matmul_small_brute_force_tunableop_cuda_float32 (__main__.TestLinalgCUDA)": 157.28033447265625,
"test_matmul_small_brute_force_tunableop_cuda_float64 (__main__.TestLinalgCUDA)": 272.11766815185547,
"test_max_autotune_cutlass_backend_addmm_dynamic_False_max_autotune_gemm_backends_ATen,Triton,CUTLASS (__main__.TestCutlassBackend)": 85.9010009765625,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 65.27966647677951,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 65.34055582682292,
"test_memory_format_operators_cpu (__main__.TestTorchDeviceTypeCPU)": 73.96219524472124,
"test_memory_format_operators_cuda (__main__.TestTorchDeviceTypeCUDA)": 74.76016703496377,
"test_nccl_non_blocking_wait_with_barrier (__main__.NcclErrorHandlingTest)": 128.86683146158853,
"test_proper_exit (__main__.TestDataLoader)": 225.54483795166016,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 229.0020014444987,
"test_qat_conv2d_unary (__main__.TestQuantizePT2EX86Inductor)": 155.29989030626086,
"test_qat_conv_bn_fusion_no_conv_bias (__main__.TestQuantizePT2EQAT_ConvBn1d)": 60.57449994768415,
"test_qat_conv_bn_fusion_no_conv_bias (__main__.TestQuantizePT2EQAT_ConvBn2d)": 60.53676169259207,
"test_qat_mobilenet_v2 (__main__.TestQuantizePT2EQATModels)": 86.17025089263916,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 66.87833150227864,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 64.44400024414062,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 63.335001627604164,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 65.24266688028972,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 60.08399963378906,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 69.76100158691406,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 68.71633402506511,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 60.00833384195963,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 66.8259989420573,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 68.65233103434245,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 409.33233642578125,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 719.1711730957031,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 555.447998046875,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 1191.0525004069011,
"test_quick_core_backward_expand_copy_cuda_float64 (__main__.TestDecompCUDA)": 74.82050132751465,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 68.36066818237305,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 282.41783905029297,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 96.43233489990234,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 181.66466522216797,
"test_quick_core_backward_select_scatter_cpu_float64 (__main__.TestDecompCPU)": 61.32693277994792,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 115.47833251953125,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 77.8719991048177,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 136.78380126953124,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 91.93119964599609,
"test_replicatepad_64bit_indexing_cuda_float16 (__main__.TestNNDeviceTypeCUDA)": 67.2739995320638,
"test_rosenbrock_sparse_with_lrsched_False_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 84.41359996795654,
"test_rosenbrock_sparse_with_lrsched_True_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 76.8560001373291,
"test_save_load_large_string_attribute (__main__.TestSaveLoad)": 105.95299911499023,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 149.1056645711263,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 137.01250076293945,
"test_sort_stable_cpu (__main__.CpuTritonTests)": 72.2096659342448,
"test_split_cumsum_cpu (__main__.CpuTritonTests)": 89.40066528320312,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 199.06099891662598,
"test_terminate_handler_on_crash (__main__.TestTorch)": 99.10455474588606,
"test_terminate_signal (__main__.ForkTest)": 135.61289005643792,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 135.77333214630684,
"test_terminate_signal (__main__.SpawnTest)": 138.1917757458157,
"test_torchvision_smoke (__main__.TestTensorBoardPytorchGraph)": 70.92737340927124,
"test_transformer_backend_inductor_fullgraph_True (__main__.TestFullyShardCompile)": 105.59533309936523,
"test_transpose_copy (__main__.CPUReproTests)": 60.39411163330078,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 71.22266642252605,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 227.48333231608072,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 162.58349990844727,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 146.57499821980795,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 121.54083251953125,
"test_unary_ops (__main__.TestTEFuserDynamic)": 169.8456654018826,
"test_unary_ops (__main__.TestTEFuserStatic)": 152.63955561319986,
"test_upsample_bicubic2d_cpu (__main__.CpuHalideTests)": 96.07833353678386,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 91.68333435058594,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 75.80999908447265,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 78.79200045267741,
"test_vmapjvpvjp_linalg_multi_dot_cuda_float32 (__main__.TestOperatorsCUDA)": 67.70660095214843,
"test_vmapjvpvjp_linalg_solve_triangular_cuda_float32 (__main__.TestOperatorsCUDA)": 61.0824998219808,
"test_vmapjvpvjp_linalg_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 68.92850049336751,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 67.91666666666667,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 73.6173324584961,
"test_vmapjvpvjp_nn_functional_conv2d_cpu_float32 (__main__.TestOperatorsCPU)": 60.76257124401274,
"test_vmapjvpvjp_nn_functional_max_pool2d_cpu_float32 (__main__.TestOperatorsCPU)": 71.23704710460845,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 65.04120025634765,
"test_vmapjvpvjp_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 72.83116722106934,
"test_vmapjvpvjp_unbind_cpu_float32 (__main__.TestOperatorsCPU)": 61.08738090878441,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 67.91599960327149,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 72.0385004679362,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 72.64249928792317,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 124.12919769287109
"EndToEndLSTM (__main__.RNNTest)": 218.46899922688803,
"MultiheadAttention (__main__.ModulesTest)": 173.65766398111978,
"test_AllenaiLongformerBase_repro_cpu (__main__.CpuHalideTests)": 215.72766621907553,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 160.06233300103082,
"test_adaptive_max_pool2d1_cpu (__main__.CpuHalideTests)": 114.19766489664714,
"test_after_aot_cpu_runtime_error (__main__.MinifierIsolateTests)": 62.27711062961154,
"test_alexnet_prefix_cpu (__main__.CpuHalideTests)": 191.4193318684896,
"test_aot_autograd_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 113.02799733479817,
"test_aot_autograd_symbolic_exhaustive_linalg_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 66.00233332316081,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 120.18766530354817,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 141.22733561197916,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 103.69833119710286,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 130.41566721598306,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 487.44966973198785,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 94.76033147176106,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 490.70132785373266,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 496.97710503472223,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 124.80966567993164,
"test_avg_pool3d_backward_cpu (__main__.CpuHalideTests)": 61.59099833170573,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 87.07666778564453,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 68.67283248901367,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 244.37422349717883,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 161.94966761271158,
"test_builtin_equivalent_funcs (__main__.TorchFunctionModeTests)": 91.85369873046875,
"test_checkpoint_cast (__main__.TestFxToOnnx)": 367.8630065917969,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 357.23644680447046,
"test_comprehensive_constant_pad_nd_cpu_float16 (__main__.TestInductorOpInfoCPU)": 69.92699940999348,
"test_comprehensive_constant_pad_nd_cpu_float32 (__main__.TestInductorOpInfoCPU)": 75.00166575113933,
"test_comprehensive_constant_pad_nd_cpu_float64 (__main__.TestInductorOpInfoCPU)": 68.49166615804036,
"test_comprehensive_constant_pad_nd_cpu_int32 (__main__.TestInductorOpInfoCPU)": 65.78366597493489,
"test_comprehensive_constant_pad_nd_cpu_int64 (__main__.TestInductorOpInfoCPU)": 68.89199829101562,
"test_comprehensive_diff_cpu_bool (__main__.TestInductorOpInfoCPU)": 102.89200083414714,
"test_comprehensive_diff_cpu_float32 (__main__.TestInductorOpInfoCPU)": 102.76666768391927,
"test_comprehensive_diff_cpu_float64 (__main__.TestInductorOpInfoCPU)": 100.1219991048177,
"test_comprehensive_diff_cpu_int32 (__main__.TestInductorOpInfoCPU)": 102.89499918619792,
"test_comprehensive_diff_cpu_int64 (__main__.TestInductorOpInfoCPU)": 100.64933522542317,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 86.70000076293945,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 82.97133509318034,
"test_comprehensive_diff_cuda_float32 (__main__.TestDecompCUDA)": 98.83016777038574,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 63.6163330078125,
"test_comprehensive_dist_cpu_float16 (__main__.TestInductorOpInfoCPU)": 80.70999908447266,
"test_comprehensive_dist_cpu_float32 (__main__.TestInductorOpInfoCPU)": 80.09666697184245,
"test_comprehensive_dist_cpu_float64 (__main__.TestInductorOpInfoCPU)": 85.40266927083333,
"test_comprehensive_eye_cpu_bool (__main__.TestInductorOpInfoCPU)": 124.63333384195964,
"test_comprehensive_eye_cpu_float16 (__main__.TestInductorOpInfoCPU)": 118.93233235677083,
"test_comprehensive_eye_cpu_float32 (__main__.TestInductorOpInfoCPU)": 119.12733459472656,
"test_comprehensive_eye_cpu_float64 (__main__.TestInductorOpInfoCPU)": 139.26000467936197,
"test_comprehensive_eye_cpu_int32 (__main__.TestInductorOpInfoCPU)": 129.03466796875,
"test_comprehensive_eye_cpu_int64 (__main__.TestInductorOpInfoCPU)": 121.75833129882812,
"test_comprehensive_grid_sampler_2d_cpu_bfloat16 (__main__.TestDecompCPU)": 69.67933400472005,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestDecompCPU)": 82.40866597493489,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 84.81233215332031,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 357.16966756184894,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 85.7066650390625,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 349.5823262532552,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 82.29266611735027,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 262.3520024617513,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 247.61383819580078,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 1042.3961690266926,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 70.3201675415039,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 1023.5723164876302,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 73.51150004069011,
"test_comprehensive_linalg_lu_solve_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 78.84833399454753,
"test_comprehensive_linalg_lu_solve_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 71.58949788411458,
"test_comprehensive_linalg_solve_triangular_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 71.51049931844075,
"test_comprehensive_linalg_solve_triangular_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 66.26499875386556,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 63.65166664123535,
"test_comprehensive_linalg_vector_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 194.29166158040366,
"test_comprehensive_linalg_vector_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 205.24866739908853,
"test_comprehensive_linalg_vector_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 196.55799865722656,
"test_comprehensive_linalg_vector_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 74.55249977111816,
"test_comprehensive_linalg_vector_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 75.83016713460286,
"test_comprehensive_logspace_cpu_float32 (__main__.TestInductorOpInfoCPU)": 422.2393290201823,
"test_comprehensive_logspace_cpu_float64 (__main__.TestInductorOpInfoCPU)": 419.15733846028644,
"test_comprehensive_logspace_cpu_int32 (__main__.TestInductorOpInfoCPU)": 407.1983337402344,
"test_comprehensive_logspace_cpu_int64 (__main__.TestInductorOpInfoCPU)": 396.66066487630206,
"test_comprehensive_logspace_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 75.42149861653645,
"test_comprehensive_logspace_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 75.69333330790202,
"test_comprehensive_masked_amax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 97.0836664835612,
"test_comprehensive_masked_amax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 92.19766743977864,
"test_comprehensive_masked_amax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 101.15033213297527,
"test_comprehensive_masked_amax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 89.56966908772786,
"test_comprehensive_masked_amax_cpu_int64 (__main__.TestInductorOpInfoCPU)": 88.81166585286458,
"test_comprehensive_masked_amin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 95.51766713460286,
"test_comprehensive_masked_amin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 94.93733469645183,
"test_comprehensive_masked_amin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 94.22766367594402,
"test_comprehensive_masked_amin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 90.8259989420573,
"test_comprehensive_masked_amin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 92.13633473714192,
"test_comprehensive_masked_mean_cpu_float16 (__main__.TestInductorOpInfoCPU)": 95.29866536458333,
"test_comprehensive_masked_mean_cpu_float32 (__main__.TestInductorOpInfoCPU)": 92.53700256347656,
"test_comprehensive_masked_mean_cpu_float64 (__main__.TestInductorOpInfoCPU)": 95.22733306884766,
"test_comprehensive_masked_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 471.0916748046875,
"test_comprehensive_masked_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 446.25799560546875,
"test_comprehensive_masked_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 446.1899922688802,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 167.7551638285319,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 148.79099909464517,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 162.5819994608561,
"test_comprehensive_masked_prod_cpu_bool (__main__.TestInductorOpInfoCPU)": 88.22800191243489,
"test_comprehensive_masked_prod_cpu_float16 (__main__.TestInductorOpInfoCPU)": 95.65499877929688,
"test_comprehensive_masked_prod_cpu_float32 (__main__.TestInductorOpInfoCPU)": 90.88400014241536,
"test_comprehensive_masked_prod_cpu_float64 (__main__.TestInductorOpInfoCPU)": 94.00266520182292,
"test_comprehensive_masked_prod_cpu_int32 (__main__.TestInductorOpInfoCPU)": 91.75599924723308,
"test_comprehensive_masked_prod_cpu_int64 (__main__.TestInductorOpInfoCPU)": 85.58166758219402,
"test_comprehensive_masked_sum_cpu_bool (__main__.TestInductorOpInfoCPU)": 87.07266743977864,
"test_comprehensive_masked_sum_cpu_float16 (__main__.TestInductorOpInfoCPU)": 91.46266428629558,
"test_comprehensive_masked_sum_cpu_float32 (__main__.TestInductorOpInfoCPU)": 88.94800059000652,
"test_comprehensive_masked_sum_cpu_float64 (__main__.TestInductorOpInfoCPU)": 94.90433502197266,
"test_comprehensive_masked_sum_cpu_int32 (__main__.TestInductorOpInfoCPU)": 99.29966735839844,
"test_comprehensive_masked_sum_cpu_int64 (__main__.TestInductorOpInfoCPU)": 85.29933166503906,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 110.91299947102864,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 87.41866683959961,
"test_comprehensive_nn_functional_glu_cpu_float16 (__main__.TestInductorOpInfoCPU)": 73.81366729736328,
"test_comprehensive_nn_functional_glu_cpu_float32 (__main__.TestInductorOpInfoCPU)": 72.70933532714844,
"test_comprehensive_nn_functional_glu_cpu_float64 (__main__.TestInductorOpInfoCPU)": 71.70566813151042,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 101.97566731770833,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 79.01466878255208,
"test_comprehensive_nn_functional_grid_sample_cuda_bfloat16 (__main__.TestDecompCUDA)": 60.61944495307075,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 249.51266479492188,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 204.8530019124349,
"test_comprehensive_nn_functional_interpolate_bicubic_cpu_uint8 (__main__.TestInductorOpInfoCPU)": 71.11166636149089,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 79.37683359781902,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 75.29683430989583,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 75.37983131408691,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float64 (__main__.TestDecompCUDA)": 71.4200013478597,
"test_comprehensive_nn_functional_max_pool1d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 182.4503377278646,
"test_comprehensive_nn_functional_max_pool1d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 182.4470011393229,
"test_comprehensive_nn_functional_max_pool1d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 180.7423299153646,
"test_comprehensive_nn_functional_max_pool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 947.5219930013021,
"test_comprehensive_nn_functional_max_pool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 888.4380086263021,
"test_comprehensive_nn_functional_max_pool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 872.6106770833334,
"test_comprehensive_nn_functional_max_pool2d_cpu_int32 (__main__.TestInductorOpInfoCPU)": 873.1863199869791,
"test_comprehensive_nn_functional_max_pool2d_cpu_int64 (__main__.TestInductorOpInfoCPU)": 836.9976806640625,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 914.9636637369791,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 865.170664469401,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 921.9736531575521,
"test_comprehensive_nn_functional_max_pool3d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 61.38200124104818,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 194.47033182779947,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 201.79733276367188,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 196.93966674804688,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 111.52166557312012,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 113.46616617838542,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 107.02900060017903,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 126.29766845703125,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 137.279665629069,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 156.32100423177084,
"test_comprehensive_nn_functional_pad_constant_cpu_float16 (__main__.TestInductorOpInfoCPU)": 68.2356669108073,
"test_comprehensive_nn_functional_pad_constant_cpu_float32 (__main__.TestInductorOpInfoCPU)": 68.04666392008464,
"test_comprehensive_nn_functional_pad_constant_cpu_float64 (__main__.TestInductorOpInfoCPU)": 72.65566762288411,
"test_comprehensive_nn_functional_pad_constant_cpu_int32 (__main__.TestInductorOpInfoCPU)": 71.84566497802734,
"test_comprehensive_nn_functional_pad_constant_cpu_int64 (__main__.TestInductorOpInfoCPU)": 67.30033365885417,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float16 (__main__.TestInductorOpInfoCPU)": 116.07533264160156,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestInductorOpInfoCPU)": 121.11599985758464,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float64 (__main__.TestInductorOpInfoCPU)": 126.1576639811198,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int32 (__main__.TestInductorOpInfoCPU)": 111.02566528320312,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int64 (__main__.TestInductorOpInfoCPU)": 110.67699940999348,
"test_comprehensive_nn_functional_unfold_cpu_bool (__main__.TestInductorOpInfoCPU)": 122.94300079345703,
"test_comprehensive_nn_functional_unfold_cpu_float16 (__main__.TestInductorOpInfoCPU)": 232.5183308919271,
"test_comprehensive_nn_functional_unfold_cpu_float32 (__main__.TestInductorOpInfoCPU)": 226.49100240071616,
"test_comprehensive_nn_functional_unfold_cpu_float64 (__main__.TestInductorOpInfoCPU)": 225.53233337402344,
"test_comprehensive_nn_functional_unfold_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 80.8669999440511,
"test_comprehensive_nn_functional_unfold_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 84.27566655476888,
"test_comprehensive_nn_functional_unfold_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 78.59099960327148,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 97.90700022379558,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 116.58016713460286,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 64.93249829610188,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 103.83033243815105,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestDecompCUDA)": 61.22433217366537,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 95.78066635131836,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 68.0203348795573,
"test_comprehensive_svd_cuda_complex64 (__main__.TestDecompCUDA)": 67.12083435058594,
"test_cond_autograd_nested (__main__.TestControlFlow)": 86.52511257595486,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 124.19883473714192,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 124.81499989827473,
"test_constructor_autograd_SparseCSC_cuda (__main__.TestSparseAnyCUDA)": 96.18599955240886,
"test_constructor_autograd_SparseCSR_cuda (__main__.TestSparseAnyCUDA)": 80.51999982198079,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 281.4985597398546,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 490.7274458143446,
"test_conv2d_unary_cpu_cpp_wrapper (__main__.TestCppWrapper)": 109.75666809082031,
"test_correctness_AdamW_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 65.37083371480306,
"test_correctness_AdamW_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 116.6316655476888,
"test_correctness_Adam_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 64.48250007629395,
"test_correctness_Adam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 117.85650126139323,
"test_correctness_NAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 68.24049949645996,
"test_correctness_RAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 60.16349983215332,
"test_count_nonzero_all (__main__.TestBool)": 626.1464369032118,
"test_custom_module_lstm (__main__.TestQuantizedOps)": 652.5093282063802,
"test_ddp_uneven_inputs (__main__.TestDistBackendWithSpawn)": 187.38933286815882,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 79.42466608683269,
"test_eig_check_magma_cuda_float32 (__main__.TestLinalgCUDA)": 160.03483472267786,
"test_error_detection_and_propagation (__main__.NcclErrorHandlingTest)": 68.09466552734375,
"test_fail_creation_ops.py (__main__.TestTyping)": 61.745555029975044,
"test_fail_torch_size.py (__main__.TestTyping)": 72.09073282877604,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 83.79666646321614,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 102.75433349609375,
"test_fn_gradgrad_map_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 81.12766520182292,
"test_fn_gradgrad_map_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 60.80604753040132,
"test_fn_gradgrad_map_triple_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 555.7903238932291,
"test_fn_gradgrad_map_triple_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 383.1684977213542,
"test_fuse_large_params_cpu (__main__.CpuTests)": 62.148888481987846,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 90.62955390082465,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 93.76555548773871,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 61.563334147135414,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 70.02099990844727,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 88.94833374023438,
"test_gradgrad_nn_LSTM_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 96.77166748046875,
"test_gradgrad_nn_LSTM_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 94.92766825358073,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 188.36566670735678,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 111.22516632080078,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 130.82799911499023,
"test_gradgrad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 551.7034359886533,
"test_grid_sampler_2d_cpu (__main__.CpuHalideTests)": 185.3376668294271,
"test_group_norm (__main__.TestQuantizedOps)": 127.55677774217394,
"test_indexing (__main__.TestAutogradWithCompiledAutograd)": 60.10233349270291,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 206.19866434733072,
"test_inductor_no_recursionerror_on_for_loops_dynamic_shapes (__main__.DynamicShapesReproTests)": 69.05733447604709,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 120.87516657511394,
"test_inputs_overlapping_with_mutation_stress_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 136.26755608452692,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 110.98100026448567,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 632.4976641337076,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 77.85983276367188,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 80.80400117238362,
"test_linear (__main__.TestStaticQuantizedModule)": 184.62911393907336,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 64.92466862996419,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 68.9913330078125,
"test_linear_relu (__main__.TestStaticQuantizedModule)": 61.6213057386663,
"test_lobpcg_ortho_cuda_float64 (__main__.TestLinalgCUDA)": 86.48916784922282,
"test_lstm_cpu (__main__.TestMkldnnCPU)": 74.93866475423177,
"test_many_overlapping_inputs_does_not_explode_guards_dynamic_shapes (__main__.DynamicShapesReproTests)": 107.84700096978082,
"test_matmul_small_brute_force_tunableop_cuda_float32 (__main__.TestLinalgCUDA)": 226.24600219726562,
"test_matmul_small_brute_force_tunableop_cuda_float64 (__main__.TestLinalgCUDA)": 73.07600021362305,
"test_max_autotune_cutlass_backend_addmm_dynamic_False_max_autotune_gemm_backends_ATen,Triton,CUTLASS (__main__.TestCutlassBackend)": 84.08666483561198,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 61.81711112128364,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 63.886444091796875,
"test_proper_exit (__main__.TestDataLoader)": 230.7673314412435,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 231.44683074951172,
"test_put_cuda_uint8 (__main__.TestTorchDeviceTypeCUDA)": 122.29238058200905,
"test_python_ref_executor__refs_special_zeta_executor_aten_cuda_float64 (__main__.TestCommonCUDA)": 67.51911120944553,
"test_qat_conv2d_unary (__main__.TestQuantizePT2EX86Inductor)": 144.9381103515625,
"test_qat_conv_bn_fusion_no_conv_bias (__main__.TestQuantizePT2EQAT_ConvBn1d)": 60.54057139442081,
"test_qat_mobilenet_v2 (__main__.TestQuantizePT2EQATModels)": 118.08699883355035,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 66.50499979654948,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 64.51799901326497,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 69.84199905395508,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 63.13400141398112,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 63.60199864705404,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 63.15833282470703,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 61.97133255004883,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 64.73333358764648,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 329.5066630045573,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 700.787851969401,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 558.64599609375,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 1100.5410054524739,
"test_quick_core_backward_expand_copy_cuda_float64 (__main__.TestDecompCUDA)": 61.14266777038574,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 64.54199854532878,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 208.8625005086263,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 82.12933349609375,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 190.0106684366862,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 117.40333302815755,
"test_quick_core_backward_split_cuda_float64 (__main__.TestDecompCUDA)": 61.65533320109049,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 67.09733327229817,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 131.47850036621094,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 85.52533340454102,
"test_replicatepad_64bit_indexing_cuda_float16 (__main__.TestNNDeviceTypeCUDA)": 65.21066792805989,
"test_rosenbrock_sparse_with_lrsched_False_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 74.87366692225139,
"test_rosenbrock_sparse_with_lrsched_True_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 115.06016937891643,
"test_save_load_large_string_attribute (__main__.TestSaveLoad)": 109.29100290934245,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 133.14933607313367,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 141.9941143459744,
"test_sum_all_cpu_float64 (__main__.TestReductionsCPU)": 247.04196393972745,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 184.8358294169108,
"test_terminate_handler_on_crash (__main__.TestTorch)": 100.0895553694831,
"test_terminate_signal (__main__.ForkTest)": 136.60211210780673,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 135.93655212471882,
"test_terminate_signal (__main__.SpawnTest)": 138.0366676648458,
"test_torchvision_smoke (__main__.TestTensorBoardPytorchGraph)": 102.0588902367486,
"test_train_parity_multi_group (__main__.TestFullyShard1DTrainingCore)": 123.50458236188085,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 71.75666618347168,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 61.13249969482422,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 83.78299967447917,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 160.55816777547201,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 145.50849787394205,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 116.74900182088216,
"test_unary_ops (__main__.TestTEFuserDynamic)": 172.8575553894043,
"test_unary_ops (__main__.TestTEFuserStatic)": 155.1940016216702,
"test_unwaited (__main__.CommTest)": 60.710333506266274,
"test_upsample_bicubic2d_cpu (__main__.CpuHalideTests)": 96.18333435058594,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 88.48500061035156,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 75.4156665802002,
"test_vec_compare_op_cpu_only (__main__.CPUReproTests)": 64.22761005825467,
"test_vmapjvpvjp_diff_cuda_float32 (__main__.TestOperatorsCUDA)": 70.61666700575087,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 76.22133445739746,
"test_vmapjvpvjp_linalg_multi_dot_cuda_float32 (__main__.TestOperatorsCUDA)": 95.06100145975749,
"test_vmapjvpvjp_linalg_pinv_singular_cuda_float32 (__main__.TestOperatorsCUDA)": 66.50466728210449,
"test_vmapjvpvjp_linalg_solve_triangular_cuda_float32 (__main__.TestOperatorsCUDA)": 86.0706672668457,
"test_vmapjvpvjp_linalg_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 83.06883366902669,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 86.38833363850911,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 67.0398343404134,
"test_vmapjvpvjp_nn_functional_conv2d_cpu_float32 (__main__.TestOperatorsCPU)": 64.79333368937175,
"test_vmapjvpvjp_nn_functional_max_pool2d_cpu_float32 (__main__.TestOperatorsCPU)": 70.52966817220052,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 76.59099833170573,
"test_vmapjvpvjp_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 76.7548344930013,
"test_vmapjvpvjp_unbind_cpu_float32 (__main__.TestOperatorsCPU)": 65.50899887084961,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 86.91949971516927,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 174.04599571228027,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 72.79299926757812,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 131.72166697184244
}