forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathslow_tests.json
More file actions
277 lines (277 loc) · 29.3 KB
/
Copy pathslow_tests.json
File metadata and controls
277 lines (277 loc) · 29.3 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
{
"EndToEndLSTM (__main__.RNNTest)": 193.73400370279947,
"MultiheadAttention (__main__.ModulesTest)": 144.85599772135416,
"test_3mm_add (__main__.TestTritonDotReduction)": 129.92483266194662,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 90.46566390991211,
"test_aot_autograd_disable_functionalization_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 77.86966705322266,
"test_aot_autograd_disable_functionalization_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 127.5673319498698,
"test_aot_autograd_disable_functionalization_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 204.36866760253906,
"test_aot_autograd_disable_functionalization_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 123.83066304524739,
"test_aot_autograd_disable_functionalization_symbolic_exhaustive_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 66.83466720581055,
"test_aot_autograd_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 72.18625852796767,
"test_aot_autograd_symbolic_exhaustive_linalg_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 77.01166534423828,
"test_aot_autograd_symbolic_exhaustive_masked_norm_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 62.44844436645508,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 156.3863321940104,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 203.4173329671224,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 105.20900217692058,
"test_aot_autograd_symbolic_exhaustive_nn_functional_unfold_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 65.38600158691406,
"test_aot_autograd_symbolic_exhaustive_ormqr_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 83.66033426920573,
"test_aot_autograd_symbolic_exhaustive_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 101.71733093261719,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 127.03733317057292,
"test_associative_scan_partial_grad_combine_mode_generic_compile_mode_compile_dynamic_shape_reverse_False_cpu (__main__.AssociativeScanTests)": 88.39666748046875,
"test_associative_scan_partial_grad_combine_mode_generic_compile_mode_compile_dynamic_shape_reverse_True_cpu (__main__.AssociativeScanTests)": 102.40783437093098,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 763.9162445068359,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 152.19875049591064,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 514.7272237141927,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 520.711890326606,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 64.15366808573405,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 128.34783426920572,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 71.84533437093098,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 64.79450035095215,
"test_baddmm_search_space_EXHAUSTIVE (__main__.TestMaxAutotune)": 112.79600016276042,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 226.9800008138021,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 173.3750025431315,
"test_cat_2k_args (__main__.TestTEFuserDynamic)": 131.654914483428,
"test_checkpointing_without_reentrant_input_requires_grad_False (__main__.TestAutogradWithCompiledAutograd)": 347.29089016384546,
"test_checkpointing_without_reentrant_input_requires_grad_True (__main__.TestAutogradWithCompiledAutograd)": 448.10833062065973,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 285.1102227105035,
"test_compiled_dtensor_op_db_nn_functional_max_pool2d_cpu_float32 (__main__.TestCompiledDTensorOpsCPU)": 92.9769999186198,
"test_compiled_dtensor_op_db_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestCompiledDTensorOpsCPU)": 64.3003323872884,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 100.02783330281575,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 97.7408332824707,
"test_comprehensive_diff_cuda_float32 (__main__.TestDecompCUDA)": 67.63183339436848,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 66.48316637674968,
"test_comprehensive_grid_sampler_2d_cpu_bfloat16 (__main__.TestDecompCPU)": 89.89199829101562,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestDecompCPU)": 90.3046646118164,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 432.8856608072917,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 431.4099934895833,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 244.3134994506836,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 277.8193359375,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 1243.374491373698,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 71.73899968465169,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 1143.0853271484375,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 75.46933364868164,
"test_comprehensive_linalg_lu_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 66.4915000597636,
"test_comprehensive_linalg_lu_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 67.09683386484782,
"test_comprehensive_linalg_lu_factor_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 62.22633425394694,
"test_comprehensive_linalg_lu_factor_ex_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 62.32066790262858,
"test_comprehensive_linalg_lu_factor_ex_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 62.156500498453774,
"test_comprehensive_linalg_lu_solve_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 80.1408322652181,
"test_comprehensive_linalg_lu_solve_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 79.4061648050944,
"test_comprehensive_linalg_matrix_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 95.98250071207683,
"test_comprehensive_linalg_matrix_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 94.55149968465169,
"test_comprehensive_linalg_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 98.94500128428142,
"test_comprehensive_linalg_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 115.80650011698405,
"test_comprehensive_linalg_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 115.1416654586792,
"test_comprehensive_linalg_norm_subgradients_at_zero_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 87.03200038274129,
"test_comprehensive_linalg_norm_subgradients_at_zero_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 110.46916611989339,
"test_comprehensive_linalg_norm_subgradients_at_zero_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 111.24783261617024,
"test_comprehensive_linalg_solve_triangular_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 83.31766764322917,
"test_comprehensive_linalg_solve_triangular_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 80.25166447957356,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 69.97166570027669,
"test_comprehensive_linalg_svd_cuda_complex64 (__main__.TestDecompCUDA)": 68.84450022379558,
"test_comprehensive_linalg_svd_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 96.60883108774821,
"test_comprehensive_linalg_svd_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 93.79333368937175,
"test_comprehensive_linalg_vector_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 256.18433062235516,
"test_comprehensive_linalg_vector_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 248.46516863505045,
"test_comprehensive_logspace_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 74.78166580200195,
"test_comprehensive_logspace_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 69.59733327229817,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 117.71599960327148,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 113.31033579508464,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 114.37183252970378,
"test_comprehensive_max_pool2d_with_indices_backward_cpu_float64 (__main__.TestDecompCPU)": 64.0938326517741,
"test_comprehensive_nn_functional_conv_transpose3d_cuda_complex128 (__main__.TestDecompCUDA)": 63.42050043741862,
"test_comprehensive_nn_functional_conv_transpose3d_cuda_complex64 (__main__.TestDecompCUDA)": 63.77633285522461,
"test_comprehensive_nn_functional_gaussian_nll_loss_cpu_float32 (__main__.TestDecompCPU)": 61.52166620890299,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 118.71116765340169,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 125.97533289591472,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 110.10399881998698,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 119.12533315022786,
"test_comprehensive_nn_functional_grid_sample_cuda_bfloat16 (__main__.TestDecompCUDA)": 63.85616683959961,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 263.6338348388672,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 260.0433349609375,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestDecompCUDA)": 80.7168337504069,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 83.66033426920573,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestDecompCUDA)": 78.34583409627278,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 83.96233240763347,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 120.8836669921875,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float64 (__main__.TestDecompCUDA)": 124.52166748046875,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 819.3448282877604,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 800.9398295084635,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 798.9723409016927,
"test_comprehensive_nn_functional_max_pool3d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 650.4093424479166,
"test_comprehensive_nn_functional_max_pool3d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 672.7261657714844,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 70.85333506266277,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 73.07083384195964,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 73.60183334350586,
"test_comprehensive_ormqr_cpu_complex128 (__main__.TestDecompCPU)": 63.091583251953125,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 119.43050130208333,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 129.18349838256836,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 73.39383252461751,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 77.46083196004231,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestDecompCUDA)": 100.95350011189778,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 76.22900009155273,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 76.60616556803386,
"test_comprehensive_svd_cuda_complex64 (__main__.TestDecompCUDA)": 72.88816579182942,
"test_comprehensive_svd_lowrank_cuda_complex128 (__main__.TestDecompCUDA)": 66.14150047302246,
"test_comprehensive_svd_lowrank_cuda_complex64 (__main__.TestDecompCUDA)": 71.52549870808919,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 103.31566747029622,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 90.61466598510742,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 85.5044453938802,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 186.80122545030383,
"test_conv2d_binary_broadcast_shapes_cpu (__main__.TestPatternMatcherGenericCPU)": 73.75333404541016,
"test_conv3d_binary_broadcast_shapes_cpu (__main__.TestPatternMatcherGenericCPU)": 165.67066955566406,
"test_conv3d_binary_dynamic_shapes_cpu (__main__.TestDynamicPatternMatcherGenericCPU)": 69.34033330281575,
"test_conv3d_unary_dynamic_shapes_cpu (__main__.TestDynamicPatternMatcherGenericCPU)": 73.0816667344835,
"test_conv_bn_fuse_cpu (__main__.CpuTests)": 62.08125019073486,
"test_conv_unary_fusion_nnc (__main__.TestMkldnnFusion)": 82.00311109754774,
"test_correctness_AdamW_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 89.69633356730144,
"test_correctness_Adam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 88.30749893188477,
"test_count_nonzero_all (__main__.TestBool)": 654.9627821180555,
"test_create_rand_mask_from_inputs_dynamic_shapes (__main__.DynamicShapesReproTests)": 92.5728333791097,
"test_dijkstra_expand_single_dim_strategy_to_mesh_hard_4d (__main__.TestDijkstraExpandSingleDimStrategy)": 303.05066935221356,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 95.07450103759766,
"test_dtensor_op_db__native_batch_norm_legit_cpu_float32 (__main__.TestMultiThreadedDTensorOpsCPU)": 172.50000508626303,
"test_dtensor_op_db_native_batch_norm_cpu_float32 (__main__.TestMultiThreadedDTensorOpsCPU)": 200.29400126139322,
"test_dtensor_op_db_nn_functional_batch_norm_cpu_float32 (__main__.TestMultiThreadedDTensorOpsCPU)": 199.36066691080728,
"test_dtensor_op_db_nn_functional_binary_cross_entropy_with_logits_cpu_float32 (__main__.TestMultiThreadedDTensorOpsCPU)": 183.6556650797526,
"test_eager_sequence_nr_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 195.9025821685791,
"test_fail_arithmetic_ops.py (__main__.TestTyping)": 85.94689008924696,
"test_fail_random.py (__main__.TestTyping)": 363.56556599934896,
"test_fail_torch_size.py (__main__.TestTyping)": 114.58616725787675,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 83.33750025431316,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 103.71716690063477,
"test_fuse_large_params_cpu (__main__.CpuTests)": 92.53525161743164,
"test_fuse_large_params_cuda (__main__.GPUTests)": 62.06562566757202,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 156.92011176215277,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 158.4638909233941,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 135.43400065104166,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 132.73733266194662,
"test_grad_nn_Transformer_cpu_float64 (__main__.TestModuleCPU)": 84.30703392028809,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 80.69633356730144,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 190.28999837239584,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 113.35149892171223,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 123.2726656595866,
"test_gradgrad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 494.573003133138,
"test_graph_based_redistribute_cost (__main__.DistributeWithDeviceOrderTest)": 67.4446652730306,
"test_graph_based_redistribute_cost (__main__.DistributeWithDeviceOrderTestWithLocalTensor)": 62.11899948120117,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 325.7254994710286,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 83.06583404541016,
"test_inputs_overlapping_with_mutation_stress_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 122.00066714816623,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 86.76616668701172,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 1066.7661743164062,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 72.56916681925456,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 151.44950103759766,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 140.42566935221353,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 150.54800160725912,
"test_longformer_chunk_dynamic_shapes (__main__.DynamicShapesReproTests)": 104.55644395616319,
"test_low_memory_max_pool_dilation_1_dim_3_use_block_ptr_False_cpu_halide (__main__.HalideCpuTests)": 583.5033365885416,
"test_low_memory_max_pool_dilation_2_dim_3_use_block_ptr_False_cpu_halide (__main__.HalideCpuTests)": 516.3889973958334,
"test_lstm_cpu (__main__.TestMkldnnCPU)": 68.73433176676433,
"test_many_overlapping_inputs_does_not_explode_guards_dynamic_shapes (__main__.DynamicShapesReproTests)": 108.97577582465277,
"test_max_autotune_remote_caching_dynamic_True (__main__.TestMaxAutotuneRemoteCache)": 61.8836669921875,
"test_memory_format_operators_cuda (__main__.TestTorchDeviceTypeCUDA)": 125.83300018310547,
"test_ops_composition_names_cpu (__main__.TestTestParametrizationDeviceTypeCPU)": 157.14929997324944,
"test_ops_decorator_applies_op_and_param_specific_decorators_cpu (__main__.TestTestParametrizationDeviceTypeCPU)": 189.11739701827366,
"test_pattern_matcher_multi_user_cpu (__main__.CpuTritonTests)": 143.3016611735026,
"test_pq_vs_full_expansion_data_driven (__main__.TestDijkstraExpandSingleDimStrategy)": 881.4066772460938,
"test_proper_exit (__main__.TestDataLoader)": 219.32978057861328,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 229.30333031548395,
"test_python_ref__refs_special_zeta_cuda_float64 (__main__.TestCommonCUDA)": 74.98866653442383,
"test_python_ref_executor__refs_special_zeta_executor_aten_cuda_float64 (__main__.TestCommonCUDA)": 89.93916702270508,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 556.7093302408854,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 1110.48583984375,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 813.156005859375,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 1398.7890014648438,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 84.88433329264323,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 268.56183369954425,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 127.7530008951823,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 241.10733795166016,
"test_quick_core_backward_select_scatter_cpu_float64 (__main__.TestDecompCPU)": 77.3393325805664,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 143.2455037434896,
"test_quick_core_backward_split_cuda_float64 (__main__.TestDecompCUDA)": 69.18416849772136,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 105.94433339436848,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 174.2881647745768,
"test_quick_core_backward_std_cpu_float64 (__main__.TestDecompCPU)": 77.57733408610027,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 158.21883392333984,
"test_register_spills_cuda (__main__.BenchmarkFusionGpuTest)": 108.23566563924153,
"test_resize_as_cuda (__main__.GPUTests)": 89.16333452860515,
"test_resize_cuda (__main__.GPUTests)": 67.50366735458374,
"test_reveal_opt_size.py (__main__.TestTyping)": 60.49586756983772,
"test_run2run_determinism_model_name_BertForMaskedLM_training_or_inference_inference_precision_amp (__main__.DeterministicTest)": 104.33299763997395,
"test_run2run_determinism_model_name_BertForMaskedLM_training_or_inference_inference_precision_bfloat16 (__main__.DeterministicTest)": 64.46683311462402,
"test_run2run_determinism_model_name_BertForMaskedLM_training_or_inference_training_precision_amp (__main__.DeterministicTest)": 198.3463338216146,
"test_run2run_determinism_model_name_BertForMaskedLM_training_or_inference_training_precision_bfloat16 (__main__.DeterministicTest)": 153.71866353352866,
"test_run2run_determinism_model_name_BertForMaskedLM_training_or_inference_training_precision_float16 (__main__.DeterministicTest)": 167.72516632080078,
"test_run2run_determinism_model_name_BertForMaskedLM_training_or_inference_training_precision_float32 (__main__.DeterministicTest)": 188.2213338216146,
"test_run2run_determinism_model_name_DistillGPT2_training_or_inference_training_precision_amp (__main__.DeterministicTest)": 82.31683349609375,
"test_run2run_determinism_model_name_DistillGPT2_training_or_inference_training_precision_bfloat16 (__main__.DeterministicTest)": 115.22916666666667,
"test_run2run_determinism_model_name_DistillGPT2_training_or_inference_training_precision_float16 (__main__.DeterministicTest)": 84.5586649576823,
"test_run2run_determinism_model_name_DistillGPT2_training_or_inference_training_precision_float32 (__main__.DeterministicTest)": 122.09583409627278,
"test_run2run_determinism_model_name_GoogleFnet_training_or_inference_training_precision_amp (__main__.DeterministicTest)": 95.04883448282878,
"test_run2run_determinism_model_name_GoogleFnet_training_or_inference_training_precision_bfloat16 (__main__.DeterministicTest)": 94.20300165812175,
"test_run2run_determinism_model_name_GoogleFnet_training_or_inference_training_precision_float16 (__main__.DeterministicTest)": 118.3158327738444,
"test_run2run_determinism_model_name_GoogleFnet_training_or_inference_training_precision_float32 (__main__.DeterministicTest)": 119.6198336283366,
"test_runtime_checks_large_cpu (__main__.AOTInductorTestABICompatibleCpu)": 70.40016682942708,
"test_runtime_checks_large_cpu_with_stack_allocation (__main__.AOTInductorTestABICompatibleCpuWithStackAllocation)": 70.30955590142145,
"test_runtime_checks_large_cuda (__main__.AOTInductorTestABICompatibleGpu)": 171.0409952799479,
"test_sdpa_kernel_ctx_manager2_dynamic_shapes (__main__.DynamicShapesCtxManagerTests)": 106.9195556640625,
"test_searchsorted_cuda (__main__.GPUTests)": 82.54333392779033,
"test_shared_memory_pruning_addmm_bfloat16_mat1_transposed_False_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 143.74433390299478,
"test_shared_memory_pruning_addmm_bfloat16_mat1_transposed_False_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 143.3086675008138,
"test_shared_memory_pruning_addmm_bfloat16_mat1_transposed_True_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 143.81799825032553,
"test_shared_memory_pruning_addmm_bfloat16_mat1_transposed_True_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 144.1403350830078,
"test_shared_memory_pruning_addmm_float32_mat1_transposed_False_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 153.8959986368815,
"test_shared_memory_pruning_addmm_float32_mat1_transposed_False_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 159.3713353474935,
"test_shared_memory_pruning_addmm_float32_mat1_transposed_True_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 151.32366689046225,
"test_shared_memory_pruning_addmm_float32_mat1_transposed_True_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 151.53400166829428,
"test_shared_memory_pruning_mm_bfloat16_mat1_transposed_False_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 137.7143351236979,
"test_shared_memory_pruning_mm_bfloat16_mat1_transposed_False_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 137.6969985961914,
"test_shared_memory_pruning_mm_bfloat16_mat1_transposed_True_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 139.831662495931,
"test_shared_memory_pruning_mm_bfloat16_mat1_transposed_True_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 138.6189982096354,
"test_shared_memory_pruning_mm_float32_mat1_transposed_False_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 149.81566874186197,
"test_shared_memory_pruning_mm_float32_mat1_transposed_False_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 154.44766743977866,
"test_shared_memory_pruning_mm_float32_mat1_transposed_True_mat2_transposed_False_use_tma_False (__main__.TestTemplateConfigPruning)": 146.81933085123697,
"test_shared_memory_pruning_mm_float32_mat1_transposed_True_mat2_transposed_True_use_tma_False (__main__.TestTemplateConfigPruning)": 147.39400227864584,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 122.32033454047308,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 124.18311055501302,
"test_softmax_cpu_float64 (__main__.TestSparseCPU)": 60.396761218706764,
"test_sort_bool_cpu (__main__.CpuTritonTests)": 348.36634318033856,
"test_sort_dynamic_shape_with_check_cuda (__main__.TestInductorDynamicCUDA)": 112.24066670735677,
"test_sort_stable_cuda (__main__.GPUTests)": 126.56412506103516,
"test_sort_transpose_cpu (__main__.CpuTritonTests)": 376.54832967122394,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 327.46799723307294,
"test_tensorwise_scaling_acceptable_input_dims_M_1024_K_1024_N_2048_persistent_matmul_False_cpu (__main__.TestFP8LoweringCPU)": 75.4329337477684,
"test_terminate_handler_on_crash (__main__.TestTorch)": 207.00677956475153,
"test_terminate_signal (__main__.ForkTest)": 232.13122049967447,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 232.00266604953342,
"test_terminate_signal (__main__.SpawnTest)": 222.40377510918512,
"test_torch_size_tensor_index_scalar_constant_dynamic_shapes (__main__.DynamicShapesMiscTests)": 601.1639200846354,
"test_train_parity_multi_group (__main__.TestFullyShard1DTrainingCore)": 174.3316650390625,
"test_train_parity_multi_group_cpu_offload_eager (__main__.TestFullyShard1DTrainingCore)": 61.27133305867513,
"test_train_parity_multi_group_unshard_async_op (__main__.TestFullyShard1DTrainingCore)": 64.80400085449219,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 87.95033391316731,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 254.8540013631185,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 256.1475016276042,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 194.4748331705729,
"test_tuning_pool_timeout (__main__.TestTuningProcessPool)": 126.16133371988933,
"test_unbacked_dtensor_op_db_clamp_cpu_float32 (__main__.TestUnbackedDTensorOpsCPU)": 96.5290018717448,
"test_unbind (__main__.TestVmapOperators)": 82.44380033289393,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 88.58866628011067,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 78.71033223470052,
"test_vec_compare_op_cpu_only (__main__.CPUReproTests)": 62.92533323499892,
"test_views1_cuda (__main__.GPUTests)": 106.26166693369548,
"test_vmapjvpvjp_linalg_lstsq_grad_oriented_cpu_float32 (__main__.TestOperatorsCPU)": 113.2413330078125,
"test_vmapjvpvjp_linalg_lu_solve_cpu_float32 (__main__.TestOperatorsCPU)": 68.83388929013853,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 67.28550148010254,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 86.25900014241536,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 78.42966588338216,
"test_vmapjvpvjp_nn_functional_conv2d_cpu_float32 (__main__.TestOperatorsCPU)": 69.55499903361003,
"test_vmapjvpvjp_nn_functional_max_pool2d_cpu_float32 (__main__.TestOperatorsCPU)": 89.97300211588542,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 79.44366709391277,
"test_vmapjvpvjp_unbind_cpu_float32 (__main__.TestOperatorsCPU)": 66.21299997965495,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 81.87016677856445,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 82.90099970499675,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 81.67116800944011,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 110.1931660970052
}