forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathslow_tests.json
301 lines (301 loc) · 30.3 KB
/
slow_tests.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
{
"test_AllenaiLongformerBase_repro_cpu (__main__.CpuHalideTests)": 217.4143320719401,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 166.39100392659506,
"test_adaptive_max_pool2d1_cpu (__main__.CpuHalideTests)": 114.1923344930013,
"test_after_aot_cpu_runtime_error (__main__.MinifierIsolateTests)": 63.9750010172526,
"test_alexnet_prefix_cpu (__main__.CpuHalideTests)": 192.23033142089844,
"test_aot_autograd_symbolic_exhaustive_linalg_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 61.99166671435038,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 69.81999969482422,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 124.89299774169922,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 76.3479995727539,
"test_aot_autograd_symbolic_exhaustive_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 63.36962493260702,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 81.5479965209961,
"test_associative_scan_dim_reverse_False_combine_mode_generic_cpu (__main__.TestControlFlow)": 67.8025016784668,
"test_associative_scan_dim_reverse_True_combine_mode_generic_cpu (__main__.TestControlFlow)": 66.13800048828125,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 478.62633260091144,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 93.62950134277344,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 506.30767822265625,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 491.98000081380206,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 64.00250053405762,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 121.60200500488281,
"test_avg_pool3d_backward_cpu (__main__.CpuHalideTests)": 61.75266647338867,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 78.88500213623047,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 86.18000030517578,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 258.5509999593099,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 185.53849411010742,
"test_builtin_equivalent_funcs (__main__.TorchFunctionModeTests)": 106.2084831730012,
"test_captured_score_mod_aot_eager_gradcheck_score_mod_name__head_offset_mode_eager (__main__.TestFlexAttention)": 168.5279998779297,
"test_checkpoint_cast (__main__.TestFxToOnnx)": 367.0326639811198,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 445.89332071940106,
"test_comprehensive_constant_pad_nd_cpu_float16 (__main__.TestInductorOpInfoCPU)": 77.9749984741211,
"test_comprehensive_constant_pad_nd_cpu_float32 (__main__.TestInductorOpInfoCPU)": 79.8239974975586,
"test_comprehensive_constant_pad_nd_cpu_float64 (__main__.TestInductorOpInfoCPU)": 85.11900329589844,
"test_comprehensive_constant_pad_nd_cpu_int32 (__main__.TestInductorOpInfoCPU)": 76.80500030517578,
"test_comprehensive_constant_pad_nd_cpu_int64 (__main__.TestInductorOpInfoCPU)": 85.15299987792969,
"test_comprehensive_diff_cpu_bool (__main__.TestInductorOpInfoCPU)": 120.29299926757812,
"test_comprehensive_diff_cpu_float32 (__main__.TestInductorOpInfoCPU)": 124.5790023803711,
"test_comprehensive_diff_cpu_float64 (__main__.TestInductorOpInfoCPU)": 117.91300201416016,
"test_comprehensive_diff_cpu_int32 (__main__.TestInductorOpInfoCPU)": 114.56999969482422,
"test_comprehensive_diff_cpu_int64 (__main__.TestInductorOpInfoCPU)": 112.50800323486328,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 84.26350212097168,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 78.46549987792969,
"test_comprehensive_diff_cuda_float32 (__main__.TestDecompCUDA)": 67.1016674041748,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 65.60141595204671,
"test_comprehensive_dist_cpu_float16 (__main__.TestInductorOpInfoCPU)": 92.52999877929688,
"test_comprehensive_dist_cpu_float32 (__main__.TestInductorOpInfoCPU)": 97.3219985961914,
"test_comprehensive_dist_cpu_float64 (__main__.TestInductorOpInfoCPU)": 95.83000183105469,
"test_comprehensive_eye_cpu_bool (__main__.TestInductorOpInfoCPU)": 144.24400329589844,
"test_comprehensive_eye_cpu_float16 (__main__.TestInductorOpInfoCPU)": 144.09800720214844,
"test_comprehensive_eye_cpu_float32 (__main__.TestInductorOpInfoCPU)": 140.6179962158203,
"test_comprehensive_eye_cpu_float64 (__main__.TestInductorOpInfoCPU)": 147.72799682617188,
"test_comprehensive_eye_cpu_int32 (__main__.TestInductorOpInfoCPU)": 148.1300048828125,
"test_comprehensive_eye_cpu_int64 (__main__.TestInductorOpInfoCPU)": 140.44900512695312,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 336.2829895019531,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 79.47200012207031,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 332.3320007324219,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 87.55799865722656,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 198.34749603271484,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 179.73450469970703,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 967.4775085449219,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 694.5654907226562,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 66.58891677856445,
"test_comprehensive_linalg_svd_cuda_complex64 (__main__.TestDecompCUDA)": 65.6439167658488,
"test_comprehensive_linalg_vector_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 227.33700561523438,
"test_comprehensive_linalg_vector_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 216.9149932861328,
"test_comprehensive_linalg_vector_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 232.6009979248047,
"test_comprehensive_logspace_cpu_float32 (__main__.TestInductorOpInfoCPU)": 481.40899658203125,
"test_comprehensive_logspace_cpu_float64 (__main__.TestInductorOpInfoCPU)": 471.8290100097656,
"test_comprehensive_logspace_cpu_int32 (__main__.TestInductorOpInfoCPU)": 486.5690002441406,
"test_comprehensive_logspace_cpu_int64 (__main__.TestInductorOpInfoCPU)": 463.9100036621094,
"test_comprehensive_masked_amax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 110.54100036621094,
"test_comprehensive_masked_amax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 108.97200012207031,
"test_comprehensive_masked_amax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 102.99299621582031,
"test_comprehensive_masked_amax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 101.9540023803711,
"test_comprehensive_masked_amax_cpu_int64 (__main__.TestInductorOpInfoCPU)": 113.29900360107422,
"test_comprehensive_masked_amin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 109.6259994506836,
"test_comprehensive_masked_amin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 108.30999755859375,
"test_comprehensive_masked_amin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 116.44100189208984,
"test_comprehensive_masked_amin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 109.46900177001953,
"test_comprehensive_masked_amin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 104.93399810791016,
"test_comprehensive_masked_mean_cpu_bool (__main__.TestInductorOpInfoCPU)": 114.0250015258789,
"test_comprehensive_masked_mean_cpu_float16 (__main__.TestInductorOpInfoCPU)": 101.22699737548828,
"test_comprehensive_masked_mean_cpu_float32 (__main__.TestInductorOpInfoCPU)": 107.9739990234375,
"test_comprehensive_masked_mean_cpu_float64 (__main__.TestInductorOpInfoCPU)": 99.99700164794922,
"test_comprehensive_masked_mean_cpu_int32 (__main__.TestInductorOpInfoCPU)": 101.21099853515625,
"test_comprehensive_masked_mean_cpu_int64 (__main__.TestInductorOpInfoCPU)": 101.0739974975586,
"test_comprehensive_masked_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 520.8800048828125,
"test_comprehensive_masked_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 519.7890014648438,
"test_comprehensive_masked_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 537.2009887695312,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 133.04099655151367,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 152.52900314331055,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 152.47850036621094,
"test_comprehensive_masked_prod_cpu_bool (__main__.TestInductorOpInfoCPU)": 106.46099853515625,
"test_comprehensive_masked_prod_cpu_float16 (__main__.TestInductorOpInfoCPU)": 109.83699798583984,
"test_comprehensive_masked_prod_cpu_float32 (__main__.TestInductorOpInfoCPU)": 103.9739990234375,
"test_comprehensive_masked_prod_cpu_float64 (__main__.TestInductorOpInfoCPU)": 105.8479995727539,
"test_comprehensive_masked_prod_cpu_int32 (__main__.TestInductorOpInfoCPU)": 102.44999694824219,
"test_comprehensive_masked_prod_cpu_int64 (__main__.TestInductorOpInfoCPU)": 105.66799926757812,
"test_comprehensive_masked_sum_cpu_bool (__main__.TestInductorOpInfoCPU)": 106.78600311279297,
"test_comprehensive_masked_sum_cpu_float16 (__main__.TestInductorOpInfoCPU)": 105.28500366210938,
"test_comprehensive_masked_sum_cpu_float32 (__main__.TestInductorOpInfoCPU)": 103.47899627685547,
"test_comprehensive_masked_sum_cpu_float64 (__main__.TestInductorOpInfoCPU)": 103.16100311279297,
"test_comprehensive_masked_sum_cpu_int32 (__main__.TestInductorOpInfoCPU)": 109.84500122070312,
"test_comprehensive_masked_sum_cpu_int64 (__main__.TestInductorOpInfoCPU)": 101.93699645996094,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 81.2234992980957,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 74.54800033569336,
"test_comprehensive_nn_functional_glu_cpu_float16 (__main__.TestInductorOpInfoCPU)": 81.26899719238281,
"test_comprehensive_nn_functional_glu_cpu_float32 (__main__.TestInductorOpInfoCPU)": 79.93000030517578,
"test_comprehensive_nn_functional_glu_cpu_float64 (__main__.TestInductorOpInfoCPU)": 81.04100036621094,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 92.6050033569336,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 104.4520034790039,
"test_comprehensive_nn_functional_grid_sample_cuda_bfloat16 (__main__.TestDecompCUDA)": 60.700416564941406,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 178.74700164794922,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 274.27099609375,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 61.93400192260742,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float64 (__main__.TestDecompCUDA)": 61.11149978637695,
"test_comprehensive_nn_functional_max_pool1d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 175.85699462890625,
"test_comprehensive_nn_functional_max_pool1d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 168.17300415039062,
"test_comprehensive_nn_functional_max_pool1d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 165.5489959716797,
"test_comprehensive_nn_functional_max_pool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 923.7789916992188,
"test_comprehensive_nn_functional_max_pool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 884.5230102539062,
"test_comprehensive_nn_functional_max_pool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 881.906982421875,
"test_comprehensive_nn_functional_max_pool2d_cpu_int32 (__main__.TestInductorOpInfoCPU)": 842.1710205078125,
"test_comprehensive_nn_functional_max_pool2d_cpu_int64 (__main__.TestInductorOpInfoCPU)": 848.0770263671875,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 752.0610046386719,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 753.4309997558594,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 838.5154724121094,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 221.04100036621094,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 234.07400512695312,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 231.1929931640625,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 78.63642120361328,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 76.75510486803557,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 77.19105228624846,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 153.2100067138672,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 149.39599609375,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 146.4810028076172,
"test_comprehensive_nn_functional_pad_constant_cpu_float16 (__main__.TestInductorOpInfoCPU)": 75.3740005493164,
"test_comprehensive_nn_functional_pad_constant_cpu_float32 (__main__.TestInductorOpInfoCPU)": 88.25800323486328,
"test_comprehensive_nn_functional_pad_constant_cpu_float64 (__main__.TestInductorOpInfoCPU)": 77.86799621582031,
"test_comprehensive_nn_functional_pad_constant_cpu_int32 (__main__.TestInductorOpInfoCPU)": 85.75399780273438,
"test_comprehensive_nn_functional_pad_constant_cpu_int64 (__main__.TestInductorOpInfoCPU)": 75.73500061035156,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float16 (__main__.TestInductorOpInfoCPU)": 134.7989959716797,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestInductorOpInfoCPU)": 125.13800048828125,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float64 (__main__.TestInductorOpInfoCPU)": 138.28500366210938,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int32 (__main__.TestInductorOpInfoCPU)": 127.2229995727539,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int64 (__main__.TestInductorOpInfoCPU)": 124.50499725341797,
"test_comprehensive_nn_functional_unfold_cpu_bool (__main__.TestInductorOpInfoCPU)": 141.44400024414062,
"test_comprehensive_nn_functional_unfold_cpu_float16 (__main__.TestInductorOpInfoCPU)": 255.00599670410156,
"test_comprehensive_nn_functional_unfold_cpu_float32 (__main__.TestInductorOpInfoCPU)": 257.2449951171875,
"test_comprehensive_nn_functional_unfold_cpu_float64 (__main__.TestInductorOpInfoCPU)": 252.31399536132812,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 113.76800155639648,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 91.2755012512207,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 72.64516703287761,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 119.41699981689453,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 69.64147366975483,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 73.99099953969319,
"test_comprehensive_svd_cuda_complex64 (__main__.TestDecompCUDA)": 65.03750038146973,
"test_comprehensive_svd_lowrank_cuda_complex128 (__main__.TestDecompCUDA)": 64.99233373006184,
"test_comprehensive_svd_lowrank_cuda_complex64 (__main__.TestDecompCUDA)": 64.825332959493,
"test_cond_autograd_nested (__main__.TestControlFlow)": 78.28133392333984,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 85.54650115966797,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 77.20849990844727,
"test_constructor_autograd_SparseCSC_cuda (__main__.TestSparseAnyCUDA)": 66.02849769592285,
"test_constructor_autograd_SparseCSR_cuda (__main__.TestSparseAnyCUDA)": 90.93049621582031,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 217.32833099365234,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 434.2860107421875,
"test_conv2d_unary_cpu_cpp_wrapper (__main__.TestCppWrapper)": 279.1969909667969,
"test_conv_freezing_cpu_with_stack_allocation (__main__.AOTInductorTestABICompatibleCpuWithStackAllocation)": 63.11627990722656,
"test_correctness_NAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 77.31900215148926,
"test_correctness_RAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 62.60299987792969,
"test_count_nonzero_all (__main__.TestBool)": 663.2940063476562,
"test_custom_module_lstm (__main__.TestQuantizedOps)": 205.06800333658853,
"test_ddp_uneven_inputs (__main__.TestDistBackendWithSpawn)": 185.50533405939737,
"test_deconv_freezing_cpu_with_stack_allocation (__main__.AOTInductorTestABICompatibleCpuWithStackAllocation)": 60.336119651794434,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 80.5359992980957,
"test_eig_check_magma_cuda_float32 (__main__.TestLinalgCUDA)": 62.61600172519684,
"test_fail_creation_ops.py (__main__.TestTyping)": 64.10633341471355,
"test_fail_random.py (__main__.TestTyping)": 73.96077489852905,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 63.15999794006348,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 69.70149993896484,
"test_fn_gradgrad_map_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 88.06099700927734,
"test_fn_gradgrad_map_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 66.5104997808283,
"test_fn_gradgrad_map_triple_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 490.46099853515625,
"test_fn_gradgrad_map_triple_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 309.78050231933594,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 78.52733357747395,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 77.23800150553386,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 72.49049758911133,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 61.91749954223633,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 85.50300216674805,
"test_gradgrad_nn_LSTM_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 105.5469970703125,
"test_gradgrad_nn_LSTM_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 84.302001953125,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 178.19400024414062,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 120.38199996948242,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 130.34649658203125,
"test_grid_sampler_2d_cpu (__main__.CpuHalideTests)": 188.41600036621094,
"test_index_select_cuda_float8_e4m3fnuz (__main__.TestTorchDeviceTypeCUDA)": 67.98859901059419,
"test_index_select_cuda_float8_e5m2fnuz (__main__.TestTorchDeviceTypeCUDA)": 68.28252009976656,
"test_indexing (__main__.TestAutogradWithCompiledAutograd)": 66.04966608683269,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 186.83200073242188,
"test_inductor_no_recursionerror_on_for_loops_dynamic_shapes (__main__.DynamicShapesReproTests)": 62.57789257594517,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 73.21549987792969,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 144.78700256347656,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 590.2300109863281,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 67.87849998474121,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 69.79699993133545,
"test_linear (__main__.TestStaticQuantizedModule)": 165.18300247192383,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 175.40899658203125,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 170.81900024414062,
"test_linear_packed_cpp_wrapper (__main__.TestCppWrapper)": 80.76100158691406,
"test_linear_packed_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 76.26699829101562,
"test_linear_relu (__main__.TestStaticQuantizedModule)": 60.553001403808594,
"test_load_from_view_buffer (__main__.TestFlexAttention)": 92.79700034005302,
"test_lobpcg_ortho_cuda_float64 (__main__.TestLinalgCUDA)": 62.85261689699613,
"test_max_autotune (__main__.TestFlexAttention)": 76.35428619384766,
"test_max_autotune_cutlass_backend_addmm_dynamic_False_max_autotune_gemm_backends_ATen,Triton,CUTLASS (__main__.TestCutlassBackend)": 87.5459976196289,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 64.43099848429362,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 62.10766728719076,
"test_mixed_mm_exhaustive_dtypes (__main__.TestPatternMatcher)": 90.12800025939941,
"test_output_match_max_pool2d_with_indices_backward_cpu_bfloat16 (__main__.TestConsistencyCPU)": 60.4490000406901,
"test_proper_exit (__main__.TestDataLoader)": 214.47549438476562,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 212.3499984741211,
"test_qconv2d_add_cpu_cpp_wrapper (__main__.TestCppWrapper)": 60.95766671498617,
"test_qconv2d_add_cpu_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 62.85099951426188,
"test_qconv2d_add_relu_cpu_cpp_wrapper (__main__.TestCppWrapper)": 61.30074977874756,
"test_qconv2d_add_relu_cpu_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 64.02558294932048,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 60.128166834513344,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 113.4209976196289,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 113.31400299072266,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 141.7570037841797,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 112.85099792480469,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 108.26799774169922,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 112.7490005493164,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 112.31099700927734,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 111.48500061035156,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 62.4573335647583,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 111.9219970703125,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 112.73999786376953,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 60.87241554260254,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 114.99500274658203,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 111.69499969482422,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 109.68599700927734,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 109.4990005493164,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 60.729000091552734,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 115.64600372314453,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 112.4219970703125,
"test_qrnncell (__main__.TestDynamicQuantizedOps)": 63.147268639753264,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 413.0690002441406,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 630.9710083007812,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 571.0189819335938,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 851.6174926757812,
"test_quick_core_backward_expand_copy_cuda_float64 (__main__.TestDecompCUDA)": 74.7632490793864,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 78.52200317382812,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 200.74200439453125,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 107.08300018310547,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 150.26499938964844,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 98.96500015258789,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 74.80500030517578,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 118.8329963684082,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 82.09700012207031,
"test_replicatepad_64bit_indexing_cuda_float16 (__main__.TestNNDeviceTypeCUDA)": 324.70098876953125,
"test_rosenbrock_sparse_with_lrsched_False_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 86.34838581085205,
"test_rosenbrock_sparse_with_lrsched_True_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 76.88300371170044,
"test_save_load_large_string_attribute (__main__.TestSaveLoad)": 93.64399719238281,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 151.77233378092447,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 129.88999684651694,
"test_sort_bool_cpu (__main__.CpuTritonTests)": 340.2829996744792,
"test_sum_all_cpu_float64 (__main__.TestReductionsCPU)": 164.725030376971,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 141.5560052394867,
"test_terminate_handler_on_crash (__main__.TestTorch)": 71.76799805959065,
"test_terminate_signal (__main__.ForkTest)": 105.02499709029992,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 105.14500128229459,
"test_terminate_signal (__main__.SpawnTest)": 107.84633318583171,
"test_train_parity_multi_group (__main__.TestFullyShard1DTrainingCore)": 124.47291040041654,
"test_transpose_copy (__main__.CPUReproTests)": 63.25933329264323,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 81.10850143432617,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 69.84850120544434,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 74.66350173950195,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 139.77949905395508,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 133.375,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 121.22699737548828,
"test_unary_ops (__main__.TestTEFuserDynamic)": 228.66966756184897,
"test_unary_ops (__main__.TestTEFuserStatic)": 204.28700065612793,
"test_upsample_bicubic2d_cpu (__main__.CpuHalideTests)": 95.69666544596355,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 85.29199981689453,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 68.83450126647949,
"test_vmapjvpvjp_diff_cuda_float32 (__main__.TestOperatorsCUDA)": 60.5719234759991,
"test_vmapjvpvjp_linalg_lu_solve_cpu_float32 (__main__.TestOperatorsCPU)": 67.02274974187215,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 78.4694995880127,
"test_vmapjvpvjp_linalg_multi_dot_cuda_float32 (__main__.TestOperatorsCUDA)": 72.39323043823242,
"test_vmapjvpvjp_linalg_solve_triangular_cuda_float32 (__main__.TestOperatorsCUDA)": 67.01423028799204,
"test_vmapjvpvjp_linalg_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 74.47176947960487,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 64.39900207519531,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 63.3494987487793,
"test_vmapjvpvjp_nn_functional_max_pool2d_cpu_float32 (__main__.TestOperatorsCPU)": 71.36399841308594,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 71.33700180053711,
"test_vmapjvpvjp_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 60.809499740600586,
"test_vmapjvpvjp_unbind_cpu_float32 (__main__.TestOperatorsCPU)": 71.86699676513672,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 77.49649810791016,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 66.41450119018555,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 67.54150009155273,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 127.17300033569336
}