forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathslow_tests.json
328 lines (328 loc) · 33.2 KB
/
slow_tests.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
{
"EndToEndLSTM (__main__.RNNTest)": 224.2776641845703,
"MultiheadAttention (__main__.ModulesTest)": 170.8386688232422,
"test_AllenaiLongformerBase_repro_cpu (__main__.CpuHalideTests)": 215.9730021158854,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 190.66033342149524,
"test_adaptive_max_pool2d1_cpu (__main__.CpuHalideTests)": 114.27133433024089,
"test_after_aot_cpu_runtime_error (__main__.MinifierIsolateTests)": 71.38377804226346,
"test_alexnet_prefix_cpu (__main__.CpuHalideTests)": 191.32866414388022,
"test_aot_autograd_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 67.06866836547852,
"test_aot_autograd_symbolic_exhaustive_linalg_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 60.106476193382626,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 92.41733296712239,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 153.84766642252603,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 85.03233337402344,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 84.20766703287761,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 510.78777398003473,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 97.41633224487305,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 510.7107747395833,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 507.0798814561632,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 124.66699981689453,
"test_avg_pool3d_backward_cpu (__main__.CpuHalideTests)": 62.02766672770182,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 65.31933339436848,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 64.8836669921875,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 279.31766594780817,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 196.89432907104492,
"test_builtin_equivalent_funcs (__main__.TorchFunctionModeTests)": 104.88957105364118,
"test_checkpoint_cast (__main__.TestFxToOnnx)": 363.49000040690106,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 374.91833157009546,
"test_comprehensive_constant_pad_nd_cpu_float16 (__main__.TestInductorOpInfoCPU)": 82.49566650390625,
"test_comprehensive_constant_pad_nd_cpu_float32 (__main__.TestInductorOpInfoCPU)": 82.13433329264323,
"test_comprehensive_constant_pad_nd_cpu_float64 (__main__.TestInductorOpInfoCPU)": 81.46333312988281,
"test_comprehensive_constant_pad_nd_cpu_int32 (__main__.TestInductorOpInfoCPU)": 86.26499938964844,
"test_comprehensive_constant_pad_nd_cpu_int64 (__main__.TestInductorOpInfoCPU)": 78.45066579182942,
"test_comprehensive_diff_cpu_bool (__main__.TestInductorOpInfoCPU)": 120.62533315022786,
"test_comprehensive_diff_cpu_float32 (__main__.TestInductorOpInfoCPU)": 120.60333251953125,
"test_comprehensive_diff_cpu_float64 (__main__.TestInductorOpInfoCPU)": 112.93033345540364,
"test_comprehensive_diff_cpu_int32 (__main__.TestInductorOpInfoCPU)": 118.08499908447266,
"test_comprehensive_diff_cpu_int64 (__main__.TestInductorOpInfoCPU)": 123.97566731770833,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 81.66700108846028,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 79.4769999186198,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 64.5281252861023,
"test_comprehensive_dist_cpu_float16 (__main__.TestInductorOpInfoCPU)": 96.58866628011067,
"test_comprehensive_dist_cpu_float32 (__main__.TestInductorOpInfoCPU)": 91.72833251953125,
"test_comprehensive_dist_cpu_float64 (__main__.TestInductorOpInfoCPU)": 93.73600006103516,
"test_comprehensive_eye_cpu_bool (__main__.TestInductorOpInfoCPU)": 151.32967122395834,
"test_comprehensive_eye_cpu_float16 (__main__.TestInductorOpInfoCPU)": 143.57733662923178,
"test_comprehensive_eye_cpu_float32 (__main__.TestInductorOpInfoCPU)": 141.9923299153646,
"test_comprehensive_eye_cpu_float64 (__main__.TestInductorOpInfoCPU)": 142.34900410970053,
"test_comprehensive_eye_cpu_int32 (__main__.TestInductorOpInfoCPU)": 143.60033671061197,
"test_comprehensive_eye_cpu_int64 (__main__.TestInductorOpInfoCPU)": 149.10132853190103,
"test_comprehensive_grid_sampler_2d_cpu_bfloat16 (__main__.TestDecompCPU)": 81.41033426920573,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestDecompCPU)": 81.97200012207031,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 84.08200073242188,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 347.4583333333333,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 83.02366638183594,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 328.58299763997394,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 92.41300201416016,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 206.7806625366211,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 201.07150268554688,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 838.8346659342448,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 846.4761555989584,
"test_comprehensive_linalg_lu_solve_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 87.954833984375,
"test_comprehensive_linalg_lu_solve_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 71.02933311462402,
"test_comprehensive_linalg_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 64.14100011189778,
"test_comprehensive_linalg_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 63.77633412679037,
"test_comprehensive_linalg_solve_triangular_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 71.52133178710938,
"test_comprehensive_linalg_solve_triangular_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 64.97216606140137,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 65.3273328145345,
"test_comprehensive_linalg_vector_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 227.3056640625,
"test_comprehensive_linalg_vector_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 217.87433369954428,
"test_comprehensive_linalg_vector_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 235.36133321126303,
"test_comprehensive_linalg_vector_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 69.16516621907552,
"test_comprehensive_linalg_vector_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 70.0791670481364,
"test_comprehensive_logspace_cpu_float32 (__main__.TestInductorOpInfoCPU)": 471.6073303222656,
"test_comprehensive_logspace_cpu_float64 (__main__.TestInductorOpInfoCPU)": 482.71632893880206,
"test_comprehensive_logspace_cpu_int32 (__main__.TestInductorOpInfoCPU)": 484.3889973958333,
"test_comprehensive_logspace_cpu_int64 (__main__.TestInductorOpInfoCPU)": 478.03033447265625,
"test_comprehensive_logspace_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 83.64666748046875,
"test_comprehensive_logspace_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 81.86583391825359,
"test_comprehensive_masked_amax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 109.95899963378906,
"test_comprehensive_masked_amax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 107.42000071207683,
"test_comprehensive_masked_amax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 112.86100006103516,
"test_comprehensive_masked_amax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 111.37566630045573,
"test_comprehensive_masked_amax_cpu_int64 (__main__.TestInductorOpInfoCPU)": 106.12166849772136,
"test_comprehensive_masked_amin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 110.41200002034505,
"test_comprehensive_masked_amin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 107.4979985555013,
"test_comprehensive_masked_amin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 108.29533386230469,
"test_comprehensive_masked_amin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 101.06366729736328,
"test_comprehensive_masked_amin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 111.66866556803386,
"test_comprehensive_masked_argmax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 65.20666631062825,
"test_comprehensive_masked_argmax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 66.2469991048177,
"test_comprehensive_masked_argmax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 62.26433308919271,
"test_comprehensive_masked_argmax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 65.90833282470703,
"test_comprehensive_masked_argmin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 67.25066884358723,
"test_comprehensive_masked_argmin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 63.0856679280599,
"test_comprehensive_masked_argmin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 64.3423334757487,
"test_comprehensive_masked_argmin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 62.418999989827476,
"test_comprehensive_masked_argmin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 61.3716672261556,
"test_comprehensive_masked_mean_cpu_bool (__main__.TestInductorOpInfoCPU)": 107.6316655476888,
"test_comprehensive_masked_mean_cpu_float16 (__main__.TestInductorOpInfoCPU)": 105.95433298746745,
"test_comprehensive_masked_mean_cpu_float32 (__main__.TestInductorOpInfoCPU)": 108.12066650390625,
"test_comprehensive_masked_mean_cpu_float64 (__main__.TestInductorOpInfoCPU)": 107.28466542561848,
"test_comprehensive_masked_mean_cpu_int32 (__main__.TestInductorOpInfoCPU)": 107.82733408610027,
"test_comprehensive_masked_mean_cpu_int64 (__main__.TestInductorOpInfoCPU)": 103.07533264160156,
"test_comprehensive_masked_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 530.9063313802084,
"test_comprehensive_masked_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 531.5923258463541,
"test_comprehensive_masked_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 522.8729858398438,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 170.60566584269205,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 148.06033198038736,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 149.73183059692383,
"test_comprehensive_masked_prod_cpu_bool (__main__.TestInductorOpInfoCPU)": 106.41500091552734,
"test_comprehensive_masked_prod_cpu_float16 (__main__.TestInductorOpInfoCPU)": 109.46266428629558,
"test_comprehensive_masked_prod_cpu_float32 (__main__.TestInductorOpInfoCPU)": 108.69433339436848,
"test_comprehensive_masked_prod_cpu_float64 (__main__.TestInductorOpInfoCPU)": 111.31100209554036,
"test_comprehensive_masked_prod_cpu_int32 (__main__.TestInductorOpInfoCPU)": 103.59366607666016,
"test_comprehensive_masked_prod_cpu_int64 (__main__.TestInductorOpInfoCPU)": 98.89466603597005,
"test_comprehensive_masked_sum_cpu_bool (__main__.TestInductorOpInfoCPU)": 111.9769999186198,
"test_comprehensive_masked_sum_cpu_float16 (__main__.TestInductorOpInfoCPU)": 113.90066782633464,
"test_comprehensive_masked_sum_cpu_float32 (__main__.TestInductorOpInfoCPU)": 105.57700093587239,
"test_comprehensive_masked_sum_cpu_float64 (__main__.TestInductorOpInfoCPU)": 105.22766621907552,
"test_comprehensive_masked_sum_cpu_int32 (__main__.TestInductorOpInfoCPU)": 104.93033345540364,
"test_comprehensive_masked_sum_cpu_int64 (__main__.TestInductorOpInfoCPU)": 102.3076680501302,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 78.71599960327148,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 81.63083330790202,
"test_comprehensive_nn_functional_glu_cpu_float16 (__main__.TestInductorOpInfoCPU)": 83.04366556803386,
"test_comprehensive_nn_functional_glu_cpu_float32 (__main__.TestInductorOpInfoCPU)": 82.60833231608073,
"test_comprehensive_nn_functional_glu_cpu_float64 (__main__.TestInductorOpInfoCPU)": 82.17033386230469,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 86.39266713460286,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 87.72166442871094,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 179.57733662923178,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 199.76399993896484,
"test_comprehensive_nn_functional_interpolate_bicubic_cpu_uint8 (__main__.TestInductorOpInfoCPU)": 63.46200052897135,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 78.04750061035156,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 75.1818339029948,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 63.27016639709473,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float64 (__main__.TestDecompCUDA)": 80.72016716003418,
"test_comprehensive_nn_functional_max_pool1d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 188.21700032552084,
"test_comprehensive_nn_functional_max_pool1d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 189.15300496419272,
"test_comprehensive_nn_functional_max_pool1d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 191.53266398111978,
"test_comprehensive_nn_functional_max_pool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 1001.8180135091146,
"test_comprehensive_nn_functional_max_pool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 941.7516682942709,
"test_comprehensive_nn_functional_max_pool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 957.2676798502604,
"test_comprehensive_nn_functional_max_pool2d_cpu_int32 (__main__.TestInductorOpInfoCPU)": 884.413330078125,
"test_comprehensive_nn_functional_max_pool2d_cpu_int64 (__main__.TestInductorOpInfoCPU)": 917.0406697591146,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 882.3416646321615,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 891.5490112304688,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 951.3874918619791,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 217.1499989827474,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 226.78500366210938,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 220.6536661783854,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 62.534000396728516,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 115.53050104777019,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 111.29116821289062,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 147.32699584960938,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 146.26766459147134,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 149.46000162760416,
"test_comprehensive_nn_functional_pad_constant_cpu_float16 (__main__.TestInductorOpInfoCPU)": 80.33966827392578,
"test_comprehensive_nn_functional_pad_constant_cpu_float32 (__main__.TestInductorOpInfoCPU)": 77.02700297037761,
"test_comprehensive_nn_functional_pad_constant_cpu_float64 (__main__.TestInductorOpInfoCPU)": 78.06666564941406,
"test_comprehensive_nn_functional_pad_constant_cpu_int32 (__main__.TestInductorOpInfoCPU)": 66.0947225358751,
"test_comprehensive_nn_functional_pad_constant_cpu_int64 (__main__.TestInductorOpInfoCPU)": 79.26499938964844,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float16 (__main__.TestInductorOpInfoCPU)": 141.70166524251303,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestInductorOpInfoCPU)": 142.16866811116537,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float64 (__main__.TestInductorOpInfoCPU)": 128.4029998779297,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int32 (__main__.TestInductorOpInfoCPU)": 124.0116678873698,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int64 (__main__.TestInductorOpInfoCPU)": 126.01200103759766,
"test_comprehensive_nn_functional_unfold_cpu_bool (__main__.TestInductorOpInfoCPU)": 151.81866963704428,
"test_comprehensive_nn_functional_unfold_cpu_float16 (__main__.TestInductorOpInfoCPU)": 264.4179992675781,
"test_comprehensive_nn_functional_unfold_cpu_float32 (__main__.TestInductorOpInfoCPU)": 267.08266194661456,
"test_comprehensive_nn_functional_unfold_cpu_float64 (__main__.TestInductorOpInfoCPU)": 265.7936604817708,
"test_comprehensive_nn_functional_unfold_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 85.77500025431316,
"test_comprehensive_nn_functional_unfold_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 78.86816660563152,
"test_comprehensive_nn_functional_unfold_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 79.76916758219402,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 95.18166605631511,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 91.77883275349934,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 60.81966654459635,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 119.70216623942058,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 93.25683466593425,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 70.70699964250836,
"test_comprehensive_svd_lowrank_cuda_complex128 (__main__.TestDecompCUDA)": 61.070499420166016,
"test_cond_autograd_nested (__main__.TestControlFlow)": 79.72944344414606,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 117.21133550008138,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 95.2274996439616,
"test_constructor_autograd_SparseCSC_cuda (__main__.TestSparseAnyCUDA)": 77.67016474405925,
"test_constructor_autograd_SparseCSR_cuda (__main__.TestSparseAnyCUDA)": 69.53000020980835,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 198.49655405680338,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 447.2755482991536,
"test_conv2d_unary_cpu_cpp_wrapper (__main__.TestCppWrapper)": 268.80133056640625,
"test_conv3d_cuda (__main__.AOTInductorTestABICompatibleGpu)": 135.77333323160806,
"test_conv_bn_fuse_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 60.003444247775604,
"test_conv_transpose_with_output_size_and_no_batch_dim_ConvTranspose3d_cuda (__main__.TestConvolutionNNDeviceTypeCUDA)": 114.27466656515996,
"test_correctness_AdamW_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 72.10799980163574,
"test_correctness_AdamW_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 123.51449966430664,
"test_correctness_Adam_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 67.44266573588054,
"test_correctness_Adam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 124.48583348592122,
"test_correctness_NAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 72.73799896240234,
"test_count_nonzero_all (__main__.TestBool)": 613.8192070855034,
"test_custom_module_lstm (__main__.TestQuantizedOps)": 387.75410630967883,
"test_ddp_uneven_inputs (__main__.TestDistBackendWithSpawn)": 186.20633189876875,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 84.25950113932292,
"test_eig_check_magma_cuda_float32 (__main__.TestLinalgCUDA)": 152.92416445414224,
"test_fail_creation_ops.py (__main__.TestTyping)": 75.64839254106793,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 70.79500071207683,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 79.6708329518636,
"test_fn_gradgrad_map_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 77.31333414713542,
"test_fn_gradgrad_map_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 60.696099281311035,
"test_fn_gradgrad_map_triple_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 461.1873270670573,
"test_fn_gradgrad_map_triple_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 339.5521697998047,
"test_fuse_large_params_cpu (__main__.CpuTests)": 63.09900029500326,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 92.18155585394965,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 96.59077707926433,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 63.364166259765625,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 67.6820011138916,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 80.87316767374675,
"test_gradgrad_nn_LSTM_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 99.19066619873047,
"test_gradgrad_nn_LSTM_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 95.8260014851888,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 184.47216796875,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 113.43166605631511,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 125.3043327331543,
"test_grid_sampler_2d_cpu (__main__.CpuHalideTests)": 186.22100321451822,
"test_indexing (__main__.TestAutogradWithCompiledAutograd)": 70.04255633884006,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 189.80333455403647,
"test_inductor_no_recursionerror_on_for_loops_dynamic_shapes (__main__.DynamicShapesReproTests)": 72.33966615464952,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 80.61100006103516,
"test_inputs_overlapping_with_mutation_stress_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 140.90377638075086,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 111.77066548665364,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 565.1104965209961,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 71.39283434549968,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 65.84149837493896,
"test_linear (__main__.TestStaticQuantizedModule)": 147.759886847602,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 164.447998046875,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 167.55933125813803,
"test_linear_binary_folding_cpu (__main__.FreezingCpuTests)": 60.865777757432724,
"test_linear_packed_cpp_wrapper (__main__.TestCppWrapper)": 81.31299845377605,
"test_linear_packed_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 76.33000183105469,
"test_lobpcg_ortho_cuda_float64 (__main__.TestLinalgCUDA)": 76.25166829427083,
"test_lstm_cpu (__main__.TestMkldnnCPU)": 84.14966710408528,
"test_many_overlapping_inputs_does_not_explode_guards_dynamic_shapes (__main__.DynamicShapesReproTests)": 109.88477749294705,
"test_max_autotune_cutlass_backend_addmm_dynamic_False_max_autotune_gemm_backends_ATen,Triton,CUTLASS (__main__.TestCutlassBackend)": 84.41333262125652,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 64.33055538601346,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 63.2979990641276,
"test_mixed_mm_exhaustive_dtypes (__main__.TestPatternMatcher)": 67.55066744486491,
"test_proper_exit (__main__.TestDataLoader)": 224.79383595784506,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 217.4080022176107,
"test_put_cuda_uint8 (__main__.TestTorchDeviceTypeCUDA)": 103.19804314888704,
"test_python_ref_executor__refs_special_zeta_executor_aten_cuda_float64 (__main__.TestCommonCUDA)": 60.95939979553223,
"test_qconv2d_add_cpu_cpp_wrapper (__main__.TestCppWrapper)": 62.51866658528646,
"test_qconv2d_add_cpu_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 63.23300043741862,
"test_qconv2d_add_relu_cpu_cpp_wrapper (__main__.TestCppWrapper)": 62.45500055948893,
"test_qconv2d_add_relu_cpu_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 63.74866739908854,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 73.47400156656902,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 111.55533345540364,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 113.39233144124348,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 71.40777672661676,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 114.24800109863281,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 113.41766611735027,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 65.87688954671223,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 107.47800191243489,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 113.447998046875,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 68.04311116536458,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 115.14266459147136,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 115.07366434733073,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 76.1270014444987,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 113.39599863688152,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 114.23433176676433,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 71.46933237711589,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 113.58066813151042,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 110.88400014241536,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 65.69477844238281,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False_cpp_wrapper (__main__.TestCppWrapper)": 107.49266560872395,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 114.12266540527344,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 75.25133514404297,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 115.43599955240886,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 113.93733215332031,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 319.4066670735677,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 617.1271667480469,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 555.4753214518229,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 895.808827718099,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 71.04066721598308,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 186.27233378092447,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 93.46799977620442,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 146.96949895222983,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 101.87816492716472,
"test_quick_core_backward_split_cuda_float64 (__main__.TestDecompCUDA)": 60.058855874197825,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 74.16299947102864,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 117.55266952514648,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 80.77400080362956,
"test_replicatepad_64bit_indexing_cuda_float16 (__main__.TestNNDeviceTypeCUDA)": 332.54766845703125,
"test_rosenbrock_sparse_with_lrsched_False_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 90.56116612752278,
"test_rosenbrock_sparse_with_lrsched_True_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 102.87433195114136,
"test_save_load_large_string_attribute (__main__.TestSaveLoad)": 114.60433197021484,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 163.62533145480685,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 107.40444437662761,
"test_sum_all_cpu_float64 (__main__.TestReductionsCPU)": 284.4367377569002,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 157.5870008468628,
"test_terminate_handler_on_crash (__main__.TestTorch)": 97.66699902216594,
"test_terminate_signal (__main__.ForkTest)": 130.4108906057146,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 130.55344214538732,
"test_terminate_signal (__main__.SpawnTest)": 133.65200106302896,
"test_train_parity_multi_group (__main__.TestFullyShard1DTrainingCore)": 117.12999943544855,
"test_transpose_copy (__main__.CPUReproTests)": 75.40855577256944,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 63.13999875386556,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 66.69533348083496,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 160.92549896240234,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 147.94483184814453,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 119.7986691792806,
"test_unary_ops (__main__.TestTEFuserDynamic)": 190.41244761149088,
"test_unary_ops (__main__.TestTEFuserStatic)": 165.1259978612264,
"test_upsample_bicubic2d_cpu (__main__.CpuHalideTests)": 96.73766581217448,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 88.42266591389973,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 71.24600028991699,
"test_vec_bitwise (__main__.CPUReproTests)": 63.55355538262261,
"test_vec_compare_op_cpu_only (__main__.CPUReproTests)": 66.54970640294692,
"test_views1_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 61.20033391316732,
"test_vmapjvpvjp_linalg_lu_solve_cpu_float32 (__main__.TestOperatorsCPU)": 60.52709543137323,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 70.6786657969157,
"test_vmapjvpvjp_linalg_multi_dot_cuda_float32 (__main__.TestOperatorsCUDA)": 72.03637456893921,
"test_vmapjvpvjp_linalg_solve_triangular_cuda_float32 (__main__.TestOperatorsCUDA)": 68.06242861066546,
"test_vmapjvpvjp_linalg_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 62.29850069681803,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 99.96300252278645,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 73.61033248901367,
"test_vmapjvpvjp_nn_functional_max_pool2d_cpu_float32 (__main__.TestOperatorsCPU)": 69.7383321126302,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 67.93116633097331,
"test_vmapjvpvjp_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 67.69150098164876,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 75.51783498128255,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 71.56416575113933,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 71.6493345896403,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 132.8029988606771
}