forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathslow_tests.json
303 lines (303 loc) · 29.8 KB
/
slow_tests.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
{
"EndToEndLSTM (__main__.RNNTest)": 229.8376668294271,
"MultiheadAttention (__main__.ModulesTest)": 174.3863321940104,
"test_AllenaiLongformerBase_repro_cpu (__main__.CpuHalideTests)": 215.5643310546875,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 161.98111300998264,
"test_adaptive_max_pool2d1_cpu (__main__.CpuHalideTests)": 113.75666809082031,
"test_after_aot_cpu_runtime_error (__main__.MinifierIsolateTests)": 64.25511169433594,
"test_alexnet_prefix_cpu (__main__.CpuHalideTests)": 191.23233032226562,
"test_aot_autograd_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 79.67633438110352,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 101.65633138020833,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 173.72899881998697,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 108.35699971516927,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 110.7040023803711,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 500.4296705457899,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 96.10950088500977,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 509.93289862738715,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 500.96044582790796,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 127.26850001017253,
"test_avg_pool3d_backward_cpu (__main__.CpuHalideTests)": 61.640332539876304,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 76.84266662597656,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 69.95100021362305,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 317.9998897976345,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 113.68183263142903,
"test_builtin_equivalent_funcs (__main__.TorchFunctionModeTests)": 89.66218733787537,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 349.2376641167535,
"test_comprehensive_constant_pad_nd_cpu_float16 (__main__.TestInductorOpInfoCPU)": 68.63999938964844,
"test_comprehensive_constant_pad_nd_cpu_float32 (__main__.TestInductorOpInfoCPU)": 75.47799936930339,
"test_comprehensive_constant_pad_nd_cpu_float64 (__main__.TestInductorOpInfoCPU)": 67.66733296712239,
"test_comprehensive_constant_pad_nd_cpu_int32 (__main__.TestInductorOpInfoCPU)": 64.68133290608723,
"test_comprehensive_constant_pad_nd_cpu_int64 (__main__.TestInductorOpInfoCPU)": 67.66033426920573,
"test_comprehensive_diff_cpu_bool (__main__.TestInductorOpInfoCPU)": 102.59533437093098,
"test_comprehensive_diff_cpu_float32 (__main__.TestInductorOpInfoCPU)": 100.57566833496094,
"test_comprehensive_diff_cpu_float64 (__main__.TestInductorOpInfoCPU)": 98.92966715494792,
"test_comprehensive_diff_cpu_int32 (__main__.TestInductorOpInfoCPU)": 103.16966501871745,
"test_comprehensive_diff_cpu_int64 (__main__.TestInductorOpInfoCPU)": 99.22633616129558,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 88.25283177693684,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 91.74633280436198,
"test_comprehensive_diff_cuda_float32 (__main__.TestDecompCUDA)": 62.82866668701172,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 62.4391663869222,
"test_comprehensive_dist_cpu_float16 (__main__.TestInductorOpInfoCPU)": 80.94733428955078,
"test_comprehensive_dist_cpu_float32 (__main__.TestInductorOpInfoCPU)": 79.75499979654948,
"test_comprehensive_dist_cpu_float64 (__main__.TestInductorOpInfoCPU)": 84.87999979654948,
"test_comprehensive_eye_cpu_bool (__main__.TestInductorOpInfoCPU)": 124.50833384195964,
"test_comprehensive_eye_cpu_float16 (__main__.TestInductorOpInfoCPU)": 119.09133656819661,
"test_comprehensive_eye_cpu_float32 (__main__.TestInductorOpInfoCPU)": 118.83500162760417,
"test_comprehensive_eye_cpu_float64 (__main__.TestInductorOpInfoCPU)": 137.94300333658853,
"test_comprehensive_eye_cpu_int32 (__main__.TestInductorOpInfoCPU)": 132.7836710611979,
"test_comprehensive_eye_cpu_int64 (__main__.TestInductorOpInfoCPU)": 119.86732991536458,
"test_comprehensive_grid_sampler_2d_cpu_bfloat16 (__main__.TestDecompCPU)": 72.27933502197266,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestDecompCPU)": 77.07999928792317,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 86.1326675415039,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 330.5853271484375,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 81.49166615804036,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 393.1456604003906,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 81.26866658528645,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 245.7971623738607,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 274.08716837565106,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 1144.0211791992188,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 79.30233256022136,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 1103.6513366699219,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 85.02083333333333,
"test_comprehensive_linalg_lu_solve_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 68.16633478800456,
"test_comprehensive_linalg_lu_solve_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 66.05233383178711,
"test_comprehensive_linalg_solve_triangular_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 66.81266657511394,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 62.804999669392906,
"test_comprehensive_linalg_svd_cuda_complex64 (__main__.TestDecompCUDA)": 62.844091242009945,
"test_comprehensive_linalg_vector_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 194.66766866048178,
"test_comprehensive_linalg_vector_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 205.99666849772134,
"test_comprehensive_linalg_vector_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 195.67166646321616,
"test_comprehensive_linalg_vector_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 69.10999870300293,
"test_comprehensive_linalg_vector_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 65.0721664428711,
"test_comprehensive_logspace_cpu_float32 (__main__.TestInductorOpInfoCPU)": 414.8839925130208,
"test_comprehensive_logspace_cpu_float64 (__main__.TestInductorOpInfoCPU)": 412.32166544596356,
"test_comprehensive_logspace_cpu_int32 (__main__.TestInductorOpInfoCPU)": 401.39966837565106,
"test_comprehensive_logspace_cpu_int64 (__main__.TestInductorOpInfoCPU)": 390.77866617838544,
"test_comprehensive_logspace_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 78.93299929300944,
"test_comprehensive_logspace_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 72.82900110880534,
"test_comprehensive_masked_amax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 96.87200164794922,
"test_comprehensive_masked_amax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 92.11366780598958,
"test_comprehensive_masked_amax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 100.53333282470703,
"test_comprehensive_masked_amax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 90.97166442871094,
"test_comprehensive_masked_amax_cpu_int64 (__main__.TestInductorOpInfoCPU)": 87.79233296712239,
"test_comprehensive_masked_amin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 94.58599853515625,
"test_comprehensive_masked_amin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 93.4509989420573,
"test_comprehensive_masked_amin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 94.32966613769531,
"test_comprehensive_masked_amin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 90.03700256347656,
"test_comprehensive_masked_amin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 93.39566802978516,
"test_comprehensive_masked_mean_cpu_float16 (__main__.TestInductorOpInfoCPU)": 98.01566823323567,
"test_comprehensive_masked_mean_cpu_float32 (__main__.TestInductorOpInfoCPU)": 90.41866556803386,
"test_comprehensive_masked_mean_cpu_float64 (__main__.TestInductorOpInfoCPU)": 95.50266774495442,
"test_comprehensive_masked_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 467.54233805338544,
"test_comprehensive_masked_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 443.7260030110677,
"test_comprehensive_masked_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 446.0713297526042,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 150.5536677042643,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 140.2658322652181,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 153.99183400472006,
"test_comprehensive_masked_prod_cpu_bool (__main__.TestInductorOpInfoCPU)": 88.32300059000652,
"test_comprehensive_masked_prod_cpu_float16 (__main__.TestInductorOpInfoCPU)": 97.0759989420573,
"test_comprehensive_masked_prod_cpu_float32 (__main__.TestInductorOpInfoCPU)": 91.01266733805339,
"test_comprehensive_masked_prod_cpu_float64 (__main__.TestInductorOpInfoCPU)": 93.87366739908855,
"test_comprehensive_masked_prod_cpu_int32 (__main__.TestInductorOpInfoCPU)": 92.1096674601237,
"test_comprehensive_masked_prod_cpu_int64 (__main__.TestInductorOpInfoCPU)": 84.76466623942058,
"test_comprehensive_masked_sum_cpu_bool (__main__.TestInductorOpInfoCPU)": 86.6510009765625,
"test_comprehensive_masked_sum_cpu_float16 (__main__.TestInductorOpInfoCPU)": 90.11199951171875,
"test_comprehensive_masked_sum_cpu_float32 (__main__.TestInductorOpInfoCPU)": 88.02433268229167,
"test_comprehensive_masked_sum_cpu_float64 (__main__.TestInductorOpInfoCPU)": 97.89900207519531,
"test_comprehensive_masked_sum_cpu_int32 (__main__.TestInductorOpInfoCPU)": 95.11266581217448,
"test_comprehensive_masked_sum_cpu_int64 (__main__.TestInductorOpInfoCPU)": 84.61399841308594,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 89.23933283487956,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 115.32566706339519,
"test_comprehensive_nn_functional_glu_cpu_float16 (__main__.TestInductorOpInfoCPU)": 74.7903340657552,
"test_comprehensive_nn_functional_glu_cpu_float32 (__main__.TestInductorOpInfoCPU)": 71.64700063069661,
"test_comprehensive_nn_functional_glu_cpu_float64 (__main__.TestInductorOpInfoCPU)": 71.22733052571614,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 90.17799886067708,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 79.68099975585938,
"test_comprehensive_nn_functional_grid_sample_cuda_bfloat16 (__main__.TestDecompCUDA)": 75.66366704305013,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 277.0806655883789,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 260.9174982706706,
"test_comprehensive_nn_functional_interpolate_bicubic_cpu_uint8 (__main__.TestInductorOpInfoCPU)": 70.82966613769531,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 70.04833285013835,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestDecompCUDA)": 61.33900139548562,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 68.59516588846843,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 75.75699869791667,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float64 (__main__.TestDecompCUDA)": 75.6755002339681,
"test_comprehensive_nn_functional_max_pool1d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 180.02766927083334,
"test_comprehensive_nn_functional_max_pool1d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 178.16299947102866,
"test_comprehensive_nn_functional_max_pool1d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 174.13199869791666,
"test_comprehensive_nn_functional_max_pool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 940.4483235677084,
"test_comprehensive_nn_functional_max_pool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 888.3410034179688,
"test_comprehensive_nn_functional_max_pool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 869.0559895833334,
"test_comprehensive_nn_functional_max_pool2d_cpu_int32 (__main__.TestInductorOpInfoCPU)": 858.8390096028646,
"test_comprehensive_nn_functional_max_pool2d_cpu_int64 (__main__.TestInductorOpInfoCPU)": 838.17333984375,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 823.9383341471354,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 819.8829956054688,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 788.756337483724,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 193.07699584960938,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 201.44400024414062,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 196.91666666666666,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 68.22283299763997,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 63.90866661071777,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 63.90783373514811,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 124.9623311360677,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 131.98700205485025,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 138.47733306884766,
"test_comprehensive_nn_functional_pad_constant_cpu_float16 (__main__.TestInductorOpInfoCPU)": 68.03933207194011,
"test_comprehensive_nn_functional_pad_constant_cpu_float32 (__main__.TestInductorOpInfoCPU)": 70.57266743977864,
"test_comprehensive_nn_functional_pad_constant_cpu_float64 (__main__.TestInductorOpInfoCPU)": 75.55066680908203,
"test_comprehensive_nn_functional_pad_constant_cpu_int32 (__main__.TestInductorOpInfoCPU)": 69.642333984375,
"test_comprehensive_nn_functional_pad_constant_cpu_int64 (__main__.TestInductorOpInfoCPU)": 67.43800099690755,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float16 (__main__.TestInductorOpInfoCPU)": 114.35599772135417,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestInductorOpInfoCPU)": 124.9423319498698,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float64 (__main__.TestInductorOpInfoCPU)": 136.78433481852213,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int32 (__main__.TestInductorOpInfoCPU)": 110.93899790445964,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int64 (__main__.TestInductorOpInfoCPU)": 110.34000142415364,
"test_comprehensive_nn_functional_unfold_cpu_bool (__main__.TestInductorOpInfoCPU)": 122.99199930826823,
"test_comprehensive_nn_functional_unfold_cpu_float16 (__main__.TestInductorOpInfoCPU)": 230.59066772460938,
"test_comprehensive_nn_functional_unfold_cpu_float32 (__main__.TestInductorOpInfoCPU)": 227.24933369954428,
"test_comprehensive_nn_functional_unfold_cpu_float64 (__main__.TestInductorOpInfoCPU)": 225.70667012532553,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 107.86883290608723,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 108.24150085449219,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 95.49149958292644,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 76.73016738891602,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestDecompCUDA)": 91.6338342030843,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 67.95566622416179,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 63.92883427937826,
"test_comprehensive_svd_cuda_complex64 (__main__.TestDecompCUDA)": 65.45333417256673,
"test_comprehensive_svd_lowrank_cuda_complex128 (__main__.TestDecompCUDA)": 63.04145466197621,
"test_cond_autograd_nested (__main__.TestControlFlow)": 84.39266798231337,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 99.29249954223633,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 92.76100031534831,
"test_constructor_autograd_SparseCSC_cuda (__main__.TestSparseAnyCUDA)": 81.06300099690755,
"test_constructor_autograd_SparseCSR_cuda (__main__.TestSparseAnyCUDA)": 66.52983283996582,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 292.93544430202905,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 548.6971079508463,
"test_conv2d_unary_cpu_cpp_wrapper (__main__.TestCppWrapper)": 112.78833516438802,
"test_correctness_AdamW_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 68.85216522216797,
"test_correctness_Adam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 69.27016703287761,
"test_count_nonzero_all (__main__.TestBool)": 635.0664469401041,
"test_cpu_gpu_parity_nn_LSTM_train_mode_cuda_float32 (__main__.TestModuleCUDA)": 84.12447796821594,
"test_cpu_gpu_parity_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 80.2692408466339,
"test_custom_module_lstm (__main__.TestQuantizedOps)": 715.1571180555555,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 84.22466659545898,
"test_dtensor_op_db_nn_functional_gaussian_nll_loss_cpu_float32 (__main__.TestDTensorOpsCPU)": 88.48233286539714,
"test_eig_check_magma_cuda_float32 (__main__.TestLinalgCUDA)": 151.56516675154367,
"test_fail_creation_ops.py (__main__.TestTyping)": 63.455668131510414,
"test_fail_random.py (__main__.TestTyping)": 71.26243758201599,
"test_fd_pool (__main__.TestMultiprocessing)": 230.95768259252822,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 108.64000066121419,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 83.54533386230469,
"test_fn_gradgrad_map_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 80.67066701253255,
"test_fn_gradgrad_map_triple_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 519.6433308919271,
"test_fn_gradgrad_map_triple_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 350.8470001220703,
"test_fs_pool (__main__.TestMultiprocessing)": 221.22149885328193,
"test_fuse_large_params_cpu (__main__.CpuTests)": 64.83366605970595,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 92.46333397759332,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 94.84700096978082,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 60.2641658782959,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 71.67599932352702,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 83.3826675415039,
"test_gradgrad_nn_LSTM_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 103.91466522216797,
"test_gradgrad_nn_LSTM_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 98.07433319091797,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 201.58099873860678,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 117.05183410644531,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 136.53083419799805,
"test_gradgrad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 539.1756591796875,
"test_grid_sampler_2d_cpu (__main__.CpuHalideTests)": 184.60066731770834,
"test_group_norm (__main__.TestQuantizedOps)": 259.0011165406969,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 206.87767028808594,
"test_inductor_no_recursionerror_on_for_loops_dynamic_shapes (__main__.DynamicShapesReproTests)": 71.92555491129558,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 98.36466598510742,
"test_inputs_overlapping_with_mutation_stress_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 140.90577697753906,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 110.23900095621745,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 725.4639994303385,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 86.55833307902019,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 74.77583281199138,
"test_linear (__main__.TestStaticQuantizedModule)": 207.24822658962674,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 77.41833241780598,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 71.99099731445312,
"test_lobpcg_ortho_cuda_float64 (__main__.TestLinalgCUDA)": 69.14899937311809,
"test_lstm_cpu (__main__.TestMkldnnCPU)": 62.205334981282554,
"test_many_overlapping_inputs_does_not_explode_guards_dynamic_shapes (__main__.DynamicShapesReproTests)": 113.46911027696397,
"test_matmul_small_brute_force_tunableop_cuda_float32 (__main__.TestLinalgCUDA)": 151.8993352254232,
"test_matmul_small_brute_force_tunableop_cuda_float64 (__main__.TestLinalgCUDA)": 102.19766489664714,
"test_max_autotune_cutlass_backend_addmm_dynamic_False_max_autotune_gemm_backends_ATen,Triton,CUTLASS (__main__.TestCutlassBackend)": 84.22100067138672,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 66.08288955688477,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 62.84855482313368,
"test_memory_format_operators_cpu (__main__.TestTorchDeviceTypeCPU)": 72.30622436437342,
"test_memory_format_operators_cuda (__main__.TestTorchDeviceTypeCUDA)": 62.60639995098114,
"test_nccl_non_blocking_wait_with_barrier (__main__.NcclErrorHandlingTest)": 69.72633361816406,
"test_proper_exit (__main__.TestDataLoader)": 237.19650014241537,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 230.95833333333334,
"test_python_ref_executor__refs_special_zeta_executor_aten_cuda_float64 (__main__.TestCommonCUDA)": 70.70466740926106,
"test_qat_conv2d_unary (__main__.TestQuantizePT2EX86Inductor)": 138.95155673556857,
"test_qat_conv_bn_fusion_no_conv_bias (__main__.TestQuantizePT2EQAT_ConvBn1d)": 60.11243165623058,
"test_qat_conv_bn_fusion_no_conv_bias (__main__.TestQuantizePT2EQAT_ConvBn2d)": 61.581181569532916,
"test_qat_mobilenet_v2 (__main__.TestQuantizePT2EQATModels)": 127.35777876112196,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 70.5979995727539,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 69.97799936930339,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 66.7726656595866,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 68.88433074951172,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 67.21099853515625,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 69.03100077311198,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 62.612998962402344,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 63.65299987792969,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 335.8753255208333,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 834.5986633300781,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 602.1336669921875,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 1085.4853210449219,
"test_quick_core_backward_expand_copy_cuda_float64 (__main__.TestDecompCUDA)": 65.60950088500977,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 62.46066665649414,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 239.0338363647461,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 81.54566701253255,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 166.99566396077475,
"test_quick_core_backward_select_scatter_cpu_float64 (__main__.TestDecompCPU)": 61.585000864664714,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 117.33700180053711,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 66.107666015625,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 143.55617014567056,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 91.47516632080078,
"test_register_spills_cuda (__main__.BenchmarkFusionCudaTest)": 143.4055004119873,
"test_replicatepad_64bit_indexing_cuda_float16 (__main__.TestNNDeviceTypeCUDA)": 67.73799896240234,
"test_rosenbrock_sparse_with_lrsched_False_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 70.45216703414917,
"test_rosenbrock_sparse_with_lrsched_True_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 65.28933238983154,
"test_save_load_large_string_attribute (__main__.TestSaveLoad)": 120.74533589680989,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 155.53277503119574,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 129.1546664767795,
"test_sort_stable_cpu (__main__.CpuTritonTests)": 75.61966451009114,
"test_split_cumsum_cpu (__main__.CpuTritonTests)": 89.57633209228516,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 284.7176678975423,
"test_terminate_handler_on_crash (__main__.TestTorch)": 99.32500106758542,
"test_terminate_signal (__main__.ForkTest)": 135.51877644244166,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 135.61988737020226,
"test_terminate_signal (__main__.SpawnTest)": 139.34744204415216,
"test_torchvision_smoke (__main__.TestTensorBoardPytorchGraph)": 68.02822134229872,
"test_transformer_backend_inductor_fullgraph_True (__main__.TestFullyShardCompile)": 94.83091672261556,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 75.27783266703288,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 73.52566719055176,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 83.69283294677734,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 147.2941665649414,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 142.57616678873697,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 114.45883178710938,
"test_unary_ops (__main__.TestTEFuserDynamic)": 169.01544358995227,
"test_unary_ops (__main__.TestTEFuserStatic)": 157.99788665771484,
"test_upsample_bicubic2d_cpu (__main__.CpuHalideTests)": 96.2423324584961,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 106.31300099690755,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 76.04600079854329,
"test_vmapjvpvjp_diff_cuda_float32 (__main__.TestOperatorsCUDA)": 115.88433456420898,
"test_vmapjvpvjp_linalg_lu_solve_cpu_float32 (__main__.TestOperatorsCPU)": 62.22219094775972,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 125.32350031534831,
"test_vmapjvpvjp_linalg_multi_dot_cuda_float32 (__main__.TestOperatorsCUDA)": 103.6671651204427,
"test_vmapjvpvjp_linalg_pinv_singular_cuda_float32 (__main__.TestOperatorsCUDA)": 69.03966649373372,
"test_vmapjvpvjp_linalg_solve_triangular_cuda_float32 (__main__.TestOperatorsCUDA)": 91.00933456420898,
"test_vmapjvpvjp_linalg_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 81.13250096638997,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 79.8989995320638,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 108.6731669108073,
"test_vmapjvpvjp_nn_functional_conv2d_cpu_float32 (__main__.TestOperatorsCPU)": 67.12433369954427,
"test_vmapjvpvjp_nn_functional_max_pool2d_cpu_float32 (__main__.TestOperatorsCPU)": 67.46600087483723,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 95.02799860636394,
"test_vmapjvpvjp_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 80.12366612752278,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 96.86916478474934,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 89.35266621907552,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 77.13216654459636,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 130.6520029703776
}