forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathslow_tests.json
301 lines (301 loc) · 29.8 KB
/
slow_tests.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
{
"EndToEndLSTM (__main__.RNNTest)": 219.46766662597656,
"MultiheadAttention (__main__.ModulesTest)": 169.47866821289062,
"test_AllenaiLongformerBase_repro_cpu (__main__.CpuHalideTests)": 216.27999877929688,
"test__adaptive_avg_pool2d (__main__.CPUReproTests)": 165.0509999593099,
"test_adaptive_max_pool2d1_cpu (__main__.CpuHalideTests)": 113.8866678873698,
"test_after_aot_cpu_runtime_error (__main__.MinifierIsolateTests)": 70.31311077541775,
"test_alexnet_prefix_cpu (__main__.CpuHalideTests)": 191.36766560872397,
"test_aot_autograd_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 89.71233622233073,
"test_aot_autograd_symbolic_exhaustive_linalg_svd_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 61.4735240028018,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool1d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 103.21633402506511,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool2d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 146.38499450683594,
"test_aot_autograd_symbolic_exhaustive_nn_functional_max_pool3d_cpu_float32 (__main__.TestEagerFusionOpInfoCPU)": 129.224001566569,
"test_aot_autograd_symbolic_module_exhaustive_nn_TransformerDecoderLayer_cpu_float32 (__main__.TestEagerFusionModuleInfoCPU)": 108.40233103434245,
"test_avg_pool3d_backward2_cpu (__main__.CpuTests)": 498.59322781032984,
"test_avg_pool3d_backward2_cuda (__main__.GPUTests)": 92.98616536458333,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 520.0223253038195,
"test_avg_pool3d_backward2_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 490.79644775390625,
"test_avg_pool3d_backward2_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 127.05033493041992,
"test_avg_pool3d_backward_cpu (__main__.CpuHalideTests)": 61.50299962361654,
"test_backward_nn_functional_multi_head_attention_forward_cpu_float32 (__main__.TestCompositeComplianceCPU)": 98.69633483886719,
"test_backward_nn_functional_multi_head_attention_forward_cuda_float32 (__main__.TestCompositeComplianceCUDA)": 64.9518330891927,
"test_basic_cpu (__main__.EfficientConvBNEvalCpuTests)": 279.4083319769965,
"test_basic_cuda (__main__.EfficientConvBNEvalGpuTests)": 195.9913330078125,
"test_builtin_equivalent_funcs (__main__.TorchFunctionModeTests)": 91.77583312988281,
"test_checkpoint_cast (__main__.TestFxToOnnx)": 364.96433512369794,
"test_collect_callgrind (__main__.TestBenchmarkUtils)": 401.74522908528644,
"test_comprehensive_constant_pad_nd_cpu_float16 (__main__.TestInductorOpInfoCPU)": 67.7816670735677,
"test_comprehensive_constant_pad_nd_cpu_float32 (__main__.TestInductorOpInfoCPU)": 69.75166575113933,
"test_comprehensive_constant_pad_nd_cpu_float64 (__main__.TestInductorOpInfoCPU)": 69.05133310953777,
"test_comprehensive_constant_pad_nd_cpu_int32 (__main__.TestInductorOpInfoCPU)": 74.81366729736328,
"test_comprehensive_constant_pad_nd_cpu_int64 (__main__.TestInductorOpInfoCPU)": 68.60000101725261,
"test_comprehensive_diff_cpu_bool (__main__.TestInductorOpInfoCPU)": 99.66566721598308,
"test_comprehensive_diff_cpu_float32 (__main__.TestInductorOpInfoCPU)": 99.96100107828777,
"test_comprehensive_diff_cpu_float64 (__main__.TestInductorOpInfoCPU)": 110.81066640218098,
"test_comprehensive_diff_cpu_int32 (__main__.TestInductorOpInfoCPU)": 100.76133473714192,
"test_comprehensive_diff_cpu_int64 (__main__.TestInductorOpInfoCPU)": 100.9336675008138,
"test_comprehensive_diff_cuda_complex128 (__main__.TestDecompCUDA)": 77.31899960835774,
"test_comprehensive_diff_cuda_complex64 (__main__.TestDecompCUDA)": 72.48116683959961,
"test_comprehensive_diff_cuda_float64 (__main__.TestDecompCUDA)": 62.056999630398224,
"test_comprehensive_dist_cpu_float16 (__main__.TestInductorOpInfoCPU)": 81.28766632080078,
"test_comprehensive_dist_cpu_float32 (__main__.TestInductorOpInfoCPU)": 98.3143310546875,
"test_comprehensive_dist_cpu_float64 (__main__.TestInductorOpInfoCPU)": 81.50999959309895,
"test_comprehensive_eye_cpu_bool (__main__.TestInductorOpInfoCPU)": 122.5760014851888,
"test_comprehensive_eye_cpu_float16 (__main__.TestInductorOpInfoCPU)": 123.51399993896484,
"test_comprehensive_eye_cpu_float32 (__main__.TestInductorOpInfoCPU)": 123.28799947102864,
"test_comprehensive_eye_cpu_float64 (__main__.TestInductorOpInfoCPU)": 116.3173344930013,
"test_comprehensive_eye_cpu_int32 (__main__.TestInductorOpInfoCPU)": 127.82066853841145,
"test_comprehensive_eye_cpu_int64 (__main__.TestInductorOpInfoCPU)": 122.68233235677083,
"test_comprehensive_grid_sampler_2d_cpu_bfloat16 (__main__.TestDecompCPU)": 71.04600016276042,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestDecompCPU)": 72.89833323160808,
"test_comprehensive_grid_sampler_2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 87.18833414713542,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestDecompCPU)": 332.75,
"test_comprehensive_grid_sampler_2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 82.85866800944011,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestDecompCPU)": 324.677001953125,
"test_comprehensive_grid_sampler_2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 82.86733500162761,
"test_comprehensive_grid_sampler_2d_cuda_bfloat16 (__main__.TestDecompCUDA)": 225.34333292643228,
"test_comprehensive_grid_sampler_2d_cuda_float16 (__main__.TestDecompCUDA)": 213.00050099690756,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestDecompCUDA)": 799.3779805501302,
"test_comprehensive_grid_sampler_2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 66.84477806091309,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestDecompCUDA)": 866.621348063151,
"test_comprehensive_grid_sampler_2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 71.03261015150282,
"test_comprehensive_linalg_lu_solve_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 81.06816736857097,
"test_comprehensive_linalg_lu_solve_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 74.70916748046875,
"test_comprehensive_linalg_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 62.993333180745445,
"test_comprehensive_linalg_solve_triangular_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 70.3303337097168,
"test_comprehensive_linalg_solve_triangular_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 67.46933364868164,
"test_comprehensive_linalg_svd_cuda_complex128 (__main__.TestDecompCUDA)": 61.75588862101237,
"test_comprehensive_linalg_svd_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 65.74423844473702,
"test_comprehensive_linalg_vector_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 201.85233561197916,
"test_comprehensive_linalg_vector_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 194.9086659749349,
"test_comprehensive_linalg_vector_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 190.51400248209634,
"test_comprehensive_linalg_vector_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 71.40916570027669,
"test_comprehensive_linalg_vector_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 72.34516588846843,
"test_comprehensive_logspace_cpu_float32 (__main__.TestInductorOpInfoCPU)": 424.54433186848956,
"test_comprehensive_logspace_cpu_float64 (__main__.TestInductorOpInfoCPU)": 418.6923319498698,
"test_comprehensive_logspace_cpu_int32 (__main__.TestInductorOpInfoCPU)": 407.38100179036456,
"test_comprehensive_logspace_cpu_int64 (__main__.TestInductorOpInfoCPU)": 414.07567342122394,
"test_comprehensive_logspace_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 72.58716646830241,
"test_comprehensive_logspace_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 71.60583305358887,
"test_comprehensive_masked_amax_cpu_float16 (__main__.TestInductorOpInfoCPU)": 98.01300048828125,
"test_comprehensive_masked_amax_cpu_float32 (__main__.TestInductorOpInfoCPU)": 98.23099772135417,
"test_comprehensive_masked_amax_cpu_float64 (__main__.TestInductorOpInfoCPU)": 97.51233418782552,
"test_comprehensive_masked_amax_cpu_int32 (__main__.TestInductorOpInfoCPU)": 86.70733388264973,
"test_comprehensive_masked_amax_cpu_int64 (__main__.TestInductorOpInfoCPU)": 89.51366933186848,
"test_comprehensive_masked_amin_cpu_float16 (__main__.TestInductorOpInfoCPU)": 105.18199920654297,
"test_comprehensive_masked_amin_cpu_float32 (__main__.TestInductorOpInfoCPU)": 95.83666483561198,
"test_comprehensive_masked_amin_cpu_float64 (__main__.TestInductorOpInfoCPU)": 92.2943344116211,
"test_comprehensive_masked_amin_cpu_int32 (__main__.TestInductorOpInfoCPU)": 87.82800038655598,
"test_comprehensive_masked_amin_cpu_int64 (__main__.TestInductorOpInfoCPU)": 92.68299865722656,
"test_comprehensive_masked_mean_cpu_bool (__main__.TestInductorOpInfoCPU)": 93.73733520507812,
"test_comprehensive_masked_mean_cpu_float16 (__main__.TestInductorOpInfoCPU)": 91.7943344116211,
"test_comprehensive_masked_mean_cpu_float32 (__main__.TestInductorOpInfoCPU)": 94.1106669108073,
"test_comprehensive_masked_mean_cpu_float64 (__main__.TestInductorOpInfoCPU)": 96.00266520182292,
"test_comprehensive_masked_mean_cpu_int32 (__main__.TestInductorOpInfoCPU)": 87.82233174641927,
"test_comprehensive_masked_mean_cpu_int64 (__main__.TestInductorOpInfoCPU)": 88.46933237711589,
"test_comprehensive_masked_norm_cpu_float16 (__main__.TestInductorOpInfoCPU)": 464.55799357096356,
"test_comprehensive_masked_norm_cpu_float32 (__main__.TestInductorOpInfoCPU)": 447.74900309244794,
"test_comprehensive_masked_norm_cpu_float64 (__main__.TestInductorOpInfoCPU)": 456.7113342285156,
"test_comprehensive_masked_norm_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 154.5738321940104,
"test_comprehensive_masked_norm_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 150.77416610717773,
"test_comprehensive_masked_norm_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 154.37033081054688,
"test_comprehensive_masked_prod_cpu_bool (__main__.TestInductorOpInfoCPU)": 91.66699981689453,
"test_comprehensive_masked_prod_cpu_float16 (__main__.TestInductorOpInfoCPU)": 91.7576675415039,
"test_comprehensive_masked_prod_cpu_float32 (__main__.TestInductorOpInfoCPU)": 90.7316665649414,
"test_comprehensive_masked_prod_cpu_float64 (__main__.TestInductorOpInfoCPU)": 95.60099792480469,
"test_comprehensive_masked_prod_cpu_int32 (__main__.TestInductorOpInfoCPU)": 92.26300048828125,
"test_comprehensive_masked_prod_cpu_int64 (__main__.TestInductorOpInfoCPU)": 96.61333465576172,
"test_comprehensive_masked_sum_cpu_bool (__main__.TestInductorOpInfoCPU)": 93.01033274332683,
"test_comprehensive_masked_sum_cpu_float16 (__main__.TestInductorOpInfoCPU)": 93.30700174967448,
"test_comprehensive_masked_sum_cpu_float32 (__main__.TestInductorOpInfoCPU)": 88.70266469319661,
"test_comprehensive_masked_sum_cpu_float64 (__main__.TestInductorOpInfoCPU)": 92.54333241780598,
"test_comprehensive_masked_sum_cpu_int32 (__main__.TestInductorOpInfoCPU)": 87.5500005086263,
"test_comprehensive_masked_sum_cpu_int64 (__main__.TestInductorOpInfoCPU)": 87.24099985758464,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestDecompCUDA)": 80.62266667683919,
"test_comprehensive_nn_functional_gaussian_nll_loss_cuda_float64 (__main__.TestDecompCUDA)": 76.97283172607422,
"test_comprehensive_nn_functional_glu_cpu_float16 (__main__.TestInductorOpInfoCPU)": 70.61966959635417,
"test_comprehensive_nn_functional_glu_cpu_float32 (__main__.TestInductorOpInfoCPU)": 72.37833404541016,
"test_comprehensive_nn_functional_glu_cpu_float64 (__main__.TestInductorOpInfoCPU)": 73.80133310953777,
"test_comprehensive_nn_functional_grid_sample_cpu_float32 (__main__.TestDecompCPU)": 86.89166768391927,
"test_comprehensive_nn_functional_grid_sample_cpu_float64 (__main__.TestDecompCPU)": 82.6780014038086,
"test_comprehensive_nn_functional_grid_sample_cuda_float32 (__main__.TestDecompCUDA)": 176.4113337198893,
"test_comprehensive_nn_functional_grid_sample_cuda_float64 (__main__.TestDecompCUDA)": 214.0199991861979,
"test_comprehensive_nn_functional_interpolate_bicubic_cpu_uint8 (__main__.TestInductorOpInfoCPU)": 63.2706667582194,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 76.66699981689453,
"test_comprehensive_nn_functional_interpolate_bicubic_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 78.13366572062175,
"test_comprehensive_nn_functional_interpolate_trilinear_cuda_float32 (__main__.TestDecompCUDA)": 60.39116668701172,
"test_comprehensive_nn_functional_max_pool1d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 180.94299825032553,
"test_comprehensive_nn_functional_max_pool1d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 175.80900065104166,
"test_comprehensive_nn_functional_max_pool1d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 180.89766947428384,
"test_comprehensive_nn_functional_max_pool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 911.5263264973959,
"test_comprehensive_nn_functional_max_pool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 856.4086507161459,
"test_comprehensive_nn_functional_max_pool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 861.1319986979166,
"test_comprehensive_nn_functional_max_pool2d_cpu_int32 (__main__.TestInductorOpInfoCPU)": 811.5753377278646,
"test_comprehensive_nn_functional_max_pool2d_cpu_int64 (__main__.TestInductorOpInfoCPU)": 812.4466756184896,
"test_comprehensive_nn_functional_max_pool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 900.7944946289062,
"test_comprehensive_nn_functional_max_pool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 891.2928365071615,
"test_comprehensive_nn_functional_max_pool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 881.6221618652344,
"test_comprehensive_nn_functional_max_pool3d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 61.039167404174805,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 196.0623321533203,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 199.98533630371094,
"test_comprehensive_nn_functional_max_unpool2d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 198.8000030517578,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 64.23733266194661,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 108.72433535257976,
"test_comprehensive_nn_functional_max_unpool2d_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 111.18783378601074,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float16 (__main__.TestInductorOpInfoCPU)": 124.12099965413411,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float32 (__main__.TestInductorOpInfoCPU)": 126.78400166829427,
"test_comprehensive_nn_functional_max_unpool3d_cpu_float64 (__main__.TestInductorOpInfoCPU)": 120.3459981282552,
"test_comprehensive_nn_functional_pad_constant_cpu_float16 (__main__.TestInductorOpInfoCPU)": 67.20533498128255,
"test_comprehensive_nn_functional_pad_constant_cpu_float32 (__main__.TestInductorOpInfoCPU)": 66.45566813151042,
"test_comprehensive_nn_functional_pad_constant_cpu_float64 (__main__.TestInductorOpInfoCPU)": 68.84399922688802,
"test_comprehensive_nn_functional_pad_constant_cpu_int32 (__main__.TestInductorOpInfoCPU)": 69.10233306884766,
"test_comprehensive_nn_functional_pad_constant_cpu_int64 (__main__.TestInductorOpInfoCPU)": 68.74000040690105,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float16 (__main__.TestInductorOpInfoCPU)": 111.74500020345052,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float32 (__main__.TestInductorOpInfoCPU)": 114.41833241780598,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_float64 (__main__.TestInductorOpInfoCPU)": 115.6923319498698,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int32 (__main__.TestInductorOpInfoCPU)": 109.80566660563152,
"test_comprehensive_nn_functional_poisson_nll_loss_cpu_int64 (__main__.TestInductorOpInfoCPU)": 111.232666015625,
"test_comprehensive_nn_functional_unfold_cpu_bool (__main__.TestInductorOpInfoCPU)": 126.32433573404948,
"test_comprehensive_nn_functional_unfold_cpu_float16 (__main__.TestInductorOpInfoCPU)": 230.50366719563803,
"test_comprehensive_nn_functional_unfold_cpu_float32 (__main__.TestInductorOpInfoCPU)": 225.89800008138022,
"test_comprehensive_nn_functional_unfold_cpu_float64 (__main__.TestInductorOpInfoCPU)": 234.7806650797526,
"test_comprehensive_nn_functional_unfold_cuda_float16 (__main__.TestInductorOpInfoCUDA)": 88.63733291625977,
"test_comprehensive_nn_functional_unfold_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 79.86999893188477,
"test_comprehensive_nn_functional_unfold_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 79.93016560872395,
"test_comprehensive_ormqr_cuda_complex128 (__main__.TestDecompCUDA)": 95.21299997965495,
"test_comprehensive_ormqr_cuda_complex64 (__main__.TestDecompCUDA)": 95.24533462524414,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestDecompCUDA)": 64.44333351982965,
"test_comprehensive_ormqr_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 125.76116689046223,
"test_comprehensive_ormqr_cuda_float64 (__main__.TestInductorOpInfoCUDA)": 94.32383346557617,
"test_comprehensive_pca_lowrank_cuda_float32 (__main__.TestInductorOpInfoCUDA)": 61.655999501546226,
"test_comprehensive_svd_cuda_complex128 (__main__.TestDecompCUDA)": 70.27366595798068,
"test_cond_autograd_nested (__main__.TestControlFlow)": 81.88900078667535,
"test_constructor_autograd_SparseBSC_cuda (__main__.TestSparseAnyCUDA)": 96.96666463216145,
"test_constructor_autograd_SparseBSR_cuda (__main__.TestSparseAnyCUDA)": 88.90266672770183,
"test_constructor_autograd_SparseCSC_cuda (__main__.TestSparseAnyCUDA)": 79.97699864705403,
"test_constructor_autograd_SparseCSR_cuda (__main__.TestSparseAnyCUDA)": 68.06366644965277,
"test_conv1d_basic (__main__.TestXNNPACKConv1dTransformPass)": 254.99877505832248,
"test_conv1d_with_relu_fc (__main__.TestXNNPACKConv1dTransformPass)": 507.52999708387586,
"test_conv2d_unary_cpu_cpp_wrapper (__main__.TestCppWrapper)": 107.21133168538411,
"test_conv3d_cuda (__main__.AOTInductorTestABICompatibleGpu)": 136.8423309326172,
"test_conv_transpose_with_output_size_and_no_batch_dim_ConvTranspose3d_cuda (__main__.TestConvolutionNNDeviceTypeCUDA)": 113.85933323142429,
"test_correctness_AdamW_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 71.10966618855794,
"test_correctness_AdamW_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 125.75316747029622,
"test_correctness_Adam_use_closure_False_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 66.65999984741211,
"test_correctness_Adam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 124.35716883341472,
"test_correctness_NAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 73.58849906921387,
"test_correctness_RAdam_use_closure_True_cuda_float32 (__main__.CompiledOptimizerParityTestsCUDA)": 66.45283317565918,
"test_count_nonzero_all (__main__.TestBool)": 617.1689995659722,
"test_custom_module_lstm (__main__.TestQuantizedOps)": 664.0513475206163,
"test_ddp_uneven_inputs (__main__.TestDistBackendWithSpawn)": 187.03833151112,
"test_dispatch_symbolic_meta_outplace_all_strides_nn_functional_gaussian_nll_loss_cuda_float32 (__main__.TestMetaCUDA)": 78.59683481852214,
"test_eig_check_magma_cuda_float32 (__main__.TestLinalgCUDA)": 107.13233160972595,
"test_fail_creation_ops.py (__main__.TestTyping)": 70.02577718098958,
"test_fn_fwgrad_bwgrad_cumprod_cuda_complex128 (__main__.TestFwdGradientsCUDA)": 73.22516695658366,
"test_fn_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 79.56483395894368,
"test_fn_gradgrad_map_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 79.16999816894531,
"test_fn_gradgrad_map_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 60.46457127162388,
"test_fn_gradgrad_map_triple_nested_cpu_float64 (__main__.TestBwdGradientsCPU)": 479.10866292317706,
"test_fn_gradgrad_map_triple_nested_cuda_float64 (__main__.TestBwdGradientsCUDA)": 328.49000040690106,
"test_fuse_large_params_cpu (__main__.CpuTests)": 62.572333017985024,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 95.0957785712348,
"test_fuse_large_params_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 92.28288947211371,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesCodegenGPUTests)": 62.00849978129069,
"test_fuse_large_params_dynamic_shapes_cuda (__main__.DynamicShapesGPUTests)": 70.89133262634277,
"test_grad_nn_Transformer_cuda_float64 (__main__.TestModuleCUDA)": 100.23983383178711,
"test_gradgrad_nn_LSTM_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 89.625,
"test_gradgrad_nn_LSTM_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 98.70733133951823,
"test_gradgrad_nn_TransformerDecoderLayer_cuda_float64 (__main__.TestModuleCUDA)": 201.46100107828775,
"test_gradgrad_nn_TransformerEncoder_eval_mode_cuda_float64 (__main__.TestModuleCUDA)": 106.39683278401692,
"test_gradgrad_nn_TransformerEncoder_train_mode_cuda_float64 (__main__.TestModuleCUDA)": 119.79433186848958,
"test_grid_sampler_2d_cpu (__main__.CpuHalideTests)": 184.58466593424478,
"test_group_norm (__main__.TestQuantizedOps)": 154.95144324832492,
"test_indexing (__main__.TestAutogradWithCompiledAutograd)": 63.33833312988281,
"test_indirect_device_assert (__main__.TritonCodeGenTests)": 205.21300252278647,
"test_inductor_no_recursionerror_on_for_loops_dynamic_shapes (__main__.DynamicShapesReproTests)": 72.85577816433377,
"test_inplace_gradgrad_cumprod_cuda_complex128 (__main__.TestBwdGradientsCUDA)": 76.04250017801921,
"test_inputs_overlapping_with_mutation_stress_dynamic_shapes (__main__.DynamicShapesAotAutogradFallbackTests)": 132.01866658528647,
"test_jit_cuda_archflags (__main__.TestCppExtensionJIT)": 110.27666727701823,
"test_linalg_solve_triangular_large_cuda_complex128 (__main__.TestLinalgCUDA)": 751.6446736653646,
"test_linalg_solve_triangular_large_cuda_complex64 (__main__.TestLinalgCUDA)": 81.81849988301595,
"test_linalg_solve_triangular_large_cuda_float64 (__main__.TestLinalgCUDA)": 105.56516583760579,
"test_linear (__main__.TestStaticQuantizedModule)": 149.91877788967557,
"test_linear_binary_cpp_wrapper (__main__.TestCppWrapper)": 63.99366887410482,
"test_linear_binary_dynamic_shapes_cpp_wrapper (__main__.DynamicShapesCppWrapperCpuTests)": 70.03766632080078,
"test_lobpcg_ortho_cuda_float64 (__main__.TestLinalgCUDA)": 63.89849980672201,
"test_lstm_cpu (__main__.TestMkldnnCPU)": 85.00599924723308,
"test_many_overlapping_inputs_does_not_explode_guards_dynamic_shapes (__main__.DynamicShapesReproTests)": 110.84377882215712,
"test_max_autotune_cutlass_backend_addmm_dynamic_False_max_autotune_gemm_backends_ATen,Triton,CUTLASS (__main__.TestCutlassBackend)": 85.677001953125,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCodegenCpuTests)": 65.46966637505426,
"test_max_pool2d_with_indices_backward4_dynamic_shapes_cpu (__main__.DynamicShapesCpuTests)": 70.02422290378146,
"test_proper_exit (__main__.TestDataLoader)": 224.50216929117838,
"test_proper_exit (__main__.TestDataLoaderPersistentWorkers)": 222.4308344523112,
"test_put_cuda_uint8 (__main__.TestTorchDeviceTypeCUDA)": 106.03500138300781,
"test_qat_conv2d_unary (__main__.TestQuantizePT2EX86Inductor)": 147.721556769477,
"test_qat_conv_bn_fusion_no_conv_bias (__main__.TestQuantizePT2EQAT_ConvBn1d)": 61.008500235421316,
"test_qat_mobilenet_v2 (__main__.TestQuantizePT2EQATModels)": 115.49899927775066,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 66.43100229899089,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 63.0869992574056,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 61.70333353678385,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 63.64599863688151,
"test_qlinear_add_int8_mixed_bf16_use_relu_False_is_qat_True_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 61.72699991861979,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_False (__main__.TestPatternMatcher)": 65.73533376057942,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True (__main__.TestPatternMatcher)": 65.25733184814453,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_False_is_dynamic_True_cpp_wrapper (__main__.TestCppWrapper)": 65.21399943033855,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_False (__main__.TestPatternMatcher)": 62.35166676839193,
"test_qlinear_add_int8_mixed_bf16_use_relu_True_is_qat_True_is_dynamic_True (__main__.TestPatternMatcher)": 64.92533365885417,
"test_quick_core_backward__unsafe_masked_index_cpu_float64 (__main__.TestDecompCPU)": 323.0256652832031,
"test_quick_core_backward__unsafe_masked_index_cuda_float64 (__main__.TestDecompCUDA)": 610.8551737467448,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cpu_float64 (__main__.TestDecompCPU)": 578.0780029296875,
"test_quick_core_backward__unsafe_masked_index_put_accumulate_cuda_float64 (__main__.TestDecompCUDA)": 908.8040059407552,
"test_quick_core_backward_expand_copy_cuda_float64 (__main__.TestDecompCUDA)": 63.164167404174805,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cpu_float64 (__main__.TestDecompCPU)": 71.40266672770183,
"test_quick_core_backward_nn_functional_max_unpool3d_grad_cuda_float64 (__main__.TestDecompCUDA)": 190.56116739908853,
"test_quick_core_backward_roll_cpu_float64 (__main__.TestDecompCPU)": 99.84366607666016,
"test_quick_core_backward_roll_cuda_float64 (__main__.TestDecompCUDA)": 146.57849884033203,
"test_quick_core_backward_select_scatter_cuda_float64 (__main__.TestDecompCUDA)": 106.22333272298177,
"test_quick_core_backward_split_with_sizes_copy_cpu_float64 (__main__.TestDecompCPU)": 78.19633483886719,
"test_quick_core_backward_split_with_sizes_copy_cuda_float64 (__main__.TestDecompCUDA)": 120.21533584594727,
"test_quick_core_backward_std_cuda_float64 (__main__.TestDecompCUDA)": 79.77816708882649,
"test_replicatepad_64bit_indexing_cuda_float16 (__main__.TestNNDeviceTypeCUDA)": 321.36501057942706,
"test_reveal_module_list.py (__main__.TestTyping)": 72.51449979146322,
"test_rosenbrock_sparse_with_lrsched_False_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 91.87500222524007,
"test_rosenbrock_sparse_with_lrsched_True_SGD_cuda_float64 (__main__.TestOptimRenewedCUDA)": 77.79533227284749,
"test_save_load_large_string_attribute (__main__.TestSaveLoad)": 100.04700215657552,
"test_shuffler_iterdatapipe (__main__.IntegrationTestDataLoaderDataPipe)": 156.44644504123264,
"test_slow_tasks (__main__.TestFunctionalAutogradBenchmark)": 134.18555365668402,
"test_sum_all_cpu_float64 (__main__.TestReductionsCPU)": 250.51736919509455,
"test_svd_lowrank_cuda_complex128 (__main__.TestLinalgCUDA)": 312.72400482495624,
"test_terminate_handler_on_crash (__main__.TestTorch)": 97.63710957103305,
"test_terminate_signal (__main__.ForkTest)": 131.67122051285372,
"test_terminate_signal (__main__.ParallelForkServerShouldWorkTest)": 131.79988540377883,
"test_terminate_signal (__main__.SpawnTest)": 136.1091101964315,
"test_torchvision_smoke (__main__.TestTensorBoardPytorchGraph)": 118.95789125230577,
"test_train_parity_multi_group (__main__.TestFullyShard1DTrainingCore)": 120.38550086468847,
"test_transpose_copy (__main__.CPUReproTests)": 65.14377784729004,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 63.66099993387858,
"test_triton_bsr_scatter_mm_blocksize_64_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 67.12950007120769,
"test_triton_bsr_softmax_cuda_bfloat16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 150.93133417765299,
"test_triton_bsr_softmax_cuda_float16 (__main__.TestSparseCompressedTritonKernelsCUDA)": 143.80083465576172,
"test_triton_bsr_softmax_cuda_float32 (__main__.TestSparseCompressedTritonKernelsCUDA)": 117.82416661580403,
"test_unary_ops (__main__.TestTEFuserDynamic)": 173.55711110432944,
"test_unary_ops (__main__.TestTEFuserStatic)": 157.19500075446234,
"test_upsample_bicubic2d_cpu (__main__.CpuHalideTests)": 95.58333333333333,
"test_variant_consistency_jit_nn_functional_max_pool2d_cpu_float32 (__main__.TestJitCPU)": 88.76866658528645,
"test_variant_consistency_jit_nn_functional_max_pool2d_cuda_float32 (__main__.TestJitCUDA)": 71.89466667175293,
"test_vec_compare_op_cpu_only (__main__.CPUReproTests)": 63.601333406236435,
"test_vmapjvpvjp_linalg_lu_solve_cpu_float32 (__main__.TestOperatorsCPU)": 61.569332122802734,
"test_vmapjvpvjp_linalg_lu_solve_cuda_float32 (__main__.TestOperatorsCUDA)": 74.65683237711589,
"test_vmapjvpvjp_linalg_multi_dot_cuda_float32 (__main__.TestOperatorsCUDA)": 60.34216562906901,
"test_vmapjvpvjp_linalg_solve_triangular_cuda_float32 (__main__.TestOperatorsCUDA)": 67.27466668023004,
"test_vmapjvpvjp_linalg_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 63.331000010172524,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cpu_float32 (__main__.TestOperatorsCPU)": 87.71066538492839,
"test_vmapjvpvjp_max_pool2d_with_indices_backward_cuda_float32 (__main__.TestOperatorsCUDA)": 66.45183372497559,
"test_vmapjvpvjp_nn_functional_max_pool2d_cuda_float32 (__main__.TestOperatorsCUDA)": 68.36833190917969,
"test_vmapjvpvjp_svd_cuda_float32 (__main__.TestOperatorsCUDA)": 62.6788330078125,
"test_vmapjvpvjp_unbind_cuda_float32 (__main__.TestOperatorsCUDA)": 70.41216532389323,
"test_vmapvjpvjp_meshgrid_list_of_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 72.4555009206136,
"test_vmapvjpvjp_meshgrid_variadic_tensors_cuda_float32 (__main__.TestOperatorsCUDA)": 72.33916727701823,
"test_vmapvjpvjp_nn_functional_bilinear_cuda_float32 (__main__.TestOperatorsCUDA)": 129.25900014241537
}