|
SingleSource/Benchmarks/Misc/flops-6
|
9801.26% |
1.288 |
127.556 |
0.177 |
521.77% |
0.177 |
|
SingleSource/Benchmarks/Misc/flops-8
|
9386.33% |
1.349 |
128.001 |
0.132 |
513.92% |
0.132 |
|
SingleSource/Benchmarks/Misc/flops-5
|
6288.81% |
1.997 |
127.591 |
0.546 |
511.11% |
0.546 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/HACCKernels/HACCKernels
|
4970.35% |
1.810 |
91.779 |
0.223 |
290.82% |
0.223 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_VOL3D_CALC_RAW/2
|
3661.88% |
8.283 |
311.604 |
0.603 |
-0.95% |
0.603 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_VOL3D_CALC_LAMBDA/2
|
3624.83% |
8.283 |
308.518 |
2.978 |
-1.42% |
2.978 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_VOL3D_CALC_RAW/1
|
3315.60% |
248.795 |
8497.849 |
18.428 |
-1.59% |
18.428 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_VOL3D_CALC_LAMBDA/1
|
3289.61% |
248.636 |
8427.804 |
82.795 |
-1.75% |
82.795 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_VOL3D_CALC_RAW/0
|
2816.03% |
1223.650 |
35681.985 |
175.712 |
-1.85% |
175.712 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_VOL3D_CALC_LAMBDA/0
|
2813.97% |
1219.274 |
35529.289 |
283.687 |
-1.58% |
283.687 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint16_t_To_uint8_t_
|
2276.56% |
1890.490 |
44928.572 |
1890.724 |
2.27% |
1890.724 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint16_t_To_uint8_t_
|
2011.53% |
3000.297 |
63352.256 |
1483.487 |
19.00% |
1483.487 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_EOS_RAW/171
|
1746.87% |
0.880 |
16.251 |
0.717 |
-1.10% |
0.717 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint8_t_To_uint16_t_
|
1720.26% |
3390.155 |
61709.495 |
348.154 |
0.52% |
348.154 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_FIR_LAMBDA/44217
|
1694.12% |
331.118 |
5940.643 |
171.096 |
-2.90% |
171.096 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_FIR_LAMBDA/171
|
1689.39% |
1.168 |
20.903 |
0.591 |
-3.62% |
0.591 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_FIR_RAW/44217
|
1687.37% |
331.201 |
5919.790 |
89.926 |
-5.22% |
89.926 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC15
|
1686.18% |
14.391 |
257.054 |
5.467 |
-1.65% |
5.467 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC15
|
1685.26% |
14.391 |
256.914 |
5.600 |
-2.17% |
5.600 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_FIR_RAW/171
|
1683.30% |
1.169 |
20.850 |
0.287 |
-5.38% |
0.287 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_FIR_LAMBDA/5001
|
1635.63% |
38.623 |
670.354 |
18.596 |
-3.26% |
18.596 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_FIR_RAW/5001
|
1609.55% |
39.051 |
667.599 |
9.719 |
-5.42% |
9.719 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint8_t_
|
1517.31% |
18919.674 |
305989.861 |
4649.748 |
-2.73% |
4649.748 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC31
|
1503.92% |
24.406 |
391.454 |
11.481 |
-2.35% |
11.481 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC31
|
1501.04% |
24.405 |
390.733 |
11.839 |
-2.41% |
11.839 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_EOS_RAW/5001
|
1495.92% |
29.639 |
473.016 |
21.030 |
0.11% |
21.030 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint8_t_To_uint16_t_
|
1448.77% |
2179.732 |
33758.948 |
253.158 |
-8.55% |
253.158 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint8_t_To_uint32_t_
|
1414.47% |
4341.093 |
65744.358 |
2500.811 |
6.90% |
2500.811 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_EOS_RAW/44217
|
1404.28% |
277.610 |
4176.028 |
197.323 |
-0.02% |
197.323 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint8_t_
|
1364.84% |
15598.689 |
228496.136 |
15404.146 |
0.52% |
15404.146 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint16_t_To_uint32_t_
|
1351.81% |
4354.072 |
63212.752 |
1760.211 |
-4.46% |
1760.211 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC63
|
1322.45% |
46.912 |
667.297 |
6.440 |
0.47% |
6.440 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint8_t_To_uint16_t_
|
1322.41% |
5797.885 |
82469.425 |
990.751 |
0.26% |
990.751 |
|
SingleSource/Benchmarks/Dhrystone/fldry
|
1318.35% |
0.192 |
2.728 |
0.010 |
-0.17% |
0.010 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC63
|
1302.96% |
45.948 |
644.634 |
15.582 |
-2.62% |
15.582 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC63
|
1290.19% |
43.172 |
600.176 |
4.400 |
0.27% |
4.400 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC31
|
1282.65% |
30.658 |
423.893 |
5.455 |
0.09% |
5.455 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_1D_RAW/171
|
1282.59% |
0.442 |
6.117 |
0.580 |
-2.70% |
0.580 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC127
|
1282.00% |
68.205 |
942.587 |
8.601 |
0.21% |
8.601 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint16_t>/127
|
1266.20% |
139.529 |
1906.241 |
75.044 |
-4.79% |
75.044 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint16_t_To_uint64_t_
|
1255.13% |
8707.607 |
117999.573 |
949.611 |
0.91% |
949.611 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_MULADDSUB_LAMBDA/171
|
1238.49% |
0.437 |
5.855 |
0.077 |
-2.19% |
0.077 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC15
|
1216.27% |
49.432 |
650.656 |
11.916 |
-15.01% |
11.916 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_MULADDSUB_RAW/171
|
1212.89% |
0.436 |
5.729 |
0.187 |
-2.64% |
0.187 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint32_t_To_uint8_t_
|
1197.44% |
9428.280 |
122326.349 |
4644.392 |
-4.77% |
4644.392 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC127
|
1190.89% |
88.755 |
1145.733 |
50.600 |
-3.01% |
50.600 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint8_t_To_uint64_t_
|
1183.88% |
8702.692 |
111732.159 |
6512.675 |
0.99% |
6512.675 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC127
|
1177.79% |
89.544 |
1144.177 |
42.134 |
-3.11% |
42.134 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint8_t>/127
|
1161.06% |
139.529 |
1759.539 |
68.036 |
-2.26% |
68.036 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint8_t_
|
1140.16% |
8357.009 |
103640.225 |
4198.778 |
1.61% |
4198.778 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint32_t>/127
|
1133.49% |
138.284 |
1705.716 |
60.354 |
-1.90% |
60.354 |
|
MicroBenchmarks/ImageProcessing/Dilate/Dilate.test:BENCHMARK_DILATE/1024
|
1129.79% |
6758.784 |
83118.520 |
1181.392 |
0.59% |
1181.392 |
|
SingleSource/Benchmarks/Misc/flops
|
1125.25% |
13.477 |
165.122 |
0.400 |
294.75% |
0.400 |
|
SingleSource/Benchmarks/Misc/oourafft
|
1119.81% |
14.305 |
174.488 |
0.954 |
-0.90% |
0.954 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC31
|
1117.32% |
85.103 |
1035.971 |
26.591 |
-7.43% |
26.591 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC32
|
1112.80% |
24.490 |
297.010 |
7.242 |
1.43% |
7.242 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_DIFF_RAW/171
|
1089.29% |
0.262 |
3.113 |
0.249 |
-3.76% |
0.249 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC32
|
1083.77% |
24.402 |
288.867 |
10.487 |
0.64% |
10.487 |
|
SingleSource/Benchmarks/Misc/fp-convert
|
1081.75% |
3.099 |
36.624 |
0.051 |
-0.75% |
0.051 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC128
|
1053.45% |
89.946 |
1037.473 |
41.211 |
-1.06% |
41.211 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC128
|
1052.70% |
89.612 |
1032.961 |
43.606 |
-1.54% |
43.606 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint16_t_
|
1052.25% |
17851.278 |
205691.638 |
7715.332 |
0.99% |
7715.332 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC64
|
1044.44% |
46.794 |
535.531 |
18.585 |
-0.84% |
18.585 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint8_t_To_uint16_t_
|
1038.20% |
4621.096 |
52597.287 |
393.670 |
-0.18% |
393.670 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC15
|
1033.99% |
24.402 |
276.712 |
2.428 |
0.97% |
2.428 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_PRESSURE_CALC_LAMBDA/171
|
1024.03% |
1.085 |
12.199 |
0.128 |
-0.76% |
0.128 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint16_t>/65
|
1015.99% |
95.731 |
1068.357 |
46.230 |
-4.93% |
46.230 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_INIT3_LAMBDA/171
|
1015.18% |
0.436 |
4.858 |
0.095 |
-5.41% |
0.095 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC64
|
1003.65% |
47.954 |
529.242 |
21.161 |
-1.91% |
21.161 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_1D_RAW/5001
|
989.63% |
16.265 |
177.232 |
16.604 |
-2.45% |
16.604 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC16
|
989.21% |
14.392 |
156.756 |
2.492 |
0.18% |
2.492 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_PRESSURE_CALC_RAW/171
|
981.33% |
1.085 |
11.737 |
0.263 |
-5.93% |
0.263 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC128
|
975.82% |
68.207 |
733.781 |
5.303 |
-0.49% |
5.303 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint8_t_To_uint32_t_
|
974.82% |
10034.386 |
107851.111 |
3941.263 |
1.09% |
3941.263 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_INIT3_RAW/171
|
972.74% |
0.442 |
4.736 |
0.208 |
-0.53% |
0.208 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint16_t_
|
971.72% |
15521.098 |
166343.106 |
9922.150 |
2.47% |
9922.150 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC63
|
971.44% |
156.456 |
1676.334 |
17.946 |
-7.47% |
17.946 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint8_t>/65
|
942.48% |
95.737 |
998.034 |
39.521 |
-1.34% |
39.521 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint8_t_
|
929.65% |
4742.357 |
48829.817 |
1105.744 |
-1.16% |
1105.744 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint8_t_To_uint16_t_
|
927.82% |
4538.270 |
46645.173 |
294.568 |
0.76% |
294.568 |
|
MultiSource/Benchmarks/TSVC/GlobalDataFlow-flt/GlobalDataFlow-flt
|
917.89% |
7.050 |
71.756 |
0.155 |
0.95% |
0.155 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint32_t>/65
|
908.34% |
94.487 |
952.744 |
31.962 |
-1.21% |
31.962 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC16
|
904.42% |
15.016 |
150.827 |
4.585 |
-2.07% |
4.585 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint8_t_To_uint64_t_
|
901.50% |
19236.546 |
192654.753 |
14635.796 |
-3.21% |
14635.796 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint16_t_To_uint8_t_
|
897.84% |
6772.587 |
67579.757 |
776.643 |
0.99% |
776.643 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint32_t>/127
|
893.41% |
119.502 |
1187.138 |
51.758 |
-0.25% |
51.758 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-matrix
|
891.67% |
1.295 |
12.840 |
0.263 |
-4.79% |
0.263 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC127
|
885.42% |
299.154 |
2947.924 |
28.408 |
-7.33% |
28.408 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint16_t_To_uint64_t_
|
867.14% |
19651.933 |
190061.316 |
7521.425 |
-4.54% |
7521.425 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_1D_RAW/44217
|
865.69% |
162.762 |
1571.778 |
147.486 |
-2.35% |
147.486 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC128
|
857.74% |
159.576 |
1528.319 |
32.838 |
-1.08% |
32.838 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint16_t>/127
|
839.64% |
78.824 |
740.659 |
30.917 |
-0.88% |
30.917 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC64
|
815.69% |
43.171 |
395.308 |
4.983 |
-0.57% |
4.983 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint32_t_To_uint16_t_
|
812.11% |
9435.304 |
86060.131 |
4602.814 |
-7.50% |
4602.814 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint32_t_
|
809.81% |
18561.686 |
168876.556 |
2135.792 |
-0.36% |
2135.792 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC64
|
807.14% |
86.970 |
788.938 |
14.950 |
-0.65% |
14.950 |
|
MultiSource/Benchmarks/TSVC/Searching-flt/Searching-flt
|
806.98% |
5.262 |
47.728 |
0.969 |
-2.90% |
0.969 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_xor_no_runtime_checks_needed<4, int>
|
798.58% |
6.257 |
56.222 |
1.885 |
-0.67% |
1.885 |
|
SingleSource/Benchmarks/Shootout/Shootout-matrix
|
795.22% |
3.183 |
28.495 |
0.637 |
-0.54% |
0.637 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC128
|
792.44% |
173.323 |
1546.797 |
22.973 |
-0.04% |
22.973 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC128
|
779.02% |
299.144 |
2629.529 |
24.022 |
-6.23% |
24.022 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint16_t_To_uint32_t_
|
770.36% |
11258.543 |
97989.946 |
6107.084 |
2.48% |
6107.084 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC64
|
765.70% |
156.062 |
1351.035 |
12.373 |
-5.95% |
12.373 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC64
|
754.56% |
93.232 |
796.726 |
10.818 |
0.08% |
10.818 |
|
SingleSource/Benchmarks/Polybench/stencils/jacobi-1d/jacobi-1d
|
750.42% |
0.015 |
0.130 |
0.001 |
-4.71% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint16_t_To_uint8_t_
|
746.50% |
4435.106 |
37542.956 |
1498.156 |
0.49% |
1498.156 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_no_runtime_checks_needed<2, double>
|
744.47% |
8.759 |
73.971 |
0.919 |
2.25% |
0.919 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC32
|
744.16% |
50.684 |
427.852 |
10.021 |
-0.40% |
10.021 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC32
|
736.21% |
85.105 |
711.656 |
11.259 |
-5.02% |
11.259 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint32_t_To_uint64_t_
|
730.19% |
21723.998 |
180349.954 |
3230.656 |
0.00% |
3230.656 |
|
MultiSource/Benchmarks/TSVC/Symbolics-flt/Symbolics-flt
|
725.96% |
4.862 |
40.156 |
0.010 |
2.57% |
0.010 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint32_t>/65
|
721.47% |
88.074 |
723.498 |
28.856 |
0.14% |
28.856 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC32
|
709.81% |
53.191 |
430.743 |
7.291 |
1.27% |
7.291 |
|
SingleSource/Benchmarks/Adobe-C++/simple_types_constant_folding
|
704.03% |
1.326 |
10.665 |
0.152 |
-3.28% |
0.152 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_no_runtime_checks_needed<4, int>
|
703.96% |
8.760 |
70.423 |
2.266 |
-1.66% |
2.266 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint16_t_
|
694.44% |
8258.628 |
65609.880 |
5455.568 |
-0.93% |
5455.568 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint64_t_
|
691.71% |
15070.480 |
119314.226 |
1743.330 |
-0.34% |
1743.330 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_BAND_LIN_EQ_RAW/171
|
681.09% |
0.373 |
2.913 |
0.129 |
0.34% |
0.129 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC16
|
674.89% |
49.433 |
383.048 |
7.874 |
-4.49% |
7.874 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint32_t_
|
672.52% |
15753.054 |
121695.234 |
694.378 |
0.77% |
694.378 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_PRESSURE_CALC_RAW/5001
|
657.96% |
44.479 |
337.137 |
6.954 |
-5.96% |
6.954 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC127
|
651.70% |
194.604 |
1462.833 |
46.861 |
0.10% |
46.861 |
|
MultiSource/Benchmarks/TSVC/Symbolics-dbl/Symbolics-dbl
|
651.43% |
9.296 |
69.854 |
0.094 |
3.18% |
0.094 |
|
MultiSource/Benchmarks/TSVC/Equivalencing-flt/Equivalencing-flt
|
645.84% |
3.296 |
24.585 |
0.013 |
-0.62% |
0.013 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint8_t_
|
643.06% |
3810.779 |
28316.422 |
363.841 |
2.33% |
363.841 |
|
SingleSource/Benchmarks/Linpack/linpack-pc
|
642.18% |
6.928 |
51.416 |
0.140 |
-6.74% |
0.140 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint16_t>/65
|
638.90% |
67.578 |
499.331 |
15.180 |
-0.31% |
15.180 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC32
|
638.78% |
30.659 |
226.500 |
7.015 |
-0.77% |
7.015 |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/2048/2048
|
633.42% |
178359.603 |
1308119.880 |
24954.905 |
-0.22% |
24954.905 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint8_t_To_uint32_t_
|
630.24% |
12371.067 |
90339.086 |
991.032 |
0.12% |
991.032 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_PRESSURE_CALC_LAMBDA/5001
|
625.26% |
48.554 |
352.139 |
3.846 |
-1.24% |
3.846 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC128
|
616.94% |
537.591 |
3854.202 |
121.859 |
-2.04% |
121.859 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC128
|
614.32% |
214.632 |
1533.165 |
45.787 |
-1.15% |
45.787 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC128
|
613.91% |
548.865 |
3918.378 |
63.120 |
-0.91% |
63.120 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC128
|
606.66% |
77.592 |
548.315 |
15.460 |
-4.04% |
15.460 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint8_t_To_uint16_t_
|
601.41% |
3757.235 |
26353.644 |
352.655 |
-0.70% |
352.655 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC64
|
599.95% |
113.253 |
792.706 |
19.107 |
-0.36% |
19.107 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC16
|
599.57% |
33.161 |
231.986 |
2.679 |
-0.32% |
2.679 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC32
|
595.96% |
61.318 |
426.752 |
9.157 |
0.65% |
9.157 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC64
|
595.84% |
282.252 |
1964.013 |
57.198 |
-1.70% |
57.198 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_no_runtime_checks_needed<4, double>
|
595.20% |
13.139 |
91.342 |
1.447 |
-1.32% |
1.447 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC7
|
594.96% |
14.391 |
100.010 |
4.721 |
-1.95% |
4.721 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC64
|
594.53% |
288.351 |
2002.682 |
26.202 |
-0.14% |
26.202 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint16_t_To_uint32_t_
|
594.36% |
12481.936 |
86669.171 |
240.393 |
0.43% |
240.393 |
|
MultiSource/Benchmarks/McCat/18-imp/imp
|
591.04% |
0.159 |
1.101 |
0.001 |
8.63% |
0.001 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_DIFF_RAW/5001
|
586.84% |
13.033 |
89.513 |
7.251 |
-3.87% |
7.251 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC16
|
583.55% |
32.535 |
222.394 |
3.106 |
-0.55% |
3.106 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_no_runtime_checks_needed<3, double>
|
581.91% |
12.514 |
85.332 |
0.445 |
-2.52% |
0.445 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC7
|
581.85% |
14.391 |
98.124 |
4.160 |
-1.86% |
4.160 |
|
SingleSource/Benchmarks/Misc/perlin
|
577.91% |
6.661 |
45.157 |
0.958 |
-3.81% |
0.958 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC127
|
573.48% |
203.351 |
1369.526 |
48.914 |
-0.52% |
48.914 |
|
MicroBenchmarks/ImageProcessing/Dilate/Dilate.test:BENCHMARK_DILATE/128
|
570.78% |
202.298 |
1356.973 |
15.706 |
-0.31% |
15.706 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint8_t>/127
|
570.40% |
58.822 |
394.338 |
16.332 |
0.63% |
16.332 |
|
MicroBenchmarks/ImageProcessing/Dilate/Dilate.test:BENCHMARK_DILATE/512
|
567.15% |
3131.526 |
20891.861 |
265.576 |
0.29% |
265.576 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint8_t_To_uint32_t_
|
565.22% |
7077.856 |
47083.516 |
332.477 |
0.28% |
332.477 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC127
|
563.96% |
225.273 |
1495.731 |
68.636 |
-0.78% |
68.636 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC32
|
559.26% |
154.558 |
1018.940 |
21.797 |
-0.72% |
21.797 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC32
|
551.99% |
157.992 |
1030.095 |
28.786 |
-0.11% |
28.786 |
|
MultiSource/Benchmarks/TSVC/ControlLoops-flt/ControlLoops-flt
|
549.53% |
5.526 |
35.895 |
0.073 |
-0.03% |
0.073 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint32_t_
|
548.97% |
7455.977 |
48387.154 |
330.944 |
-1.34% |
330.944 |
|
SingleSource/Benchmarks/Polybench/stencils/heat-3d/heat-3d
|
542.94% |
25.120 |
161.505 |
1.253 |
2.19% |
1.253 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC128
|
540.15% |
603.960 |
3866.228 |
126.132 |
-3.41% |
126.132 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC4
|
539.42% |
14.391 |
92.017 |
3.237 |
-1.79% |
3.237 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC128
|
538.51% |
603.937 |
3856.195 |
94.115 |
-1.84% |
94.115 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC128
|
536.88% |
85.722 |
545.945 |
16.105 |
-1.30% |
16.105 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC16
|
536.37% |
36.290 |
230.939 |
3.803 |
0.12% |
3.803 |
|
MultiSource/Benchmarks/TSVC/Equivalencing-dbl/Equivalencing-dbl
|
535.39% |
7.029 |
44.663 |
0.129 |
0.10% |
0.129 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC127
|
532.61% |
577.712 |
3654.639 |
113.488 |
-1.89% |
113.488 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC64
|
528.24% |
313.450 |
1969.205 |
59.759 |
-2.57% |
59.759 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC64
|
526.68% |
313.509 |
1964.687 |
43.256 |
-1.42% |
43.256 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC63
|
525.30% |
114.507 |
716.010 |
18.680 |
-0.38% |
18.680 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC64
|
525.15% |
47.552 |
297.270 |
7.738 |
-4.36% |
7.738 |
|
SingleSource/Benchmarks/Stanford/FloatMM
|
524.92% |
0.407 |
2.545 |
0.008 |
-0.05% |
0.008 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_xor_no_runtime_checks_needed<16, int>
|
524.40% |
16.894 |
105.488 |
3.003 |
-0.64% |
3.003 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_PRESSURE_CALC_LAMBDA/44217
|
517.01% |
509.043 |
3140.858 |
26.258 |
-0.35% |
26.258 |
|
MultiSource/Benchmarks/TSVC/Searching-dbl/Searching-dbl
|
516.65% |
9.115 |
56.206 |
0.471 |
-0.31% |
0.471 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC3
|
516.57% |
14.390 |
88.726 |
3.428 |
-1.14% |
3.428 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC3
|
515.83% |
14.391 |
88.622 |
3.909 |
0.21% |
3.909 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC32
|
514.25% |
168.328 |
1033.958 |
13.508 |
1.54% |
13.508 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC63
|
508.44% |
123.890 |
753.792 |
30.490 |
-0.03% |
30.490 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC127
|
508.24% |
618.961 |
3764.790 |
83.117 |
-1.53% |
83.117 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC127
|
508.05% |
618.411 |
3760.266 |
126.365 |
-3.32% |
126.365 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC4
|
507.01% |
15.014 |
91.139 |
3.712 |
-0.76% |
3.712 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC127
|
505.46% |
87.567 |
530.179 |
12.001 |
-1.78% |
12.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC32
|
505.20% |
168.331 |
1018.736 |
34.633 |
-3.15% |
34.633 |
|
SingleSource/Benchmarks/Polybench/stencils/fdtd-2d/fdtd-2d
|
500.98% |
20.444 |
122.863 |
0.467 |
-0.19% |
0.467 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC2
|
499.77% |
14.391 |
86.315 |
3.403 |
-1.38% |
3.403 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC7
|
496.68% |
49.439 |
294.992 |
6.906 |
-3.27% |
6.906 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC8
|
492.29% |
15.016 |
88.941 |
0.945 |
0.28% |
0.945 |
|
MultiSource/Applications/sgefa/sgefa
|
491.27% |
0.617 |
3.650 |
0.014 |
2.99% |
0.014 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC8
|
488.94% |
14.392 |
84.761 |
1.641 |
1.06% |
1.641 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC16
|
481.92% |
90.730 |
527.980 |
10.299 |
-0.57% |
10.299 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint32_t_To_uint8_t_
|
481.17% |
14416.905 |
83787.377 |
2327.001 |
-9.88% |
2327.001 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_PRESSURE_CALC_RAW/44217
|
477.18% |
519.241 |
2996.979 |
58.419 |
-6.14% |
58.419 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint8_t_
|
476.45% |
11255.297 |
64880.728 |
481.130 |
-9.57% |
481.130 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC16
|
474.50% |
92.864 |
533.508 |
7.201 |
-0.50% |
7.201 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC2
|
473.20% |
15.017 |
86.077 |
3.133 |
-1.07% |
3.133 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC8
|
469.34% |
23.151 |
131.806 |
0.951 |
1.66% |
0.951 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC63
|
469.09% |
327.944 |
1866.298 |
49.132 |
-2.68% |
49.132 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC63
|
468.50% |
328.196 |
1865.788 |
34.744 |
-1.00% |
34.744 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC16
|
466.82% |
95.733 |
542.628 |
4.925 |
0.85% |
4.925 |
|
MultiSource/Benchmarks/MiBench/consumer-lame/consumer-lame
|
462.51% |
0.610 |
3.434 |
0.026 |
-2.49% |
0.026 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC16
|
462.47% |
95.736 |
538.487 |
9.419 |
-0.28% |
9.419 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC16
|
458.02% |
24.402 |
136.170 |
4.865 |
0.49% |
4.865 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC127
|
451.84% |
632.552 |
3490.673 |
55.436 |
-1.22% |
55.436 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_MULADDSUB_LAMBDA/5001
|
450.58% |
30.673 |
168.878 |
2.519 |
-2.13% |
2.519 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_no_runtime_checks_needed<16, int>
|
450.14% |
24.401 |
134.241 |
4.953 |
-3.35% |
4.953 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC8
|
444.78% |
23.776 |
129.527 |
1.797 |
0.17% |
1.797 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC63
|
444.75% |
322.722 |
1758.023 |
48.933 |
-1.42% |
48.933 |
|
MultiSource/Benchmarks/TSVC/GlobalDataFlow-dbl/GlobalDataFlow-dbl
|
437.85% |
19.335 |
103.996 |
3.066 |
35.10% |
3.066 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/SimpleMOC/SimpleMOC
|
433.64% |
10.815 |
57.714 |
0.072 |
-0.34% |
0.072 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC64
|
432.01% |
55.687 |
296.260 |
8.077 |
-1.15% |
8.077 |
|
MicroBenchmarks/ImageProcessing/Dilate/Dilate.test:BENCHMARK_DILATE/256
|
429.71% |
999.274 |
5293.279 |
66.644 |
0.37% |
66.644 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC4
|
427.45% |
49.434 |
260.742 |
5.757 |
-2.92% |
5.757 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/HPCCG/HPCCG
|
426.83% |
4.046 |
21.317 |
0.108 |
0.32% |
0.108 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC31
|
425.53% |
71.957 |
378.152 |
12.183 |
0.05% |
12.183 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint32_t_To_uint16_t_
|
425.16% |
13475.983 |
70770.060 |
2584.736 |
-4.54% |
2584.736 |
|
SingleSource/Benchmarks/Adobe-C++/simple_types_loop_invariant
|
421.40% |
1.840 |
9.593 |
0.047 |
-1.36% |
0.047 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC32
|
420.78% |
34.413 |
179.216 |
0.107 |
-1.57% |
0.107 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint16_t_
|
418.81% |
9791.554 |
50799.700 |
89.867 |
0.51% |
89.867 |
|
MultiSource/Benchmarks/TSVC/ControlLoops-dbl/ControlLoops-dbl
|
417.12% |
11.305 |
58.458 |
0.491 |
-1.19% |
0.491 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC31
|
409.76% |
182.844 |
932.065 |
27.296 |
-1.59% |
27.296 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC31
|
409.35% |
182.731 |
930.731 |
21.602 |
0.07% |
21.602 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/512/3
|
405.18% |
3207.727 |
16204.633 |
349.072 |
-2.77% |
349.072 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/solvers/durbin/durbin
|
403.39% |
0.045 |
0.229 |
0.001 |
0.50% |
0.001 |
|
SingleSource/Benchmarks/BenchmarkGame/puzzle
|
402.81% |
0.919 |
4.621 |
0.013 |
18.98% |
0.013 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_MULADDSUB_RAW/5001
|
402.67% |
32.869 |
165.221 |
5.834 |
-2.15% |
5.834 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC3
|
401.31% |
49.429 |
247.792 |
4.767 |
-3.78% |
4.767 |
|
External/SPEC/CINT2017rate/525.x264_r/525.x264_r
|
400.07% |
130.371 |
651.949 |
1.740 |
4.53% |
1.740 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_DIFF_RAW/44217
|
390.64% |
161.562 |
792.680 |
63.552 |
-3.99% |
63.552 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC8
|
390.22% |
59.445 |
291.409 |
1.865 |
1.25% |
1.865 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC8
|
387.94% |
58.192 |
283.938 |
4.463 |
-0.83% |
4.463 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC8
|
386.91% |
59.443 |
289.436 |
4.344 |
-0.41% |
4.344 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC63
|
382.80% |
57.498 |
277.601 |
4.223 |
-2.38% |
4.223 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC63
|
380.06% |
130.710 |
627.487 |
19.101 |
0.25% |
19.101 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint8_t>/65
|
379.58% |
54.457 |
261.166 |
12.415 |
-0.28% |
12.415 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/1024
|
379.15% |
29556.094 |
141617.955 |
2215.568 |
0.05% |
2215.568 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/256/3
|
378.26% |
851.722 |
4073.451 |
77.403 |
-2.24% |
77.403 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC64
|
377.48% |
675.889 |
3227.226 |
66.760 |
-0.36% |
66.760 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC128
|
375.81% |
1336.804 |
6360.672 |
152.783 |
-1.08% |
152.783 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC1
|
375.12% |
14.395 |
68.393 |
2.757 |
0.00% |
2.757 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC2
|
374.94% |
49.429 |
234.760 |
6.029 |
-5.38% |
6.029 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC1
|
374.68% |
14.390 |
68.309 |
2.569 |
-0.11% |
2.569 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC32
|
373.50% |
345.418 |
1635.563 |
57.681 |
-0.51% |
57.681 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC127
|
373.27% |
106.048 |
501.891 |
12.840 |
-0.48% |
12.840 |
|
MultiSource/Benchmarks/FreeBench/pifft/pifft
|
371.64% |
0.362 |
1.709 |
0.008 |
-0.89% |
0.008 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC16
|
371.63% |
180.209 |
849.918 |
11.654 |
0.51% |
11.654 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC127
|
371.33% |
1329.952 |
6268.513 |
147.054 |
-1.20% |
147.054 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC4
|
370.97% |
17.521 |
82.519 |
1.102 |
1.34% |
1.102 |
|
SingleSource/Benchmarks/Misc-C++/stepanov_v1p2
|
368.51% |
13.509 |
63.290 |
0.385 |
-2.47% |
0.385 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC63
|
368.03% |
668.829 |
3130.299 |
64.076 |
-0.80% |
64.076 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/16
|
367.15% |
283.748 |
1325.540 |
12.888 |
-2.31% |
12.888 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC31
|
366.97% |
338.536 |
1580.853 |
39.006 |
-0.32% |
39.006 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC128
|
364.78% |
119.505 |
555.435 |
17.191 |
-0.58% |
17.191 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC128
|
364.54% |
119.504 |
555.147 |
16.239 |
-0.76% |
16.239 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/32
|
362.73% |
1416.071 |
6552.652 |
79.183 |
-2.99% |
79.183 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/64
|
362.61% |
6267.862 |
28995.480 |
403.701 |
-2.94% |
403.701 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/256
|
360.90% |
108754.750 |
501247.697 |
5344.299 |
-2.22% |
5344.299 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/128/3
|
360.46% |
222.211 |
1023.187 |
19.352 |
-2.36% |
19.352 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC8
|
357.02% |
97.617 |
446.129 |
4.536 |
-0.16% |
4.536 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/128
|
356.98% |
26612.856 |
121616.427 |
1668.028 |
-3.00% |
1668.028 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC127
|
354.43% |
120.133 |
545.917 |
14.588 |
-0.23% |
14.588 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC127
|
353.45% |
120.136 |
544.760 |
16.052 |
-0.53% |
16.052 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint8_t_To_uint32_t_
|
351.69% |
12989.769 |
58672.961 |
547.303 |
0.14% |
547.303 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/512
|
349.85% |
7687.093 |
34580.268 |
119.025 |
-0.43% |
119.025 |
|
MultiSource/Benchmarks/FreeBench/neural/neural
|
349.52% |
0.248 |
1.116 |
0.006 |
-0.01% |
0.006 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC31
|
348.32% |
74.460 |
333.820 |
4.636 |
0.22% |
4.636 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/128
|
347.23% |
5206.448 |
23284.756 |
366.226 |
0.54% |
366.226 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC4
|
342.65% |
56.314 |
249.273 |
1.046 |
0.03% |
1.046 |
|
MicroBenchmarks/LoopInterchange/LoopInterchange.test:BENCHMARK_LI1
|
342.37% |
1554.411 |
6876.268 |
610.644 |
-9.80% |
610.644 |
|
SingleSource/Benchmarks/Polybench/stencils/jacobi-2d/jacobi-2d
|
339.11% |
33.524 |
147.206 |
1.818 |
-2.89% |
1.818 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC7
|
337.52% |
24.402 |
106.762 |
2.680 |
-1.27% |
2.680 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC15
|
334.63% |
173.356 |
753.453 |
10.292 |
0.29% |
10.292 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/256
|
334.41% |
22898.707 |
99474.062 |
1659.063 |
0.66% |
1659.063 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC64
|
333.87% |
69.450 |
301.325 |
8.829 |
-0.61% |
8.829 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC64
|
333.16% |
69.458 |
300.865 |
7.686 |
-0.43% |
7.686 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC8
|
332.86% |
49.431 |
213.968 |
4.246 |
-4.25% |
4.246 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/miniFE/miniFE
|
332.33% |
17.064 |
73.772 |
0.781 |
-3.51% |
0.781 |
|
MultiSource/Benchmarks/TSVC/InductionVariable-flt/InductionVariable-flt
|
331.46% |
11.003 |
47.475 |
0.234 |
0.38% |
0.234 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/512
|
329.75% |
95514.756 |
410477.756 |
6749.371 |
-0.60% |
6749.371 |
|
MultiSource/Benchmarks/TSVC/CrossingThresholds-flt/CrossingThresholds-flt
|
328.13% |
11.072 |
47.405 |
0.148 |
-1.46% |
0.148 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_INIT3_LAMBDA/5001
|
327.08% |
32.805 |
140.102 |
2.782 |
-5.05% |
2.782 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC31
|
322.07% |
195.056 |
823.271 |
17.123 |
0.52% |
17.123 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC63
|
321.66% |
372.123 |
1569.098 |
19.889 |
-0.71% |
19.889 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_DEL_DOT_VEC_2D_RAW/0
|
320.86% |
1861.021 |
7832.275 |
53.168 |
0.09% |
53.168 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC32
|
319.81% |
40.673 |
170.750 |
1.109 |
1.50% |
1.109 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_DEL_DOT_VEC_2D_LAMBDA/0
|
319.62% |
1863.854 |
7821.104 |
12.618 |
0.02% |
12.618 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC4
|
319.22% |
24.404 |
102.304 |
2.193 |
-0.71% |
2.193 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/256
|
319.16% |
1999.450 |
8380.934 |
60.336 |
-0.36% |
60.336 |
|
SingleSource/Benchmarks/CoyoteBench/lpbench
|
316.37% |
13.652 |
56.841 |
0.178 |
0.32% |
0.178 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/128
|
315.93% |
466.202 |
1939.054 |
22.665 |
-1.26% |
22.665 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC63
|
315.85% |
70.077 |
291.417 |
7.631 |
0.19% |
7.631 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC3
|
315.48% |
24.401 |
101.383 |
2.117 |
0.48% |
2.117 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC63
|
313.55% |
70.079 |
289.813 |
7.950 |
-0.26% |
7.950 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint16_t_To_uint32_t_
|
312.00% |
13273.054 |
54685.606 |
567.112 |
-0.45% |
567.112 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_DEL_DOT_VEC_2D_LAMBDA/1
|
311.00% |
297.386 |
1222.241 |
0.790 |
0.06% |
0.790 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_DEL_DOT_VEC_2D_RAW/1
|
310.80% |
297.449 |
1221.931 |
1.337 |
0.08% |
1.337 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_DEL_DOT_VEC_2D_RAW/2
|
309.43% |
3.621 |
14.826 |
0.004 |
0.04% |
0.004 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_DEL_DOT_VEC_2D_LAMBDA/2
|
309.35% |
3.621 |
14.823 |
0.022 |
-0.03% |
0.022 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC15
|
306.92% |
46.926 |
190.954 |
3.503 |
1.35% |
3.503 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC2
|
305.28% |
24.402 |
98.898 |
2.180 |
-0.37% |
2.180 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC4
|
304.17% |
41.299 |
166.915 |
1.186 |
-1.78% |
1.186 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint8_t_To_uint32_t_
|
302.31% |
6626.974 |
26661.266 |
262.836 |
-1.06% |
262.836 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC32
|
302.19% |
44.426 |
178.676 |
1.596 |
2.04% |
1.596 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC32
|
298.85% |
44.423 |
177.183 |
1.975 |
1.45% |
1.975 |
|
MultiSource/Benchmarks/mediabench/mpeg2/mpeg2dec/mpeg2decode
|
298.13% |
0.030 |
0.119 |
0.000 |
4.65% |
0.000 |
|
SingleSource/Benchmarks/Misc-C++/oopack_v1p8
|
297.47% |
0.522 |
2.074 |
0.015 |
-2.05% |
0.015 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC2
|
295.86% |
34.412 |
136.226 |
2.290 |
0.66% |
2.290 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC4
|
295.22% |
41.299 |
163.219 |
3.434 |
0.81% |
3.434 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint32_t_
|
295.12% |
7104.559 |
28071.817 |
519.438 |
0.98% |
519.438 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC15
|
294.03% |
110.123 |
433.924 |
3.712 |
1.33% |
3.712 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC15
|
292.61% |
110.128 |
432.381 |
4.922 |
0.53% |
4.922 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_BAND_LIN_EQ_RAW/44217
|
290.65% |
170.647 |
666.633 |
30.241 |
2.36% |
30.241 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint8_t_To_uint64_t_
|
288.61% |
23400.669 |
90937.688 |
1522.056 |
-0.97% |
1522.056 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC8
|
283.94% |
24.401 |
93.684 |
3.605 |
1.11% |
3.605 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC7
|
283.11% |
90.720 |
347.562 |
4.465 |
0.06% |
4.465 |
|
SingleSource/Benchmarks/Adobe-C++/stepanov_abstraction
|
282.63% |
11.940 |
45.684 |
0.252 |
-1.60% |
0.252 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_MULADDSUB_LAMBDA/44217
|
280.77% |
392.899 |
1496.056 |
18.137 |
-2.27% |
18.137 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC1
|
280.03% |
24.401 |
92.734 |
3.359 |
0.35% |
3.359 |
|
MultiSource/Benchmarks/Prolangs-C/bison/mybison
|
279.73% |
0.010 |
0.040 |
0.000 |
0.15% |
0.000 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_MULADDSUB_RAW/44217
|
278.31% |
386.252 |
1461.227 |
57.942 |
-1.05% |
57.942 |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/1024
|
274.87% |
444966.498 |
1668065.416 |
26783.959 |
0.62% |
26783.959 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint8_t_
|
273.88% |
26618.536 |
99520.910 |
1552.040 |
-10.02% |
1552.040 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC1
|
273.64% |
49.432 |
184.699 |
5.395 |
-6.12% |
5.395 |
|
MultiSource/Benchmarks/TSVC/Expansion-flt/Expansion-flt
|
269.48% |
12.959 |
47.880 |
0.185 |
-8.50% |
0.185 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC31
|
265.82% |
45.049 |
164.798 |
1.294 |
1.49% |
1.294 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint16_t_
|
263.72% |
25456.784 |
92592.031 |
1809.507 |
-1.58% |
1809.507 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC16
|
262.64% |
28.162 |
102.125 |
1.782 |
-8.43% |
1.782 |
|
SingleSource/Benchmarks/Shootout/Shootout-methcall
|
260.97% |
11.059 |
39.918 |
0.023 |
-0.09% |
0.023 |
|
SingleSource/Benchmarks/Stanford/Oscar
|
260.29% |
0.010 |
0.037 |
0.000 |
-0.56% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint16_t_To_uint64_t_
|
259.04% |
25535.265 |
91680.679 |
1120.981 |
1.02% |
1120.981 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint32_t_To_uint8_t_
|
258.78% |
13256.415 |
47561.053 |
1218.737 |
-9.52% |
1218.737 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC31
|
258.37% |
45.053 |
161.456 |
2.536 |
-0.24% |
2.536 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_BAND_LIN_EQ_RAW/5001
|
255.84% |
21.158 |
75.288 |
3.574 |
-0.80% |
3.574 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint64_t_
|
255.82% |
13508.214 |
48065.224 |
469.370 |
0.60% |
469.370 |
|
MultiSource/Benchmarks/TSVC/Expansion-dbl/Expansion-dbl
|
253.21% |
20.926 |
73.913 |
0.146 |
-9.93% |
0.146 |
|
SingleSource/Benchmarks/Stanford/RealMM
|
251.99% |
0.006 |
0.020 |
0.000 |
-2.49% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint8_t_To_uint64_t_
|
248.18% |
13351.372 |
46486.492 |
468.606 |
-0.55% |
468.606 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC31
|
245.56% |
44.430 |
153.536 |
1.156 |
-2.93% |
1.156 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint8_t_
|
245.08% |
11194.264 |
38629.344 |
761.789 |
-9.56% |
761.789 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/kernels/atax/atax
|
243.09% |
0.111 |
0.380 |
0.001 |
10.74% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint8_t_
|
242.90% |
22921.174 |
78595.854 |
1687.790 |
-11.59% |
1687.790 |
|
MultiSource/Benchmarks/TSVC/ControlFlow-dbl/ControlFlow-dbl
|
235.46% |
24.480 |
82.120 |
1.771 |
-2.83% |
1.771 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC16
|
232.32% |
31.912 |
106.050 |
0.581 |
2.65% |
0.581 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint32_t_To_uint64_t_
|
231.46% |
25629.754 |
84953.661 |
2160.809 |
-5.04% |
2160.809 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC63
|
231.26% |
76.087 |
252.050 |
5.433 |
-0.08% |
5.433 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint8_t_To_uint64_t_
|
229.16% |
22741.309 |
74854.871 |
776.645 |
18.88% |
776.645 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_INIT3_RAW/5001
|
228.66% |
41.551 |
136.561 |
6.236 |
-0.49% |
6.236 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint16_t_To_uint64_t_
|
226.86% |
23706.007 |
77486.622 |
1163.780 |
27.04% |
1163.780 |
|
MultiSource/Benchmarks/BitBench/uuencode/uuencode
|
226.85% |
0.035 |
0.113 |
0.001 |
-0.68% |
0.001 |
|
External/SPEC/CFP2017rate/538.imagick_r/538.imagick_r
|
220.49% |
292.125 |
936.234 |
1.733 |
-2.70% |
1.733 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC16
|
220.41% |
31.909 |
102.241 |
2.779 |
-0.57% |
2.779 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_runtime_checks_fail<3, double>
|
218.20% |
15.016 |
47.782 |
1.465 |
0.01% |
1.465 |
|
SingleSource/Benchmarks/Adobe-C++/loop_unroll
|
218.15% |
4.122 |
13.113 |
0.013 |
0.03% |
0.013 |
|
SingleSource/Benchmarks/Shootout/Shootout-ary3
|
217.34% |
3.718 |
11.800 |
0.264 |
-9.26% |
0.264 |
|
MultiSource/Benchmarks/Rodinia/srad/srad
|
217.24% |
1.751 |
5.557 |
0.026 |
-0.16% |
0.026 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-ary3
|
216.75% |
3.755 |
11.894 |
0.252 |
-2.31% |
0.252 |
|
SingleSource/Benchmarks/BenchmarkGame/spectral-norm
|
215.12% |
1.577 |
4.970 |
0.010 |
-32.96% |
0.010 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_INIT3_LAMBDA/44217
|
213.20% |
396.838 |
1242.916 |
25.029 |
-5.16% |
25.029 |
|
MultiSource/Benchmarks/TSVC/LinearDependence-flt/LinearDependence-flt
|
212.24% |
14.797 |
46.201 |
0.249 |
0.21% |
0.249 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_acosf_autovec_float_
|
211.94% |
845.160 |
2636.353 |
59.792 |
-0.79% |
59.792 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_INIT3_RAW/44217
|
211.02% |
388.787 |
1209.197 |
56.361 |
-0.56% |
56.361 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_acosf_novec_float_
|
210.91% |
845.032 |
2627.281 |
73.886 |
-1.17% |
73.886 |
|
MultiSource/Benchmarks/TSVC/LoopRerolling-dbl/LoopRerolling-dbl
|
209.13% |
15.762 |
48.725 |
1.807 |
-0.55% |
1.807 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_runtime_checks_pass<2, double>
|
208.63% |
10.011 |
30.896 |
0.167 |
-0.04% |
0.167 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC16
|
207.76% |
33.162 |
102.059 |
1.883 |
-0.09% |
1.883 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/symm/symm
|
207.60% |
0.007 |
0.023 |
0.000 |
-1.95% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sinhf_autovec_float_
|
207.12% |
2242.828 |
6888.138 |
13.999 |
0.15% |
13.999 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint32_t_To_uint16_t_
|
206.72% |
13402.118 |
41107.599 |
797.843 |
1.04% |
797.843 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint16_t_
|
205.70% |
21956.060 |
67119.891 |
213.601 |
-8.51% |
213.601 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sinhf_novec_float_
|
205.17% |
2242.014 |
6841.965 |
31.372 |
0.37% |
31.372 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint32_t_
|
201.88% |
26121.349 |
78856.155 |
366.439 |
9.03% |
366.439 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_2D_RAW/171
|
201.02% |
91.312 |
274.872 |
9.635 |
0.33% |
9.635 |
|
MultiSource/Benchmarks/FreeBench/mason/mason
|
200.35% |
0.534 |
1.605 |
0.006 |
-0.76% |
0.006 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_runtime_checks_fail<2, double>
|
197.40% |
13.139 |
39.075 |
0.188 |
-0.04% |
0.188 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint32_t_To_uint64_t_
|
197.22% |
25269.972 |
75108.580 |
1244.318 |
34.33% |
1244.318 |
|
MultiSource/Benchmarks/TSVC/InductionVariable-dbl/InductionVariable-dbl
|
196.53% |
22.105 |
65.548 |
2.368 |
-6.06% |
2.368 |
|
MultiSource/Benchmarks/TSVC/LoopRerolling-flt/LoopRerolling-flt
|
191.12% |
11.643 |
33.894 |
0.569 |
-3.95% |
0.569 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC15
|
191.02% |
32.552 |
94.732 |
0.345 |
2.41% |
0.345 |
|
MultiSource/Benchmarks/VersaBench/beamformer/beamformer
|
188.71% |
3.844 |
11.098 |
0.021 |
-0.57% |
0.021 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/512/2
|
188.10% |
3696.957 |
10650.754 |
199.038 |
-1.81% |
199.038 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/512/4
|
184.28% |
3744.814 |
10645.873 |
245.538 |
-1.91% |
245.538 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC3
|
183.85% |
49.432 |
140.314 |
2.450 |
-0.18% |
2.450 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC1
|
183.71% |
11.262 |
31.952 |
1.206 |
36.87% |
1.206 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC16
|
183.17% |
232.290 |
657.788 |
5.289 |
-0.22% |
5.289 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-methcall
|
183.12% |
14.609 |
41.361 |
0.048 |
-0.10% |
0.048 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC8
|
182.52% |
25.029 |
70.711 |
1.273 |
-11.47% |
1.273 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC15
|
180.94% |
32.535 |
91.405 |
1.582 |
0.08% |
1.582 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC8
|
179.76% |
25.654 |
71.769 |
0.657 |
1.15% |
0.657 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC32
|
179.52% |
458.733 |
1282.251 |
14.953 |
0.12% |
14.953 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/512/8
|
178.59% |
3820.767 |
10644.233 |
234.923 |
-1.80% |
234.923 |
|
MultiSource/Benchmarks/Prolangs-C++/city/city
|
175.97% |
0.019 |
0.052 |
0.001 |
-1.13% |
0.001 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/256/2
|
174.97% |
973.559 |
2676.970 |
70.480 |
-1.40% |
70.480 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/miniGMG/miniGMG
|
174.73% |
4.608 |
12.660 |
0.280 |
-0.78% |
0.280 |
|
MultiSource/Benchmarks/SciMark2-C/scimark2
|
174.08% |
108.017 |
296.051 |
1.040 |
1.13% |
1.040 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC8
|
174.02% |
25.653 |
70.293 |
1.363 |
-0.11% |
1.363 |
|
SingleSource/Benchmarks/BenchmarkGame/n-body
|
171.90% |
2.167 |
5.891 |
0.014 |
-0.62% |
0.014 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_TRAP_INT_RAW/171
|
170.68% |
2.512 |
6.799 |
0.273 |
-0.05% |
0.273 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/256/4
|
170.17% |
989.360 |
2672.981 |
61.583 |
-2.03% |
61.583 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC128
|
168.61% |
1808.861 |
4858.782 |
103.362 |
-1.81% |
103.362 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC1
|
168.22% |
11.889 |
31.887 |
1.212 |
36.37% |
1.212 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC64
|
167.82% |
920.033 |
2464.077 |
47.476 |
-1.42% |
47.476 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_TRAP_INT_RAW/5001
|
167.72% |
72.035 |
192.852 |
8.624 |
-0.28% |
8.624 |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_TRAP_INT_RAW/44217
|
167.30% |
636.410 |
1701.092 |
72.299 |
-0.22% |
72.299 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_1D_RAW/171
|
167.22% |
7.634 |
20.400 |
0.837 |
0.16% |
0.837 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/256/8
|
166.80% |
1011.505 |
2698.675 |
34.848 |
-1.11% |
34.848 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/128/2
|
164.62% |
254.596 |
673.702 |
12.525 |
-1.26% |
12.525 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/128/4
|
163.32% |
256.177 |
674.572 |
15.211 |
-0.86% |
15.211 |
|
MultiSource/Applications/JM/lencod/lencod
|
163.29% |
28.841 |
75.936 |
0.417 |
11.06% |
0.417 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_TRAP_INT_LAMBDA/171
|
163.09% |
2.512 |
6.608 |
0.087 |
-1.07% |
0.087 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC1
|
162.48% |
8.135 |
21.352 |
0.806 |
0.18% |
0.806 |
|
MultiSource/Benchmarks/mediabench/jpeg/jpeg-6a/cjpeg
|
161.95% |
0.013 |
0.034 |
0.000 |
0.00% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC31
|
161.46% |
94.475 |
247.020 |
3.283 |
-0.08% |
3.283 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_TRAP_INT_LAMBDA/5001
|
159.99% |
72.053 |
187.333 |
2.783 |
-0.82% |
2.783 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint16_t_
|
159.58% |
11626.925 |
30181.264 |
628.710 |
0.58% |
628.710 |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_TRAP_INT_LAMBDA/44217
|
159.45% |
636.397 |
1651.150 |
28.192 |
-1.55% |
28.192 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/128/8
|
158.17% |
260.963 |
673.739 |
15.923 |
-0.77% |
15.923 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_acos_autovec_double_
|
157.45% |
1016.477 |
2616.940 |
36.360 |
-0.19% |
36.360 |
|
SingleSource/Benchmarks/Misc/evalloop
|
156.55% |
2.281 |
5.852 |
0.021 |
-0.05% |
0.021 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC15
|
156.24% |
54.443 |
139.506 |
1.459 |
0.90% |
1.459 |
|
SingleSource/Benchmarks/Misc-C++/Large/ray
|
156.21% |
12.160 |
31.154 |
0.700 |
-3.44% |
0.700 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC7
|
155.63% |
34.413 |
87.972 |
0.637 |
1.62% |
0.637 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_xor_runtime_checks_pass<4, int>
|
155.08% |
8.762 |
22.351 |
0.053 |
-0.25% |
0.053 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/32
|
153.74% |
482.548 |
1224.414 |
16.884 |
0.86% |
16.884 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_asinf_novec_float_
|
153.61% |
1011.746 |
2565.936 |
40.941 |
-1.68% |
40.941 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/64
|
153.36% |
1954.856 |
4952.767 |
59.987 |
1.01% |
59.987 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_acos_novec_double_
|
152.90% |
1016.413 |
2570.508 |
47.002 |
0.10% |
47.002 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/16
|
152.33% |
117.697 |
296.986 |
5.432 |
-0.00% |
5.432 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint64_t_
|
152.31% |
19625.761 |
49517.641 |
871.675 |
1.17% |
871.675 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint32_t_
|
152.18% |
20360.427 |
51344.945 |
498.250 |
0.63% |
498.250 |
|
MultiSource/Applications/lambda-0.1.3/lambda
|
151.44% |
14.335 |
36.045 |
0.307 |
-1.38% |
0.307 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC2
|
150.30% |
13.141 |
32.892 |
0.984 |
35.40% |
0.984 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_asinf_autovec_float_
|
150.10% |
1010.730 |
2527.804 |
56.644 |
-3.15% |
56.644 |
|
MultiSource/Benchmarks/Rodinia/hotspot/hotspot
|
149.22% |
2.068 |
5.155 |
0.049 |
-2.92% |
0.049 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/256
|
149.17% |
32057.543 |
79878.367 |
1113.630 |
1.17% |
1113.630 |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/128
|
147.96% |
8043.830 |
19945.741 |
256.150 |
1.54% |
256.150 |
|
SingleSource/Benchmarks/Misc/revertBits
|
146.97% |
0.641 |
1.584 |
0.003 |
-19.47% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC31
|
146.17% |
241.989 |
595.702 |
9.956 |
0.13% |
9.956 |
|
MultiSource/Benchmarks/TSVC/LinearDependence-dbl/LinearDependence-dbl
|
145.13% |
24.571 |
60.230 |
0.912 |
-0.07% |
0.912 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC4
|
144.06% |
22.526 |
54.976 |
0.977 |
1.21% |
0.977 |
|
MultiSource/Benchmarks/MiBench/security-rijndael/security-rijndael
|
143.98% |
0.308 |
0.752 |
0.015 |
-8.69% |
0.015 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC7
|
140.72% |
73.835 |
177.734 |
5.599 |
-0.53% |
5.599 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC4
|
140.30% |
22.526 |
54.129 |
1.166 |
-0.29% |
1.166 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC15
|
139.84% |
130.774 |
313.647 |
4.822 |
-1.68% |
4.822 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_runtime_checks_pass<3, double>
|
139.38% |
15.016 |
35.946 |
0.141 |
0.08% |
0.141 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC7
|
139.29% |
73.835 |
176.682 |
3.389 |
-0.08% |
3.389 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_ENERGY_CALC_RAW/171
|
138.88% |
14.169 |
33.848 |
0.119 |
-1.13% |
0.119 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_ENERGY_CALC_LAMBDA/171
|
137.31% |
14.144 |
33.564 |
0.772 |
-0.54% |
0.772 |
|
MultiSource/Benchmarks/nbench/nbench
|
134.29% |
6.144 |
14.396 |
0.245 |
-2.22% |
0.245 |
|
MultiSource/Benchmarks/TSVC/StatementReordering-flt/StatementReordering-flt
|
131.57% |
14.261 |
33.023 |
0.014 |
52.60% |
0.014 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_runtime_checks_fail<4, double>
|
129.58% |
20.647 |
47.403 |
0.069 |
-0.04% |
0.069 |
|
MultiSource/Benchmarks/TSVC/ControlFlow-flt/ControlFlow-flt
|
128.76% |
30.814 |
70.490 |
0.513 |
-0.54% |
0.513 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC7
|
126.56% |
26.279 |
59.536 |
2.168 |
3.02% |
2.168 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sinf_novec_float_
|
124.16% |
1158.484 |
2596.849 |
36.864 |
-2.05% |
36.864 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sinf_autovec_float_
|
122.82% |
1158.515 |
2581.428 |
47.500 |
-0.31% |
47.500 |
|
MultiSource/Benchmarks/PAQ8p/paq8p
|
122.34% |
165.774 |
368.582 |
3.537 |
-1.05% |
3.537 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC3
|
122.03% |
15.327 |
34.031 |
1.091 |
35.74% |
1.091 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC7
|
121.70% |
26.646 |
59.074 |
2.528 |
-0.47% |
2.528 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC2
|
120.89% |
10.011 |
22.113 |
0.634 |
-0.06% |
0.634 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC15
|
119.30% |
37.090 |
81.339 |
3.011 |
-10.45% |
3.011 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_cosf_novec_float_
|
117.75% |
1010.664 |
2200.670 |
22.327 |
-0.49% |
22.327 |
|
SingleSource/Benchmarks/Adobe-C++/stepanov_vector
|
117.21% |
8.110 |
17.616 |
0.155 |
-0.90% |
0.155 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_cosf_autovec_float_
|
116.65% |
1010.625 |
2189.530 |
22.245 |
0.06% |
22.245 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_ENERGY_CALC_RAW/5001
|
113.29% |
457.167 |
975.092 |
4.777 |
-1.43% |
4.777 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_ENERGY_CALC_LAMBDA/5001
|
111.65% |
456.570 |
966.351 |
24.573 |
-1.53% |
24.573 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_xor_runtime_checks_fail<4, int>
|
110.36% |
10.644 |
22.391 |
0.044 |
-0.33% |
0.044 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC31
|
109.50% |
60.069 |
125.842 |
0.865 |
0.23% |
0.865 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/kernels/doitgen/doitgen
|
109.29% |
12.677 |
26.532 |
0.072 |
-3.08% |
0.072 |
|
MultiSource/Benchmarks/TSVC/CrossingThresholds-dbl/CrossingThresholds-dbl
|
109.13% |
28.070 |
58.704 |
1.168 |
-0.39% |
1.168 |
|
MultiSource/Benchmarks/TSVC/NodeSplitting-flt/NodeSplitting-flt
|
106.42% |
17.842 |
36.829 |
0.035 |
-0.07% |
0.035 |
|
MultiSource/Benchmarks/McCat/05-eks/eks
|
103.40% |
0.016 |
0.033 |
0.000 |
-0.27% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC16
|
102.73% |
324.162 |
657.166 |
11.579 |
-0.19% |
11.579 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC1
|
102.27% |
11.262 |
22.780 |
0.845 |
-28.63% |
0.845 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC1
|
101.72% |
11.263 |
22.720 |
0.899 |
0.03% |
0.899 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC32
|
101.25% |
628.757 |
1265.367 |
27.008 |
-0.53% |
27.008 |
|
SingleSource/Benchmarks/Misc-C++/mandel-text
|
100.86% |
4.244 |
8.524 |
0.014 |
-0.26% |
0.014 |
|
MultiSource/Benchmarks/mediabench/g721/g721encode/encode
|
100.61% |
0.098 |
0.197 |
0.002 |
6.91% |
0.002 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_FLOYD_DITHER/512
|
100.54% |
6824.997 |
13686.628 |
187.753 |
-4.74% |
187.753 |
|
MultiSource/Applications/hbd/hbd
|
100.07% |
0.015 |
0.029 |
0.000 |
-0.20% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_asin_novec_double_
|
99.99% |
1211.601 |
2423.023 |
40.907 |
-1.57% |
40.907 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, Mid>
|
99.46% |
56743.288 |
113181.775 |
647.899 |
48.70% |
647.899 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_asin_autovec_double_
|
99.04% |
1212.371 |
2413.051 |
51.438 |
-2.52% |
51.438 |
|
SingleSource/Benchmarks/Stanford/Puzzle
|
97.51% |
0.203 |
0.400 |
0.002 |
0.10% |
0.002 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_ENERGY_CALC_RAW/44217
|
97.15% |
4368.480 |
8612.380 |
54.226 |
-1.35% |
54.226 |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/256/256
|
95.99% |
10472.455 |
20524.617 |
211.117 |
-0.55% |
211.117 |
|
MultiSource/Benchmarks/mediabench/gsm/toast/toast
|
95.76% |
0.086 |
0.168 |
0.001 |
-2.79% |
0.001 |
|
MultiSource/Benchmarks/MiBench/consumer-jpeg/consumer-jpeg
|
95.32% |
0.016 |
0.032 |
0.000 |
-3.77% |
0.000 |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/512/512
|
94.80% |
42225.127 |
82255.905 |
621.088 |
-0.15% |
621.088 |
|
SingleSource/Benchmarks/Misc/dt
|
94.64% |
1.861 |
3.622 |
0.079 |
-2.38% |
0.079 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC64
|
94.56% |
1258.359 |
2448.275 |
69.369 |
-2.38% |
69.369 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_ENERGY_CALC_LAMBDA/44217
|
93.54% |
4416.871 |
8548.377 |
214.660 |
-1.16% |
214.660 |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/1024/1024
|
93.44% |
169846.239 |
328551.320 |
2471.770 |
-0.49% |
2471.770 |
|
MicroBenchmarks/ImageProcessing/AnisotropicDiffusion/AnisotropicDiffusion.test:BENCHMARK_ANISTROPIC_DIFFUSION/32
|
93.41% |
2177.895 |
4212.285 |
38.488 |
-3.78% |
38.488 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC8
|
93.24% |
179.690 |
347.237 |
7.121 |
0.93% |
7.121 |
|
MicroBenchmarks/ImageProcessing/AnisotropicDiffusion/AnisotropicDiffusion.test:BENCHMARK_ANISTROPIC_DIFFUSION/64
|
93.16% |
9961.463 |
19241.633 |
176.075 |
-3.87% |
176.075 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_expf_novec_float_
|
91.74% |
902.621 |
1730.689 |
25.973 |
-0.26% |
25.973 |
|
MicroBenchmarks/ImageProcessing/AnisotropicDiffusion/AnisotropicDiffusion.test:BENCHMARK_ANISTROPIC_DIFFUSION/128
|
91.56% |
43112.976 |
82586.215 |
769.737 |
-3.84% |
769.737 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC1
|
90.89% |
11.889 |
22.696 |
0.916 |
-0.47% |
0.916 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC128
|
90.06% |
2541.619 |
4830.505 |
149.405 |
-2.60% |
149.405 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_FLOYD_DITHER/256
|
89.52% |
1793.443 |
3398.876 |
59.387 |
-4.73% |
59.387 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_expf_autovec_float_
|
89.15% |
914.201 |
1729.251 |
21.151 |
0.82% |
21.151 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_COUPLE_RAW/2
|
89.06% |
10.961 |
20.722 |
0.075 |
-0.28% |
0.075 |
|
SingleSource/Benchmarks/CoyoteBench/almabench
|
88.82% |
37.316 |
70.459 |
0.174 |
-0.90% |
0.174 |
|
External/SPEC/CFP2017rate/508.namd_r/508.namd_r
|
87.92% |
221.291 |
415.855 |
0.689 |
-1.16% |
0.689 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint8_t_
|
87.69% |
30357.854 |
56978.941 |
1796.798 |
-24.55% |
1796.798 |
|
MultiSource/Benchmarks/Prolangs-C/agrep/agrep
|
87.45% |
0.012 |
0.022 |
0.000 |
0.32% |
0.000 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_COUPLE_LAMBDA/2
|
87.22% |
10.917 |
20.439 |
0.139 |
-0.15% |
0.139 |
|
MultiSource/Benchmarks/MiBench/telecomm-gsm/telecomm-gsm
|
85.58% |
0.659 |
1.223 |
0.003 |
-2.52% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_atanf_autovec_float_
|
85.31% |
1581.765 |
2931.144 |
22.052 |
-0.54% |
22.052 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_FLOYD_DITHER/128
|
85.21% |
452.985 |
838.983 |
14.855 |
-4.68% |
14.855 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_atanf_novec_float_
|
85.16% |
1583.489 |
2931.986 |
28.540 |
-0.74% |
28.540 |
|
MicroBenchmarks/ImageProcessing/AnisotropicDiffusion/AnisotropicDiffusion.test:BENCHMARK_ANISTROPIC_DIFFUSION/256
|
84.66% |
184824.114 |
341287.256 |
2814.993 |
-3.74% |
2814.993 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_COUPLE_RAW/1
|
84.65% |
1394.542 |
2575.064 |
10.548 |
-0.51% |
10.548 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC1
|
82.29% |
12.517 |
22.818 |
0.881 |
0.69% |
0.881 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC8
|
82.09% |
195.717 |
356.380 |
7.075 |
0.35% |
7.075 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC1
|
81.93% |
12.515 |
22.768 |
0.859 |
0.87% |
0.859 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_COUPLE_LAMBDA/1
|
81.37% |
1397.283 |
2534.263 |
36.717 |
-0.27% |
36.717 |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_COUPLE_RAW/0
|
80.65% |
8317.009 |
15024.932 |
34.976 |
-0.44% |
34.976 |
|
MultiSource/Benchmarks/MallocBench/gs/gs
|
80.26% |
0.137 |
0.247 |
0.000 |
1.07% |
0.000 |
|
MultiSource/Benchmarks/FreeBench/distray/distray
|
79.70% |
0.447 |
0.803 |
0.004 |
-0.54% |
0.004 |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_COUPLE_LAMBDA/0
|
79.39% |
8232.558 |
14768.049 |
122.336 |
-0.33% |
122.336 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_cos_autovec_double_
|
79.18% |
2393.456 |
4288.489 |
79.171 |
0.32% |
79.171 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC2
|
78.98% |
13.139 |
23.516 |
0.723 |
-0.44% |
0.723 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC2
|
78.48% |
13.153 |
23.475 |
0.699 |
-0.04% |
0.699 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint16_t_
|
78.47% |
29637.872 |
52894.501 |
75.289 |
-26.01% |
75.289 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC2
|
78.35% |
13.199 |
23.542 |
0.769 |
-28.27% |
0.769 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sinh_novec_double_
|
78.29% |
2481.125 |
4423.576 |
48.659 |
-1.27% |
48.659 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_cos_novec_double_
|
78.22% |
2393.141 |
4265.117 |
84.314 |
-0.59% |
84.314 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC3
|
78.03% |
13.008 |
23.157 |
0.699 |
0.73% |
0.699 |
|
MultiSource/Benchmarks/TSVC/NodeSplitting-dbl/NodeSplitting-dbl
|
77.52% |
26.055 |
46.252 |
0.026 |
1.30% |
0.026 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint64_t_
|
76.64% |
18444.083 |
32578.735 |
639.522 |
-28.09% |
639.522 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC1
|
75.16% |
13.140 |
23.016 |
2.006 |
0.00% |
2.006 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sinh_autovec_double_
|
74.91% |
2481.375 |
4340.098 |
95.721 |
-2.15% |
95.721 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC16
|
74.59% |
377.105 |
658.380 |
9.679 |
-0.11% |
9.679 |
|
SingleSource/Benchmarks/BenchmarkGame/partialsums
|
73.70% |
1.057 |
1.836 |
0.005 |
-0.69% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_exp_autovec_double_
|
72.87% |
1128.378 |
1950.588 |
5.965 |
-0.24% |
5.965 |
|
MultiSource/Applications/oggenc/oggenc
|
72.72% |
0.395 |
0.681 |
0.003 |
-0.36% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_cbrt_novec_double_
|
72.69% |
3148.754 |
5437.435 |
49.036 |
-0.93% |
49.036 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint8_t_To_uint64_t_
|
71.62% |
17786.071 |
30525.057 |
283.416 |
-28.90% |
283.416 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_cbrt_autovec_double_
|
70.26% |
3149.155 |
5361.902 |
109.289 |
0.84% |
109.289 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_exp_novec_double_
|
69.75% |
1128.795 |
1916.097 |
22.503 |
-0.60% |
22.503 |
|
SingleSource/Benchmarks/Shootout/Shootout-fib2
|
69.60% |
5.814 |
9.861 |
0.168 |
-0.19% |
0.168 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC32
|
69.38% |
750.661 |
1271.446 |
20.313 |
-0.25% |
20.313 |
|
External/SPEC/CINT2017rate/523.xalancbmk_r/523.xalancbmk_r
|
68.40% |
229.235 |
386.022 |
45.044 |
-0.32% |
45.044 |
|
SingleSource/Benchmarks/Misc/mandel-2
|
68.18% |
2.535 |
4.263 |
0.011 |
0.00% |
0.011 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC64
|
67.94% |
1461.368 |
2454.208 |
64.076 |
-1.15% |
64.076 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sin_novec_double_
|
66.85% |
2370.819 |
3955.675 |
145.620 |
0.80% |
145.620 |
|
SingleSource/Benchmarks/Misc/whetstone
|
66.39% |
3.086 |
5.134 |
0.153 |
-0.35% |
0.153 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_sin_autovec_double_
|
65.99% |
2370.684 |
3935.019 |
135.160 |
0.37% |
135.160 |
|
MultiSource/Benchmarks/McCat/08-main/main
|
65.69% |
0.143 |
0.237 |
0.001 |
-0.17% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC4
|
64.81% |
114.180 |
188.184 |
2.503 |
-0.11% |
2.503 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_1D_RAW/5001
|
64.65% |
356.939 |
587.713 |
27.851 |
0.04% |
27.851 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC128
|
64.17% |
2963.051 |
4864.518 |
126.908 |
-1.04% |
126.908 |
|
SingleSource/Benchmarks/Misc/flops-3
|
63.33% |
9.000 |
14.700 |
0.059 |
-0.29% |
0.059 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC2
|
61.94% |
14.588 |
23.624 |
0.858 |
0.14% |
0.858 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-fibo
|
61.93% |
5.819 |
9.424 |
0.040 |
-0.41% |
0.040 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/solvers/trisolv/trisolv
|
61.19% |
0.071 |
0.114 |
0.001 |
55.86% |
0.001 |
|
MultiSource/Benchmarks/Bullet/bullet
|
61.11% |
31.107 |
50.118 |
0.050 |
1.00% |
0.050 |
|
SingleSource/Benchmarks/BenchmarkGame/recursive
|
60.66% |
3.760 |
6.041 |
0.014 |
-0.02% |
0.014 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_multiply_accumulate_runtime_checks_pass<4, double>
|
60.24% |
20.647 |
33.084 |
0.903 |
-20.07% |
0.903 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC4
|
59.19% |
15.017 |
23.904 |
0.676 |
0.17% |
0.676 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC4
|
59.13% |
15.642 |
24.892 |
0.802 |
0.44% |
0.802 |
|
MicroBenchmarks/ImageProcessing/BilateralFiltering/BilateralFilter.test:BENCHMARK_BILATERAL_FILTER/32/4
|
58.11% |
1951.588 |
3085.587 |
18.274 |
-2.01% |
18.274 |
|
MicroBenchmarks/ImageProcessing/BilateralFiltering/BilateralFilter.test:BENCHMARK_BILATERAL_FILTER/64/4
|
58.03% |
8966.196 |
14169.643 |
91.117 |
-1.94% |
91.117 |
|
MicroBenchmarks/ImageProcessing/BilateralFiltering/BilateralFilter.test:BENCHMARK_BILATERAL_FILTER/16/4
|
57.99% |
358.482 |
566.356 |
4.241 |
-1.59% |
4.241 |
|
MultiSource/Benchmarks/tramp3d-v4/tramp3d-v4
|
57.54% |
1.092 |
1.720 |
0.018 |
-0.72% |
0.018 |
|
SingleSource/Benchmarks/SmallPT/smallpt
|
57.34% |
30.189 |
47.499 |
0.064 |
0.30% |
0.064 |
|
SingleSource/Benchmarks/Shootout/Shootout-ackermann
|
57.30% |
0.020 |
0.031 |
0.000 |
-1.20% |
0.000 |
|
MultiSource/Benchmarks/TSVC/IndirectAddressing-flt/IndirectAddressing-flt
|
56.15% |
17.970 |
28.061 |
0.064 |
0.04% |
0.064 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC3
|
55.45% |
15.852 |
24.643 |
0.966 |
-0.22% |
0.966 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/kernels/bicg/bicg
|
55.29% |
0.174 |
0.271 |
0.001 |
9.74% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC127
|
54.69% |
2800.223 |
4331.777 |
86.335 |
-1.62% |
86.335 |
|
MicroBenchmarks/ImageProcessing/BilateralFiltering/BilateralFilter.test:BENCHMARK_BILATERAL_FILTER/32/2
|
54.08% |
558.083 |
859.921 |
7.176 |
-2.56% |
7.176 |
|
MicroBenchmarks/ImageProcessing/BilateralFiltering/BilateralFilter.test:BENCHMARK_BILATERAL_FILTER/64/2
|
54.07% |
2387.492 |
3678.514 |
8.106 |
-2.42% |
8.106 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/PENNANT/PENNANT
|
53.90% |
4.914 |
7.563 |
0.026 |
-0.08% |
0.026 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_GEN_LIN_RECUR_RAW/171
|
53.76% |
2.155 |
3.314 |
0.111 |
-0.09% |
0.111 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_atan_autovec_double_
|
53.75% |
2060.157 |
3167.519 |
47.322 |
-0.33% |
47.322 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC127
|
53.61% |
2972.877 |
4566.545 |
131.976 |
-2.54% |
131.976 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_atan_novec_double_
|
53.54% |
2060.772 |
3164.049 |
62.017 |
-0.74% |
62.017 |
|
SingleSource/Benchmarks/Misc/flops-4
|
53.09% |
4.405 |
6.743 |
0.029 |
-0.07% |
0.029 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, LessThanZero, First>
|
52.77% |
11861.667 |
18121.535 |
182.380 |
0.04% |
182.380 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, EqZero, First>
|
52.51% |
11861.063 |
18089.895 |
187.757 |
-0.18% |
187.757 |
|
SingleSource/Benchmarks/Misc/fbench
|
52.42% |
6.034 |
9.197 |
0.071 |
0.17% |
0.071 |
|
MicroBenchmarks/ImageProcessing/BilateralFiltering/BilateralFilter.test:BENCHMARK_BILATERAL_FILTER/16/2
|
52.30% |
123.210 |
187.644 |
0.228 |
-2.32% |
0.228 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, GreaterThanZero, First>
|
52.22% |
11863.827 |
18059.535 |
179.092 |
-0.07% |
179.092 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, GreaterThanZero, First>
|
52.05% |
23714.872 |
36058.971 |
194.945 |
-0.10% |
194.945 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<31, EqZero, First>
|
51.88% |
3213.253 |
4880.313 |
16.385 |
-0.34% |
16.385 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC3
|
51.73% |
16.268 |
24.684 |
0.831 |
-0.14% |
0.831 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<31, GreaterThanZero, First>
|
51.59% |
3213.501 |
4871.360 |
15.822 |
0.21% |
15.822 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<63, EqZero, First>
|
51.52% |
1592.025 |
2412.269 |
4.243 |
0.05% |
4.243 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC3
|
51.14% |
16.270 |
24.590 |
0.748 |
-27.08% |
0.748 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC127
|
51.02% |
3117.324 |
4707.918 |
129.877 |
-1.55% |
129.877 |
|
SingleSource/Benchmarks/Misc/mandel
|
50.90% |
3.331 |
5.027 |
0.012 |
-0.33% |
0.012 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_SUM_RAW/171
|
50.63% |
0.469 |
0.707 |
0.029 |
-0.26% |
0.029 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<6, LessThanZero, First>
|
50.38% |
16009.198 |
24074.143 |
261.881 |
0.16% |
261.881 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<6, GreaterThanZero, First>
|
50.32% |
16011.241 |
24067.736 |
247.278 |
-0.10% |
247.278 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<63, GreaterThanZero, First>
|
50.17% |
1592.882 |
2391.993 |
10.986 |
0.68% |
10.986 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<6, EqZero, First>
|
50.06% |
16009.914 |
24024.250 |
137.177 |
-0.06% |
137.177 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, LessThanZero, First>
|
50.00% |
48065.142 |
72098.601 |
476.502 |
-0.41% |
476.502 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, GreaterThanZero, First>
|
49.88% |
32250.954 |
48338.728 |
247.314 |
-0.03% |
247.314 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, EqZero, First>
|
49.78% |
32254.742 |
48311.527 |
193.706 |
-0.13% |
193.706 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, LessThanZero, First>
|
49.75% |
32251.353 |
48297.630 |
324.170 |
0.06% |
324.170 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, EqZero, First>
|
49.54% |
19353.197 |
28940.380 |
113.679 |
0.13% |
113.679 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<15, GreaterThanZero, First>
|
49.43% |
6454.724 |
9645.334 |
84.959 |
-0.12% |
84.959 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<15, EqZero, First>
|
49.39% |
6454.709 |
9642.868 |
95.870 |
0.20% |
95.870 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<7, EqZero, First>
|
49.33% |
13826.647 |
20647.815 |
205.819 |
0.04% |
205.819 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, LessThanZero, First>
|
49.26% |
19354.169 |
28887.732 |
117.792 |
0.10% |
117.792 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, GreaterThanZero, First>
|
49.13% |
19352.671 |
28861.455 |
135.496 |
-0.21% |
135.496 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<15, LessThanZero, First>
|
49.01% |
6454.684 |
9618.391 |
115.677 |
-0.57% |
115.677 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<7, GreaterThanZero, First>
|
49.00% |
13824.610 |
20598.273 |
244.458 |
-0.32% |
244.458 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<7, LessThanZero, First>
|
48.96% |
13824.492 |
20593.364 |
231.485 |
-0.30% |
231.485 |
|
SingleSource/Benchmarks/Misc-C++-EH/spirit
|
48.79% |
19.751 |
29.386 |
0.762 |
-0.05% |
0.762 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<31, LessThanZero, First>
|
48.35% |
3283.422 |
4870.909 |
17.645 |
0.03% |
17.645 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, LessThanZero, First>
|
48.33% |
24356.915 |
36127.963 |
170.040 |
-0.12% |
170.040 |
|
SingleSource/Benchmarks/Shootout/Shootout-lists
|
48.26% |
11.054 |
16.388 |
0.102 |
1.69% |
0.102 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<63, LessThanZero, First>
|
48.19% |
1615.276 |
2393.667 |
14.176 |
-0.87% |
14.176 |
|
MultiSource/Benchmarks/TSVC/Recurrences-flt/Recurrences-flt
|
48.00% |
7.652 |
11.325 |
0.026 |
-0.45% |
0.026 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC2
|
47.16% |
16.268 |
23.941 |
0.745 |
-0.32% |
0.745 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC2
|
46.75% |
16.268 |
23.874 |
0.750 |
0.16% |
0.750 |
|
MultiSource/Benchmarks/Prolangs-C++/life/life
|
45.18% |
5.259 |
7.635 |
0.150 |
-0.56% |
0.150 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC2
|
44.98% |
16.893 |
24.492 |
0.779 |
0.27% |
0.779 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, First>
|
44.75% |
49985.848 |
72353.637 |
477.020 |
0.16% |
477.020 |
|
MultiSource/Benchmarks/MiBench/telecomm-FFT/telecomm-fft
|
44.43% |
0.148 |
0.214 |
0.001 |
-0.54% |
0.001 |
|
MultiSource/Benchmarks/Prolangs-C++/simul/simul
|
44.19% |
0.028 |
0.041 |
0.000 |
-0.56% |
0.000 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/CoMD/CoMD
|
43.80% |
9.999 |
14.379 |
0.030 |
1.67% |
0.030 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC63
|
43.80% |
1617.345 |
2325.735 |
53.928 |
-1.01% |
53.928 |
|
MultiSource/Benchmarks/Ptrdist/anagram/anagram
|
43.17% |
3.786 |
5.420 |
0.085 |
-10.28% |
0.085 |
|
MultiSource/Benchmarks/Prolangs-C++/employ/employ
|
43.12% |
0.030 |
0.043 |
0.001 |
-1.13% |
0.001 |
|
MultiSource/Benchmarks/Olden/bh/bh
|
42.97% |
5.260 |
7.520 |
0.088 |
-0.84% |
0.088 |
|
SingleSource/Benchmarks/Shootout/Shootout-sieve
|
42.39% |
13.963 |
19.882 |
0.038 |
0.14% |
0.038 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC4
|
42.22% |
17.868 |
25.412 |
0.857 |
0.11% |
0.857 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC3
|
41.50% |
17.520 |
24.791 |
0.802 |
0.21% |
0.802 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_erff_autovec_float_
|
40.44% |
744.338 |
1045.324 |
12.304 |
-0.59% |
12.304 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_erff_novec_float_
|
40.34% |
744.134 |
1044.296 |
12.395 |
-0.71% |
12.395 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC4
|
39.90% |
18.145 |
25.386 |
0.799 |
-27.22% |
0.799 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_runtime_checks_pass<4, int>
|
39.86% |
16.773 |
23.459 |
0.085 |
0.02% |
0.085 |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_runtime_checks_fail<4, int>
|
39.56% |
16.833 |
23.492 |
0.098 |
0.54% |
0.098 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_ICCG_RAW/171
|
38.76% |
1.584 |
2.197 |
0.144 |
-0.32% |
0.144 |
|
MultiSource/Benchmarks/TSVC/IndirectAddressing-dbl/IndirectAddressing-dbl
|
38.39% |
19.836 |
27.452 |
0.072 |
-1.99% |
0.072 |
|
MultiSource/Benchmarks/MiBench/automotive-susan/automotive-susan
|
37.82% |
0.288 |
0.398 |
0.001 |
-9.26% |
0.001 |
|
SingleSource/Benchmarks/Misc/flops-1
|
34.90% |
9.000 |
12.141 |
0.029 |
-0.21% |
0.029 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, GreaterThanZero, Mid>
|
34.70% |
37281.748 |
50218.107 |
349.976 |
0.06% |
349.976 |
|
External/SPEC/CFP2017rate/510.parest_r/510.parest_r
|
34.37% |
333.570 |
448.222 |
1.882 |
-1.53% |
1.882 |
|
MultiSource/Benchmarks/McCat/01-qbsort/qbsort
|
34.25% |
0.198 |
0.266 |
0.000 |
-0.09% |
0.000 |
|
MultiSource/Benchmarks/VersaBench/ecbdes/ecbdes
|
34.22% |
5.365 |
7.200 |
0.076 |
7.29% |
0.076 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, EqZero, Mid>
|
34.21% |
37405.777 |
50203.667 |
421.032 |
0.04% |
421.032 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint64_t_
|
34.19% |
24564.068 |
32963.729 |
432.044 |
-26.92% |
432.044 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, LessThanZero, Mid>
|
33.75% |
37625.287 |
50325.392 |
271.360 |
0.06% |
271.360 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, LessThanZero, Mid>
|
33.52% |
56546.080 |
75502.453 |
277.845 |
0.05% |
277.845 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC8
|
33.26% |
21.561 |
28.732 |
0.897 |
3.57% |
0.897 |
|
SingleSource/Benchmarks/Misc/flops-2
|
33.01% |
2.792 |
3.713 |
0.013 |
-0.03% |
0.013 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_erf_novec_double_
|
32.99% |
897.684 |
1193.817 |
12.428 |
-0.70% |
12.428 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_erf_autovec_double_
|
32.52% |
899.581 |
1192.085 |
9.490 |
-0.76% |
9.490 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, Last>
|
32.44% |
56781.287 |
75199.261 |
370.441 |
-0.37% |
370.441 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, LessThanZero, Last>
|
32.32% |
56706.213 |
75034.420 |
449.239 |
0.19% |
449.239 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint8_t_
|
30.66% |
37094.350 |
48468.816 |
276.917 |
-45.03% |
276.917 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC63
|
29.32% |
1691.490 |
2187.510 |
57.260 |
-1.86% |
57.260 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC7
|
28.75% |
20.648 |
26.584 |
0.929 |
-0.02% |
0.929 |
|
SingleSource/Benchmarks/Dhrystone/dry
|
28.20% |
0.150 |
0.193 |
0.001 |
-0.45% |
0.001 |
|
External/SPEC/CFP2017rate/511.povray_r/511.povray_r
|
27.92% |
33.531 |
42.891 |
0.304 |
-2.62% |
0.304 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, GreaterThanZero, None>
|
27.84% |
8175.671 |
10451.800 |
31.554 |
0.39% |
31.554 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC7
|
27.18% |
22.528 |
28.650 |
0.153 |
2.65% |
0.153 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, GreaterThanZero, Mid>
|
26.89% |
8512.213 |
10801.243 |
41.804 |
-0.08% |
41.804 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC1
|
25.98% |
22.525 |
28.377 |
1.167 |
8.44% |
1.167 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, LessThanZero, None>
|
25.65% |
8336.407 |
10474.561 |
10.474 |
0.26% |
10.474 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, EqZero, None>
|
25.21% |
8321.591 |
10419.351 |
47.860 |
-0.00% |
47.860 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, EqZero, Mid>
|
24.79% |
8640.605 |
10782.436 |
37.213 |
-0.10% |
37.213 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/miniAMR/miniAMR
|
24.64% |
3.318 |
4.136 |
0.071 |
-1.72% |
0.071 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, EqZero, None>
|
24.64% |
4407.954 |
5494.118 |
20.328 |
-0.48% |
20.328 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, None>
|
24.55% |
61494.423 |
76593.816 |
318.181 |
0.08% |
318.181 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC31
|
24.43% |
909.186 |
1131.325 |
18.614 |
-0.71% |
18.614 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, LessThanZero, None>
|
24.22% |
61399.693 |
76270.830 |
506.244 |
0.21% |
506.244 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, EqZero, Mid>
|
23.49% |
4491.063 |
5546.191 |
19.912 |
0.52% |
19.912 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, GreaterThanZero, None>
|
23.18% |
4495.548 |
5537.762 |
14.330 |
0.01% |
14.330 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, EqZero, Last>
|
22.94% |
42075.446 |
51728.720 |
252.757 |
0.09% |
252.757 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, LessThanZero, Mid>
|
22.67% |
8816.268 |
10814.557 |
22.873 |
0.10% |
22.873 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, EqZero, First>
|
22.40% |
8335.815 |
10202.861 |
20.626 |
0.25% |
20.626 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC3
|
22.22% |
20.647 |
25.236 |
0.777 |
0.67% |
0.777 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC3
|
22.11% |
20.647 |
25.213 |
0.786 |
0.71% |
0.786 |
|
SingleSource/Benchmarks/Shootout-C++/EH/Shootout-C++-except
|
21.91% |
1.528 |
1.862 |
0.007 |
-0.44% |
0.007 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, GreaterThanZero, Mid>
|
21.64% |
31811.596 |
38695.458 |
240.354 |
-0.15% |
240.354 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, GreaterThanZero, Last>
|
21.63% |
42483.727 |
51674.460 |
291.318 |
0.20% |
291.318 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC3
|
21.55% |
21.273 |
25.857 |
0.779 |
0.21% |
0.779 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC8
|
21.53% |
22.525 |
27.375 |
0.948 |
0.05% |
0.948 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, LessThanZero, Mid>
|
21.42% |
25621.227 |
31109.422 |
113.072 |
-0.09% |
113.072 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_GEN_LIN_RECUR_RAW/5001
|
21.40% |
79.618 |
96.653 |
3.331 |
-0.11% |
3.331 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC7
|
21.33% |
23.161 |
28.100 |
1.114 |
0.64% |
1.114 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, LessThanZero, Mid>
|
21.22% |
32012.693 |
38806.213 |
225.367 |
-0.02% |
225.367 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, LessThanZero, Last>
|
21.18% |
42707.892 |
51753.448 |
219.858 |
-0.15% |
219.858 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, GreaterThanZero, First>
|
21.16% |
8336.386 |
10100.745 |
49.039 |
-0.18% |
49.039 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, LessThanZero, Mid>
|
20.92% |
4530.375 |
5478.082 |
18.373 |
0.50% |
18.373 |
|
MultiSource/Benchmarks/Ptrdist/bc/bc
|
20.87% |
1.578 |
1.908 |
0.013 |
-1.31% |
0.013 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, EqZero, First>
|
20.80% |
2128.362 |
2571.142 |
1.718 |
-0.01% |
1.718 |
|
MultiSource/Benchmarks/MallocBench/espresso/espresso
|
20.53% |
1.295 |
1.561 |
0.003 |
-0.56% |
0.003 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, GreaterThanZero, Mid>
|
20.51% |
25693.123 |
30962.023 |
190.374 |
-0.10% |
190.374 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, GreaterThanZero, First>
|
20.30% |
4251.338 |
5114.430 |
1.247 |
0.02% |
1.247 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, LessThanZero, First>
|
20.17% |
4251.470 |
5108.781 |
13.676 |
0.11% |
13.676 |
|
MultiSource/Applications/sqlite3/sqlite3
|
20.02% |
12.973 |
15.571 |
0.214 |
-0.67% |
0.214 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, EqZero, Mid>
|
20.01% |
25848.182 |
31020.251 |
183.002 |
-0.02% |
183.002 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, LessThanZero, None>
|
19.92% |
4599.851 |
5516.057 |
19.435 |
-0.22% |
19.435 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, LessThanZero, First>
|
19.77% |
2128.181 |
2548.975 |
8.213 |
0.17% |
8.213 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, EqZero, First>
|
19.76% |
4251.514 |
5091.745 |
18.324 |
0.27% |
18.324 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_TRIDIAG_ELIM_RAW/171
|
18.82% |
0.967 |
1.149 |
0.054 |
-0.38% |
0.054 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-moments
|
18.29% |
0.343 |
0.406 |
0.004 |
0.92% |
0.004 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_INT_PREDICT_RAW/171
|
18.21% |
6.917 |
8.176 |
0.327 |
0.08% |
0.327 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_TRIDIAG_ELIM_RAW/44217
|
18.20% |
252.366 |
298.308 |
14.065 |
-0.16% |
14.065 |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_TRIDIAG_ELIM_RAW/5001
|
18.17% |
28.474 |
33.648 |
1.649 |
-0.15% |
1.649 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, GreaterThanZero, First>
|
18.03% |
2165.771 |
2556.178 |
3.943 |
-0.14% |
3.943 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, EqZero, None>
|
18.02% |
44466.656 |
52477.834 |
484.094 |
0.00% |
484.094 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, GreaterThanZero, Mid>
|
17.87% |
4652.530 |
5484.122 |
20.625 |
0.44% |
20.625 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC7
|
17.38% |
23.776 |
27.909 |
1.191 |
-25.03% |
1.191 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, LessThanZero, None>
|
16.35% |
45251.516 |
52651.285 |
266.433 |
-0.07% |
266.433 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, GreaterThanZero, None>
|
16.02% |
45226.113 |
52471.708 |
356.874 |
-0.17% |
356.874 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, LessThanZero, First>
|
15.86% |
8762.519 |
10152.449 |
31.108 |
-0.06% |
31.108 |
|
MultiSource/Benchmarks/MiBench/automotive-basicmath/automotive-basicmath
|
15.77% |
1.242 |
1.438 |
0.008 |
-0.33% |
0.008 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1BigLoopWithReductionTC1
|
15.64% |
20.022 |
23.154 |
0.769 |
-0.25% |
0.769 |
|
SingleSource/Benchmarks/Misc/richards_benchmark
|
15.64% |
2.001 |
2.313 |
0.005 |
-1.11% |
0.005 |
|
External/SPEC/CINT2017rate/531.deepsjeng_r/531.deepsjeng_r
|
15.11% |
279.708 |
321.974 |
1.454 |
-0.27% |
1.454 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/RSBench/rsbench
|
14.35% |
2.221 |
2.540 |
0.010 |
-1.12% |
0.010 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-ackermann
|
14.17% |
4.183 |
4.775 |
0.012 |
-0.19% |
0.012 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<6, LessThanZero, Mid>
|
13.90% |
23477.431 |
26741.257 |
280.460 |
0.03% |
280.460 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<7, GreaterThanZero, Mid>
|
13.86% |
20142.134 |
22934.298 |
195.043 |
-0.03% |
195.043 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<6, GreaterThanZero, Mid>
|
13.77% |
23481.511 |
26715.338 |
254.879 |
-0.12% |
254.879 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<6, EqZero, Mid>
|
13.69% |
23478.009 |
26691.127 |
128.688 |
0.05% |
128.688 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, GreaterThanZero, Last>
|
13.61% |
35252.476 |
40051.048 |
249.741 |
0.02% |
249.741 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, LessThanZero, Last>
|
13.59% |
35251.066 |
40042.790 |
224.907 |
-0.19% |
224.907 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<7, EqZero, Mid>
|
13.54% |
20140.903 |
22867.315 |
217.166 |
-0.38% |
217.166 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC8
|
13.48% |
25.402 |
28.827 |
1.284 |
-0.47% |
1.284 |
|
External/SPEC/CFP2017rate/544.nab_r/544.nab_r
|
13.36% |
479.793 |
543.913 |
1.956 |
1.62% |
1.956 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<7, LessThanZero, Mid>
|
13.21% |
20236.870 |
22909.470 |
225.209 |
0.05% |
225.209 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint32_t_
|
12.98% |
38448.267 |
43439.555 |
559.360 |
-42.74% |
559.360 |
|
MultiSource/Benchmarks/FreeBench/fourinarow/fourinarow
|
12.70% |
0.652 |
0.735 |
0.001 |
-7.24% |
0.001 |
|
MultiSource/Benchmarks/TSVC/Reductions-flt/Reductions-flt
|
12.61% |
10.840 |
12.207 |
0.033 |
-0.22% |
0.033 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, GreaterThanZero, None>
|
11.50% |
36522.989 |
40724.839 |
231.884 |
0.05% |
231.884 |
|
SingleSource/Benchmarks/BenchmarkGame/fannkuch
|
11.33% |
5.399 |
6.011 |
0.034 |
-1.77% |
0.034 |
|
SingleSource/Benchmarks/Misc/pi
|
11.24% |
1.782 |
1.982 |
0.004 |
0.43% |
0.004 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC1
|
11.22% |
22.525 |
25.051 |
0.916 |
-0.20% |
0.916 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC1
|
10.58% |
22.525 |
24.909 |
0.884 |
0.20% |
0.884 |
|
MultiSource/Applications/aha/aha
|
10.58% |
4.626 |
5.116 |
0.015 |
-0.01% |
0.015 |
|
External/SPEC/CINT2017rate/541.leela_r/541.leela_r
|
10.42% |
231.003 |
255.069 |
0.859 |
-0.46% |
0.859 |
|
MultiSource/Applications/lua/lua
|
9.98% |
81.680 |
89.832 |
0.407 |
0.34% |
0.407 |
|
MicroBenchmarks/Builtins/Int128/Builtins.test:BM_DivideIntrinsic128SmallDivisor<__int128_t>
|
9.91% |
75.931 |
83.459 |
0.292 |
-0.25% |
0.292 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, LessThanZero, None>
|
9.67% |
37236.789 |
40837.369 |
233.237 |
0.02% |
233.237 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, GreaterThanZero, Mid>
|
9.42% |
2728.306 |
2985.393 |
6.710 |
0.07% |
6.710 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/gemver/gemver
|
8.22% |
0.499 |
0.540 |
0.003 |
2.66% |
0.003 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, GreaterThanZero, Mid>
|
8.01% |
19231.074 |
20770.727 |
202.953 |
0.02% |
202.953 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, LessThanZero, Mid>
|
7.92% |
19241.577 |
20765.532 |
176.007 |
-0.02% |
176.007 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, EqZero, Mid>
|
7.90% |
2765.597 |
2984.137 |
4.564 |
-0.01% |
4.564 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, LessThanZero, Mid>
|
7.80% |
2768.933 |
2984.806 |
4.400 |
1.05% |
4.400 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, GreaterThanZero, None>
|
7.40% |
2969.257 |
3189.128 |
3.929 |
-0.27% |
3.929 |
|
SingleSource/Benchmarks/Misc-C++/Large/sphereflake
|
7.36% |
20.022 |
21.497 |
0.046 |
-1.17% |
0.046 |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-lists
|
7.35% |
21.154 |
22.707 |
0.109 |
-0.14% |
0.109 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, LessThanZero, Last>
|
6.75% |
31140.637 |
33243.134 |
147.429 |
0.18% |
147.429 |
|
MultiSource/Applications/viterbi/viterbi
|
6.69% |
12.263 |
13.084 |
0.146 |
-1.16% |
0.146 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, EqZero, Last>
|
6.47% |
31141.072 |
33156.884 |
155.408 |
-0.02% |
155.408 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, EqZero, None>
|
6.42% |
2983.928 |
3175.591 |
8.453 |
-0.30% |
8.453 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, GreaterThanZero, Last>
|
6.42% |
31140.834 |
33139.438 |
171.784 |
-0.23% |
171.784 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, EqZero, Mid>
|
6.20% |
19519.382 |
20729.108 |
208.106 |
-0.11% |
208.106 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, GreaterThanZero, None>
|
5.93% |
31971.434 |
33867.040 |
132.879 |
-0.10% |
132.879 |
|
MultiSource/Benchmarks/Olden/em3d/em3d
|
5.79% |
8.361 |
8.846 |
0.015 |
0.03% |
0.015 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, EqZero, None>
|
5.73% |
32010.276 |
33844.226 |
162.130 |
-0.03% |
162.130 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, LessThanZero, None>
|
5.59% |
3008.574 |
3176.686 |
7.017 |
0.21% |
7.017 |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/CLAMR/CLAMR
|
5.52% |
12.390 |
13.074 |
0.036 |
-1.14% |
0.036 |
|
MultiSource/Applications/JM/ldecod/ldecod
|
5.47% |
0.212 |
0.223 |
0.002 |
0.26% |
0.002 |
|
MicroBenchmarks/Builtins/Int128/Builtins.test:BM_DivideIntrinsic128UniformDivisor<__int128_t>
|
4.61% |
65.970 |
69.012 |
1.165 |
0.10% |
1.165 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, LessThanZero, None>
|
4.34% |
32285.569 |
33687.866 |
348.750 |
-0.44% |
348.750 |
|
SingleSource/Benchmarks/Misc/ReedSolomon
|
4.06% |
20.846 |
21.692 |
0.056 |
0.51% |
0.056 |
|
MultiSource/Benchmarks/MiBench/telecomm-CRC32/telecomm-CRC32
|
3.92% |
0.631 |
0.656 |
0.002 |
0.13% |
0.002 |
|
MicroBenchmarks/Builtins/Int128/Builtins.test:BM_RemainderIntrinsic128SmallDivisor<__uint128_t>
|
3.55% |
71.836 |
74.389 |
0.237 |
0.31% |
0.237 |
|
MultiSource/Benchmarks/mafft/pairlocalalign
|
3.10% |
93.075 |
95.962 |
0.859 |
0.27% |
0.859 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, GreaterThanZero, Last>
|
3.06% |
6855.346 |
7064.813 |
25.393 |
-0.60% |
25.393 |
|
MultiSource/Benchmarks/TSVC/Recurrences-dbl/Recurrences-dbl
|
2.77% |
10.376 |
10.663 |
0.016 |
1.25% |
0.016 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, EqZero, Last>
|
2.63% |
6905.605 |
7087.273 |
14.137 |
-0.28% |
14.137 |
|
MultiSource/Benchmarks/Ptrdist/yacr2/yacr2
|
1.68% |
2.222 |
2.260 |
0.004 |
-1.44% |
0.004 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, GreaterThanZero, Last>
|
1.58% |
12984.081 |
13188.639 |
49.094 |
0.05% |
49.094 |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, LessThanZero, Last>
|
1.50% |
13000.329 |
13195.637 |
35.870 |
0.02% |
35.870 |