|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_2D_RAW/44217
|
-70.30% |
105029.018 |
31197.401 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_2D_RAW/5001
|
-67.84% |
10789.124 |
3469.796 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_1D_RAW/44217
|
-60.42% |
15160.259 |
6001.153 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_INT_PREDICT_LAMBDA/44217
|
-57.58% |
19660.889 |
8339.562 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_INT_PREDICT_RAW/44217
|
-57.53% |
19675.317 |
8355.328 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_INT_PREDICT_RAW/5001
|
-54.88% |
1942.895 |
876.581 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_INT_PREDICT_LAMBDA/5001
|
-54.61% |
2025.294 |
919.314 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint32_t_
|
-50.26% |
38182.912 |
18990.380 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint8_t_
|
-48.72% |
37094.350 |
19022.232 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint16_t_
|
-47.89% |
39588.288 |
20629.776 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC128
|
-46.70% |
1808.861 |
964.100 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC64
|
-46.19% |
920.033 |
495.090 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_DIFF_PREDICT_RAW/44217
|
-42.86% |
25399.187 |
14512.682 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_DIFF_PREDICT_LAMBDA/44217
|
-42.23% |
25144.537 |
14526.194 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC32
|
-41.75% |
458.733 |
267.203 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint32_t_
|
-41.47% |
38448.267 |
22504.374 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Adobe-C++/loop_unroll
|
-40.26% |
4.122 |
2.463 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_DIFF_RAW/44217
|
-39.96% |
161.562 |
96.995 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_DIFF_PREDICT_RAW/5001
|
-39.90% |
2685.832 |
1614.084 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_DIFF_PREDICT_LAMBDA/5001
|
-39.84% |
2652.634 |
1595.945 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC16
|
-39.65% |
232.290 |
140.188 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_FIRST_DIFF_LAMBDA/44217
|
-39.19% |
159.393 |
96.930 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint8_t_
|
-33.06% |
30357.854 |
20320.632 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint16_t_
|
-32.71% |
29637.872 |
19942.718 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_PIC_2D_LAMBDA/5001
|
-30.81% |
1305.946 |
903.637 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_PIC_2D_LAMBDA/44217
|
-29.48% |
12727.964 |
8975.357 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_2D_RAW/44217
|
-28.34% |
12578.137 |
9013.505 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, EqZero, None>
|
-27.99% |
16025.244 |
11540.078 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_FIRST_SUM_LAMBDA/44217
|
-27.20% |
182.840 |
133.110 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_2D_RAW/5001
|
-26.35% |
1201.801 |
885.115 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_SUM_RAW/44217
|
-23.23% |
172.218 |
132.219 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint16_t_
|
-22.69% |
11626.925 |
8989.037 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Fhourstones/fhourstones
|
-21.64% |
10.882 |
8.527 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint8_t_
|
-20.69% |
26618.536 |
21111.229 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Trimaran/enc-pc1/enc-pc1
|
-20.19% |
1.105 |
0.882 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_INIT3_RAW/5001
|
-19.67% |
41.551 |
33.376 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/64
|
-19.31% |
6267.862 |
5057.401 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC8
|
-19.30% |
179.690 |
145.006 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/16
|
-19.27% |
283.748 |
229.084 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/32
|
-19.26% |
1416.071 |
1143.266 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC127
|
-19.20% |
2800.223 |
2262.622 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/128
|
-19.19% |
26612.856 |
21507.066 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint8_t_
|
-19.18% |
3810.779 |
3079.920 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BICUBIC_INTERPOLATION/256
|
-19.12% |
108754.750 |
87963.823 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_PRESSURE_CALC_RAW/44217
|
-19.04% |
519.241 |
420.384 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, EqZero, None>
|
-18.72% |
20510.022 |
16670.168 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint16_t_
|
-18.48% |
25456.784 |
20751.691 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, EqZero, Mid>
|
-18.17% |
14102.946 |
11540.302 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC128
|
-18.07% |
1336.804 |
1095.242 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC64
|
-17.93% |
675.889 |
554.715 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC127
|
-17.74% |
1329.952 |
1094.017 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC32
|
-17.72% |
345.418 |
284.227 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/himenobmtxpa
|
-17.64% |
10.199 |
8.400 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC16
|
-17.31% |
180.209 |
149.009 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC63
|
-17.29% |
668.829 |
553.171 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint64_t_
|
-16.73% |
19625.761 |
16341.574 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint32_t_To_uint16_t_
|
-16.51% |
13402.118 |
11188.815 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC31
|
-16.45% |
338.536 |
282.854 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/128
|
-16.42% |
8043.830 |
6722.657 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC8
|
-16.28% |
97.617 |
81.730 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/256
|
-16.24% |
32057.543 |
26851.285 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_PRESSURE_CALC_LAMBDA/44217
|
-16.09% |
509.043 |
427.136 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint8_t_
|
-16.05% |
11194.264 |
9397.592 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/32
|
-16.04% |
482.548 |
405.141 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/64
|
-15.97% |
1954.856 |
1642.673 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint32_t_
|
-15.88% |
26121.349 |
21972.179 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Interpolation/Interpolation.test:BENCHMARK_BILINEAR_INTERPOLATION/16
|
-15.71% |
117.697 |
99.208 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC128
|
-15.58% |
2541.619 |
2145.574 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint16_t_
|
-15.45% |
21956.060 |
18564.179 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint32_t_
|
-15.45% |
7104.559 |
6007.252 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, EqZero, Mid>
|
-15.39% |
16671.027 |
14105.094 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, EqZero, First>
|
-15.38% |
16666.378 |
14103.399 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, EqZero, Last>
|
-15.38% |
16666.234 |
14103.665 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC4
|
-15.37% |
56.314 |
47.659 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/kernels/mvt/mvt
|
-15.25% |
0.881 |
0.747 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/VersaBench/dbms/dbms
|
-15.24% |
10.335 |
8.760 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint64_t_
|
-15.23% |
24564.068 |
20823.220 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC15
|
-14.82% |
173.356 |
147.670 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_SUM_RAW/5001
|
-14.69% |
20.824 |
17.764 |
- |
0.00% |
- |
|
External/SPEC/CFP2017rate/508.namd_r/508.namd_r
|
-14.64% |
221.291 |
188.899 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint8_t_
|
-14.48% |
22921.174 |
19601.480 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_PRESSURE_CALC_LAMBDA/5001
|
-14.39% |
48.554 |
41.565 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC127
|
-14.09% |
299.154 |
257.018 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC128
|
-14.03% |
299.144 |
257.181 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc-C++/stepanov_container
|
-14.00% |
29.467 |
25.342 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/mst/mst
|
-13.74% |
0.890 |
0.768 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, EqZero, Last>
|
-13.63% |
14103.393 |
12180.789 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, EqZero, First>
|
-13.63% |
14102.713 |
12180.987 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC64
|
-13.57% |
1258.359 |
1087.656 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint8_t_
|
-13.36% |
11255.297 |
9752.036 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/McCat/12-IOtest/iotest
|
-13.29% |
1.883 |
1.632 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint32_t_
|
-13.17% |
7455.977 |
6474.142 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout/Shootout-hash
|
-13.06% |
43.072 |
37.446 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint8_t_To_uint16_t_
|
-13.05% |
3757.235 |
3266.842 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_FIRST_DIFF_LAMBDA/5001
|
-12.81% |
12.953 |
11.294 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC2
|
-12.72% |
34.412 |
30.035 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/BenchmarkGame/nsieve-bits
|
-12.61% |
10.907 |
9.531 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/datamining/correlation/correlation
|
-12.49% |
109.559 |
95.870 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/medley/nussinov/nussinov
|
-12.47% |
324.080 |
283.666 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC4
|
-12.43% |
17.521 |
15.343 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint64_t_
|
-12.38% |
18444.083 |
16160.400 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC127
|
-12.28% |
2972.877 |
2607.685 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC8
|
-12.19% |
25.654 |
22.527 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC8
|
-12.19% |
25.653 |
22.527 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout/Shootout-heapsort
|
-12.09% |
24.067 |
21.157 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC7
|
-11.71% |
90.720 |
80.094 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC32
|
-11.46% |
628.757 |
556.691 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-heapsort
|
-11.33% |
23.768 |
21.074 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC4
|
-11.11% |
22.526 |
20.022 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC4
|
-11.11% |
22.526 |
20.024 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/128
|
-11.04% |
466.202 |
414.716 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC7
|
-10.91% |
34.413 |
30.659 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC8
|
-10.90% |
23.151 |
20.628 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint64_t_
|
-10.83% |
13508.214 |
12045.107 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC7
|
-10.76% |
26.646 |
23.778 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint8_t>/127
|
-10.64% |
58.822 |
52.560 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_HYDRO_2D_RAW/171
|
-10.58% |
91.312 |
81.652 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint16_t_To_uint64_t_
|
-10.53% |
25535.265 |
22846.808 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC8
|
-10.51% |
23.776 |
21.276 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/gemver/gemver
|
-10.43% |
0.499 |
0.447 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_FIRST_SUM_LAMBDA/5001
|
-10.42% |
20.266 |
18.153 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC64
|
-10.41% |
156.062 |
139.812 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/Packing-flt/Packing-flt
|
-10.40% |
35.898 |
32.164 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/llubenchmark/llu
|
-10.27% |
60.093 |
53.924 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_ADI_LAMBDA/5001
|
-10.14% |
2434.327 |
2187.530 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint8_t_To_uint32_t_
|
-10.07% |
12989.769 |
11681.254 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/McCat/17-bintr/bintr
|
-10.03% |
1.264 |
1.137 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC63
|
-10.02% |
156.456 |
140.783 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Fhourstones-3.1/fhourstones3.1
|
-9.94% |
3.966 |
3.572 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC2
|
-9.92% |
14.588 |
13.140 |
- |
0.00% |
- |
|
MultiSource/Applications/minisat/minisat
|
-9.91% |
63.672 |
57.360 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC16
|
-9.80% |
31.912 |
28.783 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC16
|
-9.80% |
31.909 |
28.782 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC15
|
-9.66% |
32.552 |
29.409 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC15
|
-9.61% |
32.535 |
29.409 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC7
|
-9.52% |
26.279 |
23.777 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint32_t_
|
-9.43% |
20360.427 |
18439.500 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/FreeBench/pifft/pifft
|
-9.41% |
0.362 |
0.328 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Ptrdist/ft/ft
|
-9.28% |
3.970 |
3.601 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint8_t_To_uint32_t_
|
-9.27% |
6626.974 |
6012.631 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/SciMark2-C/scimark2
|
-9.17% |
108.017 |
98.116 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/solvers/ludcmp/ludcmp
|
-9.12% |
1322.060 |
1201.520 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/McCat/09-vor/vor
|
-9.10% |
0.643 |
0.585 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint32_t_To_uint8_t_
|
-9.05% |
13256.415 |
12056.599 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint8_t_
|
-9.03% |
8357.009 |
7601.993 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/bisort/bisort
|
-8.97% |
3.595 |
3.273 |
- |
0.00% |
- |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_runtime_checks_fail<4, int>
|
-8.93% |
16.833 |
15.329 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-hash
|
-8.89% |
3.886 |
3.541 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC63
|
-8.86% |
1900.105 |
1731.737 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_DIFF_PREDICT_LAMBDA/171
|
-8.78% |
12.334 |
11.252 |
- |
0.00% |
- |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_runtime_checks_pass<4, int>
|
-8.61% |
16.773 |
15.329 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC63
|
-8.60% |
1691.490 |
1546.028 |
- |
0.00% |
- |
|
External/SPEC/CINT2017rate/520.omnetpp_r/520.omnetpp_r
|
-8.57% |
650.814 |
595.026 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC64
|
-8.38% |
47.954 |
43.936 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint8_t_To_uint32_t_
|
-8.33% |
7077.856 |
6488.245 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint8_t_To_uint64_t_
|
-8.31% |
13351.372 |
12242.498 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/PAQ8p/paq8p
|
-8.28% |
165.774 |
152.049 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/7zip/7zip-benchmark
|
-8.16% |
30.900 |
28.378 |
- |
0.00% |
- |
|
External/SPEC/CINT2017rate/502.gcc_r/502.gcc_r
|
-8.14% |
428.379 |
393.500 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/256
|
-8.12% |
22898.707 |
21039.915 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/stencils/adi/adi
|
-8.07% |
138.875 |
127.664 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC16
|
-8.07% |
324.162 |
297.996 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint16_t_To_uint8_t_
|
-7.97% |
3000.297 |
2761.230 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC15
|
-7.97% |
46.926 |
43.187 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_ADI_RAW/5001
|
-7.90% |
2442.380 |
2249.501 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/CoyoteBench/fftbench
|
-7.84% |
9.330 |
8.598 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint32_t_To_uint16_t_
|
-7.83% |
13475.983 |
12421.321 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC128
|
-7.79% |
89.612 |
82.628 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Ptrdist/anagram/anagram
|
-7.69% |
3.786 |
3.495 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC16
|
-7.69% |
32.535 |
30.034 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Trimaran/enc-md5/enc-md5
|
-7.68% |
3.507 |
3.238 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC16
|
-7.61% |
33.161 |
30.639 |
- |
0.00% |
- |
|
External/SPEC/CFP2017rate/519.lbm_r/519.lbm_r
|
-7.60% |
214.032 |
197.775 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC32
|
-7.59% |
85.105 |
78.646 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/128
|
-7.47% |
5206.448 |
4817.267 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC127
|
-7.47% |
89.544 |
82.853 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_DIFF_PREDICT_RAW/171
|
-7.45% |
12.359 |
11.438 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_FIRST_DIFF_LAMBDA/171
|
-7.45% |
0.263 |
0.243 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/CoyoteBench/huffbench
|
-7.43% |
41.722 |
38.623 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint16_t_
|
-7.37% |
17851.278 |
16535.421 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC128
|
-7.28% |
89.946 |
83.394 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/512
|
-7.27% |
95514.756 |
88571.823 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_BAND_LIN_EQ_LAMBDA/44217
|
-7.21% |
179.441 |
166.508 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/512
|
-7.13% |
7687.093 |
7139.272 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_DIFF_RAW/171
|
-7.08% |
0.262 |
0.243 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC32
|
-7.04% |
44.423 |
41.295 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC32
|
-7.04% |
44.426 |
41.297 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/pi
|
-7.02% |
1.782 |
1.657 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/XSBench/XSBench
|
-6.95% |
18.793 |
17.486 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC31
|
-6.95% |
45.053 |
41.922 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Dilate/Dilate.test:BENCHMARK_DILATE/128
|
-6.94% |
202.298 |
188.268 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC31
|
-6.93% |
45.049 |
41.927 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC16
|
-6.88% |
36.290 |
33.792 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/syr2k/syr2k
|
-6.86% |
203.159 |
189.223 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint32_t_To_uint8_t_
|
-6.85% |
14416.905 |
13428.704 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Ptrdist/yacr2/yacr2
|
-6.84% |
2.222 |
2.070 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/CrossingThresholds-dbl/CrossingThresholds-dbl
|
-6.74% |
28.070 |
26.179 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC127
|
-6.73% |
88.755 |
82.786 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_FIRST_DIFF_RAW/5001
|
-6.51% |
13.033 |
12.184 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/syrk/syrk
|
-6.47% |
87.448 |
81.788 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC128
|
-6.43% |
68.207 |
63.821 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/trmm/trmm
|
-6.42% |
61.782 |
57.813 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC127
|
-6.42% |
68.205 |
63.828 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC63
|
-6.36% |
46.912 |
43.929 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC3
|
-6.33% |
49.432 |
46.305 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint8_t>/127
|
-6.28% |
139.529 |
130.768 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1BigLoopWithReductionTC1
|
-6.24% |
20.022 |
18.772 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/LinearDependence-flt/LinearDependence-flt
|
-6.21% |
14.797 |
13.878 |
- |
0.00% |
- |
|
MultiSource/Applications/SPASS/SPASS
|
-6.08% |
123.358 |
115.860 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint32_t_To_uint16_t_
|
-6.05% |
9435.304 |
8864.186 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_ENERGY_CALC_LAMBDA/5001
|
-5.91% |
456.570 |
429.596 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/1024
|
-5.89% |
29556.094 |
27814.753 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/perimeter/perimeter
|
-5.87% |
1.119 |
1.054 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC3
|
-5.87% |
21.273 |
20.024 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/NPB-serial/is/is
|
-5.85% |
25.302 |
23.822 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint32_t>/127
|
-5.75% |
119.502 |
112.625 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC64
|
-5.74% |
46.794 |
44.110 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc-C++/Large/sphereflake
|
-5.74% |
20.022 |
18.874 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/BenchmarkGame/puzzle
|
-5.67% |
0.919 |
0.867 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/health/health
|
-5.61% |
1.645 |
1.553 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_ADI_RAW/44217
|
-5.58% |
21791.977 |
20575.594 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint16_t>/65
|
-5.56% |
67.578 |
63.820 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/IndirectAddressing-flt/IndirectAddressing-flt
|
-5.55% |
17.970 |
16.973 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/salsa20
|
-5.47% |
14.937 |
14.120 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint32_t>/127
|
-5.43% |
138.284 |
130.781 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint16_t>/127
|
-5.38% |
139.529 |
132.023 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/voronoi/voronoi
|
-5.32% |
1.408 |
1.333 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_HYDRO_2D_LAMBDA/171
|
-5.30% |
88.627 |
83.933 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC1
|
-5.27% |
11.889 |
11.263 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC3
|
-5.26% |
15.852 |
15.018 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC31
|
-5.22% |
71.957 |
68.203 |
- |
0.00% |
- |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/256/256
|
-5.19% |
10472.455 |
9928.558 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/McGill/chomp
|
-5.17% |
12.873 |
12.207 |
- |
0.00% |
- |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_no_runtime_checks_needed<16, int>
|
-5.13% |
24.401 |
23.151 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_MULADDSUB_RAW/171
|
-5.08% |
0.436 |
0.414 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint8_t_To_uint64_t_
|
-5.06% |
17786.071 |
16886.360 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC4
|
-4.87% |
114.180 |
108.622 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint32_t_
|
-4.87% |
18561.686 |
17658.271 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, LessThanZero, First>
|
-4.85% |
8762.519 |
8337.639 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_GAUSSIAN_BLUR/1024
|
-4.85% |
444966.498 |
423392.602 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC31
|
-4.82% |
1058.953 |
1007.944 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_ADI_LAMBDA/44217
|
-4.80% |
21729.175 |
20686.995 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint16_t_To_uint32_t_
|
-4.79% |
13273.054 |
12637.807 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/MiBench/telecomm-gsm/telecomm-gsm
|
-4.75% |
0.659 |
0.628 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC32
|
-4.75% |
53.191 |
50.665 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC4
|
-4.70% |
25.653 |
24.448 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC63
|
-4.68% |
45.948 |
43.798 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC15
|
-4.61% |
54.443 |
51.936 |
- |
0.00% |
- |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_runtime_checks_pass<16, int>
|
-4.60% |
54.439 |
51.933 |
- |
0.00% |
- |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_add_xor_runtime_checks_fail<16, int>
|
-4.60% |
54.438 |
51.933 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/Equivalencing-dbl/Equivalencing-dbl
|
-4.59% |
7.029 |
6.707 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/Equivalencing-flt/Equivalencing-flt
|
-4.58% |
3.296 |
3.145 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint8_t>/65
|
-4.58% |
95.737 |
91.355 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC128
|
-4.56% |
548.865 |
523.823 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetBRawLoops/lcalsBRaw.test:BM_INIT3_RAW/171
|
-4.54% |
0.442 |
0.421 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC63
|
-4.54% |
123.890 |
118.262 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC64
|
-4.51% |
69.458 |
66.327 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC64
|
-4.50% |
69.450 |
66.326 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC63
|
-4.47% |
70.079 |
66.949 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC63
|
-4.46% |
70.077 |
66.951 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-hash2
|
-4.45% |
9.143 |
8.736 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint32_t_To_uint64_t_
|
-4.42% |
21723.998 |
20764.651 |
- |
0.00% |
- |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/512/512
|
-4.39% |
42225.127 |
40371.264 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC63
|
-4.34% |
43.172 |
41.297 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC64
|
-4.34% |
43.171 |
41.296 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/stencils/heat-3d/heat-3d
|
-4.33% |
25.120 |
24.032 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_PIC_2D_LAMBDA/171
|
-4.23% |
13.817 |
13.232 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint8_t_
|
-4.21% |
18919.674 |
18122.269 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_2D_RAW/171
|
-4.20% |
13.800 |
13.220 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC2
|
-4.17% |
15.017 |
14.391 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC8
|
-4.16% |
15.016 |
14.392 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/SimpleMOC/SimpleMOC
|
-4.15% |
10.815 |
10.367 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC4
|
-4.14% |
15.014 |
14.392 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint32_t>/65
|
-4.09% |
88.074 |
84.474 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC4
|
-4.08% |
15.017 |
14.404 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/tramp3d-v4/tramp3d-v4
|
-4.08% |
1.092 |
1.047 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC32
|
-4.08% |
61.318 |
58.819 |
- |
0.00% |
- |
|
MultiSource/Applications/obsequi/Obsequi
|
-4.04% |
7.770 |
7.456 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/stencils/jacobi-2d/jacobi-2d
|
-3.99% |
33.524 |
32.187 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_DISC_ORD_RAW/44217
|
-3.98% |
6270.326 |
6020.569 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC2
|
-3.98% |
16.893 |
16.221 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC8
|
-3.93% |
25.402 |
24.403 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC4
|
-3.90% |
17.868 |
17.172 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC64
|
-3.86% |
113.253 |
108.880 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC3
|
-3.84% |
16.268 |
15.643 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, First>
|
-3.84% |
49985.848 |
48064.650 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Blur/blur.test:BENCHMARK_boxBlurKernel/256
|
-3.83% |
1999.450 |
1922.773 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC4
|
-3.80% |
49.434 |
47.555 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC3
|
-3.79% |
13.008 |
12.514 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC1
|
-3.79% |
49.432 |
47.559 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC3
|
-3.79% |
49.429 |
47.557 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC2
|
-3.78% |
49.429 |
47.560 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/bh/bh
|
-3.71% |
5.260 |
5.065 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC32
|
-3.71% |
50.684 |
48.805 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC31
|
-3.57% |
85.103 |
82.067 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_FLOYD_DITHER/256
|
-3.56% |
1793.443 |
1729.634 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC1
|
-3.50% |
22.694 |
21.900 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, GreaterThanZero, Mid>
|
-3.46% |
4652.530 |
4491.496 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/tsp/tsp
|
-3.45% |
4.900 |
4.731 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_ENERGY_CALC_RAW/5001
|
-3.39% |
457.167 |
441.649 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_ENERGY_CALC_RAW/171
|
-3.36% |
14.169 |
13.693 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PIC_1D_RAW/5001
|
-3.36% |
356.939 |
344.955 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_FLOYD_DITHER/128
|
-3.33% |
452.985 |
437.889 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC7
|
-3.32% |
37.541 |
36.293 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC31
|
-3.31% |
74.460 |
71.992 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Polybench/linear-algebra/solvers/lu/lu
|
-3.28% |
1288.970 |
1246.650 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint16_t>/65
|
-3.26% |
95.731 |
92.608 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC8
|
-3.22% |
58.192 |
56.318 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint16_t_
|
-3.18% |
9791.554 |
9479.939 |
- |
0.00% |
- |
|
MultiSource/Applications/ClamAV/clamscan
|
-3.16% |
0.475 |
0.460 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC1
|
-3.08% |
13.140 |
12.735 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_ENERGY_CALC_LAMBDA/171
|
-3.07% |
14.144 |
13.709 |
- |
0.00% |
- |
|
External/SPEC/CINT2017rate/531.deepsjeng_r/531.deepsjeng_r
|
-3.06% |
279.708 |
271.158 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchVecWithRuntimeChecks4PointersDBeforeA/1000
|
-3.06% |
5019568.331 |
4866135.403 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint16_t_
|
-3.05% |
8258.628 |
8006.532 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC7
|
-3.02% |
20.648 |
20.024 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Rodinia/pathfinder/pathfinder
|
-2.99% |
1.272 |
1.233 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC32
|
-2.98% |
52.579 |
51.014 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/PENNANT/PENNANT
|
-2.96% |
4.914 |
4.769 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/GlobalDataFlow-dbl/GlobalDataFlow-dbl
|
-2.95% |
19.335 |
18.765 |
- |
0.00% |
- |
|
External/SPEC/CFP2017rate/544.nab_r/544.nab_r
|
-2.94% |
479.793 |
465.693 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<63, EqZero, None>
|
-2.94% |
4744.171 |
4604.860 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/Symbolics-flt/Symbolics-flt
|
-2.93% |
4.862 |
4.719 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/FreeBench/pcompress2/pcompress2
|
-2.89% |
0.400 |
0.389 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/perlin
|
-2.88% |
6.661 |
6.469 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC8
|
-2.87% |
41.923 |
40.721 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_acosf_autovec_float_
|
-2.85% |
845.160 |
821.040 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_acosf_novec_float_
|
-2.83% |
845.032 |
821.090 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/BitBench/drop3/drop3
|
-2.83% |
0.747 |
0.726 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, EqZero, Mid>
|
-2.79% |
2765.597 |
2688.377 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Rodinia/backprop/backprop
|
-2.79% |
32.019 |
31.125 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint32_t_To_uint64_t_
|
-2.74% |
25629.754 |
24927.689 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/revertBits
|
-2.73% |
0.641 |
0.624 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC64
|
-2.71% |
93.232 |
90.708 |
- |
0.00% |
- |
|
MultiSource/Applications/lua/lua
|
-2.66% |
81.680 |
79.505 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC64
|
-2.66% |
288.351 |
280.691 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint32_t>/65
|
-2.66% |
94.487 |
91.977 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC32
|
-2.64% |
157.992 |
153.815 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/miniFE/miniFE
|
-2.63% |
17.064 |
16.616 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<4, LessThanZero, First>
|
-2.62% |
24356.915 |
23719.012 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC128
|
-2.62% |
119.505 |
116.376 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC64
|
-2.61% |
93.169 |
90.736 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1LoopWithReductionTC127
|
-2.61% |
120.136 |
117.004 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC128
|
-2.61% |
119.504 |
116.388 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC127
|
-2.59% |
120.133 |
117.021 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/ControlLoops-flt/ControlLoops-flt
|
-2.59% |
5.526 |
5.383 |
- |
0.00% |
- |
|
External/SPEC/CFP2017rate/511.povray_r/511.povray_r
|
-2.58% |
33.531 |
32.665 |
- |
0.00% |
- |
|
MicroBenchmarks/harris/harris.test:BENCHMARK_HARRIS/2048/2048
|
-2.58% |
178359.603 |
173763.687 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC7
|
-2.55% |
23.776 |
23.169 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC127
|
-2.50% |
225.273 |
219.640 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC8
|
-2.50% |
25.029 |
24.404 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/mafft/pairlocalalign
|
-2.46% |
93.075 |
90.786 |
- |
0.00% |
- |
|
MultiSource/Applications/JM/lencod/lencod
|
-2.45% |
28.841 |
28.134 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/HPCCG/HPCCG
|
-2.39% |
4.046 |
3.949 |
- |
0.00% |
- |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_ORDERED_DITHER/128/3
|
-2.38% |
222.211 |
216.921 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint16_t>/127
|
-2.37% |
78.824 |
76.960 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout/Shootout-matrix
|
-2.35% |
3.183 |
3.108 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, LessThanZero, None>
|
-2.35% |
4599.851 |
4491.713 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_PLANCKIAN_RAW/44217
|
-2.34% |
4511.846 |
4406.043 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC4
|
-2.33% |
18.145 |
17.723 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_MAT_X_MAT_LAMBDA/171
|
-2.33% |
2611.310 |
2550.583 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC16
|
-2.25% |
15.016 |
14.679 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint8_t_To_uint64_t_
|
-2.24% |
19236.546 |
18804.742 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC63
|
-2.18% |
114.507 |
112.008 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/flops-1
|
-2.18% |
9.000 |
8.804 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC15
|
-2.15% |
37.090 |
36.292 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC63
|
-2.14% |
76.087 |
74.457 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Olden/treeadd/treeadd
|
-2.09% |
1.001 |
0.981 |
- |
0.00% |
- |
|
External/SPEC/CINT2017rate/557.xz_r/557.xz_r
|
-2.09% |
217.205 |
212.674 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1BigLoopWithReductionTC2
|
-2.08% |
30.033 |
29.409 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, None>
|
-2.08% |
61494.423 |
60217.132 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Prolangs-C++/primes/primes
|
-2.06% |
1.061 |
1.039 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, EqZero, Mid>
|
-2.04% |
25848.182 |
25320.375 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/VersaBench/ecbdes/ecbdes
|
-2.04% |
5.365 |
5.255 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC31
|
-2.04% |
30.658 |
30.033 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForLoopWithReductionAutoVecTC32
|
-2.04% |
30.659 |
30.034 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC128
|
-2.03% |
214.632 |
210.268 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_INNER_PROD_RAW/44217
|
-2.03% |
362.171 |
354.830 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint16_t_
|
-2.02% |
15521.098 |
15207.319 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/LoopRerolling-flt/LoopRerolling-flt
|
-2.02% |
11.643 |
11.408 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_erf_autovec_double_
|
-2.00% |
899.581 |
881.587 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC31
|
-1.98% |
94.475 |
92.606 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<31, EqZero, Mid>
|
-1.98% |
7881.836 |
7725.967 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc-C++/Large/ray
|
-1.94% |
12.160 |
11.924 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC16
|
-1.89% |
33.162 |
32.537 |
- |
0.00% |
- |
|
External/SPEC/CFP2017rate/526.blender_r/526.blender_r
|
-1.88% |
881.195 |
864.660 |
- |
0.00% |
- |
|
MicroBenchmarks/SLPVectorization/SLPVectorizationBenchmarks.test:benchmark_xor_no_runtime_checks_needed<16, int>
|
-1.86% |
16.894 |
16.580 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C/CoMD/CoMD
|
-1.85% |
9.999 |
9.814 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, LessThanZero, None>
|
-1.83% |
45251.516 |
44424.584 |
- |
0.00% |
- |
|
MultiSource/Applications/siod/siod
|
-1.82% |
8.028 |
7.882 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, LessThanZero, Mid>
|
-1.81% |
8816.268 |
8656.938 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, Last>
|
-1.80% |
56781.287 |
55756.634 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC15
|
-1.78% |
70.080 |
68.829 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, EqZero, None>
|
-1.77% |
8321.591 |
8174.550 |
- |
0.00% |
- |
|
MultiSource/Applications/sgefa/sgefa
|
-1.77% |
0.617 |
0.606 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC15
|
-1.76% |
35.667 |
35.039 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_ENERGY_CALC_LAMBDA/44217
|
-1.75% |
4416.871 |
4339.556 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<2, GreaterThanZero, Mid>
|
-1.74% |
56743.288 |
55754.487 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, GreaterThanZero, First>
|
-1.73% |
2165.771 |
2128.292 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<16, EqZero, Mid>
|
-1.67% |
8640.605 |
8496.280 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC16
|
-1.66% |
37.540 |
36.915 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchVecWithRuntimeChecks4PointersDBeforeA/32
|
-1.60% |
166201.655 |
163534.472 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<5, GreaterThanZero, Mid>
|
-1.58% |
25693.123 |
25287.385 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/ASCI_Purple/SMG2000/smg2000
|
-1.58% |
18.897 |
18.599 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_DEL_DOT_VEC_2D_RAW/1
|
-1.56% |
297.449 |
292.794 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Misc/mandel-2
|
-1.56% |
2.535 |
2.495 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_DEL_DOT_VEC_2D_LAMBDA/1
|
-1.55% |
297.386 |
292.765 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC32
|
-1.54% |
40.673 |
40.045 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<3, GreaterThanZero, None>
|
-1.54% |
45226.113 |
44531.070 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<63, GreaterThanZero, Last>
|
-1.53% |
4800.750 |
4727.443 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_FIR_RAW/171
|
-1.49% |
1.169 |
1.152 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, GreaterThanZero, None>
|
-1.48% |
4495.548 |
4429.118 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<8, EqZero, Mid>
|
-1.48% |
19519.382 |
19231.215 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/Rodinia/hotspot/hotspot
|
-1.47% |
2.068 |
2.038 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC127
|
-1.47% |
106.048 |
104.489 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC128
|
-1.45% |
173.323 |
170.816 |
- |
0.00% |
- |
|
MultiSource/Applications/sqlite3/sqlite3
|
-1.42% |
12.973 |
12.789 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_FIR_LAMBDA/171
|
-1.41% |
1.168 |
1.152 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/TSVC/ControlLoops-dbl/ControlLoops-dbl
|
-1.40% |
11.305 |
11.147 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, LessThanZero, Mid>
|
-1.38% |
2768.933 |
2730.821 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_MULADDSUB_LAMBDA/44217
|
-1.34% |
392.899 |
387.615 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetARawLoops/lcalsARaw.test:BM_PRESSURE_CALC_RAW/5001
|
-1.31% |
44.479 |
43.897 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint8_t_To_uint16_t_
|
-1.31% |
3390.155 |
3345.854 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopWithReductionTC3
|
-1.30% |
16.270 |
16.058 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_expf_autovec_float_
|
-1.28% |
914.201 |
902.532 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC127
|
-1.28% |
194.604 |
192.120 |
- |
0.00% |
- |
|
External/SPEC/CINT2017rate/541.leela_r/541.leela_r
|
-1.27% |
231.003 |
228.080 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_MAT_X_MAT_RAW/5001
|
-1.24% |
755504.580 |
746105.622 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopInterchange/LoopInterchange.test:BENCHMARK_LI1
|
-1.24% |
1554.411 |
1535.127 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/Shootout-C++/Shootout-C++-lists1
|
-1.23% |
1.029 |
1.017 |
- |
0.00% |
- |
|
SingleSource/Benchmarks/SmallPT/smallpt
|
-1.22% |
30.189 |
29.819 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<64, LessThanZero, None>
|
-1.22% |
3008.574 |
2971.881 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_INT_PREDICT_RAW/171
|
-1.22% |
6.917 |
6.833 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetBLambdaLoops/lcalsBLambda.test:BM_INIT3_LAMBDA/44217
|
-1.22% |
396.838 |
392.014 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/DOE-ProxyApps-C++/CLAMR/CLAMR
|
-1.21% |
12.390 |
12.240 |
- |
0.00% |
- |
|
MicroBenchmarks/MemFunctions/MemFunctions.test:BM_MemCmp<32, LessThanZero, Last>
|
-1.20% |
7034.778 |
6950.555 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_PLANCKIAN_LAMBDA/44217
|
-1.17% |
4443.094 |
4391.204 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_INT_PREDICT_LAMBDA/171
|
-1.14% |
6.918 |
6.839 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC64
|
-1.12% |
55.687 |
55.062 |
- |
0.00% |
- |
|
MultiSource/Benchmarks/MallocBench/cfrac/cfrac
|
-1.11% |
2.801 |
2.770 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCLambdaLoops/lcalsCLambda.test:BM_HYDRO_1D_LAMBDA/5001
|
-1.11% |
16.577 |
16.393 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1LoopWithReductionTC128
|
-1.10% |
172.715 |
170.813 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_DEL_DOT_VEC_2D_LAMBDA/0
|
-1.10% |
1863.854 |
1843.360 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC1
|
-1.09% |
102.417 |
101.304 |
- |
0.00% |
- |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopWithReductionTC31
|
-1.04% |
60.069 |
59.445 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetCRawLoops/lcalsCRaw.test:BM_BAND_LIN_EQ_RAW/44217
|
-1.02% |
170.647 |
168.903 |
- |
0.00% |
- |
|
MicroBenchmarks/LCALS/SubsetALambdaLoops/lcalsALambda.test:BM_COUPLE_LAMBDA/1
|
-1.00% |
1397.283 |
1383.269 |
- |
0.00% |
- |