|
SingleSource/Benchmarks/Misc/revertBits
Profile
|
18304.31% |
0.002 |
0.427 |
0.000 |
16911.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/16
|
34.38% |
29.784 |
40.025 |
0.000 |
34.39% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/28
|
33.02% |
27.401 |
36.450 |
0.001 |
33.03% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/28
|
32.05% |
49.797 |
65.757 |
0.000 |
32.05% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/51
|
31.24% |
45.745 |
60.037 |
0.001 |
31.24% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/10
|
31.02% |
20.729 |
27.160 |
0.000 |
31.02% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/51
|
30.53% |
88.160 |
115.073 |
0.001 |
30.52% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/999
|
28.35% |
1678.367 |
2154.208 |
0.029 |
28.35% |
0.029 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/999
|
28.21% |
1679.022 |
2152.751 |
0.029 |
28.21% |
0.029 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/999
|
27.81% |
847.744 |
1083.515 |
0.013 |
27.80% |
0.013 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/256
|
27.63% |
439.599 |
561.063 |
0.007 |
27.62% |
0.007 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/256
|
27.31% |
439.597 |
559.635 |
0.006 |
27.30% |
0.006 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/51
|
27.29% |
88.159 |
112.215 |
0.001 |
27.29% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/16
|
26.91% |
18.584 |
23.586 |
0.000 |
26.90% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/28
|
26.31% |
49.796 |
62.898 |
0.001 |
26.30% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/256
|
25.91% |
228.770 |
288.039 |
0.048 |
25.91% |
0.048 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/51
|
24.99% |
45.748 |
57.180 |
0.001 |
24.99% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/999
|
24.93% |
868.986 |
1085.662 |
0.027 |
24.79% |
0.027 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/16
|
23.80% |
30.022 |
37.166 |
0.000 |
23.80% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/28
|
22.60% |
27.400 |
33.593 |
0.000 |
22.60% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/10
|
20.00% |
10.721 |
12.865 |
0.000 |
20.19% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/10
|
19.99% |
14.296 |
17.153 |
0.000 |
19.98% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint64_t_
|
19.79% |
11940.475 |
14303.004 |
73.573 |
19.86% |
73.573 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint16_t_To_uint64_t_
|
19.78% |
11941.271 |
14303.813 |
73.356 |
19.87% |
73.356 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint64_t_
|
19.78% |
11941.092 |
14303.085 |
74.175 |
19.86% |
74.175 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint16_t_
|
19.57% |
11961.382 |
14302.139 |
0.257 |
19.57% |
0.257 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint16_t_
|
19.56% |
11961.880 |
14301.853 |
0.518 |
19.57% |
0.518 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint16_t_
|
19.55% |
11963.265 |
14302.174 |
0.111 |
19.57% |
0.111 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/10
|
18.31% |
16.916 |
20.013 |
0.000 |
18.30% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/10
|
16.60% |
4.289 |
5.001 |
0.001 |
16.61% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/51
|
16.55% |
4.289 |
4.998 |
0.002 |
16.55% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/999
|
16.54% |
4.289 |
4.998 |
0.002 |
16.54% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/256
|
16.54% |
4.289 |
4.998 |
0.002 |
16.54% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/16
|
16.54% |
4.289 |
4.998 |
0.000 |
16.54% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/28
|
16.33% |
4.289 |
4.989 |
0.006 |
16.33% |
0.006 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/256
|
16.01% |
250.126 |
290.183 |
0.014 |
16.71% |
0.014 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/16
|
15.99% |
17.869 |
20.728 |
0.000 |
15.99% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC1
|
15.77% |
12.093 |
13.999 |
0.003 |
15.75% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC1
|
14.47% |
12.226 |
13.996 |
0.005 |
14.51% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/16
|
14.32% |
15.005 |
17.154 |
0.000 |
14.31% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC1
|
14.28% |
5.003 |
5.718 |
0.000 |
14.27% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.27% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.28% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.28% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.28% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC1
|
14.20% |
12.149 |
13.875 |
0.062 |
12.09% |
0.062 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/10
|
13.32% |
21.444 |
24.301 |
0.000 |
13.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC4
|
13.32% |
10.722 |
12.150 |
0.000 |
13.33% |
0.000 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/gemver/gemver
Profile
|
13.17% |
0.280 |
0.316 |
0.004 |
17.80% |
0.004 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint8_t_
|
12.33% |
19098.563 |
21452.988 |
3.450 |
12.28% |
3.450 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint8_t_
|
12.29% |
19103.986 |
21452.682 |
3.967 |
12.29% |
3.967 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint8_t_
|
12.29% |
19104.634 |
21452.927 |
3.679 |
12.29% |
3.679 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/16
|
12.14% |
25.494 |
28.590 |
0.000 |
12.14% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/28
|
9.16% |
23.571 |
25.731 |
0.001 |
9.18% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC4
|
9.08% |
7.863 |
8.577 |
0.000 |
9.08% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/999
|
9.05% |
2630.249 |
2868.186 |
0.063 |
9.04% |
0.063 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/256
|
8.87% |
683.367 |
744.015 |
0.017 |
8.87% |
0.017 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/51
|
8.85% |
137.239 |
149.380 |
0.003 |
8.85% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/999
|
8.83% |
1326.648 |
1443.760 |
0.023 |
8.82% |
0.023 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/28
|
8.66% |
76.958 |
83.625 |
0.001 |
8.66% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/16
|
8.37% |
45.507 |
49.317 |
0.001 |
8.37% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC7
|
8.32% |
17.155 |
18.583 |
0.000 |
8.32% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/256
|
8.27% |
353.850 |
383.097 |
0.004 |
8.26% |
0.004 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/10
|
8.00% |
29.782 |
32.164 |
0.000 |
8.00% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/51
|
7.71% |
71.005 |
76.476 |
0.001 |
7.70% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC3
|
7.69% |
9.292 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC3
|
7.68% |
9.292 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC3
|
7.68% |
9.292 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC3
|
7.68% |
9.292 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC3
|
7.68% |
9.293 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC8
|
7.39% |
19.300 |
20.727 |
0.000 |
7.40% |
0.000 |
|
SingleSource/Benchmarks/CoyoteBench/huffbench
Profile
|
7.31% |
45.945 |
49.304 |
0.011 |
7.33% |
0.011 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/28
|
7.26% |
42.648 |
45.744 |
0.000 |
7.26% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/28
|
6.77% |
42.172 |
45.028 |
0.000 |
6.77% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC4
|
6.66% |
10.721 |
11.435 |
0.000 |
6.66% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC4
|
6.66% |
10.722 |
11.436 |
0.000 |
6.65% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC4
|
6.66% |
10.722 |
11.436 |
0.000 |
6.65% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC4
|
6.65% |
10.722 |
11.436 |
0.000 |
6.65% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint32_t>/65
|
6.52% |
141.526 |
150.750 |
0.279 |
6.52% |
0.279 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint8_t>/127
|
6.23% |
150.167 |
159.523 |
0.203 |
6.20% |
0.203 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC64
|
6.16% |
139.377 |
147.969 |
0.061 |
6.16% |
0.061 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/51
|
6.09% |
39.075 |
41.455 |
0.000 |
6.09% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/16
|
5.40% |
26.447 |
27.875 |
0.000 |
5.39% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/10
|
5.25% |
13.582 |
14.295 |
0.000 |
5.26% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint16_t_
|
5.24% |
13602.161 |
14315.594 |
187.219 |
5.24% |
187.219 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint16_t_
|
5.24% |
13603.391 |
14316.805 |
186.467 |
5.24% |
186.467 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint16_t_
|
5.24% |
13603.075 |
14315.928 |
186.840 |
5.25% |
186.840 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC8
|
4.39% |
72.667 |
75.860 |
0.036 |
4.36% |
0.036 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/28
|
4.35% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/256
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/999
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/10
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/10
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/16
|
4.34% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/51
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/51
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/999
|
4.34% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/16
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/28
|
4.34% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/256
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint16_t>/256
|
4.20% |
197.268 |
205.543 |
0.340 |
4.19% |
0.340 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_single_csa_nested_cond_load_novec_int32_t_
|
4.19% |
856602.689 |
892468.112 |
1478.792 |
4.11% |
1478.792 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC7
|
4.16% |
17.154 |
17.868 |
0.000 |
4.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC7
|
4.16% |
17.155 |
17.868 |
0.000 |
4.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC7
|
4.15% |
17.155 |
17.867 |
0.001 |
4.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/51
|
4.01% |
75.589 |
78.622 |
0.001 |
3.99% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC7
|
3.99% |
17.870 |
18.583 |
0.000 |
3.99% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/10
|
3.84% |
18.584 |
19.298 |
0.000 |
3.83% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC8
|
3.70% |
19.299 |
20.013 |
0.000 |
3.69% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_single_csa_nested_cond_load_autovec_int32_t_
|
3.69% |
859045.343 |
890767.561 |
1222.262 |
3.85% |
1222.262 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC8
|
3.69% |
19.299 |
20.012 |
0.001 |
3.69% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC8
|
3.69% |
19.299 |
20.012 |
0.001 |
3.69% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint16_t>/10
|
3.56% |
20.015 |
20.728 |
0.000 |
3.56% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC8
|
3.56% |
20.014 |
20.726 |
0.001 |
3.56% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC2
|
3.44% |
6.909 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC2
|
3.44% |
6.909 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint32_t>/256
|
3.02% |
198.016 |
203.996 |
0.069 |
3.03% |
0.069 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC15
|
2.08% |
34.308 |
35.022 |
0.000 |
2.08% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC15
|
2.08% |
34.308 |
35.021 |
0.001 |
2.08% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC15
|
2.08% |
34.309 |
35.021 |
0.001 |
2.08% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC16
|
1.95% |
36.454 |
37.166 |
0.000 |
1.95% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC16
|
1.95% |
36.455 |
37.166 |
0.000 |
1.95% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC16
|
1.95% |
36.455 |
37.165 |
0.002 |
1.95% |
0.002 |
|
MicroBenchmarks/ImageProcessing/Dither/Dither.test:BENCHMARK_FLOYD_DITHER/512
|
1.95% |
4818.234 |
4912.049 |
22.847 |
0.47% |
22.847 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC16
|
1.95% |
36.455 |
37.165 |
0.001 |
1.95% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC16
|
1.94% |
36.457 |
37.166 |
0.001 |
1.95% |
0.001 |
|
MultiSource/Applications/sqlite3/sqlite3
Profile
|
1.81% |
7.561 |
7.699 |
0.014 |
2.25% |
0.014 |
|
External/SPEC/CINT2017rate/523.xalancbmk_r/523.xalancbmk_r
Profile
|
1.42% |
154.449 |
156.642 |
0.438 |
-0.76% |
0.438 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC1
|
1.39% |
9.292 |
9.421 |
0.015 |
1.38% |
0.015 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint16_t>/127
|
1.34% |
145.990 |
147.950 |
0.081 |
1.20% |
0.081 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_erff_autovec_float_
|
1.17% |
525.128 |
531.260 |
0.210 |
1.13% |
0.210 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1BigLoopWithReductionTC8
|
1.16% |
40.980 |
41.455 |
0.000 |
1.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC8
|
1.16% |
40.979 |
41.454 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC8
|
1.16% |
40.978 |
41.453 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC8
|
1.16% |
40.980 |
41.453 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC8
|
1.15% |
40.981 |
41.454 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC8
|
1.15% |
40.981 |
41.454 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC8
|
1.15% |
40.980 |
41.453 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint16_t>/999
|
1.14% |
727.658 |
735.958 |
0.342 |
1.14% |
0.342 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC31
|
1.04% |
68.618 |
69.329 |
0.001 |
1.03% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC31
|
1.03% |
68.622 |
69.329 |
0.001 |
1.04% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC31
|
1.03% |
68.621 |
69.327 |
0.002 |
1.03% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC31
|
1.03% |
68.622 |
69.328 |
0.002 |
1.03% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC31
|
1.03% |
68.621 |
69.327 |
0.003 |
1.03% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC64
|
1.02% |
139.380 |
140.801 |
0.002 |
1.02% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC32
|
1.00% |
70.762 |
71.471 |
0.001 |
1.00% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC32
|
1.00% |
70.766 |
71.475 |
0.000 |
1.00% |
0.000 |
|
MultiSource/Applications/lambda-0.1.3/lambda
Profile
|
1.00% |
9.319 |
9.412 |
0.021 |
0.28% |
0.021 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC32
|
1.00% |
70.767 |
71.475 |
0.002 |
1.00% |
0.002 |