|
SingleSource/Benchmarks/Misc/revertBits
Profile
|
16899.20% |
0.003 |
0.427 |
0.000 |
16899.20% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/16
|
34.38% |
29.783 |
40.023 |
0.000 |
34.38% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/28
|
33.02% |
27.401 |
36.449 |
0.001 |
33.02% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/28
|
32.04% |
49.798 |
65.753 |
0.001 |
32.04% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/51
|
31.23% |
45.746 |
60.034 |
0.001 |
31.23% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/10
|
31.01% |
20.729 |
27.158 |
0.001 |
31.01% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/51
|
30.52% |
88.161 |
115.067 |
0.005 |
30.52% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/999
|
28.35% |
1678.368 |
2154.138 |
0.048 |
28.34% |
0.048 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/999
|
28.21% |
1679.053 |
2152.697 |
0.044 |
28.21% |
0.044 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/999
|
27.80% |
847.795 |
1083.508 |
0.021 |
27.80% |
0.021 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint8_t>/256
|
27.62% |
439.611 |
561.033 |
0.116 |
27.62% |
0.116 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/256
|
27.30% |
439.600 |
559.625 |
0.007 |
27.30% |
0.007 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/51
|
27.28% |
88.159 |
112.211 |
0.002 |
27.28% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/16
|
26.90% |
18.585 |
23.585 |
0.001 |
26.90% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/28
|
26.30% |
49.799 |
62.895 |
0.001 |
26.30% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/256
|
25.92% |
228.740 |
288.029 |
0.006 |
25.91% |
0.006 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/999
|
25.31% |
866.313 |
1085.617 |
0.033 |
24.79% |
0.033 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/51
|
24.99% |
45.747 |
57.178 |
0.002 |
24.98% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/16
|
23.80% |
30.021 |
37.166 |
0.000 |
23.79% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/28
|
22.59% |
27.401 |
33.592 |
0.001 |
22.60% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/10
|
19.99% |
10.722 |
12.865 |
0.000 |
20.19% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/10
|
19.98% |
14.296 |
17.153 |
0.000 |
19.98% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint16_t_To_uint64_t_
|
19.93% |
11925.437 |
14301.788 |
9.930 |
19.85% |
9.930 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint16_t_To_uint64_t_
|
19.92% |
11925.510 |
14301.639 |
11.327 |
19.85% |
11.327 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint16_t_To_uint64_t_
|
19.92% |
11926.264 |
14301.659 |
8.914 |
19.85% |
8.914 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint32_t_To_uint16_t_
|
19.57% |
11961.435 |
14302.107 |
0.409 |
19.57% |
0.409 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint32_t_To_uint16_t_
|
19.57% |
11961.641 |
14302.086 |
0.080 |
19.57% |
0.080 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint32_t_To_uint16_t_
|
19.57% |
11961.690 |
14302.072 |
0.154 |
19.57% |
0.154 |
|
SingleSource/Benchmarks/Polybench/linear-algebra/blas/gemver/gemver
Profile
|
18.75% |
0.274 |
0.325 |
0.003 |
21.12% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/10
|
18.30% |
16.916 |
20.013 |
0.000 |
18.30% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint8_t>/256
|
17.34% |
247.281 |
290.167 |
0.007 |
16.71% |
0.007 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/999
|
16.54% |
4.289 |
4.998 |
0.002 |
16.54% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/51
|
16.44% |
4.289 |
4.994 |
0.004 |
16.44% |
0.004 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/16
|
16.44% |
4.289 |
4.994 |
0.002 |
16.44% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/28
|
16.43% |
4.289 |
4.994 |
0.003 |
16.43% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/10
|
16.33% |
4.289 |
4.989 |
0.005 |
16.33% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_two_loads<uint16_t>/256
|
16.32% |
4.289 |
4.989 |
0.005 |
16.32% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/16
|
15.98% |
17.871 |
20.727 |
0.001 |
15.98% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopTC1
|
15.72% |
12.096 |
13.998 |
0.002 |
15.74% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopTC1
|
14.50% |
12.224 |
13.997 |
0.005 |
14.52% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC1
|
14.28% |
5.004 |
5.718 |
0.000 |
14.28% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.28% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.27% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/16
|
14.27% |
15.011 |
17.153 |
0.000 |
14.31% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC1
|
14.27% |
5.004 |
5.718 |
0.000 |
14.27% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC1
|
14.26% |
5.004 |
5.718 |
0.000 |
14.28% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC1
|
13.65% |
12.224 |
13.892 |
0.049 |
12.23% |
0.049 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint32_t>/10
|
13.32% |
21.444 |
24.301 |
0.001 |
13.32% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC4
|
13.32% |
10.722 |
12.150 |
0.000 |
13.32% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopFrom_uint64_t_To_uint8_t_
|
12.35% |
19095.132 |
21452.433 |
0.387 |
12.29% |
0.387 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW8From_uint64_t_To_uint8_t_
|
12.30% |
19103.303 |
21452.250 |
0.273 |
12.28% |
0.273 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecWithAddInLoopWithVW16From_uint64_t_To_uint8_t_
|
12.29% |
19105.332 |
21452.617 |
0.323 |
12.28% |
0.323 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/16
|
12.14% |
25.494 |
28.589 |
0.000 |
12.14% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/28
|
9.38% |
23.523 |
25.730 |
0.000 |
9.17% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopWithReductionTC4
|
9.08% |
7.863 |
8.577 |
0.000 |
9.09% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/999
|
9.04% |
2630.350 |
2868.105 |
0.056 |
9.03% |
0.056 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/256
|
8.86% |
683.412 |
743.993 |
0.027 |
8.87% |
0.027 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/51
|
8.84% |
137.239 |
149.375 |
0.005 |
8.84% |
0.005 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/999
|
8.83% |
1326.643 |
1443.729 |
0.036 |
8.82% |
0.036 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/28
|
8.65% |
76.961 |
83.621 |
0.002 |
8.66% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/16
|
8.37% |
45.508 |
49.316 |
0.001 |
8.37% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC7
|
8.32% |
17.155 |
18.582 |
0.000 |
8.32% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/256
|
8.27% |
353.819 |
383.095 |
0.003 |
8.26% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_three_loads<uint16_t>/10
|
7.99% |
29.783 |
32.162 |
0.001 |
8.00% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/51
|
7.71% |
71.003 |
76.475 |
0.001 |
7.70% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC3
|
7.68% |
9.292 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC3
|
7.68% |
9.293 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC3
|
7.68% |
9.292 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC3
|
7.68% |
9.293 |
10.006 |
0.000 |
7.68% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC3
|
7.68% |
9.293 |
10.006 |
0.000 |
7.68% |
0.000 |
|
SingleSource/Benchmarks/CoyoteBench/huffbench
Profile
|
7.40% |
45.917 |
49.315 |
0.013 |
7.35% |
0.013 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC8
|
7.40% |
19.300 |
20.728 |
0.000 |
7.40% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/28
|
7.26% |
42.647 |
45.743 |
0.001 |
7.25% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchAutoVec<uint32_t>/65
|
6.87% |
141.527 |
151.244 |
0.135 |
6.87% |
0.135 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/28
|
6.77% |
42.174 |
45.028 |
0.000 |
6.77% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC4
|
6.66% |
10.722 |
11.436 |
0.000 |
6.65% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC4
|
6.66% |
10.722 |
11.436 |
0.000 |
6.66% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC4
|
6.66% |
10.722 |
11.436 |
0.000 |
6.66% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC4
|
6.65% |
10.722 |
11.435 |
0.000 |
6.65% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC64
|
6.16% |
139.392 |
147.975 |
0.054 |
6.16% |
0.054 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint8_t>/127
|
6.10% |
150.192 |
159.356 |
0.272 |
6.09% |
0.272 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint64_t>/51
|
6.08% |
39.076 |
41.453 |
0.001 |
6.08% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/16
|
5.39% |
26.448 |
27.874 |
0.001 |
5.39% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint16_t_
|
5.28% |
13596.431 |
14314.369 |
1.701 |
5.23% |
1.701 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_two_loads<uint32_t>/10
|
5.25% |
13.581 |
14.295 |
0.000 |
5.25% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint16_t_
|
5.25% |
13599.305 |
14313.290 |
1.758 |
5.23% |
1.758 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint16_t_
|
5.25% |
13602.305 |
14316.351 |
0.954 |
5.24% |
0.954 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopTC8
|
4.91% |
72.253 |
75.804 |
0.103 |
4.29% |
0.103 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:BENCHMARK_single_csa_nested_cond_load_novec_int32_t_
|
4.80% |
857768.382 |
898921.895 |
15317.619 |
4.86% |
15317.619 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/10
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/999
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/51
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/16
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/51
|
4.34% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/256
|
4.34% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/28
|
4.33% |
5.480 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint16_t>/16
|
4.33% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/10
|
4.33% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/999
|
4.33% |
5.480 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/28
|
4.32% |
5.481 |
5.718 |
0.000 |
4.33% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_first_three_loads<uint8_t>/256
|
4.31% |
5.482 |
5.718 |
0.000 |
4.34% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint16_t>/256
|
4.24% |
197.290 |
205.660 |
0.299 |
4.25% |
0.299 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC7
|
4.16% |
17.155 |
17.869 |
0.000 |
4.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC7
|
4.16% |
17.155 |
17.869 |
0.000 |
4.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC7
|
4.15% |
17.155 |
17.868 |
0.000 |
4.15% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_single_load<uint64_t>/51
|
4.03% |
75.575 |
78.620 |
0.001 |
3.99% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC7
|
3.99% |
17.870 |
18.583 |
0.000 |
3.99% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_three_loads<uint16_t>/10
|
3.83% |
18.585 |
19.297 |
0.000 |
3.83% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC8
|
3.69% |
19.299 |
20.012 |
0.000 |
3.70% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC8
|
3.69% |
19.300 |
20.012 |
0.001 |
3.69% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC8
|
3.69% |
19.300 |
20.012 |
0.001 |
3.69% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC8
|
3.56% |
20.014 |
20.727 |
0.000 |
3.56% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_no_early_exit_two_loads<uint16_t>/10
|
3.56% |
20.014 |
20.727 |
0.001 |
3.56% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC2
|
3.44% |
6.910 |
7.147 |
0.000 |
3.44% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint32_t>/256
|
3.04% |
198.020 |
204.034 |
0.021 |
3.05% |
0.021 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC15
|
2.08% |
34.309 |
35.021 |
0.001 |
2.08% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC15
|
2.07% |
34.311 |
35.021 |
0.001 |
2.07% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC15
|
2.07% |
34.311 |
35.021 |
0.000 |
2.08% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW16From_uint64_t_To_uint32_t_
|
1.96% |
14079.213 |
14354.472 |
0.354 |
-1.70% |
0.354 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC16
|
1.95% |
36.456 |
37.167 |
0.000 |
1.95% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC16
|
1.95% |
36.456 |
37.167 |
0.000 |
1.95% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC16
|
1.95% |
36.455 |
37.166 |
0.001 |
1.95% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC16
|
1.95% |
36.456 |
37.166 |
0.000 |
1.95% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC16
|
1.95% |
36.456 |
37.166 |
0.000 |
1.96% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopFrom_uint64_t_To_uint32_t_
|
1.92% |
14080.270 |
14351.216 |
1.098 |
-1.70% |
1.098 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:benchForTruncOrZextVecInLoopWithVW8From_uint64_t_To_uint32_t_
|
1.92% |
14080.198 |
14350.451 |
1.578 |
-1.72% |
1.578 |
|
MicroBenchmarks/LoopVectorization/LoopEpilogueVectorizationBenchmarks.test:benchReductionAutoVec<uint16_t>/127
|
1.42% |
145.922 |
147.988 |
0.015 |
1.23% |
0.015 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC1
|
1.40% |
9.292 |
9.422 |
0.016 |
1.21% |
0.016 |
|
External/SPEC/CINT2017rate/523.xalancbmk_r/523.xalancbmk_r
Profile
|
1.38% |
154.765 |
156.899 |
0.069 |
-0.59% |
0.069 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC1
|
1.21% |
9.292 |
9.405 |
0.026 |
1.03% |
0.026 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW1BigLoopWithReductionTC8
|
1.16% |
40.980 |
41.455 |
0.000 |
1.15% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4BigLoopWithReductionTC8
|
1.16% |
40.981 |
41.455 |
0.000 |
1.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4BigLoopWithReductionTC8
|
1.16% |
40.981 |
41.454 |
0.000 |
1.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopVectorizationBenchmarks.test:autovec_early_exit_taken_mid_single_load<uint16_t>/999
|
1.15% |
727.646 |
736.049 |
0.267 |
1.15% |
0.267 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForBigLoopWithReductionAutoVecTC8
|
1.15% |
40.980 |
41.453 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4BigLoopWithReductionTC8
|
1.15% |
40.981 |
41.454 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1BigLoopWithReductionTC8
|
1.15% |
40.981 |
41.454 |
0.001 |
1.15% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW1BigLoopWithReductionTC8
|
1.15% |
40.981 |
41.454 |
0.000 |
1.16% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW1LoopWithReductionTC2
|
1.10% |
5.439 |
5.499 |
0.003 |
-0.50% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC31
|
1.03% |
68.622 |
69.331 |
0.001 |
1.04% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC1VW4LoopTC31
|
1.03% |
68.622 |
69.329 |
0.000 |
1.03% |
0.000 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC31
|
1.03% |
68.622 |
69.328 |
0.001 |
1.03% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC31
|
1.03% |
68.623 |
69.328 |
0.002 |
1.03% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForBigLoopTC31
|
1.03% |
68.622 |
69.327 |
0.002 |
1.03% |
0.002 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC4VW4LoopTC64
|
1.01% |
139.388 |
140.799 |
0.003 |
1.02% |
0.003 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchAutoVecForLoopTC32
|
1.00% |
70.763 |
71.474 |
0.001 |
1.00% |
0.001 |
|
MicroBenchmarks/LoopVectorization/LoopInterleavingBenchmarks.test:benchForIC2VW4LoopTC32
|
1.00% |
70.766 |
71.474 |
0.001 |
1.00% |
0.001 |