RAPP Compute Tuning Report


Best generic

Best SWAR

Best SIMD
Linux gcc1-power7.osuosl.org 3.17.2-200.fc20.ppc64p7 #1 SMP Wed Feb 18 20:59:33 MST 2015 ppc64 ppc64 ppc64 GNU/Linux
Function
0%Relative Execution Speed100%
Gain
rc_bitblt_wa_copy_bin

1.07
rc_bitblt_vm_copy_bin

1.58
rc_bitblt_vm_not_bin

1.46
rc_bitblt_vm_and_bin

1.62
rc_bitblt_vm_or_bin

1.58
rc_bitblt_vm_xor_bin

1.75
rc_bitblt_vm_nand_bin

1.50
rc_bitblt_vm_nor_bin

1.64
rc_bitblt_vm_xnor_bin

1.60
rc_bitblt_vm_andn_bin

1.68
rc_bitblt_vm_orn_bin

1.51
rc_bitblt_vm_nandn_bin

1.58
rc_bitblt_vm_norn_bin

1.61
rc_bitblt_va_copy_bin

1.01
rc_bitblt_va_not_bin

1.15
rc_bitblt_va_and_bin

1.16
rc_bitblt_va_or_bin

1.03
rc_bitblt_va_xor_bin

1.11
rc_bitblt_va_nand_bin

1.10
rc_bitblt_va_nor_bin

1.21
rc_bitblt_va_xnor_bin

1.02
rc_bitblt_va_andn_bin

1.13
rc_bitblt_va_orn_bin

1.07
rc_bitblt_va_nandn_bin

1.11
rc_bitblt_va_norn_bin

1.15
rc_pixop_set_u8

1.47
rc_pixop_not_u8

9.41
rc_pixop_flip_u8

10.30
rc_pixop_abs_u8

6.07
rc_pixop_addc_u8

15.81
rc_pixop_lerpc_u8

26.83
rc_pixop_lerpnc_u8

14.59
rc_pixop_add_u8

14.86
rc_pixop_avg_u8

9.70
rc_pixop_sub_u8

11.55
rc_pixop_subh_u8

9.82
rc_pixop_suba_u8

10.22
rc_pixop_lerp_u8

8.32
rc_pixop_lerpn_u8

8.03
rc_pixop_lerpi_u8

8.84
rc_pixop_norm_u8

5.74
rc_type_u8_to_bin

4.77
rc_type_bin_to_u8

4.10
rc_thresh_gt_u8

5.79
rc_thresh_lt_u8

5.64
rc_thresh_gtlt_u8

6.10
rc_thresh_ltgt_u8

6.14
rc_thresh_gt_pixel_u8

6.04
rc_thresh_lt_pixel_u8

5.96
rc_thresh_gtlt_pixel_u8

6.22
rc_thresh_ltgt_pixel_u8

6.21
rc_stat_sum_bin

2.59
rc_stat_sum_u8

2.59
rc_stat_sum2_u8

3.95
rc_stat_xsum_u8

6.85
rc_stat_min_bin

1.23
rc_stat_max_bin

1.03
rc_stat_min_u8

22.20
rc_stat_max_u8

21.85
rc_reduce_1x2_u8

6.39
rc_reduce_2x1_u8

10.09
rc_reduce_2x2_u8

5.05
rc_filter_diff_1x2_horz_u8

9.11
rc_filter_diff_1x2_horz_abs_u8

10.77
rc_filter_diff_2x1_vert_u8

11.35
rc_filter_diff_2x1_vert_abs_u8

12.53
rc_filter_diff_2x2_magn_u8

12.56
rc_filter_sobel_3x3_horz_u8

6.39
rc_filter_sobel_3x3_horz_abs_u8

10.86
rc_filter_sobel_3x3_vert_u8

6.16
rc_filter_sobel_3x3_vert_abs_u8

7.86
rc_filter_sobel_3x3_magn_u8

6.85
rc_filter_gauss_3x3_u8

7.39
rc_filter_laplace_3x3_u8

5.13
rc_filter_laplace_3x3_abs_u8

9.72
rc_filter_highpass_3x3_u8

4.32
rc_filter_highpass_3x3_abs_u8

8.65
rc_margin_horz_bin

1.14
rc_cond_set_u8

1.94
rc_cond_addc_u8

2.52
rc_cond_subc_u8

3.27
rc_cond_copy_u8

2.01
rc_cond_add_u8

3.06