diff options
author | commit-bot@chromium.org <commit-bot@chromium.org@2bbb7eff-a529-9590-31e7-b0007b416f81> | 2013-10-16 16:24:08 +0000 |
---|---|---|
committer | commit-bot@chromium.org <commit-bot@chromium.org@2bbb7eff-a529-9590-31e7-b0007b416f81> | 2013-10-16 16:24:08 +0000 |
commit | b4c29c536374cdc8657838744002e8a770dff871 (patch) | |
tree | 99afdb344eae113f1d96a562e128245ab64b3e6f /src/opts/SkColor_opts_neon.h | |
parent | 8b66abb9bc78fd031334f565c9394f4fdc99811b (diff) |
ARM Skia NEON patches - 30 - Xfermode: NEON modeprocs
Xfermode: NEON implementation of SIMD procs
This patch contains a NEON implementation for a number of Xfermodes.
It provides a big speedup on Xfermode benchmarks (currently up to 3x
with gcc4.7 but up to 10x when gcc produces optimal code for it).
Signed-off-by: Kévin PETIT <kevin.petit@arm.com>
BUG=
Committed: http://code.google.com/p/skia/source/detail?r=11777
R=djsollen@google.com, mtklein@google.com, reed@google.com, robertphillips@google.com
Author: kevin.petit.arm@gmail.com
Review URL: https://codereview.chromium.org/26627004
git-svn-id: http://skia.googlecode.com/svn/trunk@11813 2bbb7eff-a529-9590-31e7-b0007b416f81
Diffstat (limited to 'src/opts/SkColor_opts_neon.h')
-rw-r--r-- | src/opts/SkColor_opts_neon.h | 21 |
1 files changed, 21 insertions, 0 deletions
diff --git a/src/opts/SkColor_opts_neon.h b/src/opts/SkColor_opts_neon.h index 7e3057d14c..cd9e8133e2 100644 --- a/src/opts/SkColor_opts_neon.h +++ b/src/opts/SkColor_opts_neon.h @@ -3,9 +3,30 @@ #include "SkTypes.h" +#include <arm_neon.h> + #define NEON_A (SK_A32_SHIFT / 8) #define NEON_R (SK_R32_SHIFT / 8) #define NEON_G (SK_G32_SHIFT / 8) #define NEON_B (SK_B32_SHIFT / 8) +static inline uint16x8_t SkAlpha255To256_neon8(uint8x8_t alpha) { + return vaddw_u8(vdupq_n_u16(1), alpha); +} + +static inline uint8x8_t SkAlphaMul_neon8(uint8x8_t color, uint16x8_t scale) { + return vshrn_n_u16(vmovl_u8(color) * scale, 8); +} + +static inline uint8x8x4_t SkAlphaMulQ_neon8(uint8x8x4_t color, uint16x8_t scale) { + uint8x8x4_t ret; + + ret.val[NEON_A] = SkAlphaMul_neon8(color.val[NEON_A], scale); + ret.val[NEON_R] = SkAlphaMul_neon8(color.val[NEON_R], scale); + ret.val[NEON_G] = SkAlphaMul_neon8(color.val[NEON_G], scale); + ret.val[NEON_B] = SkAlphaMul_neon8(color.val[NEON_B], scale); + + return ret; +} + #endif /* #ifndef SkColor_opts_neon_DEFINED */ |