aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/opts/SkColor_opts_neon.h
diff options
context:
space:
mode:
authorGravatar commit-bot@chromium.org <commit-bot@chromium.org@2bbb7eff-a529-9590-31e7-b0007b416f81>2013-10-17 16:29:34 +0000
committerGravatar commit-bot@chromium.org <commit-bot@chromium.org@2bbb7eff-a529-9590-31e7-b0007b416f81>2013-10-17 16:29:34 +0000
commitcd7992ba55e8b87580f54e7c19fc033bed01640d (patch)
tree4de48a483e2fd3c2337957c337c6624f092bdeb3 /src/opts/SkColor_opts_neon.h
parent521a46750d87d3d206617d05d917ad6aad242ca4 (diff)
ARM Skia NEON patches - 30 - Xfermode: NEON modeprocs
Xfermode: NEON implementation of SIMD procs This patch contains a NEON implementation for a number of Xfermodes. It provides a big speedup on Xfermode benchmarks (currently up to 3x with gcc4.7 but up to 10x when gcc produces optimal code for it). Signed-off-by: Kévin PETIT <kevin.petit@arm.com> BUG= Committed: http://code.google.com/p/skia/source/detail?r=11777 Committed: http://code.google.com/p/skia/source/detail?r=11813 R=djsollen@google.com, mtklein@google.com, reed@google.com, robertphillips@google.com Author: kevin.petit.arm@gmail.com Review URL: https://codereview.chromium.org/26627004 git-svn-id: http://skia.googlecode.com/svn/trunk@11843 2bbb7eff-a529-9590-31e7-b0007b416f81
Diffstat (limited to 'src/opts/SkColor_opts_neon.h')
-rw-r--r--src/opts/SkColor_opts_neon.h21
1 files changed, 21 insertions, 0 deletions
diff --git a/src/opts/SkColor_opts_neon.h b/src/opts/SkColor_opts_neon.h
index 7e3057d14c..cd9e8133e2 100644
--- a/src/opts/SkColor_opts_neon.h
+++ b/src/opts/SkColor_opts_neon.h
@@ -3,9 +3,30 @@
#include "SkTypes.h"
+#include <arm_neon.h>
+
#define NEON_A (SK_A32_SHIFT / 8)
#define NEON_R (SK_R32_SHIFT / 8)
#define NEON_G (SK_G32_SHIFT / 8)
#define NEON_B (SK_B32_SHIFT / 8)
+static inline uint16x8_t SkAlpha255To256_neon8(uint8x8_t alpha) {
+ return vaddw_u8(vdupq_n_u16(1), alpha);
+}
+
+static inline uint8x8_t SkAlphaMul_neon8(uint8x8_t color, uint16x8_t scale) {
+ return vshrn_n_u16(vmovl_u8(color) * scale, 8);
+}
+
+static inline uint8x8x4_t SkAlphaMulQ_neon8(uint8x8x4_t color, uint16x8_t scale) {
+ uint8x8x4_t ret;
+
+ ret.val[NEON_A] = SkAlphaMul_neon8(color.val[NEON_A], scale);
+ ret.val[NEON_R] = SkAlphaMul_neon8(color.val[NEON_R], scale);
+ ret.val[NEON_G] = SkAlphaMul_neon8(color.val[NEON_G], scale);
+ ret.val[NEON_B] = SkAlphaMul_neon8(color.val[NEON_B], scale);
+
+ return ret;
+}
+
#endif /* #ifndef SkColor_opts_neon_DEFINED */