aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/opts/SkXfermode_opts_arm.cpp
blob: db5d5317e3d6f5bbb2b8da170b6d96cdbe2fa3e6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
#include "SkXfermode.h"
#include "SkXfermode_proccoeff.h"
#include "SkColorPriv.h"
#include "SkUtilsArm.h"

#if !SK_ARM_NEON_IS_NONE

#include <arm_neon.h>

////////////////////////////////////////////////////////////////////////////////

typedef uint8x8x4_t (*SkXfermodeProcSIMD)(uint8x8x4_t src, uint8x8x4_t dst);

class SkNEONProcCoeffXfermode : public SkProcCoeffXfermode {
public:
    SkNEONProcCoeffXfermode(const ProcCoeff& rec, SkXfermode::Mode mode,
                            SkXfermodeProcSIMD procSIMD)
            : INHERITED(rec, mode), fProcSIMD(procSIMD) {}

    virtual void xfer32(SkPMColor dst[], const SkPMColor src[], int count,
                        const SkAlpha aa[]) const SK_OVERRIDE;

    SK_DEVELOPER_TO_STRING()
    SK_DECLARE_PUBLIC_FLATTENABLE_DESERIALIZATION_PROCS(SkNEONProcCoeffXfermode)

private:
    SkNEONProcCoeffXfermode(SkFlattenableReadBuffer& buffer)
        : INHERITED(buffer) {

        fProcSIMD = NULL;
        if (!buffer.isCrossProcess()) {
            fProcSIMD = (SkXfermodeProcSIMD)buffer.readFunctionPtr();
        }
    }

    virtual void flatten(SkFlattenableWriteBuffer& buffer) const SK_OVERRIDE;

    SkXfermodeProcSIMD fProcSIMD;
    typedef SkProcCoeffXfermode INHERITED;
};


void SkNEONProcCoeffXfermode::xfer32(SkPMColor dst[], const SkPMColor src[],
                                     int count, const SkAlpha aa[]) const {
    SkASSERT(dst && src && count >= 0);

    SkXfermodeProc proc = this->getProc();
    SkXfermodeProcSIMD procSIMD = fProcSIMD;

    if (NULL == aa) {
        // Unrolled NEON code
        while (count >= 8) {
            uint8x8x4_t vsrc, vdst, vres;

            asm volatile (
                "vld4.u8    %h[vsrc], [%[src]]!  \t\n"
                "vld4.u8    %h[vdst], [%[dst]]   \t\n"
                : [vsrc] "=w" (vsrc), [vdst] "=w" (vdst)
                : [src] "r" (src), [dst] "r" (dst)
                :
            );

            vres = procSIMD(vsrc, vdst);

            vst4_u8((uint8_t*)dst, vres);

            count -= 8;
            dst += 8;
        }
        // Leftovers
        for (int i = 0; i < count; i++) {
            dst[i] = proc(src[i], dst[i]);
        }
    } else {
        for (int i = count - 1; i >= 0; --i) {
            unsigned a = aa[i];
            if (0 != a) {
                SkPMColor dstC = dst[i];
                SkPMColor C = proc(src[i], dstC);
                if (a != 0xFF) {
                    C = SkFourByteInterp(C, dstC, a);
                }
                dst[i] = C;
            }
        }
    }
}

#ifdef SK_DEVELOPER
void SkNEONProcCoeffXfermode::toString(SkString* str) const {
    this->INHERITED::toString(str);
}
#endif

void SkNEONProcCoeffXfermode::flatten(SkFlattenableWriteBuffer& buffer) const {
    this->INHERITED::flatten(buffer);
    if (!buffer.isCrossProcess()) {
        buffer.writeFunctionPtr((void*)fProcSIMD);
    }
}

////////////////////////////////////////////////////////////////////////////////

SkXfermodeProcSIMD gNEONXfermodeProcs[] = {
    [SkXfermode::kClear_Mode]   = NULL,
    [SkXfermode::kSrc_Mode]     = NULL,
    [SkXfermode::kDst_Mode]     = NULL,
    [SkXfermode::kSrcOver_Mode] = NULL,
    [SkXfermode::kDstOver_Mode] = NULL,
    [SkXfermode::kSrcIn_Mode]   = NULL,
    [SkXfermode::kDstIn_Mode]   = NULL,
    [SkXfermode::kSrcOut_Mode]  = NULL,
    [SkXfermode::kDstOut_Mode]  = NULL,
    [SkXfermode::kSrcATop_Mode] = NULL,
    [SkXfermode::kDstATop_Mode] = NULL,
    [SkXfermode::kXor_Mode]     = NULL,
    [SkXfermode::kPlus_Mode]    = NULL,
    [SkXfermode::kModulate_Mode]= NULL,
    [SkXfermode::kScreen_Mode]  = NULL,

    [SkXfermode::kOverlay_Mode]    = NULL,
    [SkXfermode::kDarken_Mode]     = NULL,
    [SkXfermode::kLighten_Mode]    = NULL,
    [SkXfermode::kColorDodge_Mode] = NULL,
    [SkXfermode::kColorBurn_Mode]  = NULL,
    [SkXfermode::kHardLight_Mode]  = NULL,
    [SkXfermode::kSoftLight_Mode]  = NULL,
    [SkXfermode::kDifference_Mode] = NULL,
    [SkXfermode::kExclusion_Mode]  = NULL,
    [SkXfermode::kMultiply_Mode]   = NULL,

    [SkXfermode::kHue_Mode]        = NULL,
    [SkXfermode::kSaturation_Mode] = NULL,
    [SkXfermode::kColor_Mode]      = NULL,
    [SkXfermode::kLuminosity_Mode] = NULL,
};

SK_COMPILE_ASSERT(
    SK_ARRAY_COUNT(gNEONXfermodeProcs) == SkXfermode::kLastMode + 1,
    mode_count_arm
);

#endif

SkProcCoeffXfermode* SkPlatformXfermodeFactory(const ProcCoeff& rec,
                                               SkXfermode::Mode mode) {
#if !SK_ARM_NEON_IS_NONE
    #if SK_ARM_NEON_IS_DYNAMIC
    if ((sk_cpu_arm_has_neon()) && (gNEONXfermodeProcs[mode] != NULL)) {
    #elif SK_ARM_NEON_IS_ALWAYS
    if (gNEONXfermodeProcs[mode] != NULL) {
    #endif
        return SkNEW_ARGS(SkNEONProcCoeffXfermode,
                          (rec, mode, gNEONXfermodeProcs[mode]));
    }
#endif
    return NULL;
}