diff options
Diffstat (limited to 'src/core/SkPMFloat.h')
-rw-r--r-- | src/core/SkPMFloat.h | 68 |
1 files changed, 28 insertions, 40 deletions
diff --git a/src/core/SkPMFloat.h b/src/core/SkPMFloat.h index 66262a8916..27f6f78f26 100644 --- a/src/core/SkPMFloat.h +++ b/src/core/SkPMFloat.h @@ -11,13 +11,7 @@ #include "SkTypes.h" #include "SkColor.h" #include "SkColorPriv.h" -#include "Sk4x.h" - -#if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 - #include <immintrin.h> -#elif defined(SK_ARM_HAS_NEON) - #include <arm_neon.h> -#endif +#include "SkNx.h" // A pre-multiplied color storing each component in the same order as SkPMColor, // but as a float in the range [0, 255]. @@ -29,29 +23,25 @@ public: // May be more efficient than one at a time. No special alignment assumed for SkPMColors. static void From4PMColors(const SkPMColor[4], SkPMFloat*, SkPMFloat*, SkPMFloat*, SkPMFloat*); - explicit SkPMFloat(SkPMColor); - SkPMFloat(float a, float r, float g, float b) { - // TODO: faster when specialized? - fColor[SK_A32_SHIFT / 8] = a; - fColor[SK_R32_SHIFT / 8] = r; - fColor[SK_G32_SHIFT / 8] = g; - fColor[SK_B32_SHIFT / 8] = b; - } - // Uninitialized. SkPMFloat() {} + explicit SkPMFloat(SkPMColor); + SkPMFloat(float a, float r, float g, float b) + #ifdef SK_PMCOLOR_IS_RGBA + : fColors(r,g,b,a) {} + #else + : fColors(b,g,r,a) {} + #endif - SkPMFloat(const SkPMFloat& that) { *this = that; } - SkPMFloat& operator=(const SkPMFloat& that); - // Freely autoconvert between SkPMFloat and Sk4f. They're always byte-for-byte identical. - /*implicit*/ SkPMFloat(const Sk4f& fs) { fs.storeAligned(fColor); } - /*implicit*/ operator Sk4f() const { return Sk4f::LoadAligned(fColor); } + // Freely autoconvert between SkPMFloat and Sk4s. + /*implicit*/ SkPMFloat(const Sk4s& fs) { fColors = fs; } + /*implicit*/ operator Sk4s() const { return fColors; } - float a() const { return fColor[SK_A32_SHIFT / 8]; } - float r() const { return fColor[SK_R32_SHIFT / 8]; } - float g() const { return fColor[SK_G32_SHIFT / 8]; } - float b() const { return fColor[SK_B32_SHIFT / 8]; } + float a() const { return fColors[SK_A32_SHIFT / 8]; } + float r() const { return fColors[SK_R32_SHIFT / 8]; } + float g() const { return fColors[SK_G32_SHIFT / 8]; } + float b() const { return fColors[SK_B32_SHIFT / 8]; } // get() and clamped() round component values to the nearest integer. SkPMColor get() const; // May SkASSERT(this->isValid()). Some implementations may clamp. @@ -75,24 +65,22 @@ public: } private: - union { - float fColor[4]; -#if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 - __m128 fColors; -#elif defined(SK_ARM_HAS_NEON) - float32x4_t fColors; -#endif - }; + Sk4s fColors; }; -#if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 - #include "../opts/SkPMFloat_SSSE3.h" -#elif SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 - #include "../opts/SkPMFloat_SSE2.h" -#elif defined(SK_ARM_HAS_NEON) - #include "../opts/SkPMFloat_neon.h" -#else +#ifdef SKNX_NO_SIMD + // Platform implementations of SkPMFloat assume Sk4s uses SSE or NEON. _none is generic. #include "../opts/SkPMFloat_none.h" +#else + #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 + #include "../opts/SkPMFloat_SSSE3.h" + #elif SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 + #include "../opts/SkPMFloat_SSE2.h" + #elif defined(SK_ARM_HAS_NEON) + #include "../opts/SkPMFloat_neon.h" + #else + #include "../opts/SkPMFloat_none.h" + #endif #endif #endif//SkPM_DEFINED |