diff options
Diffstat (limited to 'src/opts/SkNx_neon.h')
-rw-r--r-- | src/opts/SkNx_neon.h | 13 |
1 files changed, 13 insertions, 0 deletions
diff --git a/src/opts/SkNx_neon.h b/src/opts/SkNx_neon.h index 660b92c6b0..cf149862c5 100644 --- a/src/opts/SkNx_neon.h +++ b/src/opts/SkNx_neon.h @@ -223,9 +223,22 @@ public: SkNf() {} explicit SkNf(float val) : fVec(vdupq_n_f32(val)) {} static SkNf Load(const float vals[4]) { return vld1q_f32(vals); } + static SkNf FromBytes(const uint8_t vals[4]) { + uint8x8_t fix8 = (uint8x8_t)vld1_dup_u32((const uint32_t*)vals); + uint16x8_t fix8_16 = vmovl_u8(fix8); + uint32x4_t fix8_32 = vmovl_u16(vget_low_u16(fix8_16)); + return SkNf(vcvtq_f32_u32(fix8_32)); + } + SkNf(float a, float b, float c, float d) { fVec = (float32x4_t) { a, b, c, d }; } void store(float vals[4]) const { vst1q_f32(vals, fVec); } + void toBytes(uint8_t bytes[4]) const { + uint32x4_t fix8_32 = vcvtq_u32_f32(fVec); + uint16x4_t fix8_16 = vqmovn_u32(fix8_32); + uint8x8_t fix8 = vqmovn_u16(vcombine_u16(fix8_16, vdup_n_u16(0))); + vst1_lane_u32((uint32_t*)bytes, (uint32x2_t)fix8, 0); + } SkNi<4, int> castTrunc() const { return vcvtq_s32_f32(fVec); } |