aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/opts/SkNx_neon.h
diff options
context:
space:
mode:
Diffstat (limited to 'src/opts/SkNx_neon.h')
-rw-r--r--src/opts/SkNx_neon.h13
1 files changed, 13 insertions, 0 deletions
diff --git a/src/opts/SkNx_neon.h b/src/opts/SkNx_neon.h
index 660b92c6b0..cf149862c5 100644
--- a/src/opts/SkNx_neon.h
+++ b/src/opts/SkNx_neon.h
@@ -223,9 +223,22 @@ public:
SkNf() {}
explicit SkNf(float val) : fVec(vdupq_n_f32(val)) {}
static SkNf Load(const float vals[4]) { return vld1q_f32(vals); }
+ static SkNf FromBytes(const uint8_t vals[4]) {
+ uint8x8_t fix8 = (uint8x8_t)vld1_dup_u32((const uint32_t*)vals);
+ uint16x8_t fix8_16 = vmovl_u8(fix8);
+ uint32x4_t fix8_32 = vmovl_u16(vget_low_u16(fix8_16));
+ return SkNf(vcvtq_f32_u32(fix8_32));
+ }
+
SkNf(float a, float b, float c, float d) { fVec = (float32x4_t) { a, b, c, d }; }
void store(float vals[4]) const { vst1q_f32(vals, fVec); }
+ void toBytes(uint8_t bytes[4]) const {
+ uint32x4_t fix8_32 = vcvtq_u32_f32(fVec);
+ uint16x4_t fix8_16 = vqmovn_u32(fix8_32);
+ uint8x8_t fix8 = vqmovn_u16(vcombine_u16(fix8_16, vdup_n_u16(0)));
+ vst1_lane_u32((uint32_t*)bytes, (uint32x2_t)fix8, 0);
+ }
SkNi<4, int> castTrunc() const { return vcvtq_s32_f32(fVec); }