diff options
author | mtklein <mtklein@chromium.org> | 2016-01-19 12:20:01 -0800 |
---|---|---|
committer | Commit bot <commit-bot@chromium.org> | 2016-01-19 12:20:01 -0800 |
commit | 3bd5aba2a0e165997f683cf3aa306661e71464f6 (patch) | |
tree | 3feb6581aa6a48f7dc538eb1183dbaf06e580704 /src/opts/SkNx_sse.h | |
parent | bda86098ab2784968d0a1222dd1f4c18d18fe050 (diff) |
SkNx miplevel building
All sizes approximately twice as fast.
Before:
micros bench
1649.35 mipmap_build_512x512 nonrendering
1824.42 mipmap_build_511x512 nonrendering
2100.66 ? mipmap_build_512x511 nonrendering
2375.94 mipmap_build_511x511 nonrendering
After:
micros bench
730.32 ! mipmap_build_512x512 nonrendering
922.12 mipmap_build_511x512 nonrendering
999.07 mipmap_build_512x511 nonrendering
1342.93 ! mipmap_build_511x511 nonrendering
BUG=skia:
GOLD_TRYBOT_URL= https://gold.skia.org/search2?unt=true&query=source_type%3Dgm&master=false&issue=1606013003
CQ_EXTRA_TRYBOTS=client.skia:Test-Ubuntu-GCC-GCE-CPU-AVX2-x86_64-Release-SKNX_NO_SIMD-Trybot
Review URL: https://codereview.chromium.org/1606013003
Diffstat (limited to 'src/opts/SkNx_sse.h')
-rw-r--r-- | src/opts/SkNx_sse.h | 8 |
1 files changed, 8 insertions, 0 deletions
diff --git a/src/opts/SkNx_sse.h b/src/opts/SkNx_sse.h index c6163b6a80..a17d988ee7 100644 --- a/src/opts/SkNx_sse.h +++ b/src/opts/SkNx_sse.h @@ -379,6 +379,14 @@ static inline void Sk4f_ToBytes(uint8_t bytes[16], _mm_cvttps_epi32(d.fVec)))); } +template<> inline Sk4h SkNx_cast<uint16_t, uint8_t, 4>(const Sk4b& src) { + return _mm_unpacklo_epi8(src.fVec, _mm_setzero_si128()); +} + +template<> inline Sk4b SkNx_cast<uint8_t, uint16_t, 4>(const Sk4h& src) { + return _mm_packus_epi16(src.fVec, src.fVec); +} + } // namespace |