aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/jumper/SkJumper_generated_win.S
diff options
context:
space:
mode:
authorGravatar Mike Klein <mtklein@chromium.org>2017-08-30 09:22:50 -0400
committerGravatar Skia Commit-Bot <skia-commit-bot@chromium.org>2017-08-30 14:39:02 +0000
commit64dc4f6d4f73a890f0b2b29e68d7accd664fde87 (patch)
treee9d0d4be34f8861d96d318bc081a7a06bdfe2272 /src/jumper/SkJumper_generated_win.S
parenta523d2d1554441a79319eb46960d7b5c2dc85d9d (diff)
remove 8-bit Params struct
I'm not sure why I wrote this to use a Params struct originally, but we should have plenty of registers in _8bit to pass everything directly and avoid the stack. Even once we enable the 8-bit pipeline on 32-bit x86, we'll have 4 general purpose registers and 4 vector registers to use, precisely what we're using here. Change-Id: I3e51ab73186edcdcb8bfaa6cc99d9516db7c032a Reviewed-on: https://skia-review.googlesource.com/40771 Reviewed-by: Florin Malita <fmalita@chromium.org> Commit-Queue: Mike Klein <mtklein@chromium.org>
Diffstat (limited to 'src/jumper/SkJumper_generated_win.S')
-rw-r--r--src/jumper/SkJumper_generated_win.S7737
1 files changed, 3864 insertions, 3873 deletions
diff --git a/src/jumper/SkJumper_generated_win.S b/src/jumper/SkJumper_generated_win.S
index 08d4a3ab07..297922c68a 100644
--- a/src/jumper/SkJumper_generated_win.S
+++ b/src/jumper/SkJumper_generated_win.S
@@ -99,15 +99,15 @@ _sk_seed_shader_hsw LABEL PROC
DB 197,249,110,194 ; vmovd %edx,%xmm0
DB 196,226,125,88,192 ; vpbroadcastd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,138,191,2,0 ; vbroadcastss 0x2bf8a(%rip),%ymm1 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,13,198,190,2,0 ; vbroadcastss 0x2bec6(%rip),%ymm1 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 197,252,88,5,30,193,2,0 ; vaddps 0x2c11e(%rip),%ymm0,%ymm0 # 2c280 <_sk_overlay_sse2_8bit+0x60b>
+ DB 197,252,88,5,94,192,2,0 ; vaddps 0x2c05e(%rip),%ymm0,%ymm0 # 2c1c0 <_sk_overlay_sse2_8bit+0x610>
DB 197,249,110,209 ; vmovd %ecx,%xmm2
DB 196,226,125,88,210 ; vpbroadcastd %xmm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 197,236,88,201 ; vaddps %ymm1,%ymm2,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,21,102,191,2,0 ; vbroadcastss 0x2bf66(%rip),%ymm2 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,21,162,190,2,0 ; vbroadcastss 0x2bea2(%rip),%ymm2 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,228,87,219 ; vxorps %ymm3,%ymm3,%ymm3
DB 197,220,87,228 ; vxorps %ymm4,%ymm4,%ymm4
DB 197,212,87,237 ; vxorps %ymm5,%ymm5,%ymm5
@@ -120,17 +120,17 @@ _sk_dither_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,121,110,194 ; vmovd %edx,%xmm8
DB 196,66,125,88,192 ; vpbroadcastd %xmm8,%ymm8
- DB 197,61,254,5,249,192,2,0 ; vpaddd 0x2c0f9(%rip),%ymm8,%ymm8 # 2c2a0 <_sk_overlay_sse2_8bit+0x62b>
+ DB 197,61,254,5,57,192,2,0 ; vpaddd 0x2c039(%rip),%ymm8,%ymm8 # 2c1e0 <_sk_overlay_sse2_8bit+0x630>
DB 197,121,110,201 ; vmovd %ecx,%xmm9
DB 196,66,125,88,201 ; vpbroadcastd %xmm9,%ymm9
DB 196,65,53,239,200 ; vpxor %ymm8,%ymm9,%ymm9
- DB 196,98,125,88,21,42,191,2,0 ; vpbroadcastd 0x2bf2a(%rip),%ymm10 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,125,88,21,102,190,2,0 ; vpbroadcastd 0x2be66(%rip),%ymm10 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,65,53,219,218 ; vpand %ymm10,%ymm9,%ymm11
DB 196,193,37,114,243,5 ; vpslld $0x5,%ymm11,%ymm11
DB 196,65,61,219,210 ; vpand %ymm10,%ymm8,%ymm10
DB 196,193,45,114,242,4 ; vpslld $0x4,%ymm10,%ymm10
- DB 196,98,125,88,37,15,191,2,0 ; vpbroadcastd 0x2bf0f(%rip),%ymm12 # 2c0ec <_sk_overlay_sse2_8bit+0x477>
- DB 196,98,125,88,45,10,191,2,0 ; vpbroadcastd 0x2bf0a(%rip),%ymm13 # 2c0f0 <_sk_overlay_sse2_8bit+0x47b>
+ DB 196,98,125,88,37,75,190,2,0 ; vpbroadcastd 0x2be4b(%rip),%ymm12 # 2c028 <_sk_overlay_sse2_8bit+0x478>
+ DB 196,98,125,88,45,70,190,2,0 ; vpbroadcastd 0x2be46(%rip),%ymm13 # 2c02c <_sk_overlay_sse2_8bit+0x47c>
DB 196,65,53,219,245 ; vpand %ymm13,%ymm9,%ymm14
DB 196,193,13,114,246,2 ; vpslld $0x2,%ymm14,%ymm14
DB 196,65,61,219,237 ; vpand %ymm13,%ymm8,%ymm13
@@ -145,8 +145,8 @@ _sk_dither_hsw LABEL PROC
DB 196,65,61,235,194 ; vpor %ymm10,%ymm8,%ymm8
DB 196,65,61,235,193 ; vpor %ymm9,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,188,190,2,0 ; vbroadcastss 0x2bebc(%rip),%ymm9 # 2c0f4 <_sk_overlay_sse2_8bit+0x47f>
- DB 196,98,125,24,21,183,190,2,0 ; vbroadcastss 0x2beb7(%rip),%ymm10 # 2c0f8 <_sk_overlay_sse2_8bit+0x483>
+ DB 196,98,125,24,13,248,189,2,0 ; vbroadcastss 0x2bdf8(%rip),%ymm9 # 2c030 <_sk_overlay_sse2_8bit+0x480>
+ DB 196,98,125,24,21,243,189,2,0 ; vbroadcastss 0x2bdf3(%rip),%ymm10 # 2c034 <_sk_overlay_sse2_8bit+0x484>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 196,98,125,24,0 ; vbroadcastss (%rax),%ymm8
DB 196,65,44,89,192 ; vmulps %ymm8,%ymm10,%ymm8
@@ -176,7 +176,7 @@ _sk_uniform_color_hsw LABEL PROC
PUBLIC _sk_black_color_hsw
_sk_black_color_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,63,190,2,0 ; vbroadcastss 0x2be3f(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,123,189,2,0 ; vbroadcastss 0x2bd7b(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 197,236,87,210 ; vxorps %ymm2,%ymm2,%ymm2
@@ -185,7 +185,7 @@ _sk_black_color_hsw LABEL PROC
PUBLIC _sk_white_color_hsw
_sk_white_color_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,38,190,2,0 ; vbroadcastss 0x2be26(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,98,189,2,0 ; vbroadcastss 0x2bd62(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
@@ -223,7 +223,7 @@ _sk_clear_hsw LABEL PROC
PUBLIC _sk_srcatop_hsw
_sk_srcatop_hsw LABEL PROC
DB 197,252,89,199 ; vmulps %ymm7,%ymm0,%ymm0
- DB 196,98,125,24,5,197,189,2,0 ; vbroadcastss 0x2bdc5(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,1,189,2,0 ; vbroadcastss 0x2bd01(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,226,61,184,196 ; vfmadd231ps %ymm4,%ymm8,%ymm0
DB 197,244,89,207 ; vmulps %ymm7,%ymm1,%ymm1
@@ -237,7 +237,7 @@ _sk_srcatop_hsw LABEL PROC
PUBLIC _sk_dstatop_hsw
_sk_dstatop_hsw LABEL PROC
- DB 196,98,125,24,5,148,189,2,0 ; vbroadcastss 0x2bd94(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,208,188,2,0 ; vbroadcastss 0x2bcd0(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,226,101,184,196 ; vfmadd231ps %ymm4,%ymm3,%ymm0
@@ -270,7 +270,7 @@ _sk_dstin_hsw LABEL PROC
PUBLIC _sk_srcout_hsw
_sk_srcout_hsw LABEL PROC
- DB 196,98,125,24,5,55,189,2,0 ; vbroadcastss 0x2bd37(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,115,188,2,0 ; vbroadcastss 0x2bc73(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -281,7 +281,7 @@ _sk_srcout_hsw LABEL PROC
PUBLIC _sk_dstout_hsw
_sk_dstout_hsw LABEL PROC
- DB 196,226,125,24,5,22,189,2,0 ; vbroadcastss 0x2bd16(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,82,188,2,0 ; vbroadcastss 0x2bc52(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,92,219 ; vsubps %ymm3,%ymm0,%ymm3
DB 197,228,89,196 ; vmulps %ymm4,%ymm3,%ymm0
DB 197,228,89,205 ; vmulps %ymm5,%ymm3,%ymm1
@@ -292,7 +292,7 @@ _sk_dstout_hsw LABEL PROC
PUBLIC _sk_srcover_hsw
_sk_srcover_hsw LABEL PROC
- DB 196,98,125,24,5,245,188,2,0 ; vbroadcastss 0x2bcf5(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,49,188,2,0 ; vbroadcastss 0x2bc31(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,93,184,192 ; vfmadd231ps %ymm8,%ymm4,%ymm0
DB 196,194,85,184,200 ; vfmadd231ps %ymm8,%ymm5,%ymm1
@@ -303,7 +303,7 @@ _sk_srcover_hsw LABEL PROC
PUBLIC _sk_dstover_hsw
_sk_dstover_hsw LABEL PROC
- DB 196,98,125,24,5,208,188,2,0 ; vbroadcastss 0x2bcd0(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,12,188,2,0 ; vbroadcastss 0x2bc0c(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 196,226,61,168,196 ; vfmadd213ps %ymm4,%ymm8,%ymm0
DB 196,226,61,168,205 ; vfmadd213ps %ymm5,%ymm8,%ymm1
@@ -323,7 +323,7 @@ _sk_modulate_hsw LABEL PROC
PUBLIC _sk_multiply_hsw
_sk_multiply_hsw LABEL PROC
- DB 196,98,125,24,5,151,188,2,0 ; vbroadcastss 0x2bc97(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,211,187,2,0 ; vbroadcastss 0x2bbd3(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,208 ; vmulps %ymm0,%ymm9,%ymm10
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -344,7 +344,7 @@ _sk_multiply_hsw LABEL PROC
PUBLIC _sk_plus__hsw
_sk_plus__hsw LABEL PROC
DB 197,252,88,196 ; vaddps %ymm4,%ymm0,%ymm0
- DB 196,98,125,24,5,70,188,2,0 ; vbroadcastss 0x2bc46(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,130,187,2,0 ; vbroadcastss 0x2bb82(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 197,244,88,205 ; vaddps %ymm5,%ymm1,%ymm1
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
@@ -370,7 +370,7 @@ _sk_screen_hsw LABEL PROC
PUBLIC _sk_xor__hsw
_sk_xor__hsw LABEL PROC
- DB 196,98,125,24,5,241,187,2,0 ; vbroadcastss 0x2bbf1(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,45,187,2,0 ; vbroadcastss 0x2bb2d(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -402,7 +402,7 @@ _sk_darken_hsw LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,95,209 ; vmaxps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,117,187,2,0 ; vbroadcastss 0x2bb75(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,177,186,2,0 ; vbroadcastss 0x2bab1(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -425,7 +425,7 @@ _sk_lighten_hsw LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,32,187,2,0 ; vbroadcastss 0x2bb20(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,92,186,2,0 ; vbroadcastss 0x2ba5c(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -451,7 +451,7 @@ _sk_difference_hsw LABEL PROC
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,191,186,2,0 ; vbroadcastss 0x2babf(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,251,185,2,0 ; vbroadcastss 0x2b9fb(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -471,7 +471,7 @@ _sk_exclusion_hsw LABEL PROC
DB 197,236,89,214 ; vmulps %ymm6,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,121,186,2,0 ; vbroadcastss 0x2ba79(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,181,185,2,0 ; vbroadcastss 0x2b9b5(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -479,7 +479,7 @@ _sk_exclusion_hsw LABEL PROC
PUBLIC _sk_colorburn_hsw
_sk_colorburn_hsw LABEL PROC
- DB 196,98,125,24,5,99,186,2,0 ; vbroadcastss 0x2ba63(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,159,185,2,0 ; vbroadcastss 0x2b99f(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,216 ; vmulps %ymm0,%ymm9,%ymm11
DB 196,65,44,87,210 ; vxorps %ymm10,%ymm10,%ymm10
@@ -535,7 +535,7 @@ _sk_colorburn_hsw LABEL PROC
PUBLIC _sk_colordodge_hsw
_sk_colordodge_hsw LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
- DB 196,98,125,24,13,115,185,2,0 ; vbroadcastss 0x2b973(%rip),%ymm9 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,13,175,184,2,0 ; vbroadcastss 0x2b8af(%rip),%ymm9 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,52,92,215 ; vsubps %ymm7,%ymm9,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,52,92,203 ; vsubps %ymm3,%ymm9,%ymm9
@@ -586,7 +586,7 @@ _sk_colordodge_hsw LABEL PROC
PUBLIC _sk_hardlight_hsw
_sk_hardlight_hsw LABEL PROC
- DB 196,98,125,24,5,141,184,2,0 ; vbroadcastss 0x2b88d(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,201,183,2,0 ; vbroadcastss 0x2b7c9(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -635,7 +635,7 @@ _sk_hardlight_hsw LABEL PROC
PUBLIC _sk_overlay_hsw
_sk_overlay_hsw LABEL PROC
- DB 196,98,125,24,5,193,183,2,0 ; vbroadcastss 0x2b7c1(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,253,182,2,0 ; vbroadcastss 0x2b6fd(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -695,10 +695,10 @@ _sk_softlight_hsw LABEL PROC
DB 196,65,20,88,197 ; vaddps %ymm13,%ymm13,%ymm8
DB 196,65,60,88,192 ; vaddps %ymm8,%ymm8,%ymm8
DB 196,66,61,168,192 ; vfmadd213ps %ymm8,%ymm8,%ymm8
- DB 196,98,125,24,29,216,182,2,0 ; vbroadcastss 0x2b6d8(%rip),%ymm11 # 2c0fc <_sk_overlay_sse2_8bit+0x487>
+ DB 196,98,125,24,29,20,182,2,0 ; vbroadcastss 0x2b614(%rip),%ymm11 # 2c038 <_sk_overlay_sse2_8bit+0x488>
DB 196,65,20,88,227 ; vaddps %ymm11,%ymm13,%ymm12
DB 196,65,28,89,192 ; vmulps %ymm8,%ymm12,%ymm8
- DB 196,98,125,24,37,201,182,2,0 ; vbroadcastss 0x2b6c9(%rip),%ymm12 # 2c100 <_sk_overlay_sse2_8bit+0x48b>
+ DB 196,98,125,24,37,5,182,2,0 ; vbroadcastss 0x2b605(%rip),%ymm12 # 2c03c <_sk_overlay_sse2_8bit+0x48c>
DB 196,66,21,184,196 ; vfmadd231ps %ymm12,%ymm13,%ymm8
DB 196,65,124,82,245 ; vrsqrtps %ymm13,%ymm14
DB 196,65,124,83,246 ; vrcpps %ymm14,%ymm14
@@ -708,7 +708,7 @@ _sk_softlight_hsw LABEL PROC
DB 197,4,194,255,2 ; vcmpleps %ymm7,%ymm15,%ymm15
DB 196,67,13,74,240,240 ; vblendvps %ymm15,%ymm8,%ymm14,%ymm14
DB 197,116,88,249 ; vaddps %ymm1,%ymm1,%ymm15
- DB 196,98,125,24,5,120,182,2,0 ; vbroadcastss 0x2b678(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,180,181,2,0 ; vbroadcastss 0x2b5b4(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,65,60,92,237 ; vsubps %ymm13,%ymm8,%ymm13
DB 197,132,92,195 ; vsubps %ymm3,%ymm15,%ymm0
DB 196,98,125,168,235 ; vfmadd213ps %ymm3,%ymm0,%ymm13
@@ -821,11 +821,11 @@ _sk_hue_hsw LABEL PROC
DB 196,65,28,89,210 ; vmulps %ymm10,%ymm12,%ymm10
DB 196,65,44,94,214 ; vdivps %ymm14,%ymm10,%ymm10
DB 196,67,45,74,224,240 ; vblendvps %ymm15,%ymm8,%ymm10,%ymm12
- DB 196,98,125,24,53,139,180,2,0 ; vbroadcastss 0x2b48b(%rip),%ymm14 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
- DB 196,98,125,24,61,134,180,2,0 ; vbroadcastss 0x2b486(%rip),%ymm15 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,53,199,179,2,0 ; vbroadcastss 0x2b3c7(%rip),%ymm14 # 2c040 <_sk_overlay_sse2_8bit+0x490>
+ DB 196,98,125,24,61,194,179,2,0 ; vbroadcastss 0x2b3c2(%rip),%ymm15 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,84,89,239 ; vmulps %ymm15,%ymm5,%ymm13
DB 196,66,93,184,238 ; vfmadd231ps %ymm14,%ymm4,%ymm13
- DB 196,226,125,24,5,119,180,2,0 ; vbroadcastss 0x2b477(%rip),%ymm0 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,226,125,24,5,179,179,2,0 ; vbroadcastss 0x2b3b3(%rip),%ymm0 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 196,98,77,184,232 ; vfmadd231ps %ymm0,%ymm6,%ymm13
DB 196,65,116,89,215 ; vmulps %ymm15,%ymm1,%ymm10
DB 196,66,53,184,214 ; vfmadd231ps %ymm14,%ymm9,%ymm10
@@ -880,7 +880,7 @@ _sk_hue_hsw LABEL PROC
DB 196,193,124,95,192 ; vmaxps %ymm8,%ymm0,%ymm0
DB 196,65,36,95,200 ; vmaxps %ymm8,%ymm11,%ymm9
DB 196,65,116,95,192 ; vmaxps %ymm8,%ymm1,%ymm8
- DB 196,226,125,24,13,56,179,2,0 ; vbroadcastss 0x2b338(%rip),%ymm1 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,13,116,178,2,0 ; vbroadcastss 0x2b274(%rip),%ymm1 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,116,92,215 ; vsubps %ymm7,%ymm1,%ymm10
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 197,116,92,219 ; vsubps %ymm3,%ymm1,%ymm11
@@ -934,11 +934,11 @@ _sk_saturation_hsw LABEL PROC
DB 196,65,28,89,210 ; vmulps %ymm10,%ymm12,%ymm10
DB 196,65,44,94,214 ; vdivps %ymm14,%ymm10,%ymm10
DB 196,67,45,74,224,240 ; vblendvps %ymm15,%ymm8,%ymm10,%ymm12
- DB 196,98,125,24,53,101,178,2,0 ; vbroadcastss 0x2b265(%rip),%ymm14 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
- DB 196,98,125,24,61,96,178,2,0 ; vbroadcastss 0x2b260(%rip),%ymm15 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,53,161,177,2,0 ; vbroadcastss 0x2b1a1(%rip),%ymm14 # 2c040 <_sk_overlay_sse2_8bit+0x490>
+ DB 196,98,125,24,61,156,177,2,0 ; vbroadcastss 0x2b19c(%rip),%ymm15 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,84,89,239 ; vmulps %ymm15,%ymm5,%ymm13
DB 196,66,93,184,238 ; vfmadd231ps %ymm14,%ymm4,%ymm13
- DB 196,226,125,24,5,81,178,2,0 ; vbroadcastss 0x2b251(%rip),%ymm0 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,226,125,24,5,141,177,2,0 ; vbroadcastss 0x2b18d(%rip),%ymm0 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 196,98,77,184,232 ; vfmadd231ps %ymm0,%ymm6,%ymm13
DB 196,65,116,89,215 ; vmulps %ymm15,%ymm1,%ymm10
DB 196,66,53,184,214 ; vfmadd231ps %ymm14,%ymm9,%ymm10
@@ -993,7 +993,7 @@ _sk_saturation_hsw LABEL PROC
DB 196,193,124,95,192 ; vmaxps %ymm8,%ymm0,%ymm0
DB 196,65,36,95,200 ; vmaxps %ymm8,%ymm11,%ymm9
DB 196,65,116,95,192 ; vmaxps %ymm8,%ymm1,%ymm8
- DB 196,226,125,24,13,18,177,2,0 ; vbroadcastss 0x2b112(%rip),%ymm1 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,13,78,176,2,0 ; vbroadcastss 0x2b04e(%rip),%ymm1 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,116,92,215 ; vsubps %ymm7,%ymm1,%ymm10
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 197,116,92,219 ; vsubps %ymm3,%ymm1,%ymm11
@@ -1021,11 +1021,11 @@ _sk_color_hsw LABEL PROC
DB 197,108,89,199 ; vmulps %ymm7,%ymm2,%ymm8
DB 197,116,89,215 ; vmulps %ymm7,%ymm1,%ymm10
DB 197,52,89,223 ; vmulps %ymm7,%ymm9,%ymm11
- DB 196,98,125,24,45,193,176,2,0 ; vbroadcastss 0x2b0c1(%rip),%ymm13 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
- DB 196,98,125,24,53,188,176,2,0 ; vbroadcastss 0x2b0bc(%rip),%ymm14 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,45,253,175,2,0 ; vbroadcastss 0x2affd(%rip),%ymm13 # 2c040 <_sk_overlay_sse2_8bit+0x490>
+ DB 196,98,125,24,53,248,175,2,0 ; vbroadcastss 0x2aff8(%rip),%ymm14 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,84,89,230 ; vmulps %ymm14,%ymm5,%ymm12
DB 196,66,93,184,229 ; vfmadd231ps %ymm13,%ymm4,%ymm12
- DB 196,98,125,24,61,173,176,2,0 ; vbroadcastss 0x2b0ad(%rip),%ymm15 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,98,125,24,61,233,175,2,0 ; vbroadcastss 0x2afe9(%rip),%ymm15 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 196,66,77,184,231 ; vfmadd231ps %ymm15,%ymm6,%ymm12
DB 196,65,44,89,206 ; vmulps %ymm14,%ymm10,%ymm9
DB 196,66,61,184,205 ; vfmadd231ps %ymm13,%ymm8,%ymm9
@@ -1081,7 +1081,7 @@ _sk_color_hsw LABEL PROC
DB 196,193,116,95,206 ; vmaxps %ymm14,%ymm1,%ymm1
DB 196,65,44,95,198 ; vmaxps %ymm14,%ymm10,%ymm8
DB 196,65,124,95,206 ; vmaxps %ymm14,%ymm0,%ymm9
- DB 196,226,125,24,5,99,175,2,0 ; vbroadcastss 0x2af63(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,159,174,2,0 ; vbroadcastss 0x2ae9f(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,124,92,215 ; vsubps %ymm7,%ymm0,%ymm10
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 197,124,92,219 ; vsubps %ymm3,%ymm0,%ymm11
@@ -1109,11 +1109,11 @@ _sk_luminosity_hsw LABEL PROC
DB 197,100,89,196 ; vmulps %ymm4,%ymm3,%ymm8
DB 197,100,89,213 ; vmulps %ymm5,%ymm3,%ymm10
DB 197,100,89,222 ; vmulps %ymm6,%ymm3,%ymm11
- DB 196,98,125,24,45,18,175,2,0 ; vbroadcastss 0x2af12(%rip),%ymm13 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
- DB 196,98,125,24,53,13,175,2,0 ; vbroadcastss 0x2af0d(%rip),%ymm14 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,45,78,174,2,0 ; vbroadcastss 0x2ae4e(%rip),%ymm13 # 2c040 <_sk_overlay_sse2_8bit+0x490>
+ DB 196,98,125,24,53,73,174,2,0 ; vbroadcastss 0x2ae49(%rip),%ymm14 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,116,89,230 ; vmulps %ymm14,%ymm1,%ymm12
DB 196,66,109,184,229 ; vfmadd231ps %ymm13,%ymm2,%ymm12
- DB 196,98,125,24,61,254,174,2,0 ; vbroadcastss 0x2aefe(%rip),%ymm15 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,98,125,24,61,58,174,2,0 ; vbroadcastss 0x2ae3a(%rip),%ymm15 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 196,66,53,184,231 ; vfmadd231ps %ymm15,%ymm9,%ymm12
DB 196,65,44,89,206 ; vmulps %ymm14,%ymm10,%ymm9
DB 196,66,61,184,205 ; vfmadd231ps %ymm13,%ymm8,%ymm9
@@ -1169,7 +1169,7 @@ _sk_luminosity_hsw LABEL PROC
DB 196,193,116,95,206 ; vmaxps %ymm14,%ymm1,%ymm1
DB 196,65,44,95,198 ; vmaxps %ymm14,%ymm10,%ymm8
DB 196,65,124,95,206 ; vmaxps %ymm14,%ymm0,%ymm9
- DB 196,226,125,24,5,180,173,2,0 ; vbroadcastss 0x2adb4(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,240,172,2,0 ; vbroadcastss 0x2acf0(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,124,92,215 ; vsubps %ymm7,%ymm0,%ymm10
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 197,124,92,219 ; vsubps %ymm3,%ymm0,%ymm11
@@ -1199,17 +1199,17 @@ _sk_srcover_rgba_8888_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,179,0,0,0 ; jne 1448 <_sk_srcover_rgba_8888_hsw+0xd3>
DB 196,129,126,111,60,152 ; vmovdqu (%r8,%r11,4),%ymm7
- DB 197,197,219,37,29,175,2,0 ; vpand 0x2af1d(%rip),%ymm7,%ymm4 # 2c2c0 <_sk_overlay_sse2_8bit+0x64b>
+ DB 197,197,219,37,93,174,2,0 ; vpand 0x2ae5d(%rip),%ymm7,%ymm4 # 2c200 <_sk_overlay_sse2_8bit+0x650>
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,69,0,45,48,175,2,0 ; vpshufb 0x2af30(%rip),%ymm7,%ymm5 # 2c2e0 <_sk_overlay_sse2_8bit+0x66b>
+ DB 196,226,69,0,45,112,174,2,0 ; vpshufb 0x2ae70(%rip),%ymm7,%ymm5 # 2c220 <_sk_overlay_sse2_8bit+0x670>
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
- DB 196,226,69,0,53,67,175,2,0 ; vpshufb 0x2af43(%rip),%ymm7,%ymm6 # 2c300 <_sk_overlay_sse2_8bit+0x68b>
+ DB 196,226,69,0,53,131,174,2,0 ; vpshufb 0x2ae83(%rip),%ymm7,%ymm6 # 2c240 <_sk_overlay_sse2_8bit+0x690>
DB 197,252,91,246 ; vcvtdq2ps %ymm6,%ymm6
DB 197,197,114,215,24 ; vpsrld $0x18,%ymm7,%ymm7
DB 197,252,91,255 ; vcvtdq2ps %ymm7,%ymm7
- DB 196,98,125,24,5,17,173,2,0 ; vbroadcastss 0x2ad11(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,77,172,2,0 ; vbroadcastss 0x2ac4d(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
- DB 196,98,125,24,13,48,173,2,0 ; vbroadcastss 0x2ad30(%rip),%ymm9 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,13,108,172,2,0 ; vbroadcastss 0x2ac6c(%rip),%ymm9 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,194,93,184,192 ; vfmadd231ps %ymm8,%ymm4,%ymm0
DB 196,193,116,89,201 ; vmulps %ymm9,%ymm1,%ymm1
@@ -1331,7 +1331,7 @@ _sk_clamp_0_hsw LABEL PROC
PUBLIC _sk_clamp_1_hsw
_sk_clamp_1_hsw LABEL PROC
- DB 196,98,125,24,5,30,171,2,0 ; vbroadcastss 0x2ab1e(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,90,170,2,0 ; vbroadcastss 0x2aa5a(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
@@ -1341,7 +1341,7 @@ _sk_clamp_1_hsw LABEL PROC
PUBLIC _sk_clamp_a_hsw
_sk_clamp_a_hsw LABEL PROC
- DB 196,98,125,24,5,253,170,2,0 ; vbroadcastss 0x2aafd(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,57,170,2,0 ; vbroadcastss 0x2aa39(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 197,252,93,195 ; vminps %ymm3,%ymm0,%ymm0
DB 197,244,93,203 ; vminps %ymm3,%ymm1,%ymm1
@@ -1351,7 +1351,7 @@ _sk_clamp_a_hsw LABEL PROC
PUBLIC _sk_clamp_a_dst_hsw
_sk_clamp_a_dst_hsw LABEL PROC
- DB 196,98,125,24,5,223,170,2,0 ; vbroadcastss 0x2aadf(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,27,170,2,0 ; vbroadcastss 0x2aa1b(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,68,93,248 ; vminps %ymm8,%ymm7,%ymm7
DB 197,220,93,231 ; vminps %ymm7,%ymm4,%ymm4
DB 197,212,93,239 ; vminps %ymm7,%ymm5,%ymm5
@@ -1378,7 +1378,7 @@ _sk_swap_rb_hsw LABEL PROC
PUBLIC _sk_invert_hsw
_sk_invert_hsw LABEL PROC
- DB 196,98,125,24,5,154,170,2,0 ; vbroadcastss 0x2aa9a(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,214,169,2,0 ; vbroadcastss 0x2a9d6(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,188,92,192 ; vsubps %ymm0,%ymm8,%ymm0
DB 197,188,92,201 ; vsubps %ymm1,%ymm8,%ymm1
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
@@ -1424,7 +1424,7 @@ PUBLIC _sk_unpremul_hsw
_sk_unpremul_hsw LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,65,100,194,200,0 ; vcmpeqps %ymm8,%ymm3,%ymm9
- DB 196,98,125,24,21,42,170,2,0 ; vbroadcastss 0x2aa2a(%rip),%ymm10 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,21,102,169,2,0 ; vbroadcastss 0x2a966(%rip),%ymm10 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,44,94,211 ; vdivps %ymm3,%ymm10,%ymm10
DB 196,67,45,74,192,144 ; vblendvps %ymm9,%ymm8,%ymm10,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
@@ -1435,16 +1435,16 @@ _sk_unpremul_hsw LABEL PROC
PUBLIC _sk_from_srgb_hsw
_sk_from_srgb_hsw LABEL PROC
- DB 196,98,125,24,5,55,170,2,0 ; vbroadcastss 0x2aa37(%rip),%ymm8 # 2c114 <_sk_overlay_sse2_8bit+0x49f>
+ DB 196,98,125,24,5,115,169,2,0 ; vbroadcastss 0x2a973(%rip),%ymm8 # 2c050 <_sk_overlay_sse2_8bit+0x4a0>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 197,124,89,208 ; vmulps %ymm0,%ymm0,%ymm10
- DB 196,98,125,24,29,41,170,2,0 ; vbroadcastss 0x2aa29(%rip),%ymm11 # 2c118 <_sk_overlay_sse2_8bit+0x4a3>
- DB 196,98,125,24,37,12,170,2,0 ; vbroadcastss 0x2aa0c(%rip),%ymm12 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,29,101,169,2,0 ; vbroadcastss 0x2a965(%rip),%ymm11 # 2c054 <_sk_overlay_sse2_8bit+0x4a4>
+ DB 196,98,125,24,37,72,169,2,0 ; vbroadcastss 0x2a948(%rip),%ymm12 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,124,40,236 ; vmovaps %ymm12,%ymm13
DB 196,66,125,168,235 ; vfmadd213ps %ymm11,%ymm0,%ymm13
- DB 196,98,125,24,53,17,170,2,0 ; vbroadcastss 0x2aa11(%rip),%ymm14 # 2c11c <_sk_overlay_sse2_8bit+0x4a7>
+ DB 196,98,125,24,53,77,169,2,0 ; vbroadcastss 0x2a94d(%rip),%ymm14 # 2c058 <_sk_overlay_sse2_8bit+0x4a8>
DB 196,66,45,168,238 ; vfmadd213ps %ymm14,%ymm10,%ymm13
- DB 196,98,125,24,21,7,170,2,0 ; vbroadcastss 0x2aa07(%rip),%ymm10 # 2c120 <_sk_overlay_sse2_8bit+0x4ab>
+ DB 196,98,125,24,21,67,169,2,0 ; vbroadcastss 0x2a943(%rip),%ymm10 # 2c05c <_sk_overlay_sse2_8bit+0x4ac>
DB 196,193,124,194,194,1 ; vcmpltps %ymm10,%ymm0,%ymm0
DB 196,195,21,74,193,0 ; vblendvps %ymm0,%ymm9,%ymm13,%ymm0
DB 196,65,116,89,200 ; vmulps %ymm8,%ymm1,%ymm9
@@ -1465,16 +1465,16 @@ _sk_from_srgb_hsw LABEL PROC
PUBLIC _sk_from_srgb_dst_hsw
_sk_from_srgb_dst_hsw LABEL PROC
- DB 196,98,125,24,5,159,169,2,0 ; vbroadcastss 0x2a99f(%rip),%ymm8 # 2c114 <_sk_overlay_sse2_8bit+0x49f>
+ DB 196,98,125,24,5,219,168,2,0 ; vbroadcastss 0x2a8db(%rip),%ymm8 # 2c050 <_sk_overlay_sse2_8bit+0x4a0>
DB 196,65,92,89,200 ; vmulps %ymm8,%ymm4,%ymm9
DB 197,92,89,212 ; vmulps %ymm4,%ymm4,%ymm10
- DB 196,98,125,24,29,145,169,2,0 ; vbroadcastss 0x2a991(%rip),%ymm11 # 2c118 <_sk_overlay_sse2_8bit+0x4a3>
- DB 196,98,125,24,37,116,169,2,0 ; vbroadcastss 0x2a974(%rip),%ymm12 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,29,205,168,2,0 ; vbroadcastss 0x2a8cd(%rip),%ymm11 # 2c054 <_sk_overlay_sse2_8bit+0x4a4>
+ DB 196,98,125,24,37,176,168,2,0 ; vbroadcastss 0x2a8b0(%rip),%ymm12 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,124,40,236 ; vmovaps %ymm12,%ymm13
DB 196,66,93,168,235 ; vfmadd213ps %ymm11,%ymm4,%ymm13
- DB 196,98,125,24,53,121,169,2,0 ; vbroadcastss 0x2a979(%rip),%ymm14 # 2c11c <_sk_overlay_sse2_8bit+0x4a7>
+ DB 196,98,125,24,53,181,168,2,0 ; vbroadcastss 0x2a8b5(%rip),%ymm14 # 2c058 <_sk_overlay_sse2_8bit+0x4a8>
DB 196,66,45,168,238 ; vfmadd213ps %ymm14,%ymm10,%ymm13
- DB 196,98,125,24,21,111,169,2,0 ; vbroadcastss 0x2a96f(%rip),%ymm10 # 2c120 <_sk_overlay_sse2_8bit+0x4ab>
+ DB 196,98,125,24,21,171,168,2,0 ; vbroadcastss 0x2a8ab(%rip),%ymm10 # 2c05c <_sk_overlay_sse2_8bit+0x4ac>
DB 196,193,92,194,226,1 ; vcmpltps %ymm10,%ymm4,%ymm4
DB 196,195,21,74,225,64 ; vblendvps %ymm4,%ymm9,%ymm13,%ymm4
DB 196,65,84,89,200 ; vmulps %ymm8,%ymm5,%ymm9
@@ -1496,19 +1496,19 @@ _sk_from_srgb_dst_hsw LABEL PROC
PUBLIC _sk_to_srgb_hsw
_sk_to_srgb_hsw LABEL PROC
DB 197,124,82,200 ; vrsqrtps %ymm0,%ymm9
- DB 196,98,125,24,5,19,169,2,0 ; vbroadcastss 0x2a913(%rip),%ymm8 # 2c124 <_sk_overlay_sse2_8bit+0x4af>
+ DB 196,98,125,24,5,79,168,2,0 ; vbroadcastss 0x2a84f(%rip),%ymm8 # 2c060 <_sk_overlay_sse2_8bit+0x4b0>
DB 196,65,124,89,208 ; vmulps %ymm8,%ymm0,%ymm10
- DB 196,98,125,24,29,9,169,2,0 ; vbroadcastss 0x2a909(%rip),%ymm11 # 2c128 <_sk_overlay_sse2_8bit+0x4b3>
- DB 196,98,125,24,37,4,169,2,0 ; vbroadcastss 0x2a904(%rip),%ymm12 # 2c12c <_sk_overlay_sse2_8bit+0x4b7>
+ DB 196,98,125,24,29,69,168,2,0 ; vbroadcastss 0x2a845(%rip),%ymm11 # 2c064 <_sk_overlay_sse2_8bit+0x4b4>
+ DB 196,98,125,24,37,64,168,2,0 ; vbroadcastss 0x2a840(%rip),%ymm12 # 2c068 <_sk_overlay_sse2_8bit+0x4b8>
DB 196,65,124,40,236 ; vmovaps %ymm12,%ymm13
DB 196,66,53,168,235 ; vfmadd213ps %ymm11,%ymm9,%ymm13
- DB 196,98,125,24,53,245,168,2,0 ; vbroadcastss 0x2a8f5(%rip),%ymm14 # 2c130 <_sk_overlay_sse2_8bit+0x4bb>
+ DB 196,98,125,24,53,49,168,2,0 ; vbroadcastss 0x2a831(%rip),%ymm14 # 2c06c <_sk_overlay_sse2_8bit+0x4bc>
DB 196,66,53,168,238 ; vfmadd213ps %ymm14,%ymm9,%ymm13
- DB 196,98,125,24,61,235,168,2,0 ; vbroadcastss 0x2a8eb(%rip),%ymm15 # 2c134 <_sk_overlay_sse2_8bit+0x4bf>
+ DB 196,98,125,24,61,39,168,2,0 ; vbroadcastss 0x2a827(%rip),%ymm15 # 2c070 <_sk_overlay_sse2_8bit+0x4c0>
DB 196,65,52,88,207 ; vaddps %ymm15,%ymm9,%ymm9
DB 196,65,124,83,201 ; vrcpps %ymm9,%ymm9
DB 196,65,20,89,201 ; vmulps %ymm9,%ymm13,%ymm9
- DB 196,98,125,24,45,215,168,2,0 ; vbroadcastss 0x2a8d7(%rip),%ymm13 # 2c138 <_sk_overlay_sse2_8bit+0x4c3>
+ DB 196,98,125,24,45,19,168,2,0 ; vbroadcastss 0x2a813(%rip),%ymm13 # 2c074 <_sk_overlay_sse2_8bit+0x4c4>
DB 196,193,124,194,197,1 ; vcmpltps %ymm13,%ymm0,%ymm0
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 197,124,82,201 ; vrsqrtps %ymm1,%ymm9
@@ -1540,26 +1540,26 @@ _sk_rgb_to_hsl_hsw LABEL PROC
DB 197,116,93,202 ; vminps %ymm2,%ymm1,%ymm9
DB 196,65,124,93,201 ; vminps %ymm9,%ymm0,%ymm9
DB 196,65,60,92,209 ; vsubps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,29,242,167,2,0 ; vbroadcastss 0x2a7f2(%rip),%ymm11 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,29,46,167,2,0 ; vbroadcastss 0x2a72e(%rip),%ymm11 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,65,36,94,218 ; vdivps %ymm10,%ymm11,%ymm11
DB 197,116,92,226 ; vsubps %ymm2,%ymm1,%ymm12
DB 197,116,194,234,1 ; vcmpltps %ymm2,%ymm1,%ymm13
- DB 196,98,125,24,53,51,168,2,0 ; vbroadcastss 0x2a833(%rip),%ymm14 # 2c13c <_sk_overlay_sse2_8bit+0x4c7>
+ DB 196,98,125,24,53,111,167,2,0 ; vbroadcastss 0x2a76f(%rip),%ymm14 # 2c078 <_sk_overlay_sse2_8bit+0x4c8>
DB 196,65,4,87,255 ; vxorps %ymm15,%ymm15,%ymm15
DB 196,67,5,74,238,208 ; vblendvps %ymm13,%ymm14,%ymm15,%ymm13
DB 196,66,37,168,229 ; vfmadd213ps %ymm13,%ymm11,%ymm12
DB 197,236,92,208 ; vsubps %ymm0,%ymm2,%ymm2
DB 197,124,92,233 ; vsubps %ymm1,%ymm0,%ymm13
- DB 196,98,125,24,53,26,168,2,0 ; vbroadcastss 0x2a81a(%rip),%ymm14 # 2c144 <_sk_overlay_sse2_8bit+0x4cf>
+ DB 196,98,125,24,53,86,167,2,0 ; vbroadcastss 0x2a756(%rip),%ymm14 # 2c080 <_sk_overlay_sse2_8bit+0x4d0>
DB 196,66,37,168,238 ; vfmadd213ps %ymm14,%ymm11,%ymm13
- DB 196,98,125,24,53,8,168,2,0 ; vbroadcastss 0x2a808(%rip),%ymm14 # 2c140 <_sk_overlay_sse2_8bit+0x4cb>
+ DB 196,98,125,24,53,68,167,2,0 ; vbroadcastss 0x2a744(%rip),%ymm14 # 2c07c <_sk_overlay_sse2_8bit+0x4cc>
DB 196,194,37,168,214 ; vfmadd213ps %ymm14,%ymm11,%ymm2
DB 197,188,194,201,0 ; vcmpeqps %ymm1,%ymm8,%ymm1
DB 196,227,21,74,202,16 ; vblendvps %ymm1,%ymm2,%ymm13,%ymm1
DB 197,188,194,192,0 ; vcmpeqps %ymm0,%ymm8,%ymm0
DB 196,195,117,74,196,0 ; vblendvps %ymm0,%ymm12,%ymm1,%ymm0
DB 196,193,60,88,201 ; vaddps %ymm9,%ymm8,%ymm1
- DB 196,98,125,24,29,127,167,2,0 ; vbroadcastss 0x2a77f(%rip),%ymm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,29,187,166,2,0 ; vbroadcastss 0x2a6bb(%rip),%ymm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,193,116,89,211 ; vmulps %ymm11,%ymm1,%ymm2
DB 197,36,194,218,1 ; vcmpltps %ymm2,%ymm11,%ymm11
DB 196,65,12,92,224 ; vsubps %ymm8,%ymm14,%ymm12
@@ -1569,7 +1569,7 @@ _sk_rgb_to_hsl_hsw LABEL PROC
DB 197,172,94,201 ; vdivps %ymm1,%ymm10,%ymm1
DB 196,195,125,74,199,128 ; vblendvps %ymm8,%ymm15,%ymm0,%ymm0
DB 196,195,117,74,207,128 ; vblendvps %ymm8,%ymm15,%ymm1,%ymm1
- DB 196,98,125,24,5,174,167,2,0 ; vbroadcastss 0x2a7ae(%rip),%ymm8 # 2c148 <_sk_overlay_sse2_8bit+0x4d3>
+ DB 196,98,125,24,5,234,166,2,0 ; vbroadcastss 0x2a6ea(%rip),%ymm8 # 2c084 <_sk_overlay_sse2_8bit+0x4d4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -1584,30 +1584,30 @@ _sk_hsl_to_rgb_hsw LABEL PROC
DB 197,252,17,28,36 ; vmovups %ymm3,(%rsp)
DB 197,252,40,233 ; vmovaps %ymm1,%ymm5
DB 197,252,40,224 ; vmovaps %ymm0,%ymm4
- DB 196,98,125,24,5,5,167,2,0 ; vbroadcastss 0x2a705(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,65,166,2,0 ; vbroadcastss 0x2a641(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,60,194,202,2 ; vcmpleps %ymm2,%ymm8,%ymm9
DB 197,84,89,210 ; vmulps %ymm2,%ymm5,%ymm10
DB 196,65,84,92,218 ; vsubps %ymm10,%ymm5,%ymm11
DB 196,67,45,74,203,144 ; vblendvps %ymm9,%ymm11,%ymm10,%ymm9
DB 197,52,88,210 ; vaddps %ymm2,%ymm9,%ymm10
- DB 196,98,125,24,13,68,167,2,0 ; vbroadcastss 0x2a744(%rip),%ymm9 # 2c140 <_sk_overlay_sse2_8bit+0x4cb>
+ DB 196,98,125,24,13,128,166,2,0 ; vbroadcastss 0x2a680(%rip),%ymm9 # 2c07c <_sk_overlay_sse2_8bit+0x4cc>
DB 196,66,109,170,202 ; vfmsub213ps %ymm10,%ymm2,%ymm9
- DB 196,98,125,24,29,66,167,2,0 ; vbroadcastss 0x2a742(%rip),%ymm11 # 2c14c <_sk_overlay_sse2_8bit+0x4d7>
+ DB 196,98,125,24,29,126,166,2,0 ; vbroadcastss 0x2a67e(%rip),%ymm11 # 2c088 <_sk_overlay_sse2_8bit+0x4d8>
DB 196,65,92,88,219 ; vaddps %ymm11,%ymm4,%ymm11
DB 196,67,125,8,227,1 ; vroundps $0x1,%ymm11,%ymm12
DB 196,65,36,92,252 ; vsubps %ymm12,%ymm11,%ymm15
DB 196,65,44,92,217 ; vsubps %ymm9,%ymm10,%ymm11
- DB 196,98,125,24,45,20,167,2,0 ; vbroadcastss 0x2a714(%rip),%ymm13 # 2c13c <_sk_overlay_sse2_8bit+0x4c7>
+ DB 196,98,125,24,45,80,166,2,0 ; vbroadcastss 0x2a650(%rip),%ymm13 # 2c078 <_sk_overlay_sse2_8bit+0x4c8>
DB 196,193,4,89,197 ; vmulps %ymm13,%ymm15,%ymm0
- DB 196,98,125,24,53,14,167,2,0 ; vbroadcastss 0x2a70e(%rip),%ymm14 # 2c144 <_sk_overlay_sse2_8bit+0x4cf>
+ DB 196,98,125,24,53,74,166,2,0 ; vbroadcastss 0x2a64a(%rip),%ymm14 # 2c080 <_sk_overlay_sse2_8bit+0x4d0>
DB 197,12,92,224 ; vsubps %ymm0,%ymm14,%ymm12
DB 196,66,37,168,225 ; vfmadd213ps %ymm9,%ymm11,%ymm12
- DB 196,226,125,24,29,8,167,2,0 ; vbroadcastss 0x2a708(%rip),%ymm3 # 2c150 <_sk_overlay_sse2_8bit+0x4db>
+ DB 196,226,125,24,29,68,166,2,0 ; vbroadcastss 0x2a644(%rip),%ymm3 # 2c08c <_sk_overlay_sse2_8bit+0x4dc>
DB 196,193,100,194,255,2 ; vcmpleps %ymm15,%ymm3,%ymm7
DB 196,195,29,74,249,112 ; vblendvps %ymm7,%ymm9,%ymm12,%ymm7
DB 196,65,60,194,231,2 ; vcmpleps %ymm15,%ymm8,%ymm12
DB 196,227,45,74,255,192 ; vblendvps %ymm12,%ymm7,%ymm10,%ymm7
- DB 196,98,125,24,37,223,166,2,0 ; vbroadcastss 0x2a6df(%rip),%ymm12 # 2c148 <_sk_overlay_sse2_8bit+0x4d3>
+ DB 196,98,125,24,37,27,166,2,0 ; vbroadcastss 0x2a61b(%rip),%ymm12 # 2c084 <_sk_overlay_sse2_8bit+0x4d4>
DB 196,65,28,194,255,2 ; vcmpleps %ymm15,%ymm12,%ymm15
DB 196,194,37,168,193 ; vfmadd213ps %ymm9,%ymm11,%ymm0
DB 196,99,125,74,255,240 ; vblendvps %ymm15,%ymm7,%ymm0,%ymm15
@@ -1623,7 +1623,7 @@ _sk_hsl_to_rgb_hsw LABEL PROC
DB 197,156,194,192,2 ; vcmpleps %ymm0,%ymm12,%ymm0
DB 196,194,37,168,249 ; vfmadd213ps %ymm9,%ymm11,%ymm7
DB 196,227,69,74,201,0 ; vblendvps %ymm0,%ymm1,%ymm7,%ymm1
- DB 196,226,125,24,5,147,166,2,0 ; vbroadcastss 0x2a693(%rip),%ymm0 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
+ DB 196,226,125,24,5,207,165,2,0 ; vbroadcastss 0x2a5cf(%rip),%ymm0 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
DB 197,220,88,192 ; vaddps %ymm0,%ymm4,%ymm0
DB 196,227,125,8,224,1 ; vroundps $0x1,%ymm0,%ymm4
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
@@ -1673,10 +1673,10 @@ _sk_scale_u8_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,58 ; jne 1bb6 <_sk_scale_u8_hsw+0x52>
DB 196,2,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm8
- DB 197,57,219,5,70,175,2,0 ; vpand 0x2af46(%rip),%xmm8,%xmm8 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,57,219,5,134,174,2,0 ; vpand 0x2ae86(%rip),%xmm8,%xmm8 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,66,125,51,192 ; vpmovzxwd %xmm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,187,165,2,0 ; vbroadcastss 0x2a5bb(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,247,164,2,0 ; vbroadcastss 0x2a4f7(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -1725,7 +1725,7 @@ _sk_scale_u8_hsw LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf001c60 <_sk_overlay_sse2_8bit+0xffffffffdefd5feb>
+ DB 233,255,255,255,222 ; jmpq ffffffffdf001c60 <_sk_overlay_sse2_8bit+0xffffffffdefd60b0>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,211 ; callq *%rbx
@@ -1749,20 +1749,20 @@ _sk_scale_565_hsw LABEL PROC
DB 15,133,161,0,0,0 ; jne 1d2c <_sk_scale_565_hsw+0xc0>
DB 196,1,122,111,4,88 ; vmovdqu (%r8,%r11,2),%xmm8
DB 196,66,125,51,192 ; vpmovzxwd %xmm8,%ymm8
- DB 196,98,125,88,13,189,164,2,0 ; vpbroadcastd 0x2a4bd(%rip),%ymm9 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,98,125,88,13,249,163,2,0 ; vpbroadcastd 0x2a3f9(%rip),%ymm9 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 196,65,61,219,201 ; vpand %ymm9,%ymm8,%ymm9
DB 196,65,124,91,201 ; vcvtdq2ps %ymm9,%ymm9
- DB 196,98,125,24,21,174,164,2,0 ; vbroadcastss 0x2a4ae(%rip),%ymm10 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,98,125,24,21,234,163,2,0 ; vbroadcastss 0x2a3ea(%rip),%ymm10 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
- DB 196,98,125,88,21,164,164,2,0 ; vpbroadcastd 0x2a4a4(%rip),%ymm10 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,98,125,88,21,224,163,2,0 ; vpbroadcastd 0x2a3e0(%rip),%ymm10 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 196,65,61,219,210 ; vpand %ymm10,%ymm8,%ymm10
DB 196,65,124,91,210 ; vcvtdq2ps %ymm10,%ymm10
- DB 196,98,125,24,29,149,164,2,0 ; vbroadcastss 0x2a495(%rip),%ymm11 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,98,125,24,29,209,163,2,0 ; vbroadcastss 0x2a3d1(%rip),%ymm11 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
- DB 196,98,125,88,29,139,164,2,0 ; vpbroadcastd 0x2a48b(%rip),%ymm11 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,98,125,88,29,199,163,2,0 ; vpbroadcastd 0x2a3c7(%rip),%ymm11 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 196,65,61,219,195 ; vpand %ymm11,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,29,124,164,2,0 ; vbroadcastss 0x2a47c(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,98,125,24,29,184,163,2,0 ; vbroadcastss 0x2a3b8(%rip),%ymm11 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 197,100,194,223,1 ; vcmpltps %ymm7,%ymm3,%ymm11
DB 196,65,44,93,224 ; vminps %ymm8,%ymm10,%ymm12
@@ -1849,10 +1849,10 @@ _sk_lerp_u8_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,78 ; jne 1e65 <_sk_lerp_u8_hsw+0x66>
DB 196,2,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm8
- DB 197,57,219,5,171,172,2,0 ; vpand 0x2acab(%rip),%xmm8,%xmm8 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,57,219,5,235,171,2,0 ; vpand 0x2abeb(%rip),%xmm8,%xmm8 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,66,125,51,192 ; vpmovzxwd %xmm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,32,163,2,0 ; vbroadcastss 0x2a320(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,92,162,2,0 ; vbroadcastss 0x2a25c(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
DB 196,226,61,168,196 ; vfmadd213ps %ymm4,%ymm8,%ymm0
@@ -1904,7 +1904,7 @@ _sk_lerp_u8_hsw LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 232,255,255,255,221 ; callq ffffffffde001f10 <_sk_overlay_sse2_8bit+0xffffffffddfd629b>
+ DB 232,255,255,255,221 ; callq ffffffffde001f10 <_sk_overlay_sse2_8bit+0xffffffffddfd6360>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,210 ; callq *%rdx
@@ -1928,20 +1928,20 @@ _sk_lerp_565_hsw LABEL PROC
DB 15,133,181,0,0,0 ; jne 1ff0 <_sk_lerp_565_hsw+0xd4>
DB 196,1,122,111,4,88 ; vmovdqu (%r8,%r11,2),%xmm8
DB 196,66,125,51,192 ; vpmovzxwd %xmm8,%ymm8
- DB 196,98,125,88,13,13,162,2,0 ; vpbroadcastd 0x2a20d(%rip),%ymm9 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,98,125,88,13,73,161,2,0 ; vpbroadcastd 0x2a149(%rip),%ymm9 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 196,65,61,219,201 ; vpand %ymm9,%ymm8,%ymm9
DB 196,65,124,91,201 ; vcvtdq2ps %ymm9,%ymm9
- DB 196,98,125,24,21,254,161,2,0 ; vbroadcastss 0x2a1fe(%rip),%ymm10 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,98,125,24,21,58,161,2,0 ; vbroadcastss 0x2a13a(%rip),%ymm10 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
- DB 196,98,125,88,21,244,161,2,0 ; vpbroadcastd 0x2a1f4(%rip),%ymm10 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,98,125,88,21,48,161,2,0 ; vpbroadcastd 0x2a130(%rip),%ymm10 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 196,65,61,219,210 ; vpand %ymm10,%ymm8,%ymm10
DB 196,65,124,91,210 ; vcvtdq2ps %ymm10,%ymm10
- DB 196,98,125,24,29,229,161,2,0 ; vbroadcastss 0x2a1e5(%rip),%ymm11 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,98,125,24,29,33,161,2,0 ; vbroadcastss 0x2a121(%rip),%ymm11 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
- DB 196,98,125,88,29,219,161,2,0 ; vpbroadcastd 0x2a1db(%rip),%ymm11 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,98,125,88,29,23,161,2,0 ; vpbroadcastd 0x2a117(%rip),%ymm11 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 196,65,61,219,195 ; vpand %ymm11,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,29,204,161,2,0 ; vbroadcastss 0x2a1cc(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,98,125,24,29,8,161,2,0 ; vbroadcastss 0x2a108(%rip),%ymm11 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 197,100,194,223,1 ; vcmpltps %ymm7,%ymm3,%ymm11
DB 196,65,44,93,224 ; vminps %ymm8,%ymm10,%ymm12
@@ -2013,21 +2013,21 @@ _sk_load_tables_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,103 ; jne 2105 <_sk_load_tables_hsw+0x71>
DB 196,193,126,111,28,144 ; vmovdqu (%r8,%rdx,4),%ymm3
- DB 197,229,219,13,116,162,2,0 ; vpand 0x2a274(%rip),%ymm3,%ymm1 # 2c320 <_sk_overlay_sse2_8bit+0x6ab>
+ DB 197,229,219,13,180,161,2,0 ; vpand 0x2a1b4(%rip),%ymm3,%ymm1 # 2c260 <_sk_overlay_sse2_8bit+0x6b0>
DB 196,65,61,118,192 ; vpcmpeqd %ymm8,%ymm8,%ymm8
DB 76,139,64,8 ; mov 0x8(%rax),%r8
DB 76,139,72,16 ; mov 0x10(%rax),%r9
DB 197,237,118,210 ; vpcmpeqd %ymm2,%ymm2,%ymm2
DB 196,194,109,146,4,136 ; vgatherdps %ymm2,(%r8,%ymm1,4),%ymm0
- DB 196,226,101,0,21,116,162,2,0 ; vpshufb 0x2a274(%rip),%ymm3,%ymm2 # 2c340 <_sk_overlay_sse2_8bit+0x6cb>
+ DB 196,226,101,0,21,180,161,2,0 ; vpshufb 0x2a1b4(%rip),%ymm3,%ymm2 # 2c280 <_sk_overlay_sse2_8bit+0x6d0>
DB 196,65,53,118,201 ; vpcmpeqd %ymm9,%ymm9,%ymm9
DB 196,194,53,146,12,145 ; vgatherdps %ymm9,(%r9,%ymm2,4),%ymm1
DB 72,139,64,24 ; mov 0x18(%rax),%rax
- DB 196,98,101,0,13,124,162,2,0 ; vpshufb 0x2a27c(%rip),%ymm3,%ymm9 # 2c360 <_sk_overlay_sse2_8bit+0x6eb>
+ DB 196,98,101,0,13,188,161,2,0 ; vpshufb 0x2a1bc(%rip),%ymm3,%ymm9 # 2c2a0 <_sk_overlay_sse2_8bit+0x6f0>
DB 196,162,61,146,20,136 ; vgatherdps %ymm8,(%rax,%ymm9,4),%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,92,160,2,0 ; vbroadcastss 0x2a05c(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,152,159,2,0 ; vbroadcastss 0x29f98(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2107,7 +2107,7 @@ _sk_load_tables_u16_be_hsw LABEL PROC
DB 197,185,108,200 ; vpunpcklqdq %xmm0,%xmm8,%xmm1
DB 197,185,109,208 ; vpunpckhqdq %xmm0,%xmm8,%xmm2
DB 197,49,108,195 ; vpunpcklqdq %xmm3,%xmm9,%xmm8
- DB 197,121,111,21,157,168,2,0 ; vmovdqa 0x2a89d(%rip),%xmm10 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,121,111,21,221,167,2,0 ; vmovdqa 0x2a7dd(%rip),%xmm10 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,193,113,219,194 ; vpand %xmm10,%xmm1,%xmm0
DB 196,226,125,51,200 ; vpmovzxwd %xmm0,%ymm1
DB 196,65,37,118,219 ; vpcmpeqd %ymm11,%ymm11,%ymm11
@@ -2129,7 +2129,7 @@ _sk_load_tables_u16_be_hsw LABEL PROC
DB 197,185,235,219 ; vpor %xmm3,%xmm8,%xmm3
DB 196,226,125,51,219 ; vpmovzxwd %xmm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,210,158,2,0 ; vbroadcastss 0x29ed2(%rip),%ymm8 # 2c174 <_sk_overlay_sse2_8bit+0x4ff>
+ DB 196,98,125,24,5,14,158,2,0 ; vbroadcastss 0x29e0e(%rip),%ymm8 # 2c0b0 <_sk_overlay_sse2_8bit+0x500>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2187,7 +2187,7 @@ _sk_load_tables_rgb_u16_be_hsw LABEL PROC
DB 197,185,108,211 ; vpunpcklqdq %xmm3,%xmm8,%xmm2
DB 197,185,109,219 ; vpunpckhqdq %xmm3,%xmm8,%xmm3
DB 197,113,108,192 ; vpunpcklqdq %xmm0,%xmm1,%xmm8
- DB 197,121,111,13,44,167,2,0 ; vmovdqa 0x2a72c(%rip),%xmm9 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,121,111,13,108,166,2,0 ; vmovdqa 0x2a66c(%rip),%xmm9 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,193,105,219,193 ; vpand %xmm9,%xmm2,%xmm0
DB 196,226,125,51,200 ; vpmovzxwd %xmm0,%ymm1
DB 196,65,45,118,210 ; vpcmpeqd %ymm10,%ymm10,%ymm10
@@ -2204,7 +2204,7 @@ _sk_load_tables_rgb_u16_be_hsw LABEL PROC
DB 196,226,125,51,218 ; vpmovzxwd %xmm2,%ymm3
DB 196,226,45,146,20,152 ; vgatherdps %ymm10,(%rax,%ymm3,4),%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,236,156,2,0 ; vbroadcastss 0x29cec(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,40,156,2,0 ; vbroadcastss 0x29c28(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 196,129,121,110,4,72 ; vmovd (%r8,%r9,2),%xmm0
DB 196,1,121,196,92,72,4,2 ; vpinsrw $0x2,0x4(%r8,%r9,2),%xmm0,%xmm11
@@ -2271,7 +2271,7 @@ _sk_load_tables_rgb_u16_be_hsw LABEL PROC
PUBLIC _sk_byte_tables_hsw
_sk_byte_tables_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,220,155,2,0 ; vbroadcastss 0x29bdc(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,24,155,2,0 ; vbroadcastss 0x29b18(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 197,125,91,200 ; vcvtps2dq %ymm0,%ymm9
DB 196,65,249,126,200 ; vmovq %xmm9,%r8
@@ -2393,7 +2393,7 @@ _sk_byte_tables_hsw LABEL PROC
DB 67,15,182,4,17 ; movzbl (%r9,%r10,1),%eax
DB 196,194,125,49,193 ; vpmovzxbd %xmm9,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,197,153,2,0 ; vbroadcastss 0x299c5(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,1,153,2,0 ; vbroadcastss 0x29901(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 196,226,125,49,201 ; vpmovzxbd %xmm1,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
@@ -2507,7 +2507,7 @@ _sk_byte_tables_rgb_hsw LABEL PROC
DB 67,15,182,4,17 ; movzbl (%r9,%r10,1),%eax
DB 196,194,125,49,193 ; vpmovzxbd %xmm9,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,173,151,2,0 ; vbroadcastss 0x297ad(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,233,150,2,0 ; vbroadcastss 0x296e9(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 196,226,125,49,201 ; vpmovzxbd %xmm1,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
@@ -2596,33 +2596,33 @@ _sk_parametric_r_hsw LABEL PROC
DB 196,66,125,168,211 ; vfmadd213ps %ymm11,%ymm0,%ymm10
DB 196,226,125,24,0 ; vbroadcastss (%rax),%ymm0
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,163,150,2,0 ; vbroadcastss 0x296a3(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
- DB 196,98,125,24,45,158,150,2,0 ; vbroadcastss 0x2969e(%rip),%ymm13 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,223,149,2,0 ; vbroadcastss 0x295df(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
+ DB 196,98,125,24,45,218,149,2,0 ; vbroadcastss 0x295da(%rip),%ymm13 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,244,149,2,0 ; vbroadcastss 0x295f4(%rip),%ymm13 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,45,48,149,2,0 ; vbroadcastss 0x29530(%rip),%ymm13 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,134,150,2,0 ; vbroadcastss 0x29686(%rip),%ymm13 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,45,194,149,2,0 ; vbroadcastss 0x295c2(%rip),%ymm13 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,124,150,2,0 ; vbroadcastss 0x2967c(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,29,184,149,2,0 ; vbroadcastss 0x295b8(%rip),%ymm11 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,114,150,2,0 ; vbroadcastss 0x29672(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,174,149,2,0 ; vbroadcastss 0x295ae(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,104,150,2,0 ; vbroadcastss 0x29668(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,164,149,2,0 ; vbroadcastss 0x295a4(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 196,99,125,8,208,1 ; vroundps $0x1,%ymm0,%ymm10
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,73,150,2,0 ; vbroadcastss 0x29649(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,133,149,2,0 ; vbroadcastss 0x29585(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,124,88,195 ; vaddps %ymm11,%ymm0,%ymm0
- DB 196,98,125,24,29,63,150,2,0 ; vbroadcastss 0x2963f(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,123,149,2,0 ; vbroadcastss 0x2957b(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,98,45,172,216 ; vfnmadd213ps %ymm0,%ymm10,%ymm11
- DB 196,226,125,24,5,53,150,2,0 ; vbroadcastss 0x29635(%rip),%ymm0 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,226,125,24,5,113,149,2,0 ; vbroadcastss 0x29571(%rip),%ymm0 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,193,124,92,194 ; vsubps %ymm10,%ymm0,%ymm0
- DB 196,98,125,24,21,43,150,2,0 ; vbroadcastss 0x2962b(%rip),%ymm10 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,21,103,149,2,0 ; vbroadcastss 0x29567(%rip),%ymm10 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 197,172,94,192 ; vdivps %ymm0,%ymm10,%ymm0
DB 197,164,88,192 ; vaddps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,21,30,150,2,0 ; vbroadcastss 0x2961e(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,90,149,2,0 ; vbroadcastss 0x2955a(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,253,91,192 ; vcvtps2dq %ymm0,%ymm0
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -2630,7 +2630,7 @@ _sk_parametric_r_hsw LABEL PROC
DB 196,195,125,74,193,128 ; vblendvps %ymm8,%ymm9,%ymm0,%ymm0
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,124,95,192 ; vmaxps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,53,149,2,0 ; vbroadcastss 0x29535(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,113,148,2,0 ; vbroadcastss 0x29471(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2648,33 +2648,33 @@ _sk_parametric_g_hsw LABEL PROC
DB 196,66,117,168,211 ; vfmadd213ps %ymm11,%ymm1,%ymm10
DB 196,226,125,24,8 ; vbroadcastss (%rax),%ymm1
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,125,149,2,0 ; vbroadcastss 0x2957d(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
- DB 196,98,125,24,45,120,149,2,0 ; vbroadcastss 0x29578(%rip),%ymm13 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,185,148,2,0 ; vbroadcastss 0x294b9(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
+ DB 196,98,125,24,45,180,148,2,0 ; vbroadcastss 0x294b4(%rip),%ymm13 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,206,148,2,0 ; vbroadcastss 0x294ce(%rip),%ymm13 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,45,10,148,2,0 ; vbroadcastss 0x2940a(%rip),%ymm13 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,96,149,2,0 ; vbroadcastss 0x29560(%rip),%ymm13 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,45,156,148,2,0 ; vbroadcastss 0x2949c(%rip),%ymm13 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,86,149,2,0 ; vbroadcastss 0x29556(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,29,146,148,2,0 ; vbroadcastss 0x29492(%rip),%ymm11 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,76,149,2,0 ; vbroadcastss 0x2954c(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,136,148,2,0 ; vbroadcastss 0x29488(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,66,149,2,0 ; vbroadcastss 0x29542(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,126,148,2,0 ; vbroadcastss 0x2947e(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,116,89,202 ; vmulps %ymm10,%ymm1,%ymm1
DB 196,99,125,8,209,1 ; vroundps $0x1,%ymm1,%ymm10
DB 196,65,116,92,210 ; vsubps %ymm10,%ymm1,%ymm10
- DB 196,98,125,24,29,35,149,2,0 ; vbroadcastss 0x29523(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,95,148,2,0 ; vbroadcastss 0x2945f(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,25,149,2,0 ; vbroadcastss 0x29519(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,85,148,2,0 ; vbroadcastss 0x29455(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,98,45,172,217 ; vfnmadd213ps %ymm1,%ymm10,%ymm11
- DB 196,226,125,24,13,15,149,2,0 ; vbroadcastss 0x2950f(%rip),%ymm1 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,226,125,24,13,75,148,2,0 ; vbroadcastss 0x2944b(%rip),%ymm1 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,193,116,92,202 ; vsubps %ymm10,%ymm1,%ymm1
- DB 196,98,125,24,21,5,149,2,0 ; vbroadcastss 0x29505(%rip),%ymm10 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,21,65,148,2,0 ; vbroadcastss 0x29441(%rip),%ymm10 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 197,172,94,201 ; vdivps %ymm1,%ymm10,%ymm1
DB 197,164,88,201 ; vaddps %ymm1,%ymm11,%ymm1
- DB 196,98,125,24,21,248,148,2,0 ; vbroadcastss 0x294f8(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,52,148,2,0 ; vbroadcastss 0x29434(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,116,89,202 ; vmulps %ymm10,%ymm1,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -2682,7 +2682,7 @@ _sk_parametric_g_hsw LABEL PROC
DB 196,195,117,74,201,128 ; vblendvps %ymm8,%ymm9,%ymm1,%ymm1
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,116,95,200 ; vmaxps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,5,15,148,2,0 ; vbroadcastss 0x2940f(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,75,147,2,0 ; vbroadcastss 0x2934b(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2700,33 +2700,33 @@ _sk_parametric_b_hsw LABEL PROC
DB 196,66,109,168,211 ; vfmadd213ps %ymm11,%ymm2,%ymm10
DB 196,226,125,24,16 ; vbroadcastss (%rax),%ymm2
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,87,148,2,0 ; vbroadcastss 0x29457(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
- DB 196,98,125,24,45,82,148,2,0 ; vbroadcastss 0x29452(%rip),%ymm13 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,147,147,2,0 ; vbroadcastss 0x29393(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
+ DB 196,98,125,24,45,142,147,2,0 ; vbroadcastss 0x2938e(%rip),%ymm13 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,168,147,2,0 ; vbroadcastss 0x293a8(%rip),%ymm13 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,45,228,146,2,0 ; vbroadcastss 0x292e4(%rip),%ymm13 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,58,148,2,0 ; vbroadcastss 0x2943a(%rip),%ymm13 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,45,118,147,2,0 ; vbroadcastss 0x29376(%rip),%ymm13 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,48,148,2,0 ; vbroadcastss 0x29430(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,29,108,147,2,0 ; vbroadcastss 0x2936c(%rip),%ymm11 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,38,148,2,0 ; vbroadcastss 0x29426(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,98,147,2,0 ; vbroadcastss 0x29362(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,28,148,2,0 ; vbroadcastss 0x2941c(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,88,147,2,0 ; vbroadcastss 0x29358(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 196,99,125,8,210,1 ; vroundps $0x1,%ymm2,%ymm10
DB 196,65,108,92,210 ; vsubps %ymm10,%ymm2,%ymm10
- DB 196,98,125,24,29,253,147,2,0 ; vbroadcastss 0x293fd(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,57,147,2,0 ; vbroadcastss 0x29339(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
- DB 196,98,125,24,29,243,147,2,0 ; vbroadcastss 0x293f3(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,47,147,2,0 ; vbroadcastss 0x2932f(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,98,45,172,218 ; vfnmadd213ps %ymm2,%ymm10,%ymm11
- DB 196,226,125,24,21,233,147,2,0 ; vbroadcastss 0x293e9(%rip),%ymm2 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,226,125,24,21,37,147,2,0 ; vbroadcastss 0x29325(%rip),%ymm2 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,193,108,92,210 ; vsubps %ymm10,%ymm2,%ymm2
- DB 196,98,125,24,21,223,147,2,0 ; vbroadcastss 0x293df(%rip),%ymm10 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,21,27,147,2,0 ; vbroadcastss 0x2931b(%rip),%ymm10 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 197,172,94,210 ; vdivps %ymm2,%ymm10,%ymm2
DB 197,164,88,210 ; vaddps %ymm2,%ymm11,%ymm2
- DB 196,98,125,24,21,210,147,2,0 ; vbroadcastss 0x293d2(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,14,147,2,0 ; vbroadcastss 0x2930e(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 197,253,91,210 ; vcvtps2dq %ymm2,%ymm2
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -2734,7 +2734,7 @@ _sk_parametric_b_hsw LABEL PROC
DB 196,195,109,74,209,128 ; vblendvps %ymm8,%ymm9,%ymm2,%ymm2
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,108,95,208 ; vmaxps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,233,146,2,0 ; vbroadcastss 0x292e9(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,37,146,2,0 ; vbroadcastss 0x29225(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2752,33 +2752,33 @@ _sk_parametric_a_hsw LABEL PROC
DB 196,66,101,168,211 ; vfmadd213ps %ymm11,%ymm3,%ymm10
DB 196,226,125,24,24 ; vbroadcastss (%rax),%ymm3
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,49,147,2,0 ; vbroadcastss 0x29331(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
- DB 196,98,125,24,45,44,147,2,0 ; vbroadcastss 0x2932c(%rip),%ymm13 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,109,146,2,0 ; vbroadcastss 0x2926d(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
+ DB 196,98,125,24,45,104,146,2,0 ; vbroadcastss 0x29268(%rip),%ymm13 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,130,146,2,0 ; vbroadcastss 0x29282(%rip),%ymm13 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,45,190,145,2,0 ; vbroadcastss 0x291be(%rip),%ymm13 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,20,147,2,0 ; vbroadcastss 0x29314(%rip),%ymm13 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,45,80,146,2,0 ; vbroadcastss 0x29250(%rip),%ymm13 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,10,147,2,0 ; vbroadcastss 0x2930a(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,29,70,146,2,0 ; vbroadcastss 0x29246(%rip),%ymm11 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,0,147,2,0 ; vbroadcastss 0x29300(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,60,146,2,0 ; vbroadcastss 0x2923c(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,246,146,2,0 ; vbroadcastss 0x292f6(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,50,146,2,0 ; vbroadcastss 0x29232(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 196,99,125,8,211,1 ; vroundps $0x1,%ymm3,%ymm10
DB 196,65,100,92,210 ; vsubps %ymm10,%ymm3,%ymm10
- DB 196,98,125,24,29,215,146,2,0 ; vbroadcastss 0x292d7(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,19,146,2,0 ; vbroadcastss 0x29213(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,100,88,219 ; vaddps %ymm11,%ymm3,%ymm3
- DB 196,98,125,24,29,205,146,2,0 ; vbroadcastss 0x292cd(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,9,146,2,0 ; vbroadcastss 0x29209(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,98,45,172,219 ; vfnmadd213ps %ymm3,%ymm10,%ymm11
- DB 196,226,125,24,29,195,146,2,0 ; vbroadcastss 0x292c3(%rip),%ymm3 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,226,125,24,29,255,145,2,0 ; vbroadcastss 0x291ff(%rip),%ymm3 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,193,100,92,218 ; vsubps %ymm10,%ymm3,%ymm3
- DB 196,98,125,24,21,185,146,2,0 ; vbroadcastss 0x292b9(%rip),%ymm10 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,21,245,145,2,0 ; vbroadcastss 0x291f5(%rip),%ymm10 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 197,172,94,219 ; vdivps %ymm3,%ymm10,%ymm3
DB 197,164,88,219 ; vaddps %ymm3,%ymm11,%ymm3
- DB 196,98,125,24,21,172,146,2,0 ; vbroadcastss 0x292ac(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,232,145,2,0 ; vbroadcastss 0x291e8(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 197,253,91,219 ; vcvtps2dq %ymm3,%ymm3
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -2786,7 +2786,7 @@ _sk_parametric_a_hsw LABEL PROC
DB 196,195,101,74,217,128 ; vblendvps %ymm8,%ymm9,%ymm3,%ymm3
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,100,95,216 ; vmaxps %ymm8,%ymm3,%ymm3
- DB 196,98,125,24,5,195,145,2,0 ; vbroadcastss 0x291c3(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,255,144,2,0 ; vbroadcastss 0x290ff(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2803,35 +2803,35 @@ _sk_gamma_hsw LABEL PROC
DB 197,252,40,241 ; vmovaps %ymm1,%ymm6
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,124,91,208 ; vcvtdq2ps %ymm0,%ymm10
- DB 196,98,125,24,29,16,146,2,0 ; vbroadcastss 0x29210(%rip),%ymm11 # 2c178 <_sk_overlay_sse2_8bit+0x503>
- DB 196,226,125,24,45,11,146,2,0 ; vbroadcastss 0x2920b(%rip),%ymm5 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,29,76,145,2,0 ; vbroadcastss 0x2914c(%rip),%ymm11 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
+ DB 196,226,125,24,45,71,145,2,0 ; vbroadcastss 0x29147(%rip),%ymm5 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 197,124,84,205 ; vandps %ymm5,%ymm0,%ymm9
- DB 196,226,125,24,37,98,145,2,0 ; vbroadcastss 0x29162(%rip),%ymm4 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,37,158,144,2,0 ; vbroadcastss 0x2909e(%rip),%ymm4 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,52,86,228 ; vorps %ymm4,%ymm9,%ymm12
- DB 196,98,125,24,45,245,145,2,0 ; vbroadcastss 0x291f5(%rip),%ymm13 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,45,49,145,2,0 ; vbroadcastss 0x29131(%rip),%ymm13 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,66,37,168,213 ; vfmadd213ps %ymm13,%ymm11,%ymm10
- DB 196,98,125,24,13,235,145,2,0 ; vbroadcastss 0x291eb(%rip),%ymm9 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,13,39,145,2,0 ; vbroadcastss 0x29127(%rip),%ymm9 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,66,29,188,209 ; vfnmadd231ps %ymm9,%ymm12,%ymm10
DB 197,124,91,246 ; vcvtdq2ps %ymm6,%ymm14
DB 196,66,37,168,245 ; vfmadd213ps %ymm13,%ymm11,%ymm14
DB 197,124,91,255 ; vcvtdq2ps %ymm7,%ymm15
DB 196,66,37,168,253 ; vfmadd213ps %ymm13,%ymm11,%ymm15
- DB 196,98,125,24,29,207,145,2,0 ; vbroadcastss 0x291cf(%rip),%ymm11 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,29,11,145,2,0 ; vbroadcastss 0x2910b(%rip),%ymm11 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,65,28,88,227 ; vaddps %ymm11,%ymm12,%ymm12
- DB 196,98,125,24,45,197,145,2,0 ; vbroadcastss 0x291c5(%rip),%ymm13 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,45,1,145,2,0 ; vbroadcastss 0x29101(%rip),%ymm13 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 196,65,20,94,228 ; vdivps %ymm12,%ymm13,%ymm12
DB 196,65,44,92,212 ; vsubps %ymm12,%ymm10,%ymm10
DB 196,98,125,24,32 ; vbroadcastss (%rax),%ymm12
DB 196,65,44,89,212 ; vmulps %ymm12,%ymm10,%ymm10
DB 196,67,125,8,194,1 ; vroundps $0x1,%ymm10,%ymm8
DB 196,65,44,92,192 ; vsubps %ymm8,%ymm10,%ymm8
- DB 196,226,125,24,21,161,145,2,0 ; vbroadcastss 0x291a1(%rip),%ymm2 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,226,125,24,21,221,144,2,0 ; vbroadcastss 0x290dd(%rip),%ymm2 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 197,44,88,210 ; vaddps %ymm2,%ymm10,%ymm10
- DB 196,226,125,24,29,152,145,2,0 ; vbroadcastss 0x29198(%rip),%ymm3 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,226,125,24,29,212,144,2,0 ; vbroadcastss 0x290d4(%rip),%ymm3 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,98,61,188,211 ; vfnmadd231ps %ymm3,%ymm8,%ymm10
- DB 196,226,125,24,13,142,145,2,0 ; vbroadcastss 0x2918e(%rip),%ymm1 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,226,125,24,13,202,144,2,0 ; vbroadcastss 0x290ca(%rip),%ymm1 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,65,116,92,192 ; vsubps %ymm8,%ymm1,%ymm8
- DB 196,226,125,24,5,132,145,2,0 ; vbroadcastss 0x29184(%rip),%ymm0 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,226,125,24,5,192,144,2,0 ; vbroadcastss 0x290c0(%rip),%ymm0 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 196,65,124,94,192 ; vdivps %ymm8,%ymm0,%ymm8
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 197,204,84,245 ; vandps %ymm5,%ymm6,%ymm6
@@ -2862,7 +2862,7 @@ _sk_gamma_hsw LABEL PROC
DB 197,244,92,205 ; vsubps %ymm5,%ymm1,%ymm1
DB 197,252,94,193 ; vdivps %ymm1,%ymm0,%ymm0
DB 197,236,88,192 ; vaddps %ymm0,%ymm2,%ymm0
- DB 196,226,125,24,13,245,144,2,0 ; vbroadcastss 0x290f5(%rip),%ymm1 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,226,125,24,13,49,144,2,0 ; vbroadcastss 0x29031(%rip),%ymm1 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 197,188,89,209 ; vmulps %ymm1,%ymm8,%ymm2
DB 197,204,89,217 ; vmulps %ymm1,%ymm6,%ymm3
DB 197,252,89,225 ; vmulps %ymm1,%ymm0,%ymm4
@@ -2880,26 +2880,26 @@ _sk_gamma_hsw LABEL PROC
PUBLIC _sk_lab_to_xyz_hsw
_sk_lab_to_xyz_hsw LABEL PROC
- DB 196,98,125,24,5,173,144,2,0 ; vbroadcastss 0x290ad(%rip),%ymm8 # 2c1a4 <_sk_overlay_sse2_8bit+0x52f>
- DB 196,98,125,24,13,16,144,2,0 ; vbroadcastss 0x29010(%rip),%ymm9 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
- DB 196,98,125,24,21,159,144,2,0 ; vbroadcastss 0x2909f(%rip),%ymm10 # 2c1a8 <_sk_overlay_sse2_8bit+0x533>
+ DB 196,98,125,24,5,233,143,2,0 ; vbroadcastss 0x28fe9(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x530>
+ DB 196,98,125,24,13,76,143,2,0 ; vbroadcastss 0x28f4c(%rip),%ymm9 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
+ DB 196,98,125,24,21,219,143,2,0 ; vbroadcastss 0x28fdb(%rip),%ymm10 # 2c0e4 <_sk_overlay_sse2_8bit+0x534>
DB 196,194,53,168,202 ; vfmadd213ps %ymm10,%ymm9,%ymm1
DB 196,194,53,168,210 ; vfmadd213ps %ymm10,%ymm9,%ymm2
- DB 196,98,125,24,13,144,144,2,0 ; vbroadcastss 0x29090(%rip),%ymm9 # 2c1ac <_sk_overlay_sse2_8bit+0x537>
+ DB 196,98,125,24,13,204,143,2,0 ; vbroadcastss 0x28fcc(%rip),%ymm9 # 2c0e8 <_sk_overlay_sse2_8bit+0x538>
DB 196,66,125,184,200 ; vfmadd231ps %ymm8,%ymm0,%ymm9
- DB 196,226,125,24,5,134,144,2,0 ; vbroadcastss 0x29086(%rip),%ymm0 # 2c1b0 <_sk_overlay_sse2_8bit+0x53b>
+ DB 196,226,125,24,5,194,143,2,0 ; vbroadcastss 0x28fc2(%rip),%ymm0 # 2c0ec <_sk_overlay_sse2_8bit+0x53c>
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
- DB 196,98,125,24,5,125,144,2,0 ; vbroadcastss 0x2907d(%rip),%ymm8 # 2c1b4 <_sk_overlay_sse2_8bit+0x53f>
+ DB 196,98,125,24,5,185,143,2,0 ; vbroadcastss 0x28fb9(%rip),%ymm8 # 2c0f0 <_sk_overlay_sse2_8bit+0x540>
DB 196,98,117,168,192 ; vfmadd213ps %ymm0,%ymm1,%ymm8
- DB 196,98,125,24,13,115,144,2,0 ; vbroadcastss 0x29073(%rip),%ymm9 # 2c1b8 <_sk_overlay_sse2_8bit+0x543>
+ DB 196,98,125,24,13,175,143,2,0 ; vbroadcastss 0x28faf(%rip),%ymm9 # 2c0f4 <_sk_overlay_sse2_8bit+0x544>
DB 196,98,109,172,200 ; vfnmadd213ps %ymm0,%ymm2,%ymm9
DB 196,193,60,89,200 ; vmulps %ymm8,%ymm8,%ymm1
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
- DB 196,226,125,24,21,96,144,2,0 ; vbroadcastss 0x29060(%rip),%ymm2 # 2c1bc <_sk_overlay_sse2_8bit+0x547>
+ DB 196,226,125,24,21,156,143,2,0 ; vbroadcastss 0x28f9c(%rip),%ymm2 # 2c0f8 <_sk_overlay_sse2_8bit+0x548>
DB 197,108,194,209,1 ; vcmpltps %ymm1,%ymm2,%ymm10
- DB 196,98,125,24,29,86,144,2,0 ; vbroadcastss 0x29056(%rip),%ymm11 # 2c1c0 <_sk_overlay_sse2_8bit+0x54b>
+ DB 196,98,125,24,29,146,143,2,0 ; vbroadcastss 0x28f92(%rip),%ymm11 # 2c0fc <_sk_overlay_sse2_8bit+0x54c>
DB 196,65,60,88,195 ; vaddps %ymm11,%ymm8,%ymm8
- DB 196,98,125,24,37,76,144,2,0 ; vbroadcastss 0x2904c(%rip),%ymm12 # 2c1c4 <_sk_overlay_sse2_8bit+0x54f>
+ DB 196,98,125,24,37,136,143,2,0 ; vbroadcastss 0x28f88(%rip),%ymm12 # 2c100 <_sk_overlay_sse2_8bit+0x550>
DB 196,65,60,89,196 ; vmulps %ymm12,%ymm8,%ymm8
DB 196,99,61,74,193,160 ; vblendvps %ymm10,%ymm1,%ymm8,%ymm8
DB 197,252,89,200 ; vmulps %ymm0,%ymm0,%ymm1
@@ -2914,9 +2914,9 @@ _sk_lab_to_xyz_hsw LABEL PROC
DB 196,65,52,88,203 ; vaddps %ymm11,%ymm9,%ymm9
DB 196,65,52,89,204 ; vmulps %ymm12,%ymm9,%ymm9
DB 196,227,53,74,208,32 ; vblendvps %ymm2,%ymm0,%ymm9,%ymm2
- DB 196,226,125,24,5,1,144,2,0 ; vbroadcastss 0x29001(%rip),%ymm0 # 2c1c8 <_sk_overlay_sse2_8bit+0x553>
+ DB 196,226,125,24,5,61,143,2,0 ; vbroadcastss 0x28f3d(%rip),%ymm0 # 2c104 <_sk_overlay_sse2_8bit+0x554>
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
- DB 196,98,125,24,5,248,143,2,0 ; vbroadcastss 0x28ff8(%rip),%ymm8 # 2c1cc <_sk_overlay_sse2_8bit+0x557>
+ DB 196,98,125,24,5,52,143,2,0 ; vbroadcastss 0x28f34(%rip),%ymm8 # 2c108 <_sk_overlay_sse2_8bit+0x558>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2932,10 +2932,10 @@ _sk_load_a8_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,52 ; jne 3229 <_sk_load_a8_hsw+0x4c>
DB 196,130,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm0
- DB 197,249,219,5,205,152,2,0 ; vpand 0x298cd(%rip),%xmm0,%xmm0 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,249,219,5,13,152,2,0 ; vpand 0x2980d(%rip),%xmm0,%xmm0 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,226,125,51,192 ; vpmovzxwd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,67,143,2,0 ; vbroadcastss 0x28f43(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,127,142,2,0 ; vbroadcastss 0x28e7f(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -2983,7 +2983,7 @@ _sk_load_a8_hsw LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf0032d0 <_sk_overlay_sse2_8bit+0xffffffffdefd765b>
+ DB 233,255,255,255,222 ; jmpq ffffffffdf0032d0 <_sk_overlay_sse2_8bit+0xffffffffdefd7720>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,211 ; callq *%rbx
@@ -3005,10 +3005,10 @@ _sk_load_a8_dst_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,52 ; jne 3328 <_sk_load_a8_dst_hsw+0x4c>
DB 196,130,121,48,36,24 ; vpmovzxbw (%r8,%r11,1),%xmm4
- DB 197,217,219,37,206,151,2,0 ; vpand 0x297ce(%rip),%xmm4,%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,217,219,37,14,151,2,0 ; vpand 0x2970e(%rip),%xmm4,%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,226,125,51,228 ; vpmovzxwd %xmm4,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,68,142,2,0 ; vbroadcastss 0x28e44(%rip),%ymm5 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,45,128,141,2,0 ; vbroadcastss 0x28d80(%rip),%ymm5 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,220,89,253 ; vmulps %ymm5,%ymm4,%ymm7
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,220,87,228 ; vxorps %ymm4,%ymm4,%ymm4
@@ -3056,7 +3056,7 @@ _sk_load_a8_dst_hsw LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 232,255,255,255,221 ; callq ffffffffde0033d0 <_sk_overlay_sse2_8bit+0xffffffffddfd775b>
+ DB 232,255,255,255,221 ; callq ffffffffde0033d0 <_sk_overlay_sse2_8bit+0xffffffffddfd7820>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,210 ; callq *%rdx
@@ -3109,7 +3109,7 @@ _sk_gather_a8_hsw LABEL PROC
DB 196,227,121,32,192,7 ; vpinsrb $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,191,140,2,0 ; vbroadcastss 0x28cbf(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,251,139,2,0 ; vbroadcastss 0x28bfb(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -3129,7 +3129,7 @@ _sk_store_a8_hsw LABEL PROC
DB 77,15,175,193 ; imul %r9,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,64,140,2,0 ; vbroadcastss 0x28c40(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,124,139,2,0 ; vbroadcastss 0x28b7c(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,65,100,89,192 ; vmulps %ymm8,%ymm3,%ymm8
DB 196,65,125,91,192 ; vcvtps2dq %ymm8,%ymm8
DB 196,67,125,25,193,1 ; vextractf128 $0x1,%ymm8,%xmm9
@@ -3154,13 +3154,13 @@ _sk_store_a8_hsw LABEL PROC
DB 196,3,121,20,4,24,0 ; vpextrb $0x0,%xmm8,(%r8,%r11,1)
DB 235,202 ; jmp 34f5 <_sk_store_a8_hsw+0x41>
DB 196,3,121,20,68,24,2,4 ; vpextrb $0x4,%xmm8,0x2(%r8,%r11,1)
- DB 196,98,57,0,5,164,149,2,0 ; vpshufb 0x295a4(%rip),%xmm8,%xmm8 # 2cae0 <_sk_overlay_sse2_8bit+0xe6b>
+ DB 196,98,57,0,5,228,148,2,0 ; vpshufb 0x294e4(%rip),%xmm8,%xmm8 # 2ca20 <_sk_overlay_sse2_8bit+0xe70>
DB 196,3,121,21,4,24,0 ; vpextrw $0x0,%xmm8,(%r8,%r11,1)
DB 235,176 ; jmp 34f5 <_sk_store_a8_hsw+0x41>
DB 196,3,121,20,68,24,6,12 ; vpextrb $0xc,%xmm8,0x6(%r8,%r11,1)
DB 196,3,121,20,68,24,5,10 ; vpextrb $0xa,%xmm8,0x5(%r8,%r11,1)
DB 196,3,121,20,68,24,4,8 ; vpextrb $0x8,%xmm8,0x4(%r8,%r11,1)
- DB 196,98,57,0,5,138,149,2,0 ; vpshufb 0x2958a(%rip),%xmm8,%xmm8 # 2caf0 <_sk_overlay_sse2_8bit+0xe7b>
+ DB 196,98,57,0,5,202,148,2,0 ; vpshufb 0x294ca(%rip),%xmm8,%xmm8 # 2ca30 <_sk_overlay_sse2_8bit+0xe80>
DB 196,1,121,126,4,24 ; vmovd %xmm8,(%r8,%r11,1)
DB 235,135 ; jmp 34f5 <_sk_store_a8_hsw+0x41>
DB 102,144 ; xchg %ax,%ax
@@ -3195,13 +3195,13 @@ _sk_load_g8_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,57 ; jne 35dd <_sk_load_g8_hsw+0x51>
DB 196,130,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm0
- DB 197,249,219,5,30,149,2,0 ; vpand 0x2951e(%rip),%xmm0,%xmm0 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,249,219,5,94,148,2,0 ; vpand 0x2945e(%rip),%xmm0,%xmm0 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,226,125,51,192 ; vpmovzxwd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,148,139,2,0 ; vbroadcastss 0x28b94(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,208,138,2,0 ; vbroadcastss 0x28ad0(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,17,139,2,0 ; vbroadcastss 0x28b11(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,77,138,2,0 ; vbroadcastss 0x28a4d(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 255,224 ; jmpq *%rax
@@ -3246,7 +3246,7 @@ _sk_load_g8_hsw LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf003684 <_sk_overlay_sse2_8bit+0xffffffffdefd7a0f>
+ DB 233,255,255,255,222 ; jmpq ffffffffdf003684 <_sk_overlay_sse2_8bit+0xffffffffdefd7ad4>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,211 ; callq *%rbx
@@ -3268,13 +3268,13 @@ _sk_load_g8_dst_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,57 ; jne 36e1 <_sk_load_g8_dst_hsw+0x51>
DB 196,130,121,48,36,24 ; vpmovzxbw (%r8,%r11,1),%xmm4
- DB 197,217,219,37,26,148,2,0 ; vpand 0x2941a(%rip),%xmm4,%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,217,219,37,90,147,2,0 ; vpand 0x2935a(%rip),%xmm4,%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,226,125,51,228 ; vpmovzxwd %xmm4,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,144,138,2,0 ; vbroadcastss 0x28a90(%rip),%ymm5 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,45,204,137,2,0 ; vbroadcastss 0x289cc(%rip),%ymm5 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,220,89,229 ; vmulps %ymm5,%ymm4,%ymm4
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,61,13,138,2,0 ; vbroadcastss 0x28a0d(%rip),%ymm7 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,61,73,137,2,0 ; vbroadcastss 0x28949(%rip),%ymm7 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,236 ; vmovaps %ymm4,%ymm5
DB 197,252,40,244 ; vmovaps %ymm4,%ymm6
DB 255,224 ; jmpq *%rax
@@ -3319,7 +3319,7 @@ _sk_load_g8_dst_hsw LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf003788 <_sk_overlay_sse2_8bit+0xffffffffdefd7b13>
+ DB 233,255,255,255,222 ; jmpq ffffffffdf003788 <_sk_overlay_sse2_8bit+0xffffffffdefd7bd8>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,211 ; callq *%rbx
@@ -3372,10 +3372,10 @@ _sk_gather_g8_hsw LABEL PROC
DB 196,227,121,32,192,7 ; vpinsrb $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,7,137,2,0 ; vbroadcastss 0x28907(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,67,136,2,0 ; vbroadcastss 0x28843(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,132,136,2,0 ; vbroadcastss 0x28884(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,192,135,2,0 ; vbroadcastss 0x287c0(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 91 ; pop %rbx
@@ -3397,23 +3397,23 @@ _sk_load_565_hsw LABEL PROC
DB 117,114 ; jne 38fe <_sk_load_565_hsw+0x8d>
DB 196,129,122,111,4,88 ; vmovdqu (%r8,%r11,2),%xmm0
DB 196,226,125,51,208 ; vpmovzxwd %xmm0,%ymm2
- DB 196,226,125,88,5,188,136,2,0 ; vpbroadcastd 0x288bc(%rip),%ymm0 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,226,125,88,5,248,135,2,0 ; vpbroadcastd 0x287f8(%rip),%ymm0 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 197,237,219,192 ; vpand %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,175,136,2,0 ; vbroadcastss 0x288af(%rip),%ymm1 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,226,125,24,13,235,135,2,0 ; vbroadcastss 0x287eb(%rip),%ymm1 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,166,136,2,0 ; vpbroadcastd 0x288a6(%rip),%ymm1 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,226,125,88,13,226,135,2,0 ; vpbroadcastd 0x287e2(%rip),%ymm1 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 197,237,219,201 ; vpand %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,153,136,2,0 ; vbroadcastss 0x28899(%rip),%ymm3 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,226,125,24,29,213,135,2,0 ; vbroadcastss 0x287d5(%rip),%ymm3 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,88,29,144,136,2,0 ; vpbroadcastd 0x28890(%rip),%ymm3 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,226,125,88,29,204,135,2,0 ; vpbroadcastd 0x287cc(%rip),%ymm3 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 197,237,219,211 ; vpand %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,131,136,2,0 ; vbroadcastss 0x28883(%rip),%ymm3 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,226,125,24,29,191,135,2,0 ; vbroadcastss 0x287bf(%rip),%ymm3 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,232,135,2,0 ; vbroadcastss 0x287e8(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,36,135,2,0 ; vbroadcastss 0x28724(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
@@ -3474,23 +3474,23 @@ _sk_load_565_dst_hsw LABEL PROC
DB 117,114 ; jne 3a29 <_sk_load_565_dst_hsw+0x8d>
DB 196,129,122,111,36,88 ; vmovdqu (%r8,%r11,2),%xmm4
DB 196,226,125,51,244 ; vpmovzxwd %xmm4,%ymm6
- DB 196,226,125,88,37,145,135,2,0 ; vpbroadcastd 0x28791(%rip),%ymm4 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,226,125,88,37,205,134,2,0 ; vpbroadcastd 0x286cd(%rip),%ymm4 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 197,205,219,228 ; vpand %ymm4,%ymm6,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,132,135,2,0 ; vbroadcastss 0x28784(%rip),%ymm5 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,226,125,24,45,192,134,2,0 ; vbroadcastss 0x286c0(%rip),%ymm5 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 197,220,89,229 ; vmulps %ymm5,%ymm4,%ymm4
- DB 196,226,125,88,45,123,135,2,0 ; vpbroadcastd 0x2877b(%rip),%ymm5 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,226,125,88,45,183,134,2,0 ; vpbroadcastd 0x286b7(%rip),%ymm5 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 197,205,219,237 ; vpand %ymm5,%ymm6,%ymm5
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
- DB 196,226,125,24,61,110,135,2,0 ; vbroadcastss 0x2876e(%rip),%ymm7 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,226,125,24,61,170,134,2,0 ; vbroadcastss 0x286aa(%rip),%ymm7 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 197,212,89,239 ; vmulps %ymm7,%ymm5,%ymm5
- DB 196,226,125,88,61,101,135,2,0 ; vpbroadcastd 0x28765(%rip),%ymm7 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,226,125,88,61,161,134,2,0 ; vpbroadcastd 0x286a1(%rip),%ymm7 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 197,205,219,247 ; vpand %ymm7,%ymm6,%ymm6
DB 197,252,91,246 ; vcvtdq2ps %ymm6,%ymm6
- DB 196,226,125,24,61,88,135,2,0 ; vbroadcastss 0x28758(%rip),%ymm7 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,226,125,24,61,148,134,2,0 ; vbroadcastss 0x28694(%rip),%ymm7 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 197,204,89,247 ; vmulps %ymm7,%ymm6,%ymm6
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,61,189,134,2,0 ; vbroadcastss 0x286bd(%rip),%ymm7 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,61,249,133,2,0 ; vbroadcastss 0x285f9(%rip),%ymm7 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
@@ -3584,23 +3584,23 @@ _sk_gather_565_hsw LABEL PROC
DB 65,15,183,4,88 ; movzwl (%r8,%rbx,2),%eax
DB 197,249,196,192,7 ; vpinsrw $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,51,208 ; vpmovzxwd %xmm0,%ymm2
- DB 196,226,125,88,5,217,133,2,0 ; vpbroadcastd 0x285d9(%rip),%ymm0 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,226,125,88,5,21,133,2,0 ; vpbroadcastd 0x28515(%rip),%ymm0 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 197,237,219,192 ; vpand %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,204,133,2,0 ; vbroadcastss 0x285cc(%rip),%ymm1 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,226,125,24,13,8,133,2,0 ; vbroadcastss 0x28508(%rip),%ymm1 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,195,133,2,0 ; vpbroadcastd 0x285c3(%rip),%ymm1 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,226,125,88,13,255,132,2,0 ; vpbroadcastd 0x284ff(%rip),%ymm1 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 197,237,219,201 ; vpand %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,182,133,2,0 ; vbroadcastss 0x285b6(%rip),%ymm3 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,226,125,24,29,242,132,2,0 ; vbroadcastss 0x284f2(%rip),%ymm3 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,88,29,173,133,2,0 ; vpbroadcastd 0x285ad(%rip),%ymm3 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,226,125,88,29,233,132,2,0 ; vpbroadcastd 0x284e9(%rip),%ymm3 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 197,237,219,211 ; vpand %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,160,133,2,0 ; vbroadcastss 0x285a0(%rip),%ymm3 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,226,125,24,29,220,132,2,0 ; vbroadcastss 0x284dc(%rip),%ymm3 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,5,133,2,0 ; vbroadcastss 0x28505(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,65,132,2,0 ; vbroadcastss 0x28441(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 91 ; pop %rbx
DB 65,92 ; pop %r12
DB 65,94 ; pop %r14
@@ -3616,11 +3616,11 @@ _sk_store_565_hsw LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,201,133,2,0 ; vbroadcastss 0x285c9(%rip),%ymm8 # 2c1d0 <_sk_overlay_sse2_8bit+0x55b>
+ DB 196,98,125,24,5,5,133,2,0 ; vbroadcastss 0x28505(%rip),%ymm8 # 2c10c <_sk_overlay_sse2_8bit+0x55c>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,53,114,241,11 ; vpslld $0xb,%ymm9,%ymm9
- DB 196,98,125,24,21,180,133,2,0 ; vbroadcastss 0x285b4(%rip),%ymm10 # 2c1d4 <_sk_overlay_sse2_8bit+0x55f>
+ DB 196,98,125,24,21,240,132,2,0 ; vbroadcastss 0x284f0(%rip),%ymm10 # 2c110 <_sk_overlay_sse2_8bit+0x560>
DB 196,65,116,89,210 ; vmulps %ymm10,%ymm1,%ymm10
DB 196,65,125,91,210 ; vcvtps2dq %ymm10,%ymm10
DB 196,193,45,114,242,5 ; vpslld $0x5,%ymm10,%ymm10
@@ -3693,25 +3693,25 @@ _sk_load_4444_hsw LABEL PROC
DB 15,133,138,0,0,0 ; jne 3d81 <_sk_load_4444_hsw+0xa9>
DB 196,129,122,111,4,88 ; vmovdqu (%r8,%r11,2),%xmm0
DB 196,226,125,51,216 ; vpmovzxwd %xmm0,%ymm3
- DB 196,226,125,88,5,205,132,2,0 ; vpbroadcastd 0x284cd(%rip),%ymm0 # 2c1d8 <_sk_overlay_sse2_8bit+0x563>
+ DB 196,226,125,88,5,9,132,2,0 ; vpbroadcastd 0x28409(%rip),%ymm0 # 2c114 <_sk_overlay_sse2_8bit+0x564>
DB 197,229,219,192 ; vpand %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,192,132,2,0 ; vbroadcastss 0x284c0(%rip),%ymm1 # 2c1dc <_sk_overlay_sse2_8bit+0x567>
+ DB 196,226,125,24,13,252,131,2,0 ; vbroadcastss 0x283fc(%rip),%ymm1 # 2c118 <_sk_overlay_sse2_8bit+0x568>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,183,132,2,0 ; vpbroadcastd 0x284b7(%rip),%ymm1 # 2c1e0 <_sk_overlay_sse2_8bit+0x56b>
+ DB 196,226,125,88,13,243,131,2,0 ; vpbroadcastd 0x283f3(%rip),%ymm1 # 2c11c <_sk_overlay_sse2_8bit+0x56c>
DB 197,229,219,201 ; vpand %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,170,132,2,0 ; vbroadcastss 0x284aa(%rip),%ymm2 # 2c1e4 <_sk_overlay_sse2_8bit+0x56f>
+ DB 196,226,125,24,21,230,131,2,0 ; vbroadcastss 0x283e6(%rip),%ymm2 # 2c120 <_sk_overlay_sse2_8bit+0x570>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,88,21,161,132,2,0 ; vpbroadcastd 0x284a1(%rip),%ymm2 # 2c1e8 <_sk_overlay_sse2_8bit+0x573>
+ DB 196,226,125,88,21,221,131,2,0 ; vpbroadcastd 0x283dd(%rip),%ymm2 # 2c124 <_sk_overlay_sse2_8bit+0x574>
DB 197,229,219,210 ; vpand %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,148,132,2,0 ; vbroadcastss 0x28494(%rip),%ymm8 # 2c1ec <_sk_overlay_sse2_8bit+0x577>
+ DB 196,98,125,24,5,208,131,2,0 ; vbroadcastss 0x283d0(%rip),%ymm8 # 2c128 <_sk_overlay_sse2_8bit+0x578>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,88,5,138,132,2,0 ; vpbroadcastd 0x2848a(%rip),%ymm8 # 2c1f0 <_sk_overlay_sse2_8bit+0x57b>
+ DB 196,98,125,88,5,198,131,2,0 ; vpbroadcastd 0x283c6(%rip),%ymm8 # 2c12c <_sk_overlay_sse2_8bit+0x57c>
DB 196,193,101,219,216 ; vpand %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,124,132,2,0 ; vbroadcastss 0x2847c(%rip),%ymm8 # 2c1f4 <_sk_overlay_sse2_8bit+0x57f>
+ DB 196,98,125,24,5,184,131,2,0 ; vbroadcastss 0x283b8(%rip),%ymm8 # 2c130 <_sk_overlay_sse2_8bit+0x580>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -3777,25 +3777,25 @@ _sk_load_4444_dst_hsw LABEL PROC
DB 15,133,138,0,0,0 ; jne 3ecd <_sk_load_4444_dst_hsw+0xa9>
DB 196,129,122,111,36,88 ; vmovdqu (%r8,%r11,2),%xmm4
DB 196,226,125,51,252 ; vpmovzxwd %xmm4,%ymm7
- DB 196,226,125,88,37,129,131,2,0 ; vpbroadcastd 0x28381(%rip),%ymm4 # 2c1d8 <_sk_overlay_sse2_8bit+0x563>
+ DB 196,226,125,88,37,189,130,2,0 ; vpbroadcastd 0x282bd(%rip),%ymm4 # 2c114 <_sk_overlay_sse2_8bit+0x564>
DB 197,197,219,228 ; vpand %ymm4,%ymm7,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,116,131,2,0 ; vbroadcastss 0x28374(%rip),%ymm5 # 2c1dc <_sk_overlay_sse2_8bit+0x567>
+ DB 196,226,125,24,45,176,130,2,0 ; vbroadcastss 0x282b0(%rip),%ymm5 # 2c118 <_sk_overlay_sse2_8bit+0x568>
DB 197,220,89,229 ; vmulps %ymm5,%ymm4,%ymm4
- DB 196,226,125,88,45,107,131,2,0 ; vpbroadcastd 0x2836b(%rip),%ymm5 # 2c1e0 <_sk_overlay_sse2_8bit+0x56b>
+ DB 196,226,125,88,45,167,130,2,0 ; vpbroadcastd 0x282a7(%rip),%ymm5 # 2c11c <_sk_overlay_sse2_8bit+0x56c>
DB 197,197,219,237 ; vpand %ymm5,%ymm7,%ymm5
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
- DB 196,226,125,24,53,94,131,2,0 ; vbroadcastss 0x2835e(%rip),%ymm6 # 2c1e4 <_sk_overlay_sse2_8bit+0x56f>
+ DB 196,226,125,24,53,154,130,2,0 ; vbroadcastss 0x2829a(%rip),%ymm6 # 2c120 <_sk_overlay_sse2_8bit+0x570>
DB 197,212,89,238 ; vmulps %ymm6,%ymm5,%ymm5
- DB 196,226,125,88,53,85,131,2,0 ; vpbroadcastd 0x28355(%rip),%ymm6 # 2c1e8 <_sk_overlay_sse2_8bit+0x573>
+ DB 196,226,125,88,53,145,130,2,0 ; vpbroadcastd 0x28291(%rip),%ymm6 # 2c124 <_sk_overlay_sse2_8bit+0x574>
DB 197,197,219,246 ; vpand %ymm6,%ymm7,%ymm6
DB 197,252,91,246 ; vcvtdq2ps %ymm6,%ymm6
- DB 196,98,125,24,5,72,131,2,0 ; vbroadcastss 0x28348(%rip),%ymm8 # 2c1ec <_sk_overlay_sse2_8bit+0x577>
+ DB 196,98,125,24,5,132,130,2,0 ; vbroadcastss 0x28284(%rip),%ymm8 # 2c128 <_sk_overlay_sse2_8bit+0x578>
DB 196,193,76,89,240 ; vmulps %ymm8,%ymm6,%ymm6
- DB 196,98,125,88,5,62,131,2,0 ; vpbroadcastd 0x2833e(%rip),%ymm8 # 2c1f0 <_sk_overlay_sse2_8bit+0x57b>
+ DB 196,98,125,88,5,122,130,2,0 ; vpbroadcastd 0x2827a(%rip),%ymm8 # 2c12c <_sk_overlay_sse2_8bit+0x57c>
DB 196,193,69,219,248 ; vpand %ymm8,%ymm7,%ymm7
DB 197,252,91,255 ; vcvtdq2ps %ymm7,%ymm7
- DB 196,98,125,24,5,48,131,2,0 ; vbroadcastss 0x28330(%rip),%ymm8 # 2c1f4 <_sk_overlay_sse2_8bit+0x57f>
+ DB 196,98,125,24,5,108,130,2,0 ; vbroadcastss 0x2826c(%rip),%ymm8 # 2c130 <_sk_overlay_sse2_8bit+0x580>
DB 196,193,68,89,248 ; vmulps %ymm8,%ymm7,%ymm7
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -3891,25 +3891,25 @@ _sk_gather_4444_hsw LABEL PROC
DB 65,15,183,4,88 ; movzwl (%r8,%rbx,2),%eax
DB 197,249,196,192,7 ; vpinsrw $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,51,216 ; vpmovzxwd %xmm0,%ymm3
- DB 196,226,125,88,5,173,129,2,0 ; vpbroadcastd 0x281ad(%rip),%ymm0 # 2c1d8 <_sk_overlay_sse2_8bit+0x563>
+ DB 196,226,125,88,5,233,128,2,0 ; vpbroadcastd 0x280e9(%rip),%ymm0 # 2c114 <_sk_overlay_sse2_8bit+0x564>
DB 197,229,219,192 ; vpand %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,160,129,2,0 ; vbroadcastss 0x281a0(%rip),%ymm1 # 2c1dc <_sk_overlay_sse2_8bit+0x567>
+ DB 196,226,125,24,13,220,128,2,0 ; vbroadcastss 0x280dc(%rip),%ymm1 # 2c118 <_sk_overlay_sse2_8bit+0x568>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,151,129,2,0 ; vpbroadcastd 0x28197(%rip),%ymm1 # 2c1e0 <_sk_overlay_sse2_8bit+0x56b>
+ DB 196,226,125,88,13,211,128,2,0 ; vpbroadcastd 0x280d3(%rip),%ymm1 # 2c11c <_sk_overlay_sse2_8bit+0x56c>
DB 197,229,219,201 ; vpand %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,138,129,2,0 ; vbroadcastss 0x2818a(%rip),%ymm2 # 2c1e4 <_sk_overlay_sse2_8bit+0x56f>
+ DB 196,226,125,24,21,198,128,2,0 ; vbroadcastss 0x280c6(%rip),%ymm2 # 2c120 <_sk_overlay_sse2_8bit+0x570>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,88,21,129,129,2,0 ; vpbroadcastd 0x28181(%rip),%ymm2 # 2c1e8 <_sk_overlay_sse2_8bit+0x573>
+ DB 196,226,125,88,21,189,128,2,0 ; vpbroadcastd 0x280bd(%rip),%ymm2 # 2c124 <_sk_overlay_sse2_8bit+0x574>
DB 197,229,219,210 ; vpand %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,116,129,2,0 ; vbroadcastss 0x28174(%rip),%ymm8 # 2c1ec <_sk_overlay_sse2_8bit+0x577>
+ DB 196,98,125,24,5,176,128,2,0 ; vbroadcastss 0x280b0(%rip),%ymm8 # 2c128 <_sk_overlay_sse2_8bit+0x578>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,88,5,106,129,2,0 ; vpbroadcastd 0x2816a(%rip),%ymm8 # 2c1f0 <_sk_overlay_sse2_8bit+0x57b>
+ DB 196,98,125,88,5,166,128,2,0 ; vpbroadcastd 0x280a6(%rip),%ymm8 # 2c12c <_sk_overlay_sse2_8bit+0x57c>
DB 196,193,101,219,216 ; vpand %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,92,129,2,0 ; vbroadcastss 0x2815c(%rip),%ymm8 # 2c1f4 <_sk_overlay_sse2_8bit+0x57f>
+ DB 196,98,125,24,5,152,128,2,0 ; vbroadcastss 0x28098(%rip),%ymm8 # 2c130 <_sk_overlay_sse2_8bit+0x580>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
@@ -3927,7 +3927,7 @@ _sk_store_4444_hsw LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,49,129,2,0 ; vbroadcastss 0x28131(%rip),%ymm8 # 2c1f8 <_sk_overlay_sse2_8bit+0x583>
+ DB 196,98,125,24,5,109,128,2,0 ; vbroadcastss 0x2806d(%rip),%ymm8 # 2c134 <_sk_overlay_sse2_8bit+0x584>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,53,114,241,12 ; vpslld $0xc,%ymm9,%ymm9
@@ -4006,14 +4006,14 @@ _sk_load_8888_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,86 ; jne 4216 <_sk_load_8888_hsw+0x72>
DB 196,129,126,111,28,152 ; vmovdqu (%r8,%r11,4),%ymm3
- DB 197,229,219,5,178,129,2,0 ; vpand 0x281b2(%rip),%ymm3,%ymm0 # 2c380 <_sk_overlay_sse2_8bit+0x70b>
+ DB 197,229,219,5,242,128,2,0 ; vpand 0x280f2(%rip),%ymm3,%ymm0 # 2c2c0 <_sk_overlay_sse2_8bit+0x710>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,125,127,2,0 ; vbroadcastss 0x27f7d(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,185,126,2,0 ; vbroadcastss 0x27eb9(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,226,101,0,13,183,129,2,0 ; vpshufb 0x281b7(%rip),%ymm3,%ymm1 # 2c3a0 <_sk_overlay_sse2_8bit+0x72b>
+ DB 196,226,101,0,13,247,128,2,0 ; vpshufb 0x280f7(%rip),%ymm3,%ymm1 # 2c2e0 <_sk_overlay_sse2_8bit+0x730>
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,226,101,0,21,197,129,2,0 ; vpshufb 0x281c5(%rip),%ymm3,%ymm2 # 2c3c0 <_sk_overlay_sse2_8bit+0x74b>
+ DB 196,226,101,0,21,5,129,2,0 ; vpshufb 0x28105(%rip),%ymm3,%ymm2 # 2c300 <_sk_overlay_sse2_8bit+0x750>
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -4087,14 +4087,14 @@ _sk_load_8888_dst_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,86 ; jne 434a <_sk_load_8888_dst_hsw+0x72>
DB 196,129,126,111,60,152 ; vmovdqu (%r8,%r11,4),%ymm7
- DB 197,197,219,37,222,128,2,0 ; vpand 0x280de(%rip),%ymm7,%ymm4 # 2c3e0 <_sk_overlay_sse2_8bit+0x76b>
+ DB 197,197,219,37,30,128,2,0 ; vpand 0x2801e(%rip),%ymm7,%ymm4 # 2c320 <_sk_overlay_sse2_8bit+0x770>
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,98,125,24,5,73,126,2,0 ; vbroadcastss 0x27e49(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,133,125,2,0 ; vbroadcastss 0x27d85(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,92,89,224 ; vmulps %ymm8,%ymm4,%ymm4
- DB 196,226,69,0,45,227,128,2,0 ; vpshufb 0x280e3(%rip),%ymm7,%ymm5 # 2c400 <_sk_overlay_sse2_8bit+0x78b>
+ DB 196,226,69,0,45,35,128,2,0 ; vpshufb 0x28023(%rip),%ymm7,%ymm5 # 2c340 <_sk_overlay_sse2_8bit+0x790>
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
DB 196,193,84,89,232 ; vmulps %ymm8,%ymm5,%ymm5
- DB 196,226,69,0,53,241,128,2,0 ; vpshufb 0x280f1(%rip),%ymm7,%ymm6 # 2c420 <_sk_overlay_sse2_8bit+0x7ab>
+ DB 196,226,69,0,53,49,128,2,0 ; vpshufb 0x28031(%rip),%ymm7,%ymm6 # 2c360 <_sk_overlay_sse2_8bit+0x7b0>
DB 197,252,91,246 ; vcvtdq2ps %ymm6,%ymm6
DB 196,193,76,89,240 ; vmulps %ymm8,%ymm6,%ymm6
DB 197,197,114,215,24 ; vpsrld $0x18,%ymm7,%ymm7
@@ -4167,14 +4167,14 @@ _sk_gather_8888_hsw LABEL PROC
DB 197,245,254,192 ; vpaddd %ymm0,%ymm1,%ymm0
DB 197,245,118,201 ; vpcmpeqd %ymm1,%ymm1,%ymm1
DB 196,194,117,144,28,128 ; vpgatherdd %ymm1,(%r8,%ymm0,4),%ymm3
- DB 197,229,219,5,6,128,2,0 ; vpand 0x28006(%rip),%ymm3,%ymm0 # 2c440 <_sk_overlay_sse2_8bit+0x7cb>
+ DB 197,229,219,5,70,127,2,0 ; vpand 0x27f46(%rip),%ymm3,%ymm0 # 2c380 <_sk_overlay_sse2_8bit+0x7d0>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,17,125,2,0 ; vbroadcastss 0x27d11(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,77,124,2,0 ; vbroadcastss 0x27c4d(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,226,101,0,13,11,128,2,0 ; vpshufb 0x2800b(%rip),%ymm3,%ymm1 # 2c460 <_sk_overlay_sse2_8bit+0x7eb>
+ DB 196,226,101,0,13,75,127,2,0 ; vpshufb 0x27f4b(%rip),%ymm3,%ymm1 # 2c3a0 <_sk_overlay_sse2_8bit+0x7f0>
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,226,101,0,21,25,128,2,0 ; vpshufb 0x28019(%rip),%ymm3,%ymm2 # 2c480 <_sk_overlay_sse2_8bit+0x80b>
+ DB 196,226,101,0,21,89,127,2,0 ; vpshufb 0x27f59(%rip),%ymm3,%ymm2 # 2c3c0 <_sk_overlay_sse2_8bit+0x810>
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -4192,7 +4192,7 @@ _sk_store_8888_hsw LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,110,124,2,0 ; vbroadcastss 0x27c6e(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,170,123,2,0 ; vbroadcastss 0x27baa(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,65,116,89,208 ; vmulps %ymm8,%ymm1,%ymm10
@@ -4269,14 +4269,14 @@ _sk_load_bgra_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,86 ; jne 45f6 <_sk_load_bgra_hsw+0x72>
DB 196,129,126,111,28,152 ; vmovdqu (%r8,%r11,4),%ymm3
- DB 197,229,219,5,242,126,2,0 ; vpand 0x27ef2(%rip),%ymm3,%ymm0 # 2c4a0 <_sk_overlay_sse2_8bit+0x82b>
+ DB 197,229,219,5,50,126,2,0 ; vpand 0x27e32(%rip),%ymm3,%ymm0 # 2c3e0 <_sk_overlay_sse2_8bit+0x830>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,157,123,2,0 ; vbroadcastss 0x27b9d(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,217,122,2,0 ; vbroadcastss 0x27ad9(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,208 ; vmulps %ymm8,%ymm0,%ymm2
- DB 196,226,101,0,5,247,126,2,0 ; vpshufb 0x27ef7(%rip),%ymm3,%ymm0 # 2c4c0 <_sk_overlay_sse2_8bit+0x84b>
+ DB 196,226,101,0,5,55,126,2,0 ; vpshufb 0x27e37(%rip),%ymm3,%ymm0 # 2c400 <_sk_overlay_sse2_8bit+0x850>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
DB 196,193,124,89,200 ; vmulps %ymm8,%ymm0,%ymm1
- DB 196,226,101,0,5,5,127,2,0 ; vpshufb 0x27f05(%rip),%ymm3,%ymm0 # 2c4e0 <_sk_overlay_sse2_8bit+0x86b>
+ DB 196,226,101,0,5,69,126,2,0 ; vpshufb 0x27e45(%rip),%ymm3,%ymm0 # 2c420 <_sk_overlay_sse2_8bit+0x870>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -4350,14 +4350,14 @@ _sk_load_bgra_dst_hsw LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,86 ; jne 472a <_sk_load_bgra_dst_hsw+0x72>
DB 196,129,126,111,60,152 ; vmovdqu (%r8,%r11,4),%ymm7
- DB 197,197,219,37,30,126,2,0 ; vpand 0x27e1e(%rip),%ymm7,%ymm4 # 2c500 <_sk_overlay_sse2_8bit+0x88b>
+ DB 197,197,219,37,94,125,2,0 ; vpand 0x27d5e(%rip),%ymm7,%ymm4 # 2c440 <_sk_overlay_sse2_8bit+0x890>
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,98,125,24,5,105,122,2,0 ; vbroadcastss 0x27a69(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,165,121,2,0 ; vbroadcastss 0x279a5(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,92,89,240 ; vmulps %ymm8,%ymm4,%ymm6
- DB 196,226,69,0,37,35,126,2,0 ; vpshufb 0x27e23(%rip),%ymm7,%ymm4 # 2c520 <_sk_overlay_sse2_8bit+0x8ab>
+ DB 196,226,69,0,37,99,125,2,0 ; vpshufb 0x27d63(%rip),%ymm7,%ymm4 # 2c460 <_sk_overlay_sse2_8bit+0x8b0>
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
DB 196,193,92,89,232 ; vmulps %ymm8,%ymm4,%ymm5
- DB 196,226,69,0,37,49,126,2,0 ; vpshufb 0x27e31(%rip),%ymm7,%ymm4 # 2c540 <_sk_overlay_sse2_8bit+0x8cb>
+ DB 196,226,69,0,37,113,125,2,0 ; vpshufb 0x27d71(%rip),%ymm7,%ymm4 # 2c480 <_sk_overlay_sse2_8bit+0x8d0>
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
DB 196,193,92,89,224 ; vmulps %ymm8,%ymm4,%ymm4
DB 197,197,114,215,24 ; vpsrld $0x18,%ymm7,%ymm7
@@ -4430,14 +4430,14 @@ _sk_gather_bgra_hsw LABEL PROC
DB 197,245,254,192 ; vpaddd %ymm0,%ymm1,%ymm0
DB 197,245,118,201 ; vpcmpeqd %ymm1,%ymm1,%ymm1
DB 196,194,117,144,28,128 ; vpgatherdd %ymm1,(%r8,%ymm0,4),%ymm3
- DB 197,229,219,5,70,125,2,0 ; vpand 0x27d46(%rip),%ymm3,%ymm0 # 2c560 <_sk_overlay_sse2_8bit+0x8eb>
+ DB 197,229,219,5,134,124,2,0 ; vpand 0x27c86(%rip),%ymm3,%ymm0 # 2c4a0 <_sk_overlay_sse2_8bit+0x8f0>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,49,121,2,0 ; vbroadcastss 0x27931(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,109,120,2,0 ; vbroadcastss 0x2786d(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,208 ; vmulps %ymm8,%ymm0,%ymm2
- DB 196,226,101,0,5,75,125,2,0 ; vpshufb 0x27d4b(%rip),%ymm3,%ymm0 # 2c580 <_sk_overlay_sse2_8bit+0x90b>
+ DB 196,226,101,0,5,139,124,2,0 ; vpshufb 0x27c8b(%rip),%ymm3,%ymm0 # 2c4c0 <_sk_overlay_sse2_8bit+0x910>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
DB 196,193,124,89,200 ; vmulps %ymm8,%ymm0,%ymm1
- DB 196,226,101,0,5,89,125,2,0 ; vpshufb 0x27d59(%rip),%ymm3,%ymm0 # 2c5a0 <_sk_overlay_sse2_8bit+0x92b>
+ DB 196,226,101,0,5,153,124,2,0 ; vpshufb 0x27c99(%rip),%ymm3,%ymm0 # 2c4e0 <_sk_overlay_sse2_8bit+0x930>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -4455,7 +4455,7 @@ _sk_store_bgra_hsw LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,142,120,2,0 ; vbroadcastss 0x2788e(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,202,119,2,0 ; vbroadcastss 0x277ca(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,65,108,89,200 ; vmulps %ymm8,%ymm2,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,65,116,89,208 ; vmulps %ymm8,%ymm1,%ymm10
@@ -4753,7 +4753,7 @@ _sk_load_u16_be_hsw LABEL PROC
DB 197,241,235,192 ; vpor %xmm0,%xmm1,%xmm0
DB 196,226,125,51,192 ; vpmovzxwd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,21,59,116,2,0 ; vbroadcastss 0x2743b(%rip),%ymm10 # 2c174 <_sk_overlay_sse2_8bit+0x4ff>
+ DB 196,98,125,24,21,119,115,2,0 ; vbroadcastss 0x27377(%rip),%ymm10 # 2c0b0 <_sk_overlay_sse2_8bit+0x500>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,185,109,202 ; vpunpckhqdq %xmm2,%xmm8,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -4842,7 +4842,7 @@ _sk_load_rgb_u16_be_hsw LABEL PROC
DB 197,225,235,192 ; vpor %xmm0,%xmm3,%xmm0
DB 196,226,125,51,192 ; vpmovzxwd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,29,174,114,2,0 ; vbroadcastss 0x272ae(%rip),%ymm3 # 2c174 <_sk_overlay_sse2_8bit+0x4ff>
+ DB 196,226,125,24,29,234,113,2,0 ; vbroadcastss 0x271ea(%rip),%ymm3 # 2c0b0 <_sk_overlay_sse2_8bit+0x500>
DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
DB 197,185,109,201 ; vpunpckhqdq %xmm1,%xmm8,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -4859,7 +4859,7 @@ _sk_load_rgb_u16_be_hsw LABEL PROC
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,208,113,2,0 ; vbroadcastss 0x271d0(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,12,113,2,0 ; vbroadcastss 0x2710c(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 196,193,121,110,4,64 ; vmovd (%r8,%rax,2),%xmm0
DB 196,65,121,196,92,64,4,2 ; vpinsrw $0x2,0x4(%r8,%rax,2),%xmm0,%xmm11
@@ -4933,7 +4933,7 @@ _sk_store_u16_be_hsw LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 73,99,193 ; movslq %r9d,%rax
- DB 196,98,125,24,5,144,113,2,0 ; vbroadcastss 0x27190(%rip),%ymm8 # 2c1fc <_sk_overlay_sse2_8bit+0x587>
+ DB 196,98,125,24,5,204,112,2,0 ; vbroadcastss 0x270cc(%rip),%ymm8 # 2c138 <_sk_overlay_sse2_8bit+0x588>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,67,125,25,202,1 ; vextractf128 $0x1,%ymm9,%xmm10
@@ -5190,7 +5190,7 @@ _sk_load_f32_dst_hsw LABEL PROC
DB 255,92,255,255 ; lcall *-0x1(%rdi,%rdi,8)
DB 255,70,255 ; incl -0x1(%rsi)
DB 255 ; (bad)
- DB 255,53,255,255,255,40 ; pushq 0x28ffffff(%rip) # 290054e4 <_sk_overlay_sse2_8bit+0x28fd986f>
+ DB 255,53,255,255,255,40 ; pushq 0x28ffffff(%rip) # 290054e4 <_sk_overlay_sse2_8bit+0x28fd9934>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -5309,7 +5309,7 @@ _sk_mirror_x_hsw LABEL PROC
DB 196,65,124,92,218 ; vsubps %ymm10,%ymm0,%ymm11
DB 196,193,58,88,192 ; vaddss %xmm8,%xmm8,%xmm0
DB 196,98,125,24,192 ; vbroadcastss %xmm0,%ymm8
- DB 197,178,89,5,75,106,2,0 ; vmulss 0x26a4b(%rip),%xmm9,%xmm0 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 197,178,89,5,135,105,2,0 ; vmulss 0x26987(%rip),%xmm9,%xmm0 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,164,89,192 ; vmulps %ymm0,%ymm11,%ymm0
DB 196,227,125,8,192,1 ; vroundps $0x1,%ymm0,%ymm0
@@ -5334,7 +5334,7 @@ _sk_mirror_y_hsw LABEL PROC
DB 196,65,116,92,218 ; vsubps %ymm10,%ymm1,%ymm11
DB 196,193,58,88,200 ; vaddss %xmm8,%xmm8,%xmm1
DB 196,98,125,24,193 ; vbroadcastss %xmm1,%ymm8
- DB 197,178,89,13,231,105,2,0 ; vmulss 0x269e7(%rip),%xmm9,%xmm1 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 197,178,89,13,35,105,2,0 ; vmulss 0x26923(%rip),%xmm9,%xmm1 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,226,125,24,201 ; vbroadcastss %xmm1,%ymm1
DB 197,164,89,201 ; vmulps %ymm1,%ymm11,%ymm1
DB 196,227,125,8,201,1 ; vroundps $0x1,%ymm1,%ymm1
@@ -5354,7 +5354,7 @@ PUBLIC _sk_clamp_x_1_hsw
_sk_clamp_x_1_hsw LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 197,188,95,192 ; vmaxps %ymm0,%ymm8,%ymm0
- DB 196,98,125,24,5,156,105,2,0 ; vbroadcastss 0x2699c(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,216,104,2,0 ; vbroadcastss 0x268d8(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -5368,9 +5368,9 @@ _sk_repeat_x_1_hsw LABEL PROC
PUBLIC _sk_mirror_x_1_hsw
_sk_mirror_x_1_hsw LABEL PROC
- DB 196,98,125,24,5,147,105,2,0 ; vbroadcastss 0x26993(%rip),%ymm8 # 2c0fc <_sk_overlay_sse2_8bit+0x487>
+ DB 196,98,125,24,5,207,104,2,0 ; vbroadcastss 0x268cf(%rip),%ymm8 # 2c038 <_sk_overlay_sse2_8bit+0x488>
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,13,105,105,2,0 ; vbroadcastss 0x26969(%rip),%ymm9 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,13,165,104,2,0 ; vbroadcastss 0x268a5(%rip),%ymm9 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,124,89,201 ; vmulps %ymm9,%ymm0,%ymm9
DB 196,67,125,8,201,1 ; vroundps $0x1,%ymm9,%ymm9
DB 196,65,52,88,201 ; vaddps %ymm9,%ymm9,%ymm9
@@ -5384,11 +5384,11 @@ _sk_mirror_x_1_hsw LABEL PROC
PUBLIC _sk_luminance_to_alpha_hsw
_sk_luminance_to_alpha_hsw LABEL PROC
- DB 196,226,125,24,29,85,106,2,0 ; vbroadcastss 0x26a55(%rip),%ymm3 # 2c200 <_sk_overlay_sse2_8bit+0x58b>
- DB 196,98,125,24,5,80,106,2,0 ; vbroadcastss 0x26a50(%rip),%ymm8 # 2c204 <_sk_overlay_sse2_8bit+0x58f>
+ DB 196,226,125,24,29,145,105,2,0 ; vbroadcastss 0x26991(%rip),%ymm3 # 2c13c <_sk_overlay_sse2_8bit+0x58c>
+ DB 196,98,125,24,5,140,105,2,0 ; vbroadcastss 0x2698c(%rip),%ymm8 # 2c140 <_sk_overlay_sse2_8bit+0x590>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
DB 196,226,125,184,203 ; vfmadd231ps %ymm3,%ymm0,%ymm1
- DB 196,226,125,24,29,65,106,2,0 ; vbroadcastss 0x26a41(%rip),%ymm3 # 2c208 <_sk_overlay_sse2_8bit+0x593>
+ DB 196,226,125,24,29,125,105,2,0 ; vbroadcastss 0x2697d(%rip),%ymm3 # 2c144 <_sk_overlay_sse2_8bit+0x594>
DB 196,226,109,168,217 ; vfmadd213ps %ymm1,%ymm2,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -5634,14 +5634,14 @@ _sk_evenly_spaced_gradient_hsw LABEL PROC
PUBLIC _sk_gauss_a_to_rgba_hsw
_sk_gauss_a_to_rgba_hsw LABEL PROC
- DB 196,226,125,24,5,75,102,2,0 ; vbroadcastss 0x2664b(%rip),%ymm0 # 2c20c <_sk_overlay_sse2_8bit+0x597>
- DB 196,226,125,24,13,70,102,2,0 ; vbroadcastss 0x26646(%rip),%ymm1 # 2c210 <_sk_overlay_sse2_8bit+0x59b>
+ DB 196,226,125,24,5,135,101,2,0 ; vbroadcastss 0x26587(%rip),%ymm0 # 2c148 <_sk_overlay_sse2_8bit+0x598>
+ DB 196,226,125,24,13,130,101,2,0 ; vbroadcastss 0x26582(%rip),%ymm1 # 2c14c <_sk_overlay_sse2_8bit+0x59c>
DB 196,226,101,168,200 ; vfmadd213ps %ymm0,%ymm3,%ymm1
- DB 196,226,125,24,5,60,102,2,0 ; vbroadcastss 0x2663c(%rip),%ymm0 # 2c214 <_sk_overlay_sse2_8bit+0x59f>
+ DB 196,226,125,24,5,120,101,2,0 ; vbroadcastss 0x26578(%rip),%ymm0 # 2c150 <_sk_overlay_sse2_8bit+0x5a0>
DB 196,226,101,184,193 ; vfmadd231ps %ymm1,%ymm3,%ymm0
- DB 196,226,125,24,13,50,102,2,0 ; vbroadcastss 0x26632(%rip),%ymm1 # 2c218 <_sk_overlay_sse2_8bit+0x5a3>
+ DB 196,226,125,24,13,110,101,2,0 ; vbroadcastss 0x2656e(%rip),%ymm1 # 2c154 <_sk_overlay_sse2_8bit+0x5a4>
DB 196,226,101,184,200 ; vfmadd231ps %ymm0,%ymm3,%ymm1
- DB 196,226,125,24,5,40,102,2,0 ; vbroadcastss 0x26628(%rip),%ymm0 # 2c21c <_sk_overlay_sse2_8bit+0x5a7>
+ DB 196,226,125,24,5,100,101,2,0 ; vbroadcastss 0x26564(%rip),%ymm0 # 2c158 <_sk_overlay_sse2_8bit+0x5a8>
DB 196,226,101,184,193 ; vfmadd231ps %ymm1,%ymm3,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
@@ -5658,7 +5658,7 @@ _sk_gradient_hsw LABEL PROC
DB 76,139,72,72 ; mov 0x48(%rax),%r9
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 65,186,1,0,0,0 ; mov $0x1,%r10d
- DB 196,226,125,24,21,185,100,2,0 ; vbroadcastss 0x264b9(%rip),%ymm2 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,226,125,24,21,245,99,2,0 ; vbroadcastss 0x263f5(%rip),%ymm2 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,65,53,239,201 ; vpxor %ymm9,%ymm9,%ymm9
DB 196,130,125,24,28,145 ; vbroadcastss (%r9,%r10,4),%ymm3
DB 197,228,194,216,2 ; vcmpleps %ymm0,%ymm3,%ymm3
@@ -5749,24 +5749,24 @@ _sk_xy_to_unit_angle_hsw LABEL PROC
DB 196,65,52,95,226 ; vmaxps %ymm10,%ymm9,%ymm12
DB 196,65,36,94,220 ; vdivps %ymm12,%ymm11,%ymm11
DB 196,65,36,89,227 ; vmulps %ymm11,%ymm11,%ymm12
- DB 196,98,125,24,45,108,100,2,0 ; vbroadcastss 0x2646c(%rip),%ymm13 # 2c220 <_sk_overlay_sse2_8bit+0x5ab>
- DB 196,98,125,24,53,103,100,2,0 ; vbroadcastss 0x26467(%rip),%ymm14 # 2c224 <_sk_overlay_sse2_8bit+0x5af>
+ DB 196,98,125,24,45,168,99,2,0 ; vbroadcastss 0x263a8(%rip),%ymm13 # 2c15c <_sk_overlay_sse2_8bit+0x5ac>
+ DB 196,98,125,24,53,163,99,2,0 ; vbroadcastss 0x263a3(%rip),%ymm14 # 2c160 <_sk_overlay_sse2_8bit+0x5b0>
DB 196,66,29,184,245 ; vfmadd231ps %ymm13,%ymm12,%ymm14
- DB 196,98,125,24,45,93,100,2,0 ; vbroadcastss 0x2645d(%rip),%ymm13 # 2c228 <_sk_overlay_sse2_8bit+0x5b3>
+ DB 196,98,125,24,45,153,99,2,0 ; vbroadcastss 0x26399(%rip),%ymm13 # 2c164 <_sk_overlay_sse2_8bit+0x5b4>
DB 196,66,29,184,238 ; vfmadd231ps %ymm14,%ymm12,%ymm13
- DB 196,98,125,24,53,83,100,2,0 ; vbroadcastss 0x26453(%rip),%ymm14 # 2c22c <_sk_overlay_sse2_8bit+0x5b7>
+ DB 196,98,125,24,53,143,99,2,0 ; vbroadcastss 0x2638f(%rip),%ymm14 # 2c168 <_sk_overlay_sse2_8bit+0x5b8>
DB 196,66,29,184,245 ; vfmadd231ps %ymm13,%ymm12,%ymm14
DB 196,65,36,89,222 ; vmulps %ymm14,%ymm11,%ymm11
DB 196,65,52,194,202,1 ; vcmpltps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,62,100,2,0 ; vbroadcastss 0x2643e(%rip),%ymm10 # 2c230 <_sk_overlay_sse2_8bit+0x5bb>
+ DB 196,98,125,24,21,122,99,2,0 ; vbroadcastss 0x2637a(%rip),%ymm10 # 2c16c <_sk_overlay_sse2_8bit+0x5bc>
DB 196,65,44,92,211 ; vsubps %ymm11,%ymm10,%ymm10
DB 196,67,37,74,202,144 ; vblendvps %ymm9,%ymm10,%ymm11,%ymm9
DB 196,193,124,194,192,1 ; vcmpltps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,21,212,98,2,0 ; vbroadcastss 0x262d4(%rip),%ymm10 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,21,16,98,2,0 ; vbroadcastss 0x26210(%rip),%ymm10 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,44,92,209 ; vsubps %ymm9,%ymm10,%ymm10
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 196,65,116,194,200,1 ; vcmpltps %ymm8,%ymm1,%ymm9
- DB 196,98,125,24,21,190,98,2,0 ; vbroadcastss 0x262be(%rip),%ymm10 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,21,250,97,2,0 ; vbroadcastss 0x261fa(%rip),%ymm10 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,44,92,208 ; vsubps %ymm0,%ymm10,%ymm10
DB 196,195,125,74,194,144 ; vblendvps %ymm9,%ymm10,%ymm0,%ymm0
DB 196,65,124,194,200,3 ; vcmpunordps %ymm8,%ymm0,%ymm9
@@ -5790,23 +5790,23 @@ _sk_xy_to_2pt_conical_quadratic_max_hsw LABEL PROC
DB 197,50,89,80,44 ; vmulss 0x2c(%rax),%xmm9,%xmm10
DB 196,66,125,24,210 ; vbroadcastss %xmm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,190,99,2,0 ; vbroadcastss 0x263be(%rip),%ymm11 # 2c234 <_sk_overlay_sse2_8bit+0x5bf>
+ DB 196,98,125,24,29,250,98,2,0 ; vbroadcastss 0x262fa(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x5c0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
DB 196,98,125,184,216 ; vfmadd231ps %ymm0,%ymm0,%ymm11
DB 196,193,50,89,193 ; vmulss %xmm9,%xmm9,%xmm0
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,157,99,2,0 ; vbroadcastss 0x2639d(%rip),%ymm9 # 2c238 <_sk_overlay_sse2_8bit+0x5c3>
+ DB 196,98,125,24,13,217,98,2,0 ; vbroadcastss 0x262d9(%rip),%ymm9 # 2c174 <_sk_overlay_sse2_8bit+0x5c4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,194,45,184,194 ; vfmadd231ps %ymm10,%ymm10,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,36 ; vbroadcastss 0x24(%rax),%ymm8
- DB 196,98,125,24,13,128,99,2,0 ; vbroadcastss 0x26380(%rip),%ymm9 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,13,188,98,2,0 ; vbroadcastss 0x262bc(%rip),%ymm9 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,17,98,2,0 ; vbroadcastss 0x26211(%rip),%ymm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,29,77,97,2,0 ; vbroadcastss 0x2614d(%rip),%ymm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,44,89,208 ; vmulps %ymm8,%ymm10,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -5823,23 +5823,23 @@ _sk_xy_to_2pt_conical_quadratic_min_hsw LABEL PROC
DB 197,50,89,80,44 ; vmulss 0x2c(%rax),%xmm9,%xmm10
DB 196,66,125,24,210 ; vbroadcastss %xmm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,38,99,2,0 ; vbroadcastss 0x26326(%rip),%ymm11 # 2c234 <_sk_overlay_sse2_8bit+0x5bf>
+ DB 196,98,125,24,29,98,98,2,0 ; vbroadcastss 0x26262(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x5c0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
DB 196,98,125,184,216 ; vfmadd231ps %ymm0,%ymm0,%ymm11
DB 196,193,50,89,193 ; vmulss %xmm9,%xmm9,%xmm0
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,5,99,2,0 ; vbroadcastss 0x26305(%rip),%ymm9 # 2c238 <_sk_overlay_sse2_8bit+0x5c3>
+ DB 196,98,125,24,13,65,98,2,0 ; vbroadcastss 0x26241(%rip),%ymm9 # 2c174 <_sk_overlay_sse2_8bit+0x5c4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,194,45,184,194 ; vfmadd231ps %ymm10,%ymm10,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,36 ; vbroadcastss 0x24(%rax),%ymm8
- DB 196,98,125,24,13,232,98,2,0 ; vbroadcastss 0x262e8(%rip),%ymm9 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,13,36,98,2,0 ; vbroadcastss 0x26224(%rip),%ymm9 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,121,97,2,0 ; vbroadcastss 0x26179(%rip),%ymm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,29,181,96,2,0 ; vbroadcastss 0x260b5(%rip),%ymm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,44,89,208 ; vmulps %ymm8,%ymm10,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -5855,14 +5855,14 @@ _sk_xy_to_2pt_conical_linear_hsw LABEL PROC
DB 197,58,89,72,44 ; vmulss 0x2c(%rax),%xmm8,%xmm9
DB 196,66,125,24,201 ; vbroadcastss %xmm9,%ymm9
DB 197,52,88,200 ; vaddps %ymm0,%ymm9,%ymm9
- DB 196,98,125,24,21,148,98,2,0 ; vbroadcastss 0x26294(%rip),%ymm10 # 2c234 <_sk_overlay_sse2_8bit+0x5bf>
+ DB 196,98,125,24,21,208,97,2,0 ; vbroadcastss 0x261d0(%rip),%ymm10 # 2c170 <_sk_overlay_sse2_8bit+0x5c0>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
DB 197,116,89,209 ; vmulps %ymm1,%ymm1,%ymm10
DB 196,98,125,184,208 ; vfmadd231ps %ymm0,%ymm0,%ymm10
DB 196,193,58,89,192 ; vmulss %xmm8,%xmm8,%xmm0
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,172,92,192 ; vsubps %ymm0,%ymm10,%ymm0
- DB 196,98,125,24,5,119,98,2,0 ; vbroadcastss 0x26277(%rip),%ymm8 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,5,179,97,2,0 ; vbroadcastss 0x261b3(%rip),%ymm8 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,193,124,87,192 ; vxorps %ymm8,%ymm0,%ymm0
DB 196,193,124,94,193 ; vdivps %ymm9,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -5896,7 +5896,7 @@ _sk_apply_vector_mask_hsw LABEL PROC
PUBLIC _sk_save_xy_hsw
_sk_save_xy_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,183,96,2,0 ; vbroadcastss 0x260b7(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,243,95,2,0 ; vbroadcastss 0x25ff3(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,124,88,200 ; vaddps %ymm8,%ymm0,%ymm9
DB 196,67,125,8,209,1 ; vroundps $0x1,%ymm9,%ymm10
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
@@ -5926,9 +5926,9 @@ _sk_accumulate_hsw LABEL PROC
PUBLIC _sk_bilinear_nx_hsw
_sk_bilinear_nx_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,167,97,2,0 ; vbroadcastss 0x261a7(%rip),%ymm0 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,5,227,96,2,0 ; vbroadcastss 0x260e3(%rip),%ymm0 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,62,96,2,0 ; vbroadcastss 0x2603e(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,122,95,2,0 ; vbroadcastss 0x25f7a(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -5937,7 +5937,7 @@ _sk_bilinear_nx_hsw LABEL PROC
PUBLIC _sk_bilinear_px_hsw
_sk_bilinear_px_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,30,96,2,0 ; vbroadcastss 0x2601e(%rip),%ymm0 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,5,90,95,2,0 ; vbroadcastss 0x25f5a(%rip),%ymm0 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -5947,9 +5947,9 @@ _sk_bilinear_px_hsw LABEL PROC
PUBLIC _sk_bilinear_ny_hsw
_sk_bilinear_ny_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,94,97,2,0 ; vbroadcastss 0x2615e(%rip),%ymm1 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,13,154,96,2,0 ; vbroadcastss 0x2609a(%rip),%ymm1 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,244,95,2,0 ; vbroadcastss 0x25ff4(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,48,95,2,0 ; vbroadcastss 0x25f30(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -5958,7 +5958,7 @@ _sk_bilinear_ny_hsw LABEL PROC
PUBLIC _sk_bilinear_py_hsw
_sk_bilinear_py_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,212,95,2,0 ; vbroadcastss 0x25fd4(%rip),%ymm1 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,13,16,95,2,0 ; vbroadcastss 0x25f10(%rip),%ymm1 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -5968,13 +5968,13 @@ _sk_bilinear_py_hsw LABEL PROC
PUBLIC _sk_bicubic_n3x_hsw
_sk_bicubic_n3x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,23,97,2,0 ; vbroadcastss 0x26117(%rip),%ymm0 # 2c244 <_sk_overlay_sse2_8bit+0x5cf>
+ DB 196,226,125,24,5,83,96,2,0 ; vbroadcastss 0x26053(%rip),%ymm0 # 2c180 <_sk_overlay_sse2_8bit+0x5d0>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,170,95,2,0 ; vbroadcastss 0x25faa(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,230,94,2,0 ; vbroadcastss 0x25ee6(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,7,96,2,0 ; vbroadcastss 0x26007(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
- DB 196,98,125,24,29,242,96,2,0 ; vbroadcastss 0x260f2(%rip),%ymm11 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,67,95,2,0 ; vbroadcastss 0x25f43(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
+ DB 196,98,125,24,29,46,96,2,0 ; vbroadcastss 0x2602e(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,36,89,193 ; vmulps %ymm9,%ymm11,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -5984,16 +5984,16 @@ _sk_bicubic_n3x_hsw LABEL PROC
PUBLIC _sk_bicubic_n1x_hsw
_sk_bicubic_n1x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,201,96,2,0 ; vbroadcastss 0x260c9(%rip),%ymm0 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,5,5,96,2,0 ; vbroadcastss 0x26005(%rip),%ymm0 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,96,95,2,0 ; vbroadcastss 0x25f60(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,156,94,2,0 ; vbroadcastss 0x25e9c(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,186,96,2,0 ; vbroadcastss 0x260ba(%rip),%ymm9 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
- DB 196,98,125,24,21,181,96,2,0 ; vbroadcastss 0x260b5(%rip),%ymm10 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,13,246,95,2,0 ; vbroadcastss 0x25ff6(%rip),%ymm9 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
+ DB 196,98,125,24,21,241,95,2,0 ; vbroadcastss 0x25ff1(%rip),%ymm10 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,66,61,168,209 ; vfmadd213ps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,13,55,95,2,0 ; vbroadcastss 0x25f37(%rip),%ymm9 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,13,115,94,2,0 ; vbroadcastss 0x25e73(%rip),%ymm9 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,66,61,184,202 ; vfmadd231ps %ymm10,%ymm8,%ymm9
- DB 196,98,125,24,21,157,96,2,0 ; vbroadcastss 0x2609d(%rip),%ymm10 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,21,217,95,2,0 ; vbroadcastss 0x25fd9(%rip),%ymm10 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 197,124,17,144,128,0,0,0 ; vmovups %ymm10,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6002,14 +6002,14 @@ _sk_bicubic_n1x_hsw LABEL PROC
PUBLIC _sk_bicubic_p1x_hsw
_sk_bicubic_p1x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,13,95,2,0 ; vbroadcastss 0x25f0d(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,73,94,2,0 ; vbroadcastss 0x25e49(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,188,88,0 ; vaddps (%rax),%ymm8,%ymm0
DB 197,124,16,72,64 ; vmovups 0x40(%rax),%ymm9
- DB 196,98,125,24,21,103,96,2,0 ; vbroadcastss 0x26067(%rip),%ymm10 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
- DB 196,98,125,24,29,98,96,2,0 ; vbroadcastss 0x26062(%rip),%ymm11 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,21,163,95,2,0 ; vbroadcastss 0x25fa3(%rip),%ymm10 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
+ DB 196,98,125,24,29,158,95,2,0 ; vbroadcastss 0x25f9e(%rip),%ymm11 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,66,53,168,218 ; vfmadd213ps %ymm10,%ymm9,%ymm11
DB 196,66,53,168,216 ; vfmadd213ps %ymm8,%ymm9,%ymm11
- DB 196,98,125,24,5,83,96,2,0 ; vbroadcastss 0x26053(%rip),%ymm8 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,5,143,95,2,0 ; vbroadcastss 0x25f8f(%rip),%ymm8 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,66,53,184,195 ; vfmadd231ps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6018,12 +6018,12 @@ _sk_bicubic_p1x_hsw LABEL PROC
PUBLIC _sk_bicubic_p3x_hsw
_sk_bicubic_p3x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,47,96,2,0 ; vbroadcastss 0x2602f(%rip),%ymm0 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,226,125,24,5,107,95,2,0 ; vbroadcastss 0x25f6b(%rip),%ymm0 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,32,95,2,0 ; vbroadcastss 0x25f20(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
- DB 196,98,125,24,29,11,96,2,0 ; vbroadcastss 0x2600b(%rip),%ymm11 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,92,94,2,0 ; vbroadcastss 0x25e5c(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
+ DB 196,98,125,24,29,71,95,2,0 ; vbroadcastss 0x25f47(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,52,89,195 ; vmulps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -6033,13 +6033,13 @@ _sk_bicubic_p3x_hsw LABEL PROC
PUBLIC _sk_bicubic_n3y_hsw
_sk_bicubic_n3y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,230,95,2,0 ; vbroadcastss 0x25fe6(%rip),%ymm1 # 2c244 <_sk_overlay_sse2_8bit+0x5cf>
+ DB 196,226,125,24,13,34,95,2,0 ; vbroadcastss 0x25f22(%rip),%ymm1 # 2c180 <_sk_overlay_sse2_8bit+0x5d0>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,120,94,2,0 ; vbroadcastss 0x25e78(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,180,93,2,0 ; vbroadcastss 0x25db4(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,213,94,2,0 ; vbroadcastss 0x25ed5(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
- DB 196,98,125,24,29,192,95,2,0 ; vbroadcastss 0x25fc0(%rip),%ymm11 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,17,94,2,0 ; vbroadcastss 0x25e11(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
+ DB 196,98,125,24,29,252,94,2,0 ; vbroadcastss 0x25efc(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,36,89,193 ; vmulps %ymm9,%ymm11,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -6049,16 +6049,16 @@ _sk_bicubic_n3y_hsw LABEL PROC
PUBLIC _sk_bicubic_n1y_hsw
_sk_bicubic_n1y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,151,95,2,0 ; vbroadcastss 0x25f97(%rip),%ymm1 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,13,211,94,2,0 ; vbroadcastss 0x25ed3(%rip),%ymm1 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,45,94,2,0 ; vbroadcastss 0x25e2d(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,105,93,2,0 ; vbroadcastss 0x25d69(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,135,95,2,0 ; vbroadcastss 0x25f87(%rip),%ymm9 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
- DB 196,98,125,24,21,130,95,2,0 ; vbroadcastss 0x25f82(%rip),%ymm10 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,13,195,94,2,0 ; vbroadcastss 0x25ec3(%rip),%ymm9 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
+ DB 196,98,125,24,21,190,94,2,0 ; vbroadcastss 0x25ebe(%rip),%ymm10 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,66,61,168,209 ; vfmadd213ps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,13,4,94,2,0 ; vbroadcastss 0x25e04(%rip),%ymm9 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,13,64,93,2,0 ; vbroadcastss 0x25d40(%rip),%ymm9 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,66,61,184,202 ; vfmadd231ps %ymm10,%ymm8,%ymm9
- DB 196,98,125,24,21,106,95,2,0 ; vbroadcastss 0x25f6a(%rip),%ymm10 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,21,166,94,2,0 ; vbroadcastss 0x25ea6(%rip),%ymm10 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 197,124,17,144,160,0,0,0 ; vmovups %ymm10,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6067,14 +6067,14 @@ _sk_bicubic_n1y_hsw LABEL PROC
PUBLIC _sk_bicubic_p1y_hsw
_sk_bicubic_p1y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,218,93,2,0 ; vbroadcastss 0x25dda(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,22,93,2,0 ; vbroadcastss 0x25d16(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,188,88,72,32 ; vaddps 0x20(%rax),%ymm8,%ymm1
DB 197,124,16,72,96 ; vmovups 0x60(%rax),%ymm9
- DB 196,98,125,24,21,51,95,2,0 ; vbroadcastss 0x25f33(%rip),%ymm10 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
- DB 196,98,125,24,29,46,95,2,0 ; vbroadcastss 0x25f2e(%rip),%ymm11 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,21,111,94,2,0 ; vbroadcastss 0x25e6f(%rip),%ymm10 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
+ DB 196,98,125,24,29,106,94,2,0 ; vbroadcastss 0x25e6a(%rip),%ymm11 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,66,53,168,218 ; vfmadd213ps %ymm10,%ymm9,%ymm11
DB 196,66,53,168,216 ; vfmadd213ps %ymm8,%ymm9,%ymm11
- DB 196,98,125,24,5,31,95,2,0 ; vbroadcastss 0x25f1f(%rip),%ymm8 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,5,91,94,2,0 ; vbroadcastss 0x25e5b(%rip),%ymm8 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,66,53,184,195 ; vfmadd231ps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6083,12 +6083,12 @@ _sk_bicubic_p1y_hsw LABEL PROC
PUBLIC _sk_bicubic_p3y_hsw
_sk_bicubic_p3y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,251,94,2,0 ; vbroadcastss 0x25efb(%rip),%ymm1 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,226,125,24,13,55,94,2,0 ; vbroadcastss 0x25e37(%rip),%ymm1 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,235,93,2,0 ; vbroadcastss 0x25deb(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
- DB 196,98,125,24,29,214,94,2,0 ; vbroadcastss 0x25ed6(%rip),%ymm11 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,39,93,2,0 ; vbroadcastss 0x25d27(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
+ DB 196,98,125,24,29,18,94,2,0 ; vbroadcastss 0x25e12(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,52,89,195 ; vmulps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -6214,19 +6214,19 @@ _sk_clut_3D_hsw LABEL PROC
DB 197,254,127,76,36,32 ; vmovdqu %ymm1,0x20(%rsp)
DB 72,139,0 ; mov (%rax),%rax
DB 196,193,117,254,204 ; vpaddd %ymm12,%ymm1,%ymm1
- DB 196,226,125,88,61,180,92,2,0 ; vpbroadcastd 0x25cb4(%rip),%ymm7 # 2c25c <_sk_overlay_sse2_8bit+0x5e7>
+ DB 196,226,125,88,61,240,91,2,0 ; vpbroadcastd 0x25bf0(%rip),%ymm7 # 2c198 <_sk_overlay_sse2_8bit+0x5e8>
DB 196,226,117,64,207 ; vpmulld %ymm7,%ymm1,%ymm1
DB 197,205,118,246 ; vpcmpeqd %ymm6,%ymm6,%ymm6
DB 196,98,77,146,4,136 ; vgatherdps %ymm6,(%rax,%ymm1,4),%ymm8
- DB 196,98,125,88,21,40,91,2,0 ; vpbroadcastd 0x25b28(%rip),%ymm10 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,125,88,21,100,90,2,0 ; vpbroadcastd 0x25a64(%rip),%ymm10 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,193,117,254,242 ; vpaddd %ymm10,%ymm1,%ymm6
DB 196,65,37,118,219 ; vpcmpeqd %ymm11,%ymm11,%ymm11
DB 196,226,37,146,28,176 ; vgatherdps %ymm11,(%rax,%ymm6,4),%ymm3
- DB 196,98,125,88,29,23,91,2,0 ; vpbroadcastd 0x25b17(%rip),%ymm11 # 2c0f0 <_sk_overlay_sse2_8bit+0x47b>
+ DB 196,98,125,88,29,83,90,2,0 ; vpbroadcastd 0x25a53(%rip),%ymm11 # 2c02c <_sk_overlay_sse2_8bit+0x47c>
DB 196,193,117,254,203 ; vpaddd %ymm11,%ymm1,%ymm1
DB 197,205,118,246 ; vpcmpeqd %ymm6,%ymm6,%ymm6
DB 196,226,77,146,36,136 ; vgatherdps %ymm6,(%rax,%ymm1,4),%ymm4
- DB 196,98,125,24,45,103,92,2,0 ; vbroadcastss 0x25c67(%rip),%ymm13 # 2c258 <_sk_overlay_sse2_8bit+0x5e3>
+ DB 196,98,125,24,45,163,91,2,0 ; vbroadcastss 0x25ba3(%rip),%ymm13 # 2c194 <_sk_overlay_sse2_8bit+0x5e4>
DB 196,193,124,88,245 ; vaddps %ymm13,%ymm0,%ymm6
DB 197,254,91,246 ; vcvttps2dq %ymm6,%ymm6
DB 196,226,77,64,205 ; vpmulld %ymm5,%ymm6,%ymm1
@@ -6444,19 +6444,19 @@ _sk_clut_4D_hsw LABEL PROC
DB 197,126,91,245 ; vcvttps2dq %ymm5,%ymm14
DB 196,98,13,64,233 ; vpmulld %ymm1,%ymm14,%ymm13
DB 197,149,254,198 ; vpaddd %ymm6,%ymm13,%ymm0
- DB 196,98,125,88,21,224,87,2,0 ; vpbroadcastd 0x257e0(%rip),%ymm10 # 2c25c <_sk_overlay_sse2_8bit+0x5e7>
+ DB 196,98,125,88,21,28,87,2,0 ; vpbroadcastd 0x2571c(%rip),%ymm10 # 2c198 <_sk_overlay_sse2_8bit+0x5e8>
DB 196,194,125,64,194 ; vpmulld %ymm10,%ymm0,%ymm0
DB 196,65,61,118,192 ; vpcmpeqd %ymm8,%ymm8,%ymm8
DB 196,98,61,146,60,128 ; vgatherdps %ymm8,(%rax,%ymm0,4),%ymm15
- DB 196,98,125,88,29,83,86,2,0 ; vpbroadcastd 0x25653(%rip),%ymm11 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,125,88,29,143,85,2,0 ; vpbroadcastd 0x2558f(%rip),%ymm11 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,65,125,254,195 ; vpaddd %ymm11,%ymm0,%ymm8
DB 196,65,53,118,201 ; vpcmpeqd %ymm9,%ymm9,%ymm9
DB 196,162,53,146,20,128 ; vgatherdps %ymm9,(%rax,%ymm8,4),%ymm2
- DB 196,98,125,88,37,66,86,2,0 ; vpbroadcastd 0x25642(%rip),%ymm12 # 2c0f0 <_sk_overlay_sse2_8bit+0x47b>
+ DB 196,98,125,88,37,126,85,2,0 ; vpbroadcastd 0x2557e(%rip),%ymm12 # 2c02c <_sk_overlay_sse2_8bit+0x47c>
DB 196,193,125,254,196 ; vpaddd %ymm12,%ymm0,%ymm0
DB 196,65,61,118,192 ; vpcmpeqd %ymm8,%ymm8,%ymm8
DB 196,226,61,146,60,128 ; vgatherdps %ymm8,(%rax,%ymm0,4),%ymm7
- DB 196,98,125,24,13,145,87,2,0 ; vbroadcastss 0x25791(%rip),%ymm9 # 2c258 <_sk_overlay_sse2_8bit+0x5e3>
+ DB 196,98,125,24,13,205,86,2,0 ; vbroadcastss 0x256cd(%rip),%ymm9 # 2c194 <_sk_overlay_sse2_8bit+0x5e4>
DB 196,65,84,88,193 ; vaddps %ymm9,%ymm5,%ymm8
DB 196,65,126,91,192 ; vcvttps2dq %ymm8,%ymm8
DB 196,226,61,64,193 ; vpmulld %ymm1,%ymm8,%ymm0
@@ -6781,7 +6781,7 @@ _sk_clut_4D_hsw LABEL PROC
DB 197,196,92,214 ; vsubps %ymm6,%ymm7,%ymm2
DB 196,226,61,168,214 ; vfmadd213ps %ymm6,%ymm8,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,32,79,2,0 ; vbroadcastss 0x24f20(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,92,78,2,0 ; vbroadcastss 0x24e5c(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,16,164,36,160,3,0,0 ; vmovups 0x3a0(%rsp),%ymm4
DB 197,252,16,172,36,192,3,0,0 ; vmovups 0x3c0(%rsp),%ymm5
DB 197,252,16,180,36,224,3,0,0 ; vmovups 0x3e0(%rsp),%ymm6
@@ -6882,16 +6882,16 @@ _sk_seed_shader_avx LABEL PROC
DB 197,249,112,192,0 ; vpshufd $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,144,77,2,0 ; vbroadcastss 0x24d90(%rip),%ymm1 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,13,204,76,2,0 ; vbroadcastss 0x24ccc(%rip),%ymm1 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 197,252,88,5,100,82,2,0 ; vaddps 0x25264(%rip),%ymm0,%ymm0 # 2c5c0 <_sk_overlay_sse2_8bit+0x94b>
+ DB 197,252,88,5,164,81,2,0 ; vaddps 0x251a4(%rip),%ymm0,%ymm0 # 2c500 <_sk_overlay_sse2_8bit+0x950>
DB 197,249,110,209 ; vmovd %ecx,%xmm2
DB 197,249,112,210,0 ; vpshufd $0x0,%xmm2,%xmm2
DB 196,227,109,24,210,1 ; vinsertf128 $0x1,%xmm2,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 197,236,88,201 ; vaddps %ymm1,%ymm2,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,21,102,77,2,0 ; vbroadcastss 0x24d66(%rip),%ymm2 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,21,162,76,2,0 ; vbroadcastss 0x24ca2(%rip),%ymm2 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,228,87,219 ; vxorps %ymm3,%ymm3,%ymm3
DB 197,220,87,228 ; vxorps %ymm4,%ymm4,%ymm4
DB 197,212,87,237 ; vxorps %ymm5,%ymm5,%ymm5
@@ -6904,14 +6904,14 @@ _sk_dither_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,121,110,194 ; vmovd %edx,%xmm8
DB 196,65,121,112,192,0 ; vpshufd $0x0,%xmm8,%xmm8
- DB 197,57,254,13,88,87,2,0 ; vpaddd 0x25758(%rip),%xmm8,%xmm9 # 2cb00 <_sk_overlay_sse2_8bit+0xe8b>
- DB 197,57,254,5,96,87,2,0 ; vpaddd 0x25760(%rip),%xmm8,%xmm8 # 2cb10 <_sk_overlay_sse2_8bit+0xe9b>
+ DB 197,57,254,13,152,86,2,0 ; vpaddd 0x25698(%rip),%xmm8,%xmm9 # 2ca40 <_sk_overlay_sse2_8bit+0xe90>
+ DB 197,57,254,5,160,86,2,0 ; vpaddd 0x256a0(%rip),%xmm8,%xmm8 # 2ca50 <_sk_overlay_sse2_8bit+0xea0>
DB 196,67,53,24,192,1 ; vinsertf128 $0x1,%xmm8,%ymm9,%ymm8
DB 197,121,110,201 ; vmovd %ecx,%xmm9
DB 196,65,121,112,201,0 ; vpshufd $0x0,%xmm9,%xmm9
DB 196,67,53,24,201,1 ; vinsertf128 $0x1,%xmm9,%ymm9,%ymm9
DB 196,65,52,87,208 ; vxorps %ymm8,%ymm9,%ymm10
- DB 196,98,125,24,29,20,77,2,0 ; vbroadcastss 0x24d14(%rip),%ymm11 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,125,24,29,80,76,2,0 ; vbroadcastss 0x24c50(%rip),%ymm11 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,65,44,84,203 ; vandps %ymm11,%ymm10,%ymm9
DB 196,193,25,114,241,5 ; vpslld $0x5,%xmm9,%xmm12
DB 196,67,125,25,201,1 ; vextractf128 $0x1,%ymm9,%xmm9
@@ -6922,8 +6922,8 @@ _sk_dither_avx LABEL PROC
DB 196,67,125,25,219,1 ; vextractf128 $0x1,%ymm11,%xmm11
DB 196,193,33,114,243,4 ; vpslld $0x4,%xmm11,%xmm11
DB 196,67,29,24,219,1 ; vinsertf128 $0x1,%xmm11,%ymm12,%ymm11
- DB 196,98,125,24,37,213,76,2,0 ; vbroadcastss 0x24cd5(%rip),%ymm12 # 2c0ec <_sk_overlay_sse2_8bit+0x477>
- DB 196,98,125,24,45,208,76,2,0 ; vbroadcastss 0x24cd0(%rip),%ymm13 # 2c0f0 <_sk_overlay_sse2_8bit+0x47b>
+ DB 196,98,125,24,37,17,76,2,0 ; vbroadcastss 0x24c11(%rip),%ymm12 # 2c028 <_sk_overlay_sse2_8bit+0x478>
+ DB 196,98,125,24,45,12,76,2,0 ; vbroadcastss 0x24c0c(%rip),%ymm13 # 2c02c <_sk_overlay_sse2_8bit+0x47c>
DB 196,65,44,84,245 ; vandps %ymm13,%ymm10,%ymm14
DB 196,193,1,114,246,2 ; vpslld $0x2,%xmm14,%xmm15
DB 196,67,125,25,246,1 ; vextractf128 $0x1,%ymm14,%xmm14
@@ -6950,9 +6950,9 @@ _sk_dither_avx LABEL PROC
DB 196,65,60,86,193 ; vorps %ymm9,%ymm8,%ymm8
DB 196,65,60,86,194 ; vorps %ymm10,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,59,76,2,0 ; vbroadcastss 0x24c3b(%rip),%ymm9 # 2c0f4 <_sk_overlay_sse2_8bit+0x47f>
+ DB 196,98,125,24,13,119,75,2,0 ; vbroadcastss 0x24b77(%rip),%ymm9 # 2c030 <_sk_overlay_sse2_8bit+0x480>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,49,76,2,0 ; vbroadcastss 0x24c31(%rip),%ymm9 # 2c0f8 <_sk_overlay_sse2_8bit+0x483>
+ DB 196,98,125,24,13,109,75,2,0 ; vbroadcastss 0x24b6d(%rip),%ymm9 # 2c034 <_sk_overlay_sse2_8bit+0x484>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 196,98,125,24,8 ; vbroadcastss (%rax),%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
@@ -6982,7 +6982,7 @@ _sk_uniform_color_avx LABEL PROC
PUBLIC _sk_black_color_avx
_sk_black_color_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,185,75,2,0 ; vbroadcastss 0x24bb9(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,245,74,2,0 ; vbroadcastss 0x24af5(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 197,236,87,210 ; vxorps %ymm2,%ymm2,%ymm2
@@ -6991,7 +6991,7 @@ _sk_black_color_avx LABEL PROC
PUBLIC _sk_white_color_avx
_sk_white_color_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,160,75,2,0 ; vbroadcastss 0x24ba0(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,220,74,2,0 ; vbroadcastss 0x24adc(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
@@ -7029,7 +7029,7 @@ _sk_clear_avx LABEL PROC
PUBLIC _sk_srcatop_avx
_sk_srcatop_avx LABEL PROC
DB 197,252,89,199 ; vmulps %ymm7,%ymm0,%ymm0
- DB 196,98,125,24,5,63,75,2,0 ; vbroadcastss 0x24b3f(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,123,74,2,0 ; vbroadcastss 0x24a7b(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,204 ; vmulps %ymm4,%ymm8,%ymm9
DB 197,180,88,192 ; vaddps %ymm0,%ymm9,%ymm0
@@ -7048,7 +7048,7 @@ _sk_srcatop_avx LABEL PROC
PUBLIC _sk_dstatop_avx
_sk_dstatop_avx LABEL PROC
DB 197,100,89,196 ; vmulps %ymm4,%ymm3,%ymm8
- DB 196,98,125,24,13,253,74,2,0 ; vbroadcastss 0x24afd(%rip),%ymm9 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,13,57,74,2,0 ; vbroadcastss 0x24a39(%rip),%ymm9 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,52,92,207 ; vsubps %ymm7,%ymm9,%ymm9
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
DB 197,188,88,192 ; vaddps %ymm0,%ymm8,%ymm0
@@ -7084,7 +7084,7 @@ _sk_dstin_avx LABEL PROC
PUBLIC _sk_srcout_avx
_sk_srcout_avx LABEL PROC
- DB 196,98,125,24,5,152,74,2,0 ; vbroadcastss 0x24a98(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,212,73,2,0 ; vbroadcastss 0x249d4(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -7095,7 +7095,7 @@ _sk_srcout_avx LABEL PROC
PUBLIC _sk_dstout_avx
_sk_dstout_avx LABEL PROC
- DB 196,226,125,24,5,119,74,2,0 ; vbroadcastss 0x24a77(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,179,73,2,0 ; vbroadcastss 0x249b3(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,92,219 ; vsubps %ymm3,%ymm0,%ymm3
DB 197,228,89,196 ; vmulps %ymm4,%ymm3,%ymm0
DB 197,228,89,205 ; vmulps %ymm5,%ymm3,%ymm1
@@ -7106,7 +7106,7 @@ _sk_dstout_avx LABEL PROC
PUBLIC _sk_srcover_avx
_sk_srcover_avx LABEL PROC
- DB 196,98,125,24,5,86,74,2,0 ; vbroadcastss 0x24a56(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,146,73,2,0 ; vbroadcastss 0x24992(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,204 ; vmulps %ymm4,%ymm8,%ymm9
DB 197,180,88,192 ; vaddps %ymm0,%ymm9,%ymm0
@@ -7121,7 +7121,7 @@ _sk_srcover_avx LABEL PROC
PUBLIC _sk_dstover_avx
_sk_dstover_avx LABEL PROC
- DB 196,98,125,24,5,37,74,2,0 ; vbroadcastss 0x24a25(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,97,73,2,0 ; vbroadcastss 0x24961(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,252,88,196 ; vaddps %ymm4,%ymm0,%ymm0
@@ -7145,7 +7145,7 @@ _sk_modulate_avx LABEL PROC
PUBLIC _sk_multiply_avx
_sk_multiply_avx LABEL PROC
- DB 196,98,125,24,5,224,73,2,0 ; vbroadcastss 0x249e0(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,28,73,2,0 ; vbroadcastss 0x2491c(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,208 ; vmulps %ymm0,%ymm9,%ymm10
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -7174,7 +7174,7 @@ _sk_multiply_avx LABEL PROC
PUBLIC _sk_plus__avx
_sk_plus__avx LABEL PROC
DB 197,252,88,196 ; vaddps %ymm4,%ymm0,%ymm0
- DB 196,98,125,24,5,111,73,2,0 ; vbroadcastss 0x2496f(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,171,72,2,0 ; vbroadcastss 0x248ab(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 197,244,88,205 ; vaddps %ymm5,%ymm1,%ymm1
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
@@ -7204,7 +7204,7 @@ _sk_screen_avx LABEL PROC
PUBLIC _sk_xor__avx
_sk_xor__avx LABEL PROC
- DB 196,98,125,24,5,14,73,2,0 ; vbroadcastss 0x2490e(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,74,72,2,0 ; vbroadcastss 0x2484a(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -7239,7 +7239,7 @@ _sk_darken_avx LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,95,209 ; vmaxps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,138,72,2,0 ; vbroadcastss 0x2488a(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,198,71,2,0 ; vbroadcastss 0x247c6(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -7263,7 +7263,7 @@ _sk_lighten_avx LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,50,72,2,0 ; vbroadcastss 0x24832(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,110,71,2,0 ; vbroadcastss 0x2476e(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -7290,7 +7290,7 @@ _sk_difference_avx LABEL PROC
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,206,71,2,0 ; vbroadcastss 0x247ce(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,10,71,2,0 ; vbroadcastss 0x2470a(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -7311,7 +7311,7 @@ _sk_exclusion_avx LABEL PROC
DB 197,236,89,214 ; vmulps %ymm6,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,133,71,2,0 ; vbroadcastss 0x24785(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,193,70,2,0 ; vbroadcastss 0x246c1(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -7320,7 +7320,7 @@ _sk_exclusion_avx LABEL PROC
PUBLIC _sk_colorburn_avx
_sk_colorburn_avx LABEL PROC
- DB 196,98,125,24,5,108,71,2,0 ; vbroadcastss 0x2476c(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,168,70,2,0 ; vbroadcastss 0x246a8(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,216 ; vmulps %ymm0,%ymm9,%ymm11
DB 196,65,44,87,210 ; vxorps %ymm10,%ymm10,%ymm10
@@ -7380,7 +7380,7 @@ _sk_colorburn_avx LABEL PROC
PUBLIC _sk_colordodge_avx
_sk_colordodge_avx LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
- DB 196,98,125,24,13,112,70,2,0 ; vbroadcastss 0x24670(%rip),%ymm9 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,13,172,69,2,0 ; vbroadcastss 0x245ac(%rip),%ymm9 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,52,92,215 ; vsubps %ymm7,%ymm9,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,52,92,203 ; vsubps %ymm3,%ymm9,%ymm9
@@ -7435,7 +7435,7 @@ _sk_colordodge_avx LABEL PROC
PUBLIC _sk_hardlight_avx
_sk_hardlight_avx LABEL PROC
- DB 196,98,125,24,5,123,69,2,0 ; vbroadcastss 0x2457b(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,183,68,2,0 ; vbroadcastss 0x244b7(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,200 ; vmulps %ymm0,%ymm10,%ymm9
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -7488,7 +7488,7 @@ _sk_hardlight_avx LABEL PROC
PUBLIC _sk_overlay_avx
_sk_overlay_avx LABEL PROC
- DB 196,98,125,24,5,160,68,2,0 ; vbroadcastss 0x244a0(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,220,67,2,0 ; vbroadcastss 0x243dc(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,200 ; vmulps %ymm0,%ymm10,%ymm9
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -7553,10 +7553,10 @@ _sk_softlight_avx LABEL PROC
DB 196,65,60,88,192 ; vaddps %ymm8,%ymm8,%ymm8
DB 196,65,60,89,216 ; vmulps %ymm8,%ymm8,%ymm11
DB 196,65,60,88,195 ; vaddps %ymm11,%ymm8,%ymm8
- DB 196,98,125,24,29,163,67,2,0 ; vbroadcastss 0x243a3(%rip),%ymm11 # 2c0fc <_sk_overlay_sse2_8bit+0x487>
+ DB 196,98,125,24,29,223,66,2,0 ; vbroadcastss 0x242df(%rip),%ymm11 # 2c038 <_sk_overlay_sse2_8bit+0x488>
DB 196,65,28,88,235 ; vaddps %ymm11,%ymm12,%ymm13
DB 196,65,20,89,192 ; vmulps %ymm8,%ymm13,%ymm8
- DB 196,98,125,24,45,148,67,2,0 ; vbroadcastss 0x24394(%rip),%ymm13 # 2c100 <_sk_overlay_sse2_8bit+0x48b>
+ DB 196,98,125,24,45,208,66,2,0 ; vbroadcastss 0x242d0(%rip),%ymm13 # 2c03c <_sk_overlay_sse2_8bit+0x48c>
DB 196,65,28,89,245 ; vmulps %ymm13,%ymm12,%ymm14
DB 196,65,12,88,192 ; vaddps %ymm8,%ymm14,%ymm8
DB 196,65,124,82,244 ; vrsqrtps %ymm12,%ymm14
@@ -7567,7 +7567,7 @@ _sk_softlight_avx LABEL PROC
DB 197,4,194,255,2 ; vcmpleps %ymm7,%ymm15,%ymm15
DB 196,67,13,74,240,240 ; vblendvps %ymm15,%ymm8,%ymm14,%ymm14
DB 197,116,88,249 ; vaddps %ymm1,%ymm1,%ymm15
- DB 196,98,125,24,5,62,67,2,0 ; vbroadcastss 0x2433e(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,122,66,2,0 ; vbroadcastss 0x2427a(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,65,60,92,228 ; vsubps %ymm12,%ymm8,%ymm12
DB 197,132,92,195 ; vsubps %ymm3,%ymm15,%ymm0
DB 196,65,124,89,228 ; vmulps %ymm12,%ymm0,%ymm12
@@ -7694,12 +7694,12 @@ _sk_hue_avx LABEL PROC
DB 196,65,28,89,219 ; vmulps %ymm11,%ymm12,%ymm11
DB 196,65,36,94,222 ; vdivps %ymm14,%ymm11,%ymm11
DB 196,67,37,74,224,240 ; vblendvps %ymm15,%ymm8,%ymm11,%ymm12
- DB 196,98,125,24,53,28,65,2,0 ; vbroadcastss 0x2411c(%rip),%ymm14 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,53,88,64,2,0 ; vbroadcastss 0x24058(%rip),%ymm14 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,92,89,222 ; vmulps %ymm14,%ymm4,%ymm11
- DB 196,98,125,24,61,18,65,2,0 ; vbroadcastss 0x24112(%rip),%ymm15 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,61,78,64,2,0 ; vbroadcastss 0x2404e(%rip),%ymm15 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,84,89,239 ; vmulps %ymm15,%ymm5,%ymm13
DB 196,65,36,88,221 ; vaddps %ymm13,%ymm11,%ymm11
- DB 196,226,125,24,5,3,65,2,0 ; vbroadcastss 0x24103(%rip),%ymm0 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,226,125,24,5,63,64,2,0 ; vbroadcastss 0x2403f(%rip),%ymm0 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 197,76,89,232 ; vmulps %ymm0,%ymm6,%ymm13
DB 196,65,36,88,221 ; vaddps %ymm13,%ymm11,%ymm11
DB 196,65,52,89,238 ; vmulps %ymm14,%ymm9,%ymm13
@@ -7760,7 +7760,7 @@ _sk_hue_avx LABEL PROC
DB 196,65,36,95,208 ; vmaxps %ymm8,%ymm11,%ymm10
DB 196,195,109,74,209,240 ; vblendvps %ymm15,%ymm9,%ymm2,%ymm2
DB 196,193,108,95,208 ; vmaxps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,176,63,2,0 ; vbroadcastss 0x23fb0(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,236,62,2,0 ; vbroadcastss 0x23eec(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,180,89,201 ; vmulps %ymm1,%ymm9,%ymm1
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -7817,12 +7817,12 @@ _sk_saturation_avx LABEL PROC
DB 196,65,28,89,219 ; vmulps %ymm11,%ymm12,%ymm11
DB 196,65,36,94,222 ; vdivps %ymm14,%ymm11,%ymm11
DB 196,67,37,74,224,240 ; vblendvps %ymm15,%ymm8,%ymm11,%ymm12
- DB 196,98,125,24,53,212,62,2,0 ; vbroadcastss 0x23ed4(%rip),%ymm14 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,53,16,62,2,0 ; vbroadcastss 0x23e10(%rip),%ymm14 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,92,89,222 ; vmulps %ymm14,%ymm4,%ymm11
- DB 196,98,125,24,61,202,62,2,0 ; vbroadcastss 0x23eca(%rip),%ymm15 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,61,6,62,2,0 ; vbroadcastss 0x23e06(%rip),%ymm15 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,84,89,239 ; vmulps %ymm15,%ymm5,%ymm13
DB 196,65,36,88,221 ; vaddps %ymm13,%ymm11,%ymm11
- DB 196,226,125,24,5,187,62,2,0 ; vbroadcastss 0x23ebb(%rip),%ymm0 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,226,125,24,5,247,61,2,0 ; vbroadcastss 0x23df7(%rip),%ymm0 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 197,76,89,232 ; vmulps %ymm0,%ymm6,%ymm13
DB 196,65,36,88,221 ; vaddps %ymm13,%ymm11,%ymm11
DB 196,65,52,89,238 ; vmulps %ymm14,%ymm9,%ymm13
@@ -7883,7 +7883,7 @@ _sk_saturation_avx LABEL PROC
DB 196,65,36,95,208 ; vmaxps %ymm8,%ymm11,%ymm10
DB 196,195,109,74,209,240 ; vblendvps %ymm15,%ymm9,%ymm2,%ymm2
DB 196,193,108,95,208 ; vmaxps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,104,61,2,0 ; vbroadcastss 0x23d68(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,164,60,2,0 ; vbroadcastss 0x23ca4(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,180,89,201 ; vmulps %ymm1,%ymm9,%ymm1
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -7912,12 +7912,12 @@ _sk_color_avx LABEL PROC
DB 197,252,17,68,36,32 ; vmovups %ymm0,0x20(%rsp)
DB 197,124,89,199 ; vmulps %ymm7,%ymm0,%ymm8
DB 197,116,89,207 ; vmulps %ymm7,%ymm1,%ymm9
- DB 196,98,125,24,45,20,61,2,0 ; vbroadcastss 0x23d14(%rip),%ymm13 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,45,80,60,2,0 ; vbroadcastss 0x23c50(%rip),%ymm13 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,92,89,213 ; vmulps %ymm13,%ymm4,%ymm10
- DB 196,98,125,24,53,10,61,2,0 ; vbroadcastss 0x23d0a(%rip),%ymm14 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,53,70,60,2,0 ; vbroadcastss 0x23c46(%rip),%ymm14 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,84,89,222 ; vmulps %ymm14,%ymm5,%ymm11
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
- DB 196,98,125,24,61,251,60,2,0 ; vbroadcastss 0x23cfb(%rip),%ymm15 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,98,125,24,61,55,60,2,0 ; vbroadcastss 0x23c37(%rip),%ymm15 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 196,65,76,89,223 ; vmulps %ymm15,%ymm6,%ymm11
DB 196,193,44,88,195 ; vaddps %ymm11,%ymm10,%ymm0
DB 196,65,60,89,221 ; vmulps %ymm13,%ymm8,%ymm11
@@ -7980,7 +7980,7 @@ _sk_color_avx LABEL PROC
DB 196,65,44,95,207 ; vmaxps %ymm15,%ymm10,%ymm9
DB 196,195,37,74,192,0 ; vblendvps %ymm0,%ymm8,%ymm11,%ymm0
DB 196,65,124,95,199 ; vmaxps %ymm15,%ymm0,%ymm8
- DB 196,226,125,24,5,150,59,2,0 ; vbroadcastss 0x23b96(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,210,58,2,0 ; vbroadcastss 0x23ad2(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,124,92,215 ; vsubps %ymm7,%ymm0,%ymm10
DB 197,172,89,84,36,32 ; vmulps 0x20(%rsp),%ymm10,%ymm2
DB 197,124,92,219 ; vsubps %ymm3,%ymm0,%ymm11
@@ -8010,12 +8010,12 @@ _sk_luminosity_avx LABEL PROC
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 197,100,89,196 ; vmulps %ymm4,%ymm3,%ymm8
DB 197,100,89,205 ; vmulps %ymm5,%ymm3,%ymm9
- DB 196,98,125,24,45,62,59,2,0 ; vbroadcastss 0x23b3e(%rip),%ymm13 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,45,122,58,2,0 ; vbroadcastss 0x23a7a(%rip),%ymm13 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,108,89,213 ; vmulps %ymm13,%ymm2,%ymm10
- DB 196,98,125,24,53,52,59,2,0 ; vbroadcastss 0x23b34(%rip),%ymm14 # 2c108 <_sk_overlay_sse2_8bit+0x493>
+ DB 196,98,125,24,53,112,58,2,0 ; vbroadcastss 0x23a70(%rip),%ymm14 # 2c044 <_sk_overlay_sse2_8bit+0x494>
DB 196,65,116,89,222 ; vmulps %ymm14,%ymm1,%ymm11
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
- DB 196,98,125,24,61,37,59,2,0 ; vbroadcastss 0x23b25(%rip),%ymm15 # 2c10c <_sk_overlay_sse2_8bit+0x497>
+ DB 196,98,125,24,61,97,58,2,0 ; vbroadcastss 0x23a61(%rip),%ymm15 # 2c048 <_sk_overlay_sse2_8bit+0x498>
DB 196,65,28,89,223 ; vmulps %ymm15,%ymm12,%ymm11
DB 196,193,44,88,195 ; vaddps %ymm11,%ymm10,%ymm0
DB 196,65,60,89,221 ; vmulps %ymm13,%ymm8,%ymm11
@@ -8078,7 +8078,7 @@ _sk_luminosity_avx LABEL PROC
DB 196,65,44,95,207 ; vmaxps %ymm15,%ymm10,%ymm9
DB 196,195,37,74,192,0 ; vblendvps %ymm0,%ymm8,%ymm11,%ymm0
DB 196,65,124,95,199 ; vmaxps %ymm15,%ymm0,%ymm8
- DB 196,226,125,24,5,192,57,2,0 ; vbroadcastss 0x239c0(%rip),%ymm0 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,5,252,56,2,0 ; vbroadcastss 0x238fc(%rip),%ymm0 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,124,92,215 ; vsubps %ymm7,%ymm0,%ymm10
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 197,124,92,219 ; vsubps %ymm3,%ymm0,%ymm11
@@ -8111,7 +8111,7 @@ _sk_srcover_rgba_8888_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,42,1,0,0 ; jne 88bc <_sk_srcover_rgba_8888_avx+0x14a>
DB 196,1,125,16,4,152 ; vmovupd (%r8,%r11,4),%ymm8
- DB 197,125,40,13,64,62,2,0 ; vmovapd 0x23e40(%rip),%ymm9 # 2c5e0 <_sk_overlay_sse2_8bit+0x96b>
+ DB 197,125,40,13,128,61,2,0 ; vmovapd 0x23d80(%rip),%ymm9 # 2c520 <_sk_overlay_sse2_8bit+0x970>
DB 196,193,61,84,225 ; vandpd %ymm9,%ymm8,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
DB 196,193,81,114,208,8 ; vpsrld $0x8,%xmm8,%xmm5
@@ -8129,9 +8129,9 @@ _sk_srcover_rgba_8888_avx LABEL PROC
DB 197,193,114,215,24 ; vpsrld $0x18,%xmm7,%xmm7
DB 196,227,61,24,255,1 ; vinsertf128 $0x1,%xmm7,%ymm8,%ymm7
DB 197,252,91,255 ; vcvtdq2ps %ymm7,%ymm7
- DB 196,98,125,24,5,227,56,2,0 ; vbroadcastss 0x238e3(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,31,56,2,0 ; vbroadcastss 0x2381f(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
- DB 196,98,125,24,13,2,57,2,0 ; vbroadcastss 0x23902(%rip),%ymm9 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,13,62,56,2,0 ; vbroadcastss 0x2383e(%rip),%ymm9 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 197,60,89,212 ; vmulps %ymm4,%ymm8,%ymm10
DB 196,193,124,88,194 ; vaddps %ymm10,%ymm0,%ymm0
@@ -8269,7 +8269,7 @@ _sk_clamp_0_avx LABEL PROC
PUBLIC _sk_clamp_1_avx
_sk_clamp_1_avx LABEL PROC
- DB 196,98,125,24,5,162,54,2,0 ; vbroadcastss 0x236a2(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,222,53,2,0 ; vbroadcastss 0x235de(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
@@ -8279,7 +8279,7 @@ _sk_clamp_1_avx LABEL PROC
PUBLIC _sk_clamp_a_avx
_sk_clamp_a_avx LABEL PROC
- DB 196,98,125,24,5,129,54,2,0 ; vbroadcastss 0x23681(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,189,53,2,0 ; vbroadcastss 0x235bd(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 197,252,93,195 ; vminps %ymm3,%ymm0,%ymm0
DB 197,244,93,203 ; vminps %ymm3,%ymm1,%ymm1
@@ -8289,7 +8289,7 @@ _sk_clamp_a_avx LABEL PROC
PUBLIC _sk_clamp_a_dst_avx
_sk_clamp_a_dst_avx LABEL PROC
- DB 196,98,125,24,5,99,54,2,0 ; vbroadcastss 0x23663(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,159,53,2,0 ; vbroadcastss 0x2359f(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,68,93,248 ; vminps %ymm8,%ymm7,%ymm7
DB 197,220,93,231 ; vminps %ymm7,%ymm4,%ymm4
DB 197,212,93,239 ; vminps %ymm7,%ymm5,%ymm5
@@ -8316,7 +8316,7 @@ _sk_swap_rb_avx LABEL PROC
PUBLIC _sk_invert_avx
_sk_invert_avx LABEL PROC
- DB 196,98,125,24,5,30,54,2,0 ; vbroadcastss 0x2361e(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,90,53,2,0 ; vbroadcastss 0x2355a(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,188,92,192 ; vsubps %ymm0,%ymm8,%ymm0
DB 197,188,92,201 ; vsubps %ymm1,%ymm8,%ymm1
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
@@ -8362,7 +8362,7 @@ PUBLIC _sk_unpremul_avx
_sk_unpremul_avx LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,65,100,194,200,0 ; vcmpeqps %ymm8,%ymm3,%ymm9
- DB 196,98,125,24,21,174,53,2,0 ; vbroadcastss 0x235ae(%rip),%ymm10 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,21,234,52,2,0 ; vbroadcastss 0x234ea(%rip),%ymm10 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,44,94,211 ; vdivps %ymm3,%ymm10,%ymm10
DB 196,67,45,74,192,144 ; vblendvps %ymm9,%ymm8,%ymm10,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
@@ -8373,17 +8373,17 @@ _sk_unpremul_avx LABEL PROC
PUBLIC _sk_from_srgb_avx
_sk_from_srgb_avx LABEL PROC
- DB 196,98,125,24,5,187,53,2,0 ; vbroadcastss 0x235bb(%rip),%ymm8 # 2c114 <_sk_overlay_sse2_8bit+0x49f>
+ DB 196,98,125,24,5,247,52,2,0 ; vbroadcastss 0x234f7(%rip),%ymm8 # 2c050 <_sk_overlay_sse2_8bit+0x4a0>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 197,124,89,208 ; vmulps %ymm0,%ymm0,%ymm10
- DB 196,98,125,24,29,153,53,2,0 ; vbroadcastss 0x23599(%rip),%ymm11 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,29,213,52,2,0 ; vbroadcastss 0x234d5(%rip),%ymm11 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,124,89,227 ; vmulps %ymm11,%ymm0,%ymm12
- DB 196,98,125,24,45,159,53,2,0 ; vbroadcastss 0x2359f(%rip),%ymm13 # 2c118 <_sk_overlay_sse2_8bit+0x4a3>
+ DB 196,98,125,24,45,219,52,2,0 ; vbroadcastss 0x234db(%rip),%ymm13 # 2c054 <_sk_overlay_sse2_8bit+0x4a4>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,44,89,212 ; vmulps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,144,53,2,0 ; vbroadcastss 0x23590(%rip),%ymm12 # 2c11c <_sk_overlay_sse2_8bit+0x4a7>
+ DB 196,98,125,24,37,204,52,2,0 ; vbroadcastss 0x234cc(%rip),%ymm12 # 2c058 <_sk_overlay_sse2_8bit+0x4a8>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,53,134,53,2,0 ; vbroadcastss 0x23586(%rip),%ymm14 # 2c120 <_sk_overlay_sse2_8bit+0x4ab>
+ DB 196,98,125,24,53,194,52,2,0 ; vbroadcastss 0x234c2(%rip),%ymm14 # 2c05c <_sk_overlay_sse2_8bit+0x4ac>
DB 196,193,124,194,198,1 ; vcmpltps %ymm14,%ymm0,%ymm0
DB 196,195,45,74,193,0 ; vblendvps %ymm0,%ymm9,%ymm10,%ymm0
DB 196,65,116,89,200 ; vmulps %ymm8,%ymm1,%ymm9
@@ -8407,17 +8407,17 @@ _sk_from_srgb_avx LABEL PROC
PUBLIC _sk_from_srgb_dst_avx
_sk_from_srgb_dst_avx LABEL PROC
- DB 196,98,125,24,5,15,53,2,0 ; vbroadcastss 0x2350f(%rip),%ymm8 # 2c114 <_sk_overlay_sse2_8bit+0x49f>
+ DB 196,98,125,24,5,75,52,2,0 ; vbroadcastss 0x2344b(%rip),%ymm8 # 2c050 <_sk_overlay_sse2_8bit+0x4a0>
DB 196,65,92,89,200 ; vmulps %ymm8,%ymm4,%ymm9
DB 197,92,89,212 ; vmulps %ymm4,%ymm4,%ymm10
- DB 196,98,125,24,29,237,52,2,0 ; vbroadcastss 0x234ed(%rip),%ymm11 # 2c104 <_sk_overlay_sse2_8bit+0x48f>
+ DB 196,98,125,24,29,41,52,2,0 ; vbroadcastss 0x23429(%rip),%ymm11 # 2c040 <_sk_overlay_sse2_8bit+0x490>
DB 196,65,92,89,227 ; vmulps %ymm11,%ymm4,%ymm12
- DB 196,98,125,24,45,243,52,2,0 ; vbroadcastss 0x234f3(%rip),%ymm13 # 2c118 <_sk_overlay_sse2_8bit+0x4a3>
+ DB 196,98,125,24,45,47,52,2,0 ; vbroadcastss 0x2342f(%rip),%ymm13 # 2c054 <_sk_overlay_sse2_8bit+0x4a4>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,44,89,212 ; vmulps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,228,52,2,0 ; vbroadcastss 0x234e4(%rip),%ymm12 # 2c11c <_sk_overlay_sse2_8bit+0x4a7>
+ DB 196,98,125,24,37,32,52,2,0 ; vbroadcastss 0x23420(%rip),%ymm12 # 2c058 <_sk_overlay_sse2_8bit+0x4a8>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,53,218,52,2,0 ; vbroadcastss 0x234da(%rip),%ymm14 # 2c120 <_sk_overlay_sse2_8bit+0x4ab>
+ DB 196,98,125,24,53,22,52,2,0 ; vbroadcastss 0x23416(%rip),%ymm14 # 2c05c <_sk_overlay_sse2_8bit+0x4ac>
DB 196,193,92,194,230,1 ; vcmpltps %ymm14,%ymm4,%ymm4
DB 196,195,45,74,225,64 ; vblendvps %ymm4,%ymm9,%ymm10,%ymm4
DB 196,65,84,89,200 ; vmulps %ymm8,%ymm5,%ymm9
@@ -8442,20 +8442,20 @@ _sk_from_srgb_dst_avx LABEL PROC
PUBLIC _sk_to_srgb_avx
_sk_to_srgb_avx LABEL PROC
DB 197,124,82,200 ; vrsqrtps %ymm0,%ymm9
- DB 196,98,125,24,5,111,52,2,0 ; vbroadcastss 0x2346f(%rip),%ymm8 # 2c124 <_sk_overlay_sse2_8bit+0x4af>
+ DB 196,98,125,24,5,171,51,2,0 ; vbroadcastss 0x233ab(%rip),%ymm8 # 2c060 <_sk_overlay_sse2_8bit+0x4b0>
DB 196,65,124,89,208 ; vmulps %ymm8,%ymm0,%ymm10
- DB 196,98,125,24,29,105,52,2,0 ; vbroadcastss 0x23469(%rip),%ymm11 # 2c12c <_sk_overlay_sse2_8bit+0x4b7>
+ DB 196,98,125,24,29,165,51,2,0 ; vbroadcastss 0x233a5(%rip),%ymm11 # 2c068 <_sk_overlay_sse2_8bit+0x4b8>
DB 196,65,52,89,227 ; vmulps %ymm11,%ymm9,%ymm12
- DB 196,98,125,24,45,87,52,2,0 ; vbroadcastss 0x23457(%rip),%ymm13 # 2c128 <_sk_overlay_sse2_8bit+0x4b3>
+ DB 196,98,125,24,45,147,51,2,0 ; vbroadcastss 0x23393(%rip),%ymm13 # 2c064 <_sk_overlay_sse2_8bit+0x4b4>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,52,89,228 ; vmulps %ymm12,%ymm9,%ymm12
- DB 196,98,125,24,53,76,52,2,0 ; vbroadcastss 0x2344c(%rip),%ymm14 # 2c130 <_sk_overlay_sse2_8bit+0x4bb>
+ DB 196,98,125,24,53,136,51,2,0 ; vbroadcastss 0x23388(%rip),%ymm14 # 2c06c <_sk_overlay_sse2_8bit+0x4bc>
DB 196,65,28,88,230 ; vaddps %ymm14,%ymm12,%ymm12
- DB 196,98,125,24,61,66,52,2,0 ; vbroadcastss 0x23442(%rip),%ymm15 # 2c134 <_sk_overlay_sse2_8bit+0x4bf>
+ DB 196,98,125,24,61,126,51,2,0 ; vbroadcastss 0x2337e(%rip),%ymm15 # 2c070 <_sk_overlay_sse2_8bit+0x4c0>
DB 196,65,52,88,207 ; vaddps %ymm15,%ymm9,%ymm9
DB 196,65,124,83,201 ; vrcpps %ymm9,%ymm9
DB 196,65,52,89,204 ; vmulps %ymm12,%ymm9,%ymm9
- DB 196,98,125,24,37,46,52,2,0 ; vbroadcastss 0x2342e(%rip),%ymm12 # 2c138 <_sk_overlay_sse2_8bit+0x4c3>
+ DB 196,98,125,24,37,106,51,2,0 ; vbroadcastss 0x2336a(%rip),%ymm12 # 2c074 <_sk_overlay_sse2_8bit+0x4c4>
DB 196,193,124,194,196,1 ; vcmpltps %ymm12,%ymm0,%ymm0
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 197,124,82,201 ; vrsqrtps %ymm1,%ymm9
@@ -8490,7 +8490,7 @@ _sk_rgb_to_hsl_avx LABEL PROC
DB 197,116,93,202 ; vminps %ymm2,%ymm1,%ymm9
DB 196,65,124,93,201 ; vminps %ymm9,%ymm0,%ymm9
DB 196,65,60,92,209 ; vsubps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,29,58,51,2,0 ; vbroadcastss 0x2333a(%rip),%ymm11 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,29,118,50,2,0 ; vbroadcastss 0x23276(%rip),%ymm11 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,65,36,94,218 ; vdivps %ymm10,%ymm11,%ymm11
DB 197,116,92,226 ; vsubps %ymm2,%ymm1,%ymm12
DB 196,65,28,89,227 ; vmulps %ymm11,%ymm12,%ymm12
@@ -8500,19 +8500,19 @@ _sk_rgb_to_hsl_avx LABEL PROC
DB 196,193,108,89,211 ; vmulps %ymm11,%ymm2,%ymm2
DB 197,252,92,201 ; vsubps %ymm1,%ymm0,%ymm1
DB 196,193,116,89,203 ; vmulps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,103,51,2,0 ; vbroadcastss 0x23367(%rip),%ymm11 # 2c144 <_sk_overlay_sse2_8bit+0x4cf>
+ DB 196,98,125,24,29,163,50,2,0 ; vbroadcastss 0x232a3(%rip),%ymm11 # 2c080 <_sk_overlay_sse2_8bit+0x4d0>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,85,51,2,0 ; vbroadcastss 0x23355(%rip),%ymm11 # 2c140 <_sk_overlay_sse2_8bit+0x4cb>
+ DB 196,98,125,24,29,145,50,2,0 ; vbroadcastss 0x23291(%rip),%ymm11 # 2c07c <_sk_overlay_sse2_8bit+0x4cc>
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
DB 196,227,117,74,202,224 ; vblendvps %ymm14,%ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,61,51,2,0 ; vbroadcastss 0x2333d(%rip),%ymm2 # 2c13c <_sk_overlay_sse2_8bit+0x4c7>
+ DB 196,226,125,24,21,121,50,2,0 ; vbroadcastss 0x23279(%rip),%ymm2 # 2c078 <_sk_overlay_sse2_8bit+0x4c8>
DB 196,65,12,87,246 ; vxorps %ymm14,%ymm14,%ymm14
DB 196,227,13,74,210,208 ; vblendvps %ymm13,%ymm2,%ymm14,%ymm2
DB 197,188,194,192,0 ; vcmpeqps %ymm0,%ymm8,%ymm0
DB 196,193,108,88,212 ; vaddps %ymm12,%ymm2,%ymm2
DB 196,227,117,74,194,0 ; vblendvps %ymm0,%ymm2,%ymm1,%ymm0
DB 196,193,60,88,201 ; vaddps %ymm9,%ymm8,%ymm1
- DB 196,98,125,24,37,184,50,2,0 ; vbroadcastss 0x232b8(%rip),%ymm12 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,37,244,49,2,0 ; vbroadcastss 0x231f4(%rip),%ymm12 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,193,116,89,212 ; vmulps %ymm12,%ymm1,%ymm2
DB 197,28,194,226,1 ; vcmpltps %ymm2,%ymm12,%ymm12
DB 196,65,36,92,216 ; vsubps %ymm8,%ymm11,%ymm11
@@ -8522,7 +8522,7 @@ _sk_rgb_to_hsl_avx LABEL PROC
DB 197,172,94,201 ; vdivps %ymm1,%ymm10,%ymm1
DB 196,195,125,74,198,128 ; vblendvps %ymm8,%ymm14,%ymm0,%ymm0
DB 196,195,117,74,206,128 ; vblendvps %ymm8,%ymm14,%ymm1,%ymm1
- DB 196,98,125,24,5,231,50,2,0 ; vbroadcastss 0x232e7(%rip),%ymm8 # 2c148 <_sk_overlay_sse2_8bit+0x4d3>
+ DB 196,98,125,24,5,35,50,2,0 ; vbroadcastss 0x23223(%rip),%ymm8 # 2c084 <_sk_overlay_sse2_8bit+0x4d4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -8537,7 +8537,7 @@ _sk_hsl_to_rgb_avx LABEL PROC
DB 197,252,17,28,36 ; vmovups %ymm3,(%rsp)
DB 197,252,40,225 ; vmovaps %ymm1,%ymm4
DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
- DB 196,98,125,24,5,62,50,2,0 ; vbroadcastss 0x2323e(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,122,49,2,0 ; vbroadcastss 0x2317a(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,60,194,202,2 ; vcmpleps %ymm2,%ymm8,%ymm9
DB 197,92,89,210 ; vmulps %ymm2,%ymm4,%ymm10
DB 196,65,92,92,218 ; vsubps %ymm10,%ymm4,%ymm11
@@ -8545,23 +8545,23 @@ _sk_hsl_to_rgb_avx LABEL PROC
DB 197,52,88,210 ; vaddps %ymm2,%ymm9,%ymm10
DB 197,108,88,202 ; vaddps %ymm2,%ymm2,%ymm9
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,29,128,50,2,0 ; vbroadcastss 0x23280(%rip),%ymm11 # 2c14c <_sk_overlay_sse2_8bit+0x4d7>
+ DB 196,98,125,24,29,188,49,2,0 ; vbroadcastss 0x231bc(%rip),%ymm11 # 2c088 <_sk_overlay_sse2_8bit+0x4d8>
DB 196,65,100,88,219 ; vaddps %ymm11,%ymm3,%ymm11
DB 196,67,125,8,227,1 ; vroundps $0x1,%ymm11,%ymm12
DB 196,65,36,92,252 ; vsubps %ymm12,%ymm11,%ymm15
DB 196,65,44,92,217 ; vsubps %ymm9,%ymm10,%ymm11
- DB 196,98,125,24,37,82,50,2,0 ; vbroadcastss 0x23252(%rip),%ymm12 # 2c13c <_sk_overlay_sse2_8bit+0x4c7>
+ DB 196,98,125,24,37,142,49,2,0 ; vbroadcastss 0x2318e(%rip),%ymm12 # 2c078 <_sk_overlay_sse2_8bit+0x4c8>
DB 196,193,4,89,196 ; vmulps %ymm12,%ymm15,%ymm0
- DB 196,98,125,24,45,76,50,2,0 ; vbroadcastss 0x2324c(%rip),%ymm13 # 2c144 <_sk_overlay_sse2_8bit+0x4cf>
+ DB 196,98,125,24,45,136,49,2,0 ; vbroadcastss 0x23188(%rip),%ymm13 # 2c080 <_sk_overlay_sse2_8bit+0x4d0>
DB 197,20,92,240 ; vsubps %ymm0,%ymm13,%ymm14
DB 196,65,36,89,246 ; vmulps %ymm14,%ymm11,%ymm14
DB 196,65,52,88,246 ; vaddps %ymm14,%ymm9,%ymm14
- DB 196,226,125,24,13,65,50,2,0 ; vbroadcastss 0x23241(%rip),%ymm1 # 2c150 <_sk_overlay_sse2_8bit+0x4db>
+ DB 196,226,125,24,13,125,49,2,0 ; vbroadcastss 0x2317d(%rip),%ymm1 # 2c08c <_sk_overlay_sse2_8bit+0x4dc>
DB 196,193,116,194,255,2 ; vcmpleps %ymm15,%ymm1,%ymm7
DB 196,195,13,74,249,112 ; vblendvps %ymm7,%ymm9,%ymm14,%ymm7
DB 196,65,60,194,247,2 ; vcmpleps %ymm15,%ymm8,%ymm14
DB 196,227,45,74,255,224 ; vblendvps %ymm14,%ymm7,%ymm10,%ymm7
- DB 196,98,125,24,53,24,50,2,0 ; vbroadcastss 0x23218(%rip),%ymm14 # 2c148 <_sk_overlay_sse2_8bit+0x4d3>
+ DB 196,98,125,24,53,84,49,2,0 ; vbroadcastss 0x23154(%rip),%ymm14 # 2c084 <_sk_overlay_sse2_8bit+0x4d4>
DB 196,65,12,194,255,2 ; vcmpleps %ymm15,%ymm14,%ymm15
DB 196,193,124,89,195 ; vmulps %ymm11,%ymm0,%ymm0
DB 197,180,88,192 ; vaddps %ymm0,%ymm9,%ymm0
@@ -8580,7 +8580,7 @@ _sk_hsl_to_rgb_avx LABEL PROC
DB 197,164,89,247 ; vmulps %ymm7,%ymm11,%ymm6
DB 197,180,88,246 ; vaddps %ymm6,%ymm9,%ymm6
DB 196,227,77,74,237,0 ; vblendvps %ymm0,%ymm5,%ymm6,%ymm5
- DB 196,226,125,24,5,194,49,2,0 ; vbroadcastss 0x231c2(%rip),%ymm0 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
+ DB 196,226,125,24,5,254,48,2,0 ; vbroadcastss 0x230fe(%rip),%ymm0 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
DB 197,228,88,192 ; vaddps %ymm0,%ymm3,%ymm0
DB 196,227,125,8,216,1 ; vroundps $0x1,%ymm0,%ymm3
DB 197,252,92,195 ; vsubps %ymm3,%ymm0,%ymm0
@@ -8632,13 +8632,13 @@ _sk_scale_u8_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,74 ; jne 909d <_sk_scale_u8_avx+0x62>
DB 196,2,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm8
- DB 197,57,219,5,111,58,2,0 ; vpand 0x23a6f(%rip),%xmm8,%xmm8 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,57,219,5,175,57,2,0 ; vpand 0x239af(%rip),%xmm8,%xmm8 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 196,65,57,105,201 ; vpunpckhwd %xmm9,%xmm8,%xmm9
DB 196,66,121,51,192 ; vpmovzxwd %xmm8,%xmm8
DB 196,67,61,24,193,1 ; vinsertf128 $0x1,%xmm9,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,212,48,2,0 ; vbroadcastss 0x230d4(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,16,48,2,0 ; vbroadcastss 0x23010(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -8686,7 +8686,7 @@ _sk_scale_u8_avx LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 232,255,255,255,221 ; callq ffffffffde009148 <_sk_overlay_sse2_8bit+0xffffffffddfdd4d3>
+ DB 232,255,255,255,221 ; callq ffffffffde009148 <_sk_overlay_sse2_8bit+0xffffffffddfdd598>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,210 ; callq *%rdx
@@ -8713,20 +8713,20 @@ _sk_scale_565_avx LABEL PROC
DB 196,65,57,105,201 ; vpunpckhwd %xmm9,%xmm8,%xmm9
DB 196,66,121,51,192 ; vpmovzxwd %xmm8,%xmm8
DB 196,67,61,24,193,1 ; vinsertf128 $0x1,%xmm9,%ymm8,%ymm8
- DB 196,98,125,24,13,197,47,2,0 ; vbroadcastss 0x22fc5(%rip),%ymm9 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,98,125,24,13,1,47,2,0 ; vbroadcastss 0x22f01(%rip),%ymm9 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 196,65,60,84,201 ; vandps %ymm9,%ymm8,%ymm9
DB 196,65,124,91,201 ; vcvtdq2ps %ymm9,%ymm9
- DB 196,98,125,24,21,182,47,2,0 ; vbroadcastss 0x22fb6(%rip),%ymm10 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,98,125,24,21,242,46,2,0 ; vbroadcastss 0x22ef2(%rip),%ymm10 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,172,47,2,0 ; vbroadcastss 0x22fac(%rip),%ymm10 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,98,125,24,21,232,46,2,0 ; vbroadcastss 0x22ee8(%rip),%ymm10 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 196,65,60,84,210 ; vandps %ymm10,%ymm8,%ymm10
DB 196,65,124,91,210 ; vcvtdq2ps %ymm10,%ymm10
- DB 196,98,125,24,29,157,47,2,0 ; vbroadcastss 0x22f9d(%rip),%ymm11 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,98,125,24,29,217,46,2,0 ; vbroadcastss 0x22ed9(%rip),%ymm11 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
- DB 196,98,125,24,29,147,47,2,0 ; vbroadcastss 0x22f93(%rip),%ymm11 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,98,125,24,29,207,46,2,0 ; vbroadcastss 0x22ecf(%rip),%ymm11 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 196,65,60,84,195 ; vandps %ymm11,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,29,132,47,2,0 ; vbroadcastss 0x22f84(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,98,125,24,29,192,46,2,0 ; vbroadcastss 0x22ec0(%rip),%ymm11 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 197,100,194,223,1 ; vcmpltps %ymm7,%ymm3,%ymm11
DB 196,65,44,93,224 ; vminps %ymm8,%ymm10,%ymm12
@@ -8817,13 +8817,13 @@ _sk_lerp_u8_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,110 ; jne 938d <_sk_lerp_u8_avx+0x86>
DB 196,2,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm8
- DB 197,57,219,5,163,55,2,0 ; vpand 0x237a3(%rip),%xmm8,%xmm8 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,57,219,5,227,54,2,0 ; vpand 0x236e3(%rip),%xmm8,%xmm8 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 196,65,57,105,201 ; vpunpckhwd %xmm9,%xmm8,%xmm9
DB 196,66,121,51,192 ; vpmovzxwd %xmm8,%xmm8
DB 196,67,61,24,193,1 ; vinsertf128 $0x1,%xmm9,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,8,46,2,0 ; vbroadcastss 0x22e08(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,68,45,2,0 ; vbroadcastss 0x22d44(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
@@ -8908,20 +8908,20 @@ _sk_lerp_565_avx LABEL PROC
DB 196,65,57,105,201 ; vpunpckhwd %xmm9,%xmm8,%xmm9
DB 196,66,121,51,192 ; vpmovzxwd %xmm8,%xmm8
DB 196,67,61,24,193,1 ; vinsertf128 $0x1,%xmm9,%ymm8,%ymm8
- DB 196,98,125,24,13,209,44,2,0 ; vbroadcastss 0x22cd1(%rip),%ymm9 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,98,125,24,13,13,44,2,0 ; vbroadcastss 0x22c0d(%rip),%ymm9 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 196,65,60,84,201 ; vandps %ymm9,%ymm8,%ymm9
DB 196,65,124,91,201 ; vcvtdq2ps %ymm9,%ymm9
- DB 196,98,125,24,21,194,44,2,0 ; vbroadcastss 0x22cc2(%rip),%ymm10 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,98,125,24,21,254,43,2,0 ; vbroadcastss 0x22bfe(%rip),%ymm10 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,184,44,2,0 ; vbroadcastss 0x22cb8(%rip),%ymm10 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,98,125,24,21,244,43,2,0 ; vbroadcastss 0x22bf4(%rip),%ymm10 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 196,65,60,84,210 ; vandps %ymm10,%ymm8,%ymm10
DB 196,65,124,91,210 ; vcvtdq2ps %ymm10,%ymm10
- DB 196,98,125,24,29,169,44,2,0 ; vbroadcastss 0x22ca9(%rip),%ymm11 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,98,125,24,29,229,43,2,0 ; vbroadcastss 0x22be5(%rip),%ymm11 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
- DB 196,98,125,24,29,159,44,2,0 ; vbroadcastss 0x22c9f(%rip),%ymm11 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,98,125,24,29,219,43,2,0 ; vbroadcastss 0x22bdb(%rip),%ymm11 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 196,65,60,84,195 ; vandps %ymm11,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,29,144,44,2,0 ; vbroadcastss 0x22c90(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,98,125,24,29,204,43,2,0 ; vbroadcastss 0x22bcc(%rip),%ymm11 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 197,100,194,223,1 ; vcmpltps %ymm7,%ymm3,%ymm11
DB 196,65,44,93,224 ; vminps %ymm8,%ymm10,%ymm12
@@ -8999,7 +8999,7 @@ _sk_load_tables_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,7,2,0,0 ; jne 97fe <_sk_load_tables_avx+0x21e>
DB 196,65,125,16,20,144 ; vmovupd (%r8,%rdx,4),%ymm10
- DB 197,125,40,13,251,47,2,0 ; vmovapd 0x22ffb(%rip),%ymm9 # 2c600 <_sk_overlay_sse2_8bit+0x98b>
+ DB 197,125,40,13,59,47,2,0 ; vmovapd 0x22f3b(%rip),%ymm9 # 2c540 <_sk_overlay_sse2_8bit+0x990>
DB 196,193,45,84,201 ; vandpd %ymm9,%ymm10,%ymm1
DB 196,227,125,25,200,1 ; vextractf128 $0x1,%ymm1,%xmm0
DB 196,193,249,126,192 ; vmovq %xmm0,%r8
@@ -9091,7 +9091,7 @@ _sk_load_tables_avx LABEL PROC
DB 196,193,65,114,213,24 ; vpsrld $0x18,%xmm13,%xmm7
DB 196,227,101,24,223,1 ; vinsertf128 $0x1,%xmm7,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,226,125,24,61,107,41,2,0 ; vbroadcastss 0x2296b(%rip),%ymm7 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,61,167,40,2,0 ; vbroadcastss 0x228a7(%rip),%ymm7 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,228,89,223 ; vmulps %ymm7,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,16,60,36 ; vmovups (%rsp),%ymm7
@@ -9176,7 +9176,7 @@ _sk_load_tables_u16_be_avx LABEL PROC
DB 197,113,105,219 ; vpunpckhwd %xmm3,%xmm1,%xmm11
DB 197,177,108,200 ; vpunpcklqdq %xmm0,%xmm9,%xmm1
DB 197,49,109,224 ; vpunpckhqdq %xmm0,%xmm9,%xmm12
- DB 197,121,111,21,148,49,2,0 ; vmovdqa 0x23194(%rip),%xmm10 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,121,111,21,212,48,2,0 ; vmovdqa 0x230d4(%rip),%xmm10 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,193,113,219,202 ; vpand %xmm10,%xmm1,%xmm1
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 196,193,113,105,209 ; vpunpckhwd %xmm9,%xmm1,%xmm2
@@ -9274,7 +9274,7 @@ _sk_load_tables_u16_be_avx LABEL PROC
DB 196,226,121,51,219 ; vpmovzxwd %xmm3,%xmm3
DB 196,227,101,24,223,1 ; vinsertf128 $0x1,%xmm7,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,226,125,24,61,63,38,2,0 ; vbroadcastss 0x2263f(%rip),%ymm7 # 2c174 <_sk_overlay_sse2_8bit+0x4ff>
+ DB 196,226,125,24,61,123,37,2,0 ; vbroadcastss 0x2257b(%rip),%ymm7 # 2c0b0 <_sk_overlay_sse2_8bit+0x500>
DB 197,228,89,223 ; vmulps %ymm7,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,16,60,36 ; vmovups (%rsp),%ymm7
@@ -9337,7 +9337,7 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
DB 197,185,108,211 ; vpunpcklqdq %xmm3,%xmm8,%xmm2
DB 197,57,109,219 ; vpunpckhqdq %xmm3,%xmm8,%xmm11
DB 197,113,108,192 ; vpunpcklqdq %xmm0,%xmm1,%xmm8
- DB 197,121,111,13,130,46,2,0 ; vmovdqa 0x22e82(%rip),%xmm9 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,121,111,13,194,45,2,0 ; vmovdqa 0x22dc2(%rip),%xmm9 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 196,193,105,219,193 ; vpand %xmm9,%xmm2,%xmm0
DB 196,65,41,239,210 ; vpxor %xmm10,%xmm10,%xmm10
DB 196,193,121,105,202 ; vpunpckhwd %xmm10,%xmm0,%xmm1
@@ -9427,7 +9427,7 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
DB 196,195,105,33,211,48 ; vinsertps $0x30,%xmm11,%xmm2,%xmm2
DB 196,227,109,24,211,1 ; vinsertf128 $0x1,%xmm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,199,34,2,0 ; vbroadcastss 0x222c7(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,3,34,2,0 ; vbroadcastss 0x22203(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,16,52,36 ; vmovups (%rsp),%ymm6
DB 197,252,16,124,36,32 ; vmovups 0x20(%rsp),%ymm7
DB 72,131,196,88 ; add $0x58,%rsp
@@ -9497,7 +9497,7 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
PUBLIC _sk_byte_tables_avx
_sk_byte_tables_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,168,33,2,0 ; vbroadcastss 0x221a8(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,228,32,2,0 ; vbroadcastss 0x220e4(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 197,125,91,200 ; vcvtps2dq %ymm0,%ymm9
DB 196,65,249,126,200 ; vmovq %xmm9,%r8
@@ -9616,7 +9616,7 @@ _sk_byte_tables_avx LABEL PROC
DB 196,194,121,49,204 ; vpmovzxbd %xmm12,%xmm1
DB 196,194,121,49,213 ; vpmovzxbd %xmm13,%xmm2
DB 196,227,117,24,202,1 ; vinsertf128 $0x1,%xmm2,%ymm1,%ymm1
- DB 196,98,125,24,13,150,31,2,0 ; vbroadcastss 0x21f96(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,210,30,2,0 ; vbroadcastss 0x21ed2(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
DB 196,193,116,89,201 ; vmulps %ymm9,%ymm1,%ymm1
@@ -9730,7 +9730,7 @@ _sk_byte_tables_rgb_avx LABEL PROC
DB 196,194,121,49,203 ; vpmovzxbd %xmm11,%xmm1
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,115,29,2,0 ; vbroadcastss 0x21d73(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,175,28,2,0 ; vbroadcastss 0x21caf(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,194,121,49,202 ; vpmovzxbd %xmm10,%xmm1
DB 196,194,121,49,212 ; vpmovzxbd %xmm12,%xmm2
@@ -9957,36 +9957,36 @@ _sk_parametric_r_avx LABEL PROC
DB 196,193,124,88,195 ; vaddps %ymm11,%ymm0,%ymm0
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,216 ; vcvtdq2ps %ymm0,%ymm11
- DB 196,98,125,24,37,4,26,2,0 ; vbroadcastss 0x21a04(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
+ DB 196,98,125,24,37,64,25,2,0 ; vbroadcastss 0x21940(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,250,25,2,0 ; vbroadcastss 0x219fa(%rip),%ymm12 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,54,25,2,0 ; vbroadcastss 0x21936(%rip),%ymm12 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,193,124,84,196 ; vandps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,37,80,25,2,0 ; vbroadcastss 0x21950(%rip),%ymm12 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,37,140,24,2,0 ; vbroadcastss 0x2188c(%rip),%ymm12 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,193,124,86,196 ; vorps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,37,226,25,2,0 ; vbroadcastss 0x219e2(%rip),%ymm12 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,37,30,25,2,0 ; vbroadcastss 0x2191e(%rip),%ymm12 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,216,25,2,0 ; vbroadcastss 0x219d8(%rip),%ymm12 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,37,20,25,2,0 ; vbroadcastss 0x21914(%rip),%ymm12 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,65,124,89,228 ; vmulps %ymm12,%ymm0,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,201,25,2,0 ; vbroadcastss 0x219c9(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,5,25,2,0 ; vbroadcastss 0x21905(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,193,124,88,196 ; vaddps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,37,191,25,2,0 ; vbroadcastss 0x219bf(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,251,24,2,0 ; vbroadcastss 0x218fb(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 197,156,94,192 ; vdivps %ymm0,%ymm12,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
DB 197,172,89,192 ; vmulps %ymm0,%ymm10,%ymm0
DB 196,99,125,8,208,1 ; vroundps $0x1,%ymm0,%ymm10
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,163,25,2,0 ; vbroadcastss 0x219a3(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,223,24,2,0 ; vbroadcastss 0x218df(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,124,88,195 ; vaddps %ymm11,%ymm0,%ymm0
- DB 196,98,125,24,29,153,25,2,0 ; vbroadcastss 0x21999(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,213,24,2,0 ; vbroadcastss 0x218d5(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,124,92,195 ; vsubps %ymm11,%ymm0,%ymm0
- DB 196,98,125,24,29,138,25,2,0 ; vbroadcastss 0x2198a(%rip),%ymm11 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,98,125,24,29,198,24,2,0 ; vbroadcastss 0x218c6(%rip),%ymm11 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,128,25,2,0 ; vbroadcastss 0x21980(%rip),%ymm11 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,29,188,24,2,0 ; vbroadcastss 0x218bc(%rip),%ymm11 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,124,88,194 ; vaddps %ymm10,%ymm0,%ymm0
- DB 196,98,125,24,21,113,25,2,0 ; vbroadcastss 0x21971(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,173,24,2,0 ; vbroadcastss 0x218ad(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,253,91,192 ; vcvtps2dq %ymm0,%ymm0
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -9994,7 +9994,7 @@ _sk_parametric_r_avx LABEL PROC
DB 196,195,125,74,193,128 ; vblendvps %ymm8,%ymm9,%ymm0,%ymm0
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,124,95,192 ; vmaxps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,136,24,2,0 ; vbroadcastss 0x21888(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,196,23,2,0 ; vbroadcastss 0x217c4(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -10014,36 +10014,36 @@ _sk_parametric_g_avx LABEL PROC
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,217 ; vcvtdq2ps %ymm1,%ymm11
- DB 196,98,125,24,37,201,24,2,0 ; vbroadcastss 0x218c9(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
+ DB 196,98,125,24,37,5,24,2,0 ; vbroadcastss 0x21805(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,191,24,2,0 ; vbroadcastss 0x218bf(%rip),%ymm12 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,251,23,2,0 ; vbroadcastss 0x217fb(%rip),%ymm12 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,193,116,84,204 ; vandps %ymm12,%ymm1,%ymm1
- DB 196,98,125,24,37,21,24,2,0 ; vbroadcastss 0x21815(%rip),%ymm12 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,37,81,23,2,0 ; vbroadcastss 0x21751(%rip),%ymm12 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,193,116,86,204 ; vorps %ymm12,%ymm1,%ymm1
- DB 196,98,125,24,37,167,24,2,0 ; vbroadcastss 0x218a7(%rip),%ymm12 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,37,227,23,2,0 ; vbroadcastss 0x217e3(%rip),%ymm12 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,157,24,2,0 ; vbroadcastss 0x2189d(%rip),%ymm12 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,37,217,23,2,0 ; vbroadcastss 0x217d9(%rip),%ymm12 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,65,116,89,228 ; vmulps %ymm12,%ymm1,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,142,24,2,0 ; vbroadcastss 0x2188e(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,202,23,2,0 ; vbroadcastss 0x217ca(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,193,116,88,204 ; vaddps %ymm12,%ymm1,%ymm1
- DB 196,98,125,24,37,132,24,2,0 ; vbroadcastss 0x21884(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,192,23,2,0 ; vbroadcastss 0x217c0(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 197,156,94,201 ; vdivps %ymm1,%ymm12,%ymm1
DB 197,164,92,201 ; vsubps %ymm1,%ymm11,%ymm1
DB 197,172,89,201 ; vmulps %ymm1,%ymm10,%ymm1
DB 196,99,125,8,209,1 ; vroundps $0x1,%ymm1,%ymm10
DB 196,65,116,92,210 ; vsubps %ymm10,%ymm1,%ymm10
- DB 196,98,125,24,29,104,24,2,0 ; vbroadcastss 0x21868(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,164,23,2,0 ; vbroadcastss 0x217a4(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,94,24,2,0 ; vbroadcastss 0x2185e(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,154,23,2,0 ; vbroadcastss 0x2179a(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,116,92,203 ; vsubps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,79,24,2,0 ; vbroadcastss 0x2184f(%rip),%ymm11 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,98,125,24,29,139,23,2,0 ; vbroadcastss 0x2178b(%rip),%ymm11 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,69,24,2,0 ; vbroadcastss 0x21845(%rip),%ymm11 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,29,129,23,2,0 ; vbroadcastss 0x21781(%rip),%ymm11 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,116,88,202 ; vaddps %ymm10,%ymm1,%ymm1
- DB 196,98,125,24,21,54,24,2,0 ; vbroadcastss 0x21836(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,114,23,2,0 ; vbroadcastss 0x21772(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,116,89,202 ; vmulps %ymm10,%ymm1,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -10051,7 +10051,7 @@ _sk_parametric_g_avx LABEL PROC
DB 196,195,117,74,201,128 ; vblendvps %ymm8,%ymm9,%ymm1,%ymm1
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,116,95,200 ; vmaxps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,5,77,23,2,0 ; vbroadcastss 0x2174d(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,137,22,2,0 ; vbroadcastss 0x21689(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -10071,36 +10071,36 @@ _sk_parametric_b_avx LABEL PROC
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,218 ; vcvtdq2ps %ymm2,%ymm11
- DB 196,98,125,24,37,142,23,2,0 ; vbroadcastss 0x2178e(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
+ DB 196,98,125,24,37,202,22,2,0 ; vbroadcastss 0x216ca(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,132,23,2,0 ; vbroadcastss 0x21784(%rip),%ymm12 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,192,22,2,0 ; vbroadcastss 0x216c0(%rip),%ymm12 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,193,108,84,212 ; vandps %ymm12,%ymm2,%ymm2
- DB 196,98,125,24,37,218,22,2,0 ; vbroadcastss 0x216da(%rip),%ymm12 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,37,22,22,2,0 ; vbroadcastss 0x21616(%rip),%ymm12 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,193,108,86,212 ; vorps %ymm12,%ymm2,%ymm2
- DB 196,98,125,24,37,108,23,2,0 ; vbroadcastss 0x2176c(%rip),%ymm12 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,37,168,22,2,0 ; vbroadcastss 0x216a8(%rip),%ymm12 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,98,23,2,0 ; vbroadcastss 0x21762(%rip),%ymm12 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,37,158,22,2,0 ; vbroadcastss 0x2169e(%rip),%ymm12 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,65,108,89,228 ; vmulps %ymm12,%ymm2,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,83,23,2,0 ; vbroadcastss 0x21753(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,143,22,2,0 ; vbroadcastss 0x2168f(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,193,108,88,212 ; vaddps %ymm12,%ymm2,%ymm2
- DB 196,98,125,24,37,73,23,2,0 ; vbroadcastss 0x21749(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,133,22,2,0 ; vbroadcastss 0x21685(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 197,156,94,210 ; vdivps %ymm2,%ymm12,%ymm2
DB 197,164,92,210 ; vsubps %ymm2,%ymm11,%ymm2
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 196,99,125,8,210,1 ; vroundps $0x1,%ymm2,%ymm10
DB 196,65,108,92,210 ; vsubps %ymm10,%ymm2,%ymm10
- DB 196,98,125,24,29,45,23,2,0 ; vbroadcastss 0x2172d(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,105,22,2,0 ; vbroadcastss 0x21669(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
- DB 196,98,125,24,29,35,23,2,0 ; vbroadcastss 0x21723(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,95,22,2,0 ; vbroadcastss 0x2165f(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,108,92,211 ; vsubps %ymm11,%ymm2,%ymm2
- DB 196,98,125,24,29,20,23,2,0 ; vbroadcastss 0x21714(%rip),%ymm11 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,98,125,24,29,80,22,2,0 ; vbroadcastss 0x21650(%rip),%ymm11 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,10,23,2,0 ; vbroadcastss 0x2170a(%rip),%ymm11 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,29,70,22,2,0 ; vbroadcastss 0x21646(%rip),%ymm11 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,108,88,210 ; vaddps %ymm10,%ymm2,%ymm2
- DB 196,98,125,24,21,251,22,2,0 ; vbroadcastss 0x216fb(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,55,22,2,0 ; vbroadcastss 0x21637(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 197,253,91,210 ; vcvtps2dq %ymm2,%ymm2
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -10108,7 +10108,7 @@ _sk_parametric_b_avx LABEL PROC
DB 196,195,109,74,209,128 ; vblendvps %ymm8,%ymm9,%ymm2,%ymm2
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,108,95,208 ; vmaxps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,18,22,2,0 ; vbroadcastss 0x21612(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,78,21,2,0 ; vbroadcastss 0x2154e(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -10128,36 +10128,36 @@ _sk_parametric_a_avx LABEL PROC
DB 196,193,100,88,219 ; vaddps %ymm11,%ymm3,%ymm3
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,219 ; vcvtdq2ps %ymm3,%ymm11
- DB 196,98,125,24,37,83,22,2,0 ; vbroadcastss 0x21653(%rip),%ymm12 # 2c178 <_sk_overlay_sse2_8bit+0x503>
+ DB 196,98,125,24,37,143,21,2,0 ; vbroadcastss 0x2158f(%rip),%ymm12 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,73,22,2,0 ; vbroadcastss 0x21649(%rip),%ymm12 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,37,133,21,2,0 ; vbroadcastss 0x21585(%rip),%ymm12 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,193,100,84,220 ; vandps %ymm12,%ymm3,%ymm3
- DB 196,98,125,24,37,159,21,2,0 ; vbroadcastss 0x2159f(%rip),%ymm12 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,37,219,20,2,0 ; vbroadcastss 0x214db(%rip),%ymm12 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,193,100,86,220 ; vorps %ymm12,%ymm3,%ymm3
- DB 196,98,125,24,37,49,22,2,0 ; vbroadcastss 0x21631(%rip),%ymm12 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,37,109,21,2,0 ; vbroadcastss 0x2156d(%rip),%ymm12 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,39,22,2,0 ; vbroadcastss 0x21627(%rip),%ymm12 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,37,99,21,2,0 ; vbroadcastss 0x21563(%rip),%ymm12 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,65,100,89,228 ; vmulps %ymm12,%ymm3,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,24,22,2,0 ; vbroadcastss 0x21618(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,84,21,2,0 ; vbroadcastss 0x21554(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,193,100,88,220 ; vaddps %ymm12,%ymm3,%ymm3
- DB 196,98,125,24,37,14,22,2,0 ; vbroadcastss 0x2160e(%rip),%ymm12 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,37,74,21,2,0 ; vbroadcastss 0x2154a(%rip),%ymm12 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 197,156,94,219 ; vdivps %ymm3,%ymm12,%ymm3
DB 197,164,92,219 ; vsubps %ymm3,%ymm11,%ymm3
DB 197,172,89,219 ; vmulps %ymm3,%ymm10,%ymm3
DB 196,99,125,8,211,1 ; vroundps $0x1,%ymm3,%ymm10
DB 196,65,100,92,210 ; vsubps %ymm10,%ymm3,%ymm10
- DB 196,98,125,24,29,242,21,2,0 ; vbroadcastss 0x215f2(%rip),%ymm11 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,29,46,21,2,0 ; vbroadcastss 0x2152e(%rip),%ymm11 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,100,88,219 ; vaddps %ymm11,%ymm3,%ymm3
- DB 196,98,125,24,29,232,21,2,0 ; vbroadcastss 0x215e8(%rip),%ymm11 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,98,125,24,29,36,21,2,0 ; vbroadcastss 0x21524(%rip),%ymm11 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,100,92,219 ; vsubps %ymm11,%ymm3,%ymm3
- DB 196,98,125,24,29,217,21,2,0 ; vbroadcastss 0x215d9(%rip),%ymm11 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,98,125,24,29,21,21,2,0 ; vbroadcastss 0x21515(%rip),%ymm11 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,207,21,2,0 ; vbroadcastss 0x215cf(%rip),%ymm11 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,98,125,24,29,11,21,2,0 ; vbroadcastss 0x2150b(%rip),%ymm11 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,100,88,218 ; vaddps %ymm10,%ymm3,%ymm3
- DB 196,98,125,24,21,192,21,2,0 ; vbroadcastss 0x215c0(%rip),%ymm10 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,98,125,24,21,252,20,2,0 ; vbroadcastss 0x214fc(%rip),%ymm10 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 197,253,91,219 ; vcvtps2dq %ymm3,%ymm3
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -10165,7 +10165,7 @@ _sk_parametric_a_avx LABEL PROC
DB 196,195,101,74,217,128 ; vblendvps %ymm8,%ymm9,%ymm3,%ymm3
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,100,95,216 ; vmaxps %ymm8,%ymm3,%ymm3
- DB 196,98,125,24,5,215,20,2,0 ; vbroadcastss 0x214d7(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,19,20,2,0 ; vbroadcastss 0x21413(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -10182,34 +10182,34 @@ _sk_gamma_avx LABEL PROC
DB 197,252,40,233 ; vmovaps %ymm1,%ymm5
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,91,200 ; vcvtdq2ps %ymm0,%ymm1
- DB 196,98,125,24,5,32,21,2,0 ; vbroadcastss 0x21520(%rip),%ymm8 # 2c178 <_sk_overlay_sse2_8bit+0x503>
+ DB 196,98,125,24,5,92,20,2,0 ; vbroadcastss 0x2145c(%rip),%ymm8 # 2c0b4 <_sk_overlay_sse2_8bit+0x504>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,13,22,21,2,0 ; vbroadcastss 0x21516(%rip),%ymm9 # 2c17c <_sk_overlay_sse2_8bit+0x507>
+ DB 196,98,125,24,13,82,20,2,0 ; vbroadcastss 0x21452(%rip),%ymm9 # 2c0b8 <_sk_overlay_sse2_8bit+0x508>
DB 196,193,124,84,193 ; vandps %ymm9,%ymm0,%ymm0
- DB 196,226,125,24,37,108,20,2,0 ; vbroadcastss 0x2146c(%rip),%ymm4 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,37,168,19,2,0 ; vbroadcastss 0x213a8(%rip),%ymm4 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,252,86,196 ; vorps %ymm4,%ymm0,%ymm0
- DB 196,98,125,24,21,255,20,2,0 ; vbroadcastss 0x214ff(%rip),%ymm10 # 2c180 <_sk_overlay_sse2_8bit+0x50b>
+ DB 196,98,125,24,21,59,20,2,0 ; vbroadcastss 0x2143b(%rip),%ymm10 # 2c0bc <_sk_overlay_sse2_8bit+0x50c>
DB 196,193,116,88,202 ; vaddps %ymm10,%ymm1,%ymm1
- DB 196,98,125,24,29,245,20,2,0 ; vbroadcastss 0x214f5(%rip),%ymm11 # 2c184 <_sk_overlay_sse2_8bit+0x50f>
+ DB 196,98,125,24,29,49,20,2,0 ; vbroadcastss 0x21431(%rip),%ymm11 # 2c0c0 <_sk_overlay_sse2_8bit+0x510>
DB 196,193,124,89,211 ; vmulps %ymm11,%ymm0,%ymm2
DB 197,244,92,202 ; vsubps %ymm2,%ymm1,%ymm1
- DB 196,98,125,24,37,231,20,2,0 ; vbroadcastss 0x214e7(%rip),%ymm12 # 2c188 <_sk_overlay_sse2_8bit+0x513>
+ DB 196,98,125,24,37,35,20,2,0 ; vbroadcastss 0x21423(%rip),%ymm12 # 2c0c4 <_sk_overlay_sse2_8bit+0x514>
DB 196,193,124,88,196 ; vaddps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,45,221,20,2,0 ; vbroadcastss 0x214dd(%rip),%ymm13 # 2c18c <_sk_overlay_sse2_8bit+0x517>
+ DB 196,98,125,24,45,25,20,2,0 ; vbroadcastss 0x21419(%rip),%ymm13 # 2c0c8 <_sk_overlay_sse2_8bit+0x518>
DB 197,148,94,192 ; vdivps %ymm0,%ymm13,%ymm0
DB 197,244,92,192 ; vsubps %ymm0,%ymm1,%ymm0
DB 196,98,125,24,48 ; vbroadcastss (%rax),%ymm14
DB 196,193,124,89,198 ; vmulps %ymm14,%ymm0,%ymm0
DB 196,227,125,8,200,1 ; vroundps $0x1,%ymm0,%ymm1
DB 197,252,92,241 ; vsubps %ymm1,%ymm0,%ymm6
- DB 196,98,125,24,61,188,20,2,0 ; vbroadcastss 0x214bc(%rip),%ymm15 # 2c190 <_sk_overlay_sse2_8bit+0x51b>
+ DB 196,98,125,24,61,248,19,2,0 ; vbroadcastss 0x213f8(%rip),%ymm15 # 2c0cc <_sk_overlay_sse2_8bit+0x51c>
DB 196,193,124,88,199 ; vaddps %ymm15,%ymm0,%ymm0
- DB 196,226,125,24,29,178,20,2,0 ; vbroadcastss 0x214b2(%rip),%ymm3 # 2c194 <_sk_overlay_sse2_8bit+0x51f>
+ DB 196,226,125,24,29,238,19,2,0 ; vbroadcastss 0x213ee(%rip),%ymm3 # 2c0d0 <_sk_overlay_sse2_8bit+0x520>
DB 197,204,89,203 ; vmulps %ymm3,%ymm6,%ymm1
DB 197,252,92,201 ; vsubps %ymm1,%ymm0,%ymm1
- DB 196,226,125,24,21,165,20,2,0 ; vbroadcastss 0x214a5(%rip),%ymm2 # 2c198 <_sk_overlay_sse2_8bit+0x523>
+ DB 196,226,125,24,21,225,19,2,0 ; vbroadcastss 0x213e1(%rip),%ymm2 # 2c0d4 <_sk_overlay_sse2_8bit+0x524>
DB 197,236,92,198 ; vsubps %ymm6,%ymm2,%ymm0
- DB 196,226,125,24,53,156,20,2,0 ; vbroadcastss 0x2149c(%rip),%ymm6 # 2c19c <_sk_overlay_sse2_8bit+0x527>
+ DB 196,226,125,24,53,216,19,2,0 ; vbroadcastss 0x213d8(%rip),%ymm6 # 2c0d8 <_sk_overlay_sse2_8bit+0x528>
DB 197,204,94,192 ; vdivps %ymm0,%ymm6,%ymm0
DB 197,244,88,192 ; vaddps %ymm0,%ymm1,%ymm0
DB 197,252,17,4,36 ; vmovups %ymm0,(%rsp)
@@ -10251,7 +10251,7 @@ _sk_gamma_avx LABEL PROC
DB 197,236,92,212 ; vsubps %ymm4,%ymm2,%ymm2
DB 197,204,94,210 ; vdivps %ymm2,%ymm6,%ymm2
DB 197,244,88,202 ; vaddps %ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,224,19,2,0 ; vbroadcastss 0x213e0(%rip),%ymm2 # 2c1a0 <_sk_overlay_sse2_8bit+0x52b>
+ DB 196,226,125,24,21,28,19,2,0 ; vbroadcastss 0x2131c(%rip),%ymm2 # 2c0dc <_sk_overlay_sse2_8bit+0x52c>
DB 197,236,89,28,36 ; vmulps (%rsp),%ymm2,%ymm3
DB 197,252,89,226 ; vmulps %ymm2,%ymm0,%ymm4
DB 197,244,89,210 ; vmulps %ymm2,%ymm1,%ymm2
@@ -10269,31 +10269,31 @@ _sk_gamma_avx LABEL PROC
PUBLIC _sk_lab_to_xyz_avx
_sk_lab_to_xyz_avx LABEL PROC
- DB 196,98,125,24,5,147,19,2,0 ; vbroadcastss 0x21393(%rip),%ymm8 # 2c1a4 <_sk_overlay_sse2_8bit+0x52f>
+ DB 196,98,125,24,5,207,18,2,0 ; vbroadcastss 0x212cf(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x530>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,241,18,2,0 ; vbroadcastss 0x212f1(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,45,18,2,0 ; vbroadcastss 0x2122d(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,13,123,19,2,0 ; vbroadcastss 0x2137b(%rip),%ymm9 # 2c1a8 <_sk_overlay_sse2_8bit+0x533>
+ DB 196,98,125,24,13,183,18,2,0 ; vbroadcastss 0x212b7(%rip),%ymm9 # 2c0e4 <_sk_overlay_sse2_8bit+0x534>
DB 196,193,116,88,201 ; vaddps %ymm9,%ymm1,%ymm1
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 196,193,108,88,209 ; vaddps %ymm9,%ymm2,%ymm2
- DB 196,98,125,24,5,103,19,2,0 ; vbroadcastss 0x21367(%rip),%ymm8 # 2c1ac <_sk_overlay_sse2_8bit+0x537>
+ DB 196,98,125,24,5,163,18,2,0 ; vbroadcastss 0x212a3(%rip),%ymm8 # 2c0e8 <_sk_overlay_sse2_8bit+0x538>
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,93,19,2,0 ; vbroadcastss 0x2135d(%rip),%ymm8 # 2c1b0 <_sk_overlay_sse2_8bit+0x53b>
+ DB 196,98,125,24,5,153,18,2,0 ; vbroadcastss 0x21299(%rip),%ymm8 # 2c0ec <_sk_overlay_sse2_8bit+0x53c>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,83,19,2,0 ; vbroadcastss 0x21353(%rip),%ymm8 # 2c1b4 <_sk_overlay_sse2_8bit+0x53f>
+ DB 196,98,125,24,5,143,18,2,0 ; vbroadcastss 0x2128f(%rip),%ymm8 # 2c0f0 <_sk_overlay_sse2_8bit+0x540>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
DB 197,252,88,201 ; vaddps %ymm1,%ymm0,%ymm1
- DB 196,98,125,24,5,69,19,2,0 ; vbroadcastss 0x21345(%rip),%ymm8 # 2c1b8 <_sk_overlay_sse2_8bit+0x543>
+ DB 196,98,125,24,5,129,18,2,0 ; vbroadcastss 0x21281(%rip),%ymm8 # 2c0f4 <_sk_overlay_sse2_8bit+0x544>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,252,92,210 ; vsubps %ymm2,%ymm0,%ymm2
DB 197,116,89,193 ; vmulps %ymm1,%ymm1,%ymm8
DB 196,65,116,89,192 ; vmulps %ymm8,%ymm1,%ymm8
- DB 196,98,125,24,13,46,19,2,0 ; vbroadcastss 0x2132e(%rip),%ymm9 # 2c1bc <_sk_overlay_sse2_8bit+0x547>
+ DB 196,98,125,24,13,106,18,2,0 ; vbroadcastss 0x2126a(%rip),%ymm9 # 2c0f8 <_sk_overlay_sse2_8bit+0x548>
DB 196,65,52,194,208,1 ; vcmpltps %ymm8,%ymm9,%ymm10
- DB 196,98,125,24,29,35,19,2,0 ; vbroadcastss 0x21323(%rip),%ymm11 # 2c1c0 <_sk_overlay_sse2_8bit+0x54b>
+ DB 196,98,125,24,29,95,18,2,0 ; vbroadcastss 0x2125f(%rip),%ymm11 # 2c0fc <_sk_overlay_sse2_8bit+0x54c>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,37,25,19,2,0 ; vbroadcastss 0x21319(%rip),%ymm12 # 2c1c4 <_sk_overlay_sse2_8bit+0x54f>
+ DB 196,98,125,24,37,85,18,2,0 ; vbroadcastss 0x21255(%rip),%ymm12 # 2c100 <_sk_overlay_sse2_8bit+0x550>
DB 196,193,116,89,204 ; vmulps %ymm12,%ymm1,%ymm1
DB 196,67,117,74,192,160 ; vblendvps %ymm10,%ymm8,%ymm1,%ymm8
DB 197,252,89,200 ; vmulps %ymm0,%ymm0,%ymm1
@@ -10308,9 +10308,9 @@ _sk_lab_to_xyz_avx LABEL PROC
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
DB 196,193,108,89,212 ; vmulps %ymm12,%ymm2,%ymm2
DB 196,227,109,74,208,144 ; vblendvps %ymm9,%ymm0,%ymm2,%ymm2
- DB 196,226,125,24,5,207,18,2,0 ; vbroadcastss 0x212cf(%rip),%ymm0 # 2c1c8 <_sk_overlay_sse2_8bit+0x553>
+ DB 196,226,125,24,5,11,18,2,0 ; vbroadcastss 0x2120b(%rip),%ymm0 # 2c104 <_sk_overlay_sse2_8bit+0x554>
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
- DB 196,98,125,24,5,198,18,2,0 ; vbroadcastss 0x212c6(%rip),%ymm8 # 2c1cc <_sk_overlay_sse2_8bit+0x557>
+ DB 196,98,125,24,5,2,18,2,0 ; vbroadcastss 0x21202(%rip),%ymm8 # 2c108 <_sk_overlay_sse2_8bit+0x558>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -10326,13 +10326,13 @@ _sk_load_a8_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,66 ; jne af69 <_sk_load_a8_avx+0x5a>
DB 196,130,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm0
- DB 197,249,219,5,155,27,2,0 ; vpand 0x21b9b(%rip),%xmm0,%xmm0 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,249,219,5,219,26,2,0 ; vpand 0x21adb(%rip),%xmm0,%xmm0 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 197,241,239,201 ; vpxor %xmm1,%xmm1,%xmm1
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,3,18,2,0 ; vbroadcastss 0x21203(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,63,17,2,0 ; vbroadcastss 0x2113f(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -10380,7 +10380,7 @@ _sk_load_a8_avx LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf00b010 <_sk_overlay_sse2_8bit+0xffffffffdefdf39b>
+ DB 233,255,255,255,222 ; jmpq ffffffffdf00b010 <_sk_overlay_sse2_8bit+0xffffffffdefdf460>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,211 ; callq *%rbx
@@ -10402,13 +10402,13 @@ _sk_load_a8_dst_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,66 ; jne b076 <_sk_load_a8_dst_avx+0x5a>
DB 196,130,121,48,36,24 ; vpmovzxbw (%r8,%r11,1),%xmm4
- DB 197,217,219,37,142,26,2,0 ; vpand 0x21a8e(%rip),%xmm4,%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,217,219,37,206,25,2,0 ; vpand 0x219ce(%rip),%xmm4,%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 197,209,239,237 ; vpxor %xmm5,%xmm5,%xmm5
DB 197,217,105,237 ; vpunpckhwd %xmm5,%xmm4,%xmm5
DB 196,226,121,51,228 ; vpmovzxwd %xmm4,%xmm4
DB 196,227,93,24,229,1 ; vinsertf128 $0x1,%xmm5,%ymm4,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,246,16,2,0 ; vbroadcastss 0x210f6(%rip),%ymm5 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,45,50,16,2,0 ; vbroadcastss 0x21032(%rip),%ymm5 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,220,89,253 ; vmulps %ymm5,%ymm4,%ymm7
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,220,87,228 ; vxorps %ymm4,%ymm4,%ymm4
@@ -10514,7 +10514,7 @@ _sk_gather_a8_avx LABEL PROC
DB 196,226,121,49,201 ; vpmovzxbd %xmm1,%xmm1
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,93,15,2,0 ; vbroadcastss 0x20f5d(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,153,14,2,0 ; vbroadcastss 0x20e99(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -10534,7 +10534,7 @@ _sk_store_a8_avx LABEL PROC
DB 77,15,175,193 ; imul %r9,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,222,14,2,0 ; vbroadcastss 0x20ede(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,26,14,2,0 ; vbroadcastss 0x20e1a(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,65,100,89,192 ; vmulps %ymm8,%ymm3,%ymm8
DB 196,65,125,91,192 ; vcvtps2dq %ymm8,%ymm8
DB 196,67,125,25,193,1 ; vextractf128 $0x1,%ymm8,%xmm9
@@ -10559,13 +10559,13 @@ _sk_store_a8_avx LABEL PROC
DB 196,3,121,20,4,24,0 ; vpextrb $0x0,%xmm8,(%r8,%r11,1)
DB 235,202 ; jmp b257 <_sk_store_a8_avx+0x41>
DB 196,3,121,20,68,24,2,4 ; vpextrb $0x4,%xmm8,0x2(%r8,%r11,1)
- DB 196,98,57,0,5,66,24,2,0 ; vpshufb 0x21842(%rip),%xmm8,%xmm8 # 2cae0 <_sk_overlay_sse2_8bit+0xe6b>
+ DB 196,98,57,0,5,130,23,2,0 ; vpshufb 0x21782(%rip),%xmm8,%xmm8 # 2ca20 <_sk_overlay_sse2_8bit+0xe70>
DB 196,3,121,21,4,24,0 ; vpextrw $0x0,%xmm8,(%r8,%r11,1)
DB 235,176 ; jmp b257 <_sk_store_a8_avx+0x41>
DB 196,3,121,20,68,24,6,12 ; vpextrb $0xc,%xmm8,0x6(%r8,%r11,1)
DB 196,3,121,20,68,24,5,10 ; vpextrb $0xa,%xmm8,0x5(%r8,%r11,1)
DB 196,3,121,20,68,24,4,8 ; vpextrb $0x8,%xmm8,0x4(%r8,%r11,1)
- DB 196,98,57,0,5,40,24,2,0 ; vpshufb 0x21828(%rip),%xmm8,%xmm8 # 2caf0 <_sk_overlay_sse2_8bit+0xe7b>
+ DB 196,98,57,0,5,104,23,2,0 ; vpshufb 0x21768(%rip),%xmm8,%xmm8 # 2ca30 <_sk_overlay_sse2_8bit+0xe80>
DB 196,1,121,126,4,24 ; vmovd %xmm8,(%r8,%r11,1)
DB 235,135 ; jmp b257 <_sk_store_a8_avx+0x41>
DB 180,255 ; mov $0xff,%ah
@@ -10599,16 +10599,16 @@ _sk_load_g8_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,71 ; jne b34b <_sk_load_g8_avx+0x5f>
DB 196,130,121,48,4,24 ; vpmovzxbw (%r8,%r11,1),%xmm0
- DB 197,249,219,5,190,23,2,0 ; vpand 0x217be(%rip),%xmm0,%xmm0 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,249,219,5,254,22,2,0 ; vpand 0x216fe(%rip),%xmm0,%xmm0 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 197,241,239,201 ; vpxor %xmm1,%xmm1,%xmm1
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,38,14,2,0 ; vbroadcastss 0x20e26(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,98,13,2,0 ; vbroadcastss 0x20d62(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,163,13,2,0 ; vbroadcastss 0x20da3(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,223,12,2,0 ; vbroadcastss 0x20cdf(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 255,224 ; jmpq *%rax
@@ -10677,16 +10677,16 @@ _sk_load_g8_dst_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,71 ; jne b45f <_sk_load_g8_dst_avx+0x5f>
DB 196,130,121,48,36,24 ; vpmovzxbw (%r8,%r11,1),%xmm4
- DB 197,217,219,37,170,22,2,0 ; vpand 0x216aa(%rip),%xmm4,%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 197,217,219,37,234,21,2,0 ; vpand 0x215ea(%rip),%xmm4,%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 197,209,239,237 ; vpxor %xmm5,%xmm5,%xmm5
DB 197,217,105,237 ; vpunpckhwd %xmm5,%xmm4,%xmm5
DB 196,226,121,51,228 ; vpmovzxwd %xmm4,%xmm4
DB 196,227,93,24,229,1 ; vinsertf128 $0x1,%xmm5,%ymm4,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,18,13,2,0 ; vbroadcastss 0x20d12(%rip),%ymm5 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,45,78,12,2,0 ; vbroadcastss 0x20c4e(%rip),%ymm5 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,220,89,229 ; vmulps %ymm5,%ymm4,%ymm4
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,61,143,12,2,0 ; vbroadcastss 0x20c8f(%rip),%ymm7 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,61,203,11,2,0 ; vbroadcastss 0x20bcb(%rip),%ymm7 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,236 ; vmovaps %ymm4,%ymm5
DB 197,252,40,244 ; vmovaps %ymm4,%ymm6
DB 255,224 ; jmpq *%rax
@@ -10790,10 +10790,10 @@ _sk_gather_g8_avx LABEL PROC
DB 196,226,121,49,201 ; vpmovzxbd %xmm1,%xmm1
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,113,11,2,0 ; vbroadcastss 0x20b71(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,226,125,24,13,173,10,2,0 ; vbroadcastss 0x20aad(%rip),%ymm1 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,238,10,2,0 ; vbroadcastss 0x20aee(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,42,10,2,0 ; vbroadcastss 0x20a2a(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 91 ; pop %rbx
@@ -10818,23 +10818,23 @@ _sk_load_565_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,209,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm2
- DB 196,226,125,24,5,20,11,2,0 ; vbroadcastss 0x20b14(%rip),%ymm0 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,226,125,24,5,80,10,2,0 ; vbroadcastss 0x20a50(%rip),%ymm0 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 197,236,84,192 ; vandps %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,7,11,2,0 ; vbroadcastss 0x20b07(%rip),%ymm1 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,226,125,24,13,67,10,2,0 ; vbroadcastss 0x20a43(%rip),%ymm1 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,254,10,2,0 ; vbroadcastss 0x20afe(%rip),%ymm1 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,226,125,24,13,58,10,2,0 ; vbroadcastss 0x20a3a(%rip),%ymm1 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 197,236,84,201 ; vandps %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,241,10,2,0 ; vbroadcastss 0x20af1(%rip),%ymm3 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,226,125,24,29,45,10,2,0 ; vbroadcastss 0x20a2d(%rip),%ymm3 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,24,29,232,10,2,0 ; vbroadcastss 0x20ae8(%rip),%ymm3 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,226,125,24,29,36,10,2,0 ; vbroadcastss 0x20a24(%rip),%ymm3 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 197,236,84,211 ; vandps %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,219,10,2,0 ; vbroadcastss 0x20adb(%rip),%ymm3 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,226,125,24,29,23,10,2,0 ; vbroadcastss 0x20a17(%rip),%ymm3 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,64,10,2,0 ; vbroadcastss 0x20a40(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,124,9,2,0 ; vbroadcastss 0x2097c(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
@@ -10898,23 +10898,23 @@ _sk_load_565_dst_avx LABEL PROC
DB 197,217,105,237 ; vpunpckhwd %xmm5,%xmm4,%xmm5
DB 196,226,121,51,228 ; vpmovzxwd %xmm4,%xmm4
DB 196,227,93,24,245,1 ; vinsertf128 $0x1,%xmm5,%ymm4,%ymm6
- DB 196,226,125,24,37,211,9,2,0 ; vbroadcastss 0x209d3(%rip),%ymm4 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,226,125,24,37,15,9,2,0 ; vbroadcastss 0x2090f(%rip),%ymm4 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 197,204,84,228 ; vandps %ymm4,%ymm6,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,198,9,2,0 ; vbroadcastss 0x209c6(%rip),%ymm5 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,226,125,24,45,2,9,2,0 ; vbroadcastss 0x20902(%rip),%ymm5 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 197,220,89,229 ; vmulps %ymm5,%ymm4,%ymm4
- DB 196,226,125,24,45,189,9,2,0 ; vbroadcastss 0x209bd(%rip),%ymm5 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,226,125,24,45,249,8,2,0 ; vbroadcastss 0x208f9(%rip),%ymm5 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 197,204,84,237 ; vandps %ymm5,%ymm6,%ymm5
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
- DB 196,226,125,24,61,176,9,2,0 ; vbroadcastss 0x209b0(%rip),%ymm7 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,226,125,24,61,236,8,2,0 ; vbroadcastss 0x208ec(%rip),%ymm7 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 197,212,89,239 ; vmulps %ymm7,%ymm5,%ymm5
- DB 196,226,125,24,61,167,9,2,0 ; vbroadcastss 0x209a7(%rip),%ymm7 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,226,125,24,61,227,8,2,0 ; vbroadcastss 0x208e3(%rip),%ymm7 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 197,204,84,247 ; vandps %ymm7,%ymm6,%ymm6
DB 197,252,91,246 ; vcvtdq2ps %ymm6,%ymm6
- DB 196,226,125,24,61,154,9,2,0 ; vbroadcastss 0x2099a(%rip),%ymm7 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,226,125,24,61,214,8,2,0 ; vbroadcastss 0x208d6(%rip),%ymm7 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 197,204,89,247 ; vmulps %ymm7,%ymm6,%ymm6
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,61,255,8,2,0 ; vbroadcastss 0x208ff(%rip),%ymm7 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,61,59,8,2,0 ; vbroadcastss 0x2083b(%rip),%ymm7 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
@@ -11014,23 +11014,23 @@ _sk_gather_565_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,209,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm2
- DB 196,226,125,24,5,250,7,2,0 ; vbroadcastss 0x207fa(%rip),%ymm0 # 2c15c <_sk_overlay_sse2_8bit+0x4e7>
+ DB 196,226,125,24,5,54,7,2,0 ; vbroadcastss 0x20736(%rip),%ymm0 # 2c098 <_sk_overlay_sse2_8bit+0x4e8>
DB 197,236,84,192 ; vandps %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,237,7,2,0 ; vbroadcastss 0x207ed(%rip),%ymm1 # 2c160 <_sk_overlay_sse2_8bit+0x4eb>
+ DB 196,226,125,24,13,41,7,2,0 ; vbroadcastss 0x20729(%rip),%ymm1 # 2c09c <_sk_overlay_sse2_8bit+0x4ec>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,228,7,2,0 ; vbroadcastss 0x207e4(%rip),%ymm1 # 2c164 <_sk_overlay_sse2_8bit+0x4ef>
+ DB 196,226,125,24,13,32,7,2,0 ; vbroadcastss 0x20720(%rip),%ymm1 # 2c0a0 <_sk_overlay_sse2_8bit+0x4f0>
DB 197,236,84,201 ; vandps %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,215,7,2,0 ; vbroadcastss 0x207d7(%rip),%ymm3 # 2c168 <_sk_overlay_sse2_8bit+0x4f3>
+ DB 196,226,125,24,29,19,7,2,0 ; vbroadcastss 0x20713(%rip),%ymm3 # 2c0a4 <_sk_overlay_sse2_8bit+0x4f4>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,24,29,206,7,2,0 ; vbroadcastss 0x207ce(%rip),%ymm3 # 2c16c <_sk_overlay_sse2_8bit+0x4f7>
+ DB 196,226,125,24,29,10,7,2,0 ; vbroadcastss 0x2070a(%rip),%ymm3 # 2c0a8 <_sk_overlay_sse2_8bit+0x4f8>
DB 197,236,84,211 ; vandps %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,193,7,2,0 ; vbroadcastss 0x207c1(%rip),%ymm3 # 2c170 <_sk_overlay_sse2_8bit+0x4fb>
+ DB 196,226,125,24,29,253,6,2,0 ; vbroadcastss 0x206fd(%rip),%ymm3 # 2c0ac <_sk_overlay_sse2_8bit+0x4fc>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,38,7,2,0 ; vbroadcastss 0x20726(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,98,6,2,0 ; vbroadcastss 0x20662(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 91 ; pop %rbx
DB 65,92 ; pop %r12
DB 65,94 ; pop %r14
@@ -11047,14 +11047,14 @@ _sk_store_565_avx LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,233,7,2,0 ; vbroadcastss 0x207e9(%rip),%ymm8 # 2c1d0 <_sk_overlay_sse2_8bit+0x55b>
+ DB 196,98,125,24,5,37,7,2,0 ; vbroadcastss 0x20725(%rip),%ymm8 # 2c10c <_sk_overlay_sse2_8bit+0x55c>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,41,114,241,11 ; vpslld $0xb,%xmm9,%xmm10
DB 196,67,125,25,201,1 ; vextractf128 $0x1,%ymm9,%xmm9
DB 196,193,49,114,241,11 ; vpslld $0xb,%xmm9,%xmm9
DB 196,67,45,24,201,1 ; vinsertf128 $0x1,%xmm9,%ymm10,%ymm9
- DB 196,98,125,24,21,194,7,2,0 ; vbroadcastss 0x207c2(%rip),%ymm10 # 2c1d4 <_sk_overlay_sse2_8bit+0x55f>
+ DB 196,98,125,24,21,254,6,2,0 ; vbroadcastss 0x206fe(%rip),%ymm10 # 2c110 <_sk_overlay_sse2_8bit+0x560>
DB 196,65,116,89,210 ; vmulps %ymm10,%ymm1,%ymm10
DB 196,65,125,91,210 ; vcvtps2dq %ymm10,%ymm10
DB 196,193,33,114,242,5 ; vpslld $0x5,%xmm10,%xmm11
@@ -11133,25 +11133,25 @@ _sk_load_4444_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,217,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm3
- DB 196,226,125,24,5,187,6,2,0 ; vbroadcastss 0x206bb(%rip),%ymm0 # 2c1d8 <_sk_overlay_sse2_8bit+0x563>
+ DB 196,226,125,24,5,247,5,2,0 ; vbroadcastss 0x205f7(%rip),%ymm0 # 2c114 <_sk_overlay_sse2_8bit+0x564>
DB 197,228,84,192 ; vandps %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,174,6,2,0 ; vbroadcastss 0x206ae(%rip),%ymm1 # 2c1dc <_sk_overlay_sse2_8bit+0x567>
+ DB 196,226,125,24,13,234,5,2,0 ; vbroadcastss 0x205ea(%rip),%ymm1 # 2c118 <_sk_overlay_sse2_8bit+0x568>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,165,6,2,0 ; vbroadcastss 0x206a5(%rip),%ymm1 # 2c1e0 <_sk_overlay_sse2_8bit+0x56b>
+ DB 196,226,125,24,13,225,5,2,0 ; vbroadcastss 0x205e1(%rip),%ymm1 # 2c11c <_sk_overlay_sse2_8bit+0x56c>
DB 197,228,84,201 ; vandps %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,152,6,2,0 ; vbroadcastss 0x20698(%rip),%ymm2 # 2c1e4 <_sk_overlay_sse2_8bit+0x56f>
+ DB 196,226,125,24,21,212,5,2,0 ; vbroadcastss 0x205d4(%rip),%ymm2 # 2c120 <_sk_overlay_sse2_8bit+0x570>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,143,6,2,0 ; vbroadcastss 0x2068f(%rip),%ymm2 # 2c1e8 <_sk_overlay_sse2_8bit+0x573>
+ DB 196,226,125,24,21,203,5,2,0 ; vbroadcastss 0x205cb(%rip),%ymm2 # 2c124 <_sk_overlay_sse2_8bit+0x574>
DB 197,228,84,210 ; vandps %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,130,6,2,0 ; vbroadcastss 0x20682(%rip),%ymm8 # 2c1ec <_sk_overlay_sse2_8bit+0x577>
+ DB 196,98,125,24,5,190,5,2,0 ; vbroadcastss 0x205be(%rip),%ymm8 # 2c128 <_sk_overlay_sse2_8bit+0x578>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,120,6,2,0 ; vbroadcastss 0x20678(%rip),%ymm8 # 2c1f0 <_sk_overlay_sse2_8bit+0x57b>
+ DB 196,98,125,24,5,180,5,2,0 ; vbroadcastss 0x205b4(%rip),%ymm8 # 2c12c <_sk_overlay_sse2_8bit+0x57c>
DB 196,193,100,84,216 ; vandps %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,106,6,2,0 ; vbroadcastss 0x2066a(%rip),%ymm8 # 2c1f4 <_sk_overlay_sse2_8bit+0x57f>
+ DB 196,98,125,24,5,166,5,2,0 ; vbroadcastss 0x205a6(%rip),%ymm8 # 2c130 <_sk_overlay_sse2_8bit+0x580>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -11218,25 +11218,25 @@ _sk_load_4444_dst_avx LABEL PROC
DB 197,217,105,237 ; vpunpckhwd %xmm5,%xmm4,%xmm5
DB 196,226,121,51,228 ; vpmovzxwd %xmm4,%xmm4
DB 196,227,93,24,253,1 ; vinsertf128 $0x1,%xmm5,%ymm4,%ymm7
- DB 196,226,125,24,37,99,5,2,0 ; vbroadcastss 0x20563(%rip),%ymm4 # 2c1d8 <_sk_overlay_sse2_8bit+0x563>
+ DB 196,226,125,24,37,159,4,2,0 ; vbroadcastss 0x2049f(%rip),%ymm4 # 2c114 <_sk_overlay_sse2_8bit+0x564>
DB 197,196,84,228 ; vandps %ymm4,%ymm7,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,226,125,24,45,86,5,2,0 ; vbroadcastss 0x20556(%rip),%ymm5 # 2c1dc <_sk_overlay_sse2_8bit+0x567>
+ DB 196,226,125,24,45,146,4,2,0 ; vbroadcastss 0x20492(%rip),%ymm5 # 2c118 <_sk_overlay_sse2_8bit+0x568>
DB 197,220,89,229 ; vmulps %ymm5,%ymm4,%ymm4
- DB 196,226,125,24,45,77,5,2,0 ; vbroadcastss 0x2054d(%rip),%ymm5 # 2c1e0 <_sk_overlay_sse2_8bit+0x56b>
+ DB 196,226,125,24,45,137,4,2,0 ; vbroadcastss 0x20489(%rip),%ymm5 # 2c11c <_sk_overlay_sse2_8bit+0x56c>
DB 197,196,84,237 ; vandps %ymm5,%ymm7,%ymm5
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
- DB 196,226,125,24,53,64,5,2,0 ; vbroadcastss 0x20540(%rip),%ymm6 # 2c1e4 <_sk_overlay_sse2_8bit+0x56f>
+ DB 196,226,125,24,53,124,4,2,0 ; vbroadcastss 0x2047c(%rip),%ymm6 # 2c120 <_sk_overlay_sse2_8bit+0x570>
DB 197,212,89,238 ; vmulps %ymm6,%ymm5,%ymm5
- DB 196,226,125,24,53,55,5,2,0 ; vbroadcastss 0x20537(%rip),%ymm6 # 2c1e8 <_sk_overlay_sse2_8bit+0x573>
+ DB 196,226,125,24,53,115,4,2,0 ; vbroadcastss 0x20473(%rip),%ymm6 # 2c124 <_sk_overlay_sse2_8bit+0x574>
DB 197,196,84,246 ; vandps %ymm6,%ymm7,%ymm6
DB 197,252,91,246 ; vcvtdq2ps %ymm6,%ymm6
- DB 196,98,125,24,5,42,5,2,0 ; vbroadcastss 0x2052a(%rip),%ymm8 # 2c1ec <_sk_overlay_sse2_8bit+0x577>
+ DB 196,98,125,24,5,102,4,2,0 ; vbroadcastss 0x20466(%rip),%ymm8 # 2c128 <_sk_overlay_sse2_8bit+0x578>
DB 196,193,76,89,240 ; vmulps %ymm8,%ymm6,%ymm6
- DB 196,98,125,24,5,32,5,2,0 ; vbroadcastss 0x20520(%rip),%ymm8 # 2c1f0 <_sk_overlay_sse2_8bit+0x57b>
+ DB 196,98,125,24,5,92,4,2,0 ; vbroadcastss 0x2045c(%rip),%ymm8 # 2c12c <_sk_overlay_sse2_8bit+0x57c>
DB 196,193,68,84,248 ; vandps %ymm8,%ymm7,%ymm7
DB 197,252,91,255 ; vcvtdq2ps %ymm7,%ymm7
- DB 196,98,125,24,5,18,5,2,0 ; vbroadcastss 0x20512(%rip),%ymm8 # 2c1f4 <_sk_overlay_sse2_8bit+0x57f>
+ DB 196,98,125,24,5,78,4,2,0 ; vbroadcastss 0x2044e(%rip),%ymm8 # 2c130 <_sk_overlay_sse2_8bit+0x580>
DB 196,193,68,89,248 ; vmulps %ymm8,%ymm7,%ymm7
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -11338,25 +11338,25 @@ _sk_gather_4444_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,217,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm3
- DB 196,226,125,24,5,114,3,2,0 ; vbroadcastss 0x20372(%rip),%ymm0 # 2c1d8 <_sk_overlay_sse2_8bit+0x563>
+ DB 196,226,125,24,5,174,2,2,0 ; vbroadcastss 0x202ae(%rip),%ymm0 # 2c114 <_sk_overlay_sse2_8bit+0x564>
DB 197,228,84,192 ; vandps %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,101,3,2,0 ; vbroadcastss 0x20365(%rip),%ymm1 # 2c1dc <_sk_overlay_sse2_8bit+0x567>
+ DB 196,226,125,24,13,161,2,2,0 ; vbroadcastss 0x202a1(%rip),%ymm1 # 2c118 <_sk_overlay_sse2_8bit+0x568>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,92,3,2,0 ; vbroadcastss 0x2035c(%rip),%ymm1 # 2c1e0 <_sk_overlay_sse2_8bit+0x56b>
+ DB 196,226,125,24,13,152,2,2,0 ; vbroadcastss 0x20298(%rip),%ymm1 # 2c11c <_sk_overlay_sse2_8bit+0x56c>
DB 197,228,84,201 ; vandps %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,79,3,2,0 ; vbroadcastss 0x2034f(%rip),%ymm2 # 2c1e4 <_sk_overlay_sse2_8bit+0x56f>
+ DB 196,226,125,24,21,139,2,2,0 ; vbroadcastss 0x2028b(%rip),%ymm2 # 2c120 <_sk_overlay_sse2_8bit+0x570>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,70,3,2,0 ; vbroadcastss 0x20346(%rip),%ymm2 # 2c1e8 <_sk_overlay_sse2_8bit+0x573>
+ DB 196,226,125,24,21,130,2,2,0 ; vbroadcastss 0x20282(%rip),%ymm2 # 2c124 <_sk_overlay_sse2_8bit+0x574>
DB 197,228,84,210 ; vandps %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,57,3,2,0 ; vbroadcastss 0x20339(%rip),%ymm8 # 2c1ec <_sk_overlay_sse2_8bit+0x577>
+ DB 196,98,125,24,5,117,2,2,0 ; vbroadcastss 0x20275(%rip),%ymm8 # 2c128 <_sk_overlay_sse2_8bit+0x578>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,47,3,2,0 ; vbroadcastss 0x2032f(%rip),%ymm8 # 2c1f0 <_sk_overlay_sse2_8bit+0x57b>
+ DB 196,98,125,24,5,107,2,2,0 ; vbroadcastss 0x2026b(%rip),%ymm8 # 2c12c <_sk_overlay_sse2_8bit+0x57c>
DB 196,193,100,84,216 ; vandps %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,33,3,2,0 ; vbroadcastss 0x20321(%rip),%ymm8 # 2c1f4 <_sk_overlay_sse2_8bit+0x57f>
+ DB 196,98,125,24,5,93,2,2,0 ; vbroadcastss 0x2025d(%rip),%ymm8 # 2c130 <_sk_overlay_sse2_8bit+0x580>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
@@ -11375,7 +11375,7 @@ _sk_store_4444_avx LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,245,2,2,0 ; vbroadcastss 0x202f5(%rip),%ymm8 # 2c1f8 <_sk_overlay_sse2_8bit+0x583>
+ DB 196,98,125,24,5,49,2,2,0 ; vbroadcastss 0x20231(%rip),%ymm8 # 2c134 <_sk_overlay_sse2_8bit+0x584>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,41,114,241,12 ; vpslld $0xc,%xmm9,%xmm10
@@ -11463,10 +11463,10 @@ _sk_load_8888_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,135,0,0,0 ; jne c0bf <_sk_load_8888_avx+0xa7>
DB 196,1,125,16,12,152 ; vmovupd (%r8,%r11,4),%ymm9
- DB 197,125,40,21,218,5,2,0 ; vmovapd 0x205da(%rip),%ymm10 # 2c620 <_sk_overlay_sse2_8bit+0x9ab>
+ DB 197,125,40,21,26,5,2,0 ; vmovapd 0x2051a(%rip),%ymm10 # 2c560 <_sk_overlay_sse2_8bit+0x9b0>
DB 196,193,53,84,194 ; vandpd %ymm10,%ymm9,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,0,1,2,0 ; vbroadcastss 0x20100(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,60,0,2,0 ; vbroadcastss 0x2003c(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 196,193,113,114,209,8 ; vpsrld $0x8,%xmm9,%xmm1
DB 196,99,125,25,203,1 ; vextractf128 $0x1,%ymm9,%xmm3
@@ -11556,10 +11556,10 @@ _sk_load_8888_dst_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,135,0,0,0 ; jne c237 <_sk_load_8888_dst_avx+0xa7>
DB 196,1,125,16,12,152 ; vmovupd (%r8,%r11,4),%ymm9
- DB 197,125,40,21,130,4,2,0 ; vmovapd 0x20482(%rip),%ymm10 # 2c640 <_sk_overlay_sse2_8bit+0x9cb>
+ DB 197,125,40,21,194,3,2,0 ; vmovapd 0x203c2(%rip),%ymm10 # 2c580 <_sk_overlay_sse2_8bit+0x9d0>
DB 196,193,53,84,226 ; vandpd %ymm10,%ymm9,%ymm4
DB 197,252,91,228 ; vcvtdq2ps %ymm4,%ymm4
- DB 196,98,125,24,5,136,255,1,0 ; vbroadcastss 0x1ff88(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,196,254,1,0 ; vbroadcastss 0x1fec4(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,92,89,224 ; vmulps %ymm8,%ymm4,%ymm4
DB 196,193,81,114,209,8 ; vpsrld $0x8,%xmm9,%xmm5
DB 196,99,125,25,207,1 ; vextractf128 $0x1,%ymm9,%xmm7
@@ -11676,10 +11676,10 @@ _sk_gather_8888_avx LABEL PROC
DB 196,131,121,34,4,152,2 ; vpinsrd $0x2,(%r8,%r11,4),%xmm0,%xmm0
DB 196,131,121,34,28,144,3 ; vpinsrd $0x3,(%r8,%r10,4),%xmm0,%xmm3
DB 196,227,61,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm8,%ymm0
- DB 197,124,40,21,166,2,2,0 ; vmovaps 0x202a6(%rip),%ymm10 # 2c660 <_sk_overlay_sse2_8bit+0x9eb>
+ DB 197,124,40,21,230,1,2,0 ; vmovaps 0x201e6(%rip),%ymm10 # 2c5a0 <_sk_overlay_sse2_8bit+0x9f0>
DB 196,193,124,84,194 ; vandps %ymm10,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,140,253,1,0 ; vbroadcastss 0x1fd8c(%rip),%ymm9 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,13,200,252,1,0 ; vbroadcastss 0x1fcc8(%rip),%ymm9 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,193,113,114,208,8 ; vpsrld $0x8,%xmm8,%xmm1
DB 197,233,114,211,8 ; vpsrld $0x8,%xmm3,%xmm2
@@ -11714,7 +11714,7 @@ _sk_store_8888_avx LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,188,252,1,0 ; vbroadcastss 0x1fcbc(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,248,251,1,0 ; vbroadcastss 0x1fbf8(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,65,116,89,208 ; vmulps %ymm8,%ymm1,%ymm10
@@ -11800,10 +11800,10 @@ _sk_load_bgra_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,135,0,0,0 ; jne c613 <_sk_load_bgra_avx+0xa7>
DB 196,1,125,16,12,152 ; vmovupd (%r8,%r11,4),%ymm9
- DB 197,125,40,21,230,0,2,0 ; vmovapd 0x200e6(%rip),%ymm10 # 2c680 <_sk_overlay_sse2_8bit+0xa0b>
+ DB 197,125,40,21,38,0,2,0 ; vmovapd 0x20026(%rip),%ymm10 # 2c5c0 <_sk_overlay_sse2_8bit+0xa10>
DB 196,193,53,84,202 ; vandpd %ymm10,%ymm9,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,98,125,24,5,172,251,1,0 ; vbroadcastss 0x1fbac(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,232,250,1,0 ; vbroadcastss 0x1fae8(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,116,89,208 ; vmulps %ymm8,%ymm1,%ymm2
DB 196,193,113,114,209,8 ; vpsrld $0x8,%xmm9,%xmm1
DB 196,99,125,25,203,1 ; vextractf128 $0x1,%ymm9,%xmm3
@@ -11893,10 +11893,10 @@ _sk_load_bgra_dst_avx LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,135,0,0,0 ; jne c78b <_sk_load_bgra_dst_avx+0xa7>
DB 196,1,125,16,12,152 ; vmovupd (%r8,%r11,4),%ymm9
- DB 197,125,40,21,142,255,1,0 ; vmovapd 0x1ff8e(%rip),%ymm10 # 2c6a0 <_sk_overlay_sse2_8bit+0xa2b>
+ DB 197,125,40,21,206,254,1,0 ; vmovapd 0x1fece(%rip),%ymm10 # 2c5e0 <_sk_overlay_sse2_8bit+0xa30>
DB 196,193,53,84,234 ; vandpd %ymm10,%ymm9,%ymm5
DB 197,252,91,237 ; vcvtdq2ps %ymm5,%ymm5
- DB 196,98,125,24,5,52,250,1,0 ; vbroadcastss 0x1fa34(%rip),%ymm8 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,5,112,249,1,0 ; vbroadcastss 0x1f970(%rip),%ymm8 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,84,89,240 ; vmulps %ymm8,%ymm5,%ymm6
DB 196,193,81,114,209,8 ; vpsrld $0x8,%xmm9,%xmm5
DB 196,99,125,25,207,1 ; vextractf128 $0x1,%ymm9,%xmm7
@@ -12013,10 +12013,10 @@ _sk_gather_bgra_avx LABEL PROC
DB 196,131,121,34,4,152,2 ; vpinsrd $0x2,(%r8,%r11,4),%xmm0,%xmm0
DB 196,131,121,34,28,144,3 ; vpinsrd $0x3,(%r8,%r10,4),%xmm0,%xmm3
DB 196,227,61,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm8,%ymm0
- DB 197,124,40,13,178,253,1,0 ; vmovaps 0x1fdb2(%rip),%ymm9 # 2c6c0 <_sk_overlay_sse2_8bit+0xa4b>
+ DB 197,124,40,13,242,252,1,0 ; vmovaps 0x1fcf2(%rip),%ymm9 # 2c600 <_sk_overlay_sse2_8bit+0xa50>
DB 196,193,124,84,193 ; vandps %ymm9,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,21,56,248,1,0 ; vbroadcastss 0x1f838(%rip),%ymm10 # 2c158 <_sk_overlay_sse2_8bit+0x4e3>
+ DB 196,98,125,24,21,116,247,1,0 ; vbroadcastss 0x1f774(%rip),%ymm10 # 2c094 <_sk_overlay_sse2_8bit+0x4e4>
DB 196,193,124,89,210 ; vmulps %ymm10,%ymm0,%ymm2
DB 196,193,121,114,208,8 ; vpsrld $0x8,%xmm8,%xmm0
DB 197,241,114,211,8 ; vpsrld $0x8,%xmm3,%xmm1
@@ -12051,7 +12051,7 @@ _sk_store_bgra_avx LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,218 ; movslq %edx,%r11
- DB 196,98,125,24,5,104,247,1,0 ; vbroadcastss 0x1f768(%rip),%ymm8 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 196,98,125,24,5,164,246,1,0 ; vbroadcastss 0x1f6a4(%rip),%ymm8 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 196,65,108,89,200 ; vmulps %ymm8,%ymm2,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,65,116,89,208 ; vmulps %ymm8,%ymm1,%ymm10
@@ -12158,13 +12158,13 @@ _sk_load_f16_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
- DB 196,98,125,24,37,5,247,1,0 ; vbroadcastss 0x1f705(%rip),%ymm12 # 2c260 <_sk_overlay_sse2_8bit+0x5eb>
+ DB 196,98,125,24,37,65,246,1,0 ; vbroadcastss 0x1f641(%rip),%ymm12 # 2c19c <_sk_overlay_sse2_8bit+0x5ec>
DB 196,193,124,84,204 ; vandps %ymm12,%ymm0,%ymm1
DB 197,252,87,193 ; vxorps %ymm1,%ymm0,%ymm0
DB 196,195,125,25,198,1 ; vextractf128 $0x1,%ymm0,%xmm14
- DB 196,98,121,24,29,201,246,1,0 ; vbroadcastss 0x1f6c9(%rip),%xmm11 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,121,24,29,5,246,1,0 ; vbroadcastss 0x1f605(%rip),%xmm11 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,193,8,87,219 ; vxorps %xmm11,%xmm14,%xmm3
- DB 196,98,121,24,45,227,246,1,0 ; vbroadcastss 0x1f6e3(%rip),%xmm13 # 2c264 <_sk_overlay_sse2_8bit+0x5ef>
+ DB 196,98,121,24,45,31,246,1,0 ; vbroadcastss 0x1f61f(%rip),%xmm13 # 2c1a0 <_sk_overlay_sse2_8bit+0x5f0>
DB 197,145,102,219 ; vpcmpgtd %xmm3,%xmm13,%xmm3
DB 196,65,120,87,211 ; vxorps %xmm11,%xmm0,%xmm10
DB 196,65,17,102,210 ; vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -12178,7 +12178,7 @@ _sk_load_f16_avx LABEL PROC
DB 196,227,125,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm0,%ymm0
DB 197,252,86,193 ; vorps %ymm1,%ymm0,%ymm0
DB 196,227,125,25,193,1 ; vextractf128 $0x1,%ymm0,%xmm1
- DB 196,226,121,24,29,153,246,1,0 ; vbroadcastss 0x1f699(%rip),%xmm3 # 2c268 <_sk_overlay_sse2_8bit+0x5f3>
+ DB 196,226,121,24,29,213,245,1,0 ; vbroadcastss 0x1f5d5(%rip),%xmm3 # 2c1a4 <_sk_overlay_sse2_8bit+0x5f4>
DB 197,241,254,203 ; vpaddd %xmm3,%xmm1,%xmm1
DB 197,249,254,195 ; vpaddd %xmm3,%xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
@@ -12328,13 +12328,13 @@ _sk_load_f16_dst_avx LABEL PROC
DB 197,217,105,232 ; vpunpckhwd %xmm0,%xmm4,%xmm5
DB 196,226,121,51,228 ; vpmovzxwd %xmm4,%xmm4
DB 196,227,93,24,229,1 ; vinsertf128 $0x1,%xmm5,%ymm4,%ymm4
- DB 196,98,125,24,37,184,243,1,0 ; vbroadcastss 0x1f3b8(%rip),%ymm12 # 2c260 <_sk_overlay_sse2_8bit+0x5eb>
+ DB 196,98,125,24,37,244,242,1,0 ; vbroadcastss 0x1f2f4(%rip),%ymm12 # 2c19c <_sk_overlay_sse2_8bit+0x5ec>
DB 196,193,92,84,236 ; vandps %ymm12,%ymm4,%ymm5
DB 197,220,87,229 ; vxorps %ymm5,%ymm4,%ymm4
DB 196,195,125,25,230,1 ; vextractf128 $0x1,%ymm4,%xmm14
- DB 196,98,121,24,29,124,243,1,0 ; vbroadcastss 0x1f37c(%rip),%xmm11 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,121,24,29,184,242,1,0 ; vbroadcastss 0x1f2b8(%rip),%xmm11 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,193,8,87,251 ; vxorps %xmm11,%xmm14,%xmm7
- DB 196,98,121,24,45,150,243,1,0 ; vbroadcastss 0x1f396(%rip),%xmm13 # 2c264 <_sk_overlay_sse2_8bit+0x5ef>
+ DB 196,98,121,24,45,210,242,1,0 ; vbroadcastss 0x1f2d2(%rip),%xmm13 # 2c1a0 <_sk_overlay_sse2_8bit+0x5f0>
DB 197,145,102,255 ; vpcmpgtd %xmm7,%xmm13,%xmm7
DB 196,65,88,87,211 ; vxorps %xmm11,%xmm4,%xmm10
DB 196,65,17,102,210 ; vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -12348,7 +12348,7 @@ _sk_load_f16_dst_avx LABEL PROC
DB 196,227,93,24,231,1 ; vinsertf128 $0x1,%xmm7,%ymm4,%ymm4
DB 197,220,86,229 ; vorps %ymm5,%ymm4,%ymm4
DB 196,227,125,25,229,1 ; vextractf128 $0x1,%ymm4,%xmm5
- DB 196,226,121,24,61,76,243,1,0 ; vbroadcastss 0x1f34c(%rip),%xmm7 # 2c268 <_sk_overlay_sse2_8bit+0x5f3>
+ DB 196,226,121,24,61,136,242,1,0 ; vbroadcastss 0x1f288(%rip),%xmm7 # 2c1a4 <_sk_overlay_sse2_8bit+0x5f4>
DB 197,209,254,239 ; vpaddd %xmm7,%xmm5,%xmm5
DB 197,217,254,231 ; vpaddd %xmm7,%xmm4,%xmm4
DB 196,227,93,24,229,1 ; vinsertf128 $0x1,%xmm5,%ymm4,%ymm4
@@ -12525,13 +12525,13 @@ _sk_gather_f16_avx LABEL PROC
DB 197,249,105,210 ; vpunpckhwd %xmm2,%xmm0,%xmm2
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,194,1 ; vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
- DB 196,98,125,24,37,249,239,1,0 ; vbroadcastss 0x1eff9(%rip),%ymm12 # 2c260 <_sk_overlay_sse2_8bit+0x5eb>
+ DB 196,98,125,24,37,53,239,1,0 ; vbroadcastss 0x1ef35(%rip),%ymm12 # 2c19c <_sk_overlay_sse2_8bit+0x5ec>
DB 196,193,124,84,212 ; vandps %ymm12,%ymm0,%ymm2
DB 197,252,87,194 ; vxorps %ymm2,%ymm0,%ymm0
DB 196,195,125,25,198,1 ; vextractf128 $0x1,%ymm0,%xmm14
- DB 196,98,121,24,29,189,239,1,0 ; vbroadcastss 0x1efbd(%rip),%xmm11 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,121,24,29,249,238,1,0 ; vbroadcastss 0x1eef9(%rip),%xmm11 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,193,8,87,219 ; vxorps %xmm11,%xmm14,%xmm3
- DB 196,98,121,24,45,215,239,1,0 ; vbroadcastss 0x1efd7(%rip),%xmm13 # 2c264 <_sk_overlay_sse2_8bit+0x5ef>
+ DB 196,98,121,24,45,19,239,1,0 ; vbroadcastss 0x1ef13(%rip),%xmm13 # 2c1a0 <_sk_overlay_sse2_8bit+0x5f0>
DB 197,145,102,219 ; vpcmpgtd %xmm3,%xmm13,%xmm3
DB 196,65,120,87,211 ; vxorps %xmm11,%xmm0,%xmm10
DB 196,65,17,102,210 ; vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -12545,7 +12545,7 @@ _sk_gather_f16_avx LABEL PROC
DB 196,227,125,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm0,%ymm0
DB 197,252,86,194 ; vorps %ymm2,%ymm0,%ymm0
DB 196,227,125,25,194,1 ; vextractf128 $0x1,%ymm0,%xmm2
- DB 196,226,121,24,29,141,239,1,0 ; vbroadcastss 0x1ef8d(%rip),%xmm3 # 2c268 <_sk_overlay_sse2_8bit+0x5f3>
+ DB 196,226,121,24,29,201,238,1,0 ; vbroadcastss 0x1eec9(%rip),%xmm3 # 2c1a4 <_sk_overlay_sse2_8bit+0x5f4>
DB 197,233,254,211 ; vpaddd %xmm3,%xmm2,%xmm2
DB 197,249,254,195 ; vpaddd %xmm3,%xmm0,%xmm0
DB 196,227,125,24,194,1 ; vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
@@ -12647,12 +12647,12 @@ _sk_store_f16_avx LABEL PROC
DB 197,252,17,180,36,128,0,0,0 ; vmovups %ymm6,0x80(%rsp)
DB 197,252,17,108,36,96 ; vmovups %ymm5,0x60(%rsp)
DB 197,252,17,100,36,64 ; vmovups %ymm4,0x40(%rsp)
- DB 196,98,125,24,13,106,237,1,0 ; vbroadcastss 0x1ed6a(%rip),%ymm9 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,13,166,236,1,0 ; vbroadcastss 0x1eca6(%rip),%ymm9 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,65,124,84,209 ; vandps %ymm9,%ymm0,%ymm10
DB 197,252,17,4,36 ; vmovups %ymm0,(%rsp)
DB 196,65,124,87,218 ; vxorps %ymm10,%ymm0,%ymm11
DB 196,67,125,25,220,1 ; vextractf128 $0x1,%ymm11,%xmm12
- DB 196,98,121,24,5,124,237,1,0 ; vbroadcastss 0x1ed7c(%rip),%xmm8 # 2c26c <_sk_overlay_sse2_8bit+0x5f7>
+ DB 196,98,121,24,5,184,236,1,0 ; vbroadcastss 0x1ecb8(%rip),%xmm8 # 2c1a8 <_sk_overlay_sse2_8bit+0x5f8>
DB 196,65,57,102,236 ; vpcmpgtd %xmm12,%xmm8,%xmm13
DB 196,65,57,102,243 ; vpcmpgtd %xmm11,%xmm8,%xmm14
DB 196,67,13,24,237,1 ; vinsertf128 $0x1,%xmm13,%ymm14,%ymm13
@@ -12662,7 +12662,7 @@ _sk_store_f16_avx LABEL PROC
DB 196,67,13,24,242,1 ; vinsertf128 $0x1,%xmm10,%ymm14,%ymm14
DB 196,193,33,114,211,13 ; vpsrld $0xd,%xmm11,%xmm11
DB 196,193,25,114,212,13 ; vpsrld $0xd,%xmm12,%xmm12
- DB 196,98,125,24,21,67,237,1,0 ; vbroadcastss 0x1ed43(%rip),%ymm10 # 2c270 <_sk_overlay_sse2_8bit+0x5fb>
+ DB 196,98,125,24,21,127,236,1,0 ; vbroadcastss 0x1ec7f(%rip),%ymm10 # 2c1ac <_sk_overlay_sse2_8bit+0x5fc>
DB 196,65,12,86,242 ; vorps %ymm10,%ymm14,%ymm14
DB 196,67,125,25,247,1 ; vextractf128 $0x1,%ymm14,%xmm15
DB 196,65,1,254,228 ; vpaddd %xmm12,%xmm15,%xmm12
@@ -12815,7 +12815,7 @@ _sk_load_u16_be_avx LABEL PROC
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,29,97,233,1,0 ; vbroadcastss 0x1e961(%rip),%ymm11 # 2c174 <_sk_overlay_sse2_8bit+0x4ff>
+ DB 196,98,125,24,29,157,232,1,0 ; vbroadcastss 0x1e89d(%rip),%ymm11 # 2c0b0 <_sk_overlay_sse2_8bit+0x500>
DB 196,193,124,89,195 ; vmulps %ymm11,%ymm0,%ymm0
DB 197,177,109,202 ; vpunpckhqdq %xmm2,%xmm9,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -12913,7 +12913,7 @@ _sk_load_rgb_u16_be_avx LABEL PROC
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,194,1 ; vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,21,163,231,1,0 ; vbroadcastss 0x1e7a3(%rip),%ymm2 # 2c174 <_sk_overlay_sse2_8bit+0x4ff>
+ DB 196,226,125,24,21,223,230,1,0 ; vbroadcastss 0x1e6df(%rip),%ymm2 # 2c0b0 <_sk_overlay_sse2_8bit+0x500>
DB 197,252,89,194 ; vmulps %ymm2,%ymm0,%ymm0
DB 197,185,109,201 ; vpunpckhqdq %xmm1,%xmm8,%xmm1
DB 197,225,113,241,8 ; vpsllw $0x8,%xmm1,%xmm3
@@ -12934,7 +12934,7 @@ _sk_load_rgb_u16_be_avx LABEL PROC
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
DB 197,228,89,210 ; vmulps %ymm2,%ymm3,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,175,230,1,0 ; vbroadcastss 0x1e6af(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,235,229,1,0 ; vbroadcastss 0x1e5eb(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 255,224 ; jmpq *%rax
DB 196,193,121,110,4,64 ; vmovd (%r8,%rax,2),%xmm0
DB 196,65,121,196,92,64,4,2 ; vpinsrw $0x2,0x4(%r8,%rax,2),%xmm0,%xmm11
@@ -13008,7 +13008,7 @@ _sk_store_u16_be_avx LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 73,99,193 ; movslq %r9d,%rax
- DB 196,98,125,24,5,111,230,1,0 ; vbroadcastss 0x1e66f(%rip),%ymm8 # 2c1fc <_sk_overlay_sse2_8bit+0x587>
+ DB 196,98,125,24,5,171,229,1,0 ; vbroadcastss 0x1e5ab(%rip),%ymm8 # 2c138 <_sk_overlay_sse2_8bit+0x588>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,67,125,25,202,1 ; vextractf128 $0x1,%ymm9,%xmm10
@@ -13265,7 +13265,7 @@ _sk_load_f32_dst_avx LABEL PROC
DB 255,92,255,255 ; lcall *-0x1(%rdi,%rdi,8)
DB 255,70,255 ; incl -0x1(%rsi)
DB 255 ; (bad)
- DB 255,53,255,255,255,40 ; pushq 0x28ffffff(%rip) # 2900e004 <_sk_overlay_sse2_8bit+0x28fe238f>
+ DB 255,53,255,255,255,40 ; pushq 0x28ffffff(%rip) # 2900e004 <_sk_overlay_sse2_8bit+0x28fe2454>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -13400,7 +13400,7 @@ _sk_mirror_x_avx LABEL PROC
DB 196,193,58,88,192 ; vaddss %xmm8,%xmm8,%xmm0
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,99,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm8
- DB 197,178,89,5,211,222,1,0 ; vmulss 0x1ded3(%rip),%xmm9,%xmm0 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 197,178,89,5,15,222,1,0 ; vmulss 0x1de0f(%rip),%xmm9,%xmm0 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,164,89,192 ; vmulps %ymm0,%ymm11,%ymm0
@@ -13432,7 +13432,7 @@ _sk_mirror_y_avx LABEL PROC
DB 196,193,58,88,200 ; vaddss %xmm8,%xmm8,%xmm1
DB 196,227,121,4,201,0 ; vpermilps $0x0,%xmm1,%xmm1
DB 196,99,117,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm1,%ymm8
- DB 197,178,89,13,70,222,1,0 ; vmulss 0x1de46(%rip),%xmm9,%xmm1 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 197,178,89,13,130,221,1,0 ; vmulss 0x1dd82(%rip),%xmm9,%xmm1 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,227,121,4,201,0 ; vpermilps $0x0,%xmm1,%xmm1
DB 196,227,117,24,201,1 ; vinsertf128 $0x1,%xmm1,%ymm1,%ymm1
DB 197,164,89,201 ; vmulps %ymm1,%ymm11,%ymm1
@@ -13457,7 +13457,7 @@ PUBLIC _sk_clamp_x_1_avx
_sk_clamp_x_1_avx LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 197,188,95,192 ; vmaxps %ymm0,%ymm8,%ymm0
- DB 196,98,125,24,5,224,221,1,0 ; vbroadcastss 0x1dde0(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,28,221,1,0 ; vbroadcastss 0x1dd1c(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13471,9 +13471,9 @@ _sk_repeat_x_1_avx LABEL PROC
PUBLIC _sk_mirror_x_1_avx
_sk_mirror_x_1_avx LABEL PROC
- DB 196,98,125,24,5,215,221,1,0 ; vbroadcastss 0x1ddd7(%rip),%ymm8 # 2c0fc <_sk_overlay_sse2_8bit+0x487>
+ DB 196,98,125,24,5,19,221,1,0 ; vbroadcastss 0x1dd13(%rip),%ymm8 # 2c038 <_sk_overlay_sse2_8bit+0x488>
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,13,173,221,1,0 ; vbroadcastss 0x1ddad(%rip),%ymm9 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,13,233,220,1,0 ; vbroadcastss 0x1dce9(%rip),%ymm9 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,124,89,201 ; vmulps %ymm9,%ymm0,%ymm9
DB 196,67,125,8,201,1 ; vroundps $0x1,%ymm9,%ymm9
DB 196,65,52,88,201 ; vaddps %ymm9,%ymm9,%ymm9
@@ -13487,12 +13487,12 @@ _sk_mirror_x_1_avx LABEL PROC
PUBLIC _sk_luminance_to_alpha_avx
_sk_luminance_to_alpha_avx LABEL PROC
- DB 196,226,125,24,29,153,222,1,0 ; vbroadcastss 0x1de99(%rip),%ymm3 # 2c200 <_sk_overlay_sse2_8bit+0x58b>
+ DB 196,226,125,24,29,213,221,1,0 ; vbroadcastss 0x1ddd5(%rip),%ymm3 # 2c13c <_sk_overlay_sse2_8bit+0x58c>
DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,29,144,222,1,0 ; vbroadcastss 0x1de90(%rip),%ymm3 # 2c204 <_sk_overlay_sse2_8bit+0x58f>
+ DB 196,226,125,24,29,204,221,1,0 ; vbroadcastss 0x1ddcc(%rip),%ymm3 # 2c140 <_sk_overlay_sse2_8bit+0x590>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,131,222,1,0 ; vbroadcastss 0x1de83(%rip),%ymm1 # 2c208 <_sk_overlay_sse2_8bit+0x593>
+ DB 196,226,125,24,13,191,221,1,0 ; vbroadcastss 0x1ddbf(%rip),%ymm1 # 2c144 <_sk_overlay_sse2_8bit+0x594>
DB 197,236,89,201 ; vmulps %ymm1,%ymm2,%ymm1
DB 197,252,88,217 ; vaddps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13884,18 +13884,18 @@ _sk_evenly_spaced_gradient_avx LABEL PROC
PUBLIC _sk_gauss_a_to_rgba_avx
_sk_gauss_a_to_rgba_avx LABEL PROC
- DB 196,226,125,24,5,152,215,1,0 ; vbroadcastss 0x1d798(%rip),%ymm0 # 2c210 <_sk_overlay_sse2_8bit+0x59b>
+ DB 196,226,125,24,5,212,214,1,0 ; vbroadcastss 0x1d6d4(%rip),%ymm0 # 2c14c <_sk_overlay_sse2_8bit+0x59c>
DB 197,228,89,192 ; vmulps %ymm0,%ymm3,%ymm0
- DB 196,226,125,24,13,135,215,1,0 ; vbroadcastss 0x1d787(%rip),%ymm1 # 2c20c <_sk_overlay_sse2_8bit+0x597>
+ DB 196,226,125,24,13,195,214,1,0 ; vbroadcastss 0x1d6c3(%rip),%ymm1 # 2c148 <_sk_overlay_sse2_8bit+0x598>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,13,126,215,1,0 ; vbroadcastss 0x1d77e(%rip),%ymm1 # 2c214 <_sk_overlay_sse2_8bit+0x59f>
+ DB 196,226,125,24,13,186,214,1,0 ; vbroadcastss 0x1d6ba(%rip),%ymm1 # 2c150 <_sk_overlay_sse2_8bit+0x5a0>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,13,113,215,1,0 ; vbroadcastss 0x1d771(%rip),%ymm1 # 2c218 <_sk_overlay_sse2_8bit+0x5a3>
+ DB 196,226,125,24,13,173,214,1,0 ; vbroadcastss 0x1d6ad(%rip),%ymm1 # 2c154 <_sk_overlay_sse2_8bit+0x5a4>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,13,100,215,1,0 ; vbroadcastss 0x1d764(%rip),%ymm1 # 2c21c <_sk_overlay_sse2_8bit+0x5a7>
+ DB 196,226,125,24,13,160,214,1,0 ; vbroadcastss 0x1d6a0(%rip),%ymm1 # 2c158 <_sk_overlay_sse2_8bit+0x5a8>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
@@ -13921,7 +13921,7 @@ _sk_gradient_avx LABEL PROC
DB 73,255,200 ; dec %r8
DB 72,131,195,4 ; add $0x4,%rbx
DB 196,65,52,87,201 ; vxorps %ymm9,%ymm9,%ymm9
- DB 196,98,125,24,21,226,213,1,0 ; vbroadcastss 0x1d5e2(%rip),%ymm10 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,125,24,21,30,213,1,0 ; vbroadcastss 0x1d51e(%rip),%ymm10 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 196,98,125,24,3 ; vbroadcastss (%rbx),%ymm8
DB 197,60,194,192,2 ; vcmpleps %ymm0,%ymm8,%ymm8
@@ -14112,27 +14112,27 @@ _sk_xy_to_unit_angle_avx LABEL PROC
DB 196,65,52,95,226 ; vmaxps %ymm10,%ymm9,%ymm12
DB 196,65,36,94,220 ; vdivps %ymm12,%ymm11,%ymm11
DB 196,65,36,89,227 ; vmulps %ymm11,%ymm11,%ymm12
- DB 196,98,125,24,45,10,211,1,0 ; vbroadcastss 0x1d30a(%rip),%ymm13 # 2c220 <_sk_overlay_sse2_8bit+0x5ab>
+ DB 196,98,125,24,45,70,210,1,0 ; vbroadcastss 0x1d246(%rip),%ymm13 # 2c15c <_sk_overlay_sse2_8bit+0x5ac>
DB 196,65,28,89,237 ; vmulps %ymm13,%ymm12,%ymm13
- DB 196,98,125,24,53,0,211,1,0 ; vbroadcastss 0x1d300(%rip),%ymm14 # 2c224 <_sk_overlay_sse2_8bit+0x5af>
+ DB 196,98,125,24,53,60,210,1,0 ; vbroadcastss 0x1d23c(%rip),%ymm14 # 2c160 <_sk_overlay_sse2_8bit+0x5b0>
DB 196,65,20,88,238 ; vaddps %ymm14,%ymm13,%ymm13
DB 196,65,28,89,237 ; vmulps %ymm13,%ymm12,%ymm13
- DB 196,98,125,24,53,241,210,1,0 ; vbroadcastss 0x1d2f1(%rip),%ymm14 # 2c228 <_sk_overlay_sse2_8bit+0x5b3>
+ DB 196,98,125,24,53,45,210,1,0 ; vbroadcastss 0x1d22d(%rip),%ymm14 # 2c164 <_sk_overlay_sse2_8bit+0x5b4>
DB 196,65,20,88,238 ; vaddps %ymm14,%ymm13,%ymm13
DB 196,65,28,89,229 ; vmulps %ymm13,%ymm12,%ymm12
- DB 196,98,125,24,45,226,210,1,0 ; vbroadcastss 0x1d2e2(%rip),%ymm13 # 2c22c <_sk_overlay_sse2_8bit+0x5b7>
+ DB 196,98,125,24,45,30,210,1,0 ; vbroadcastss 0x1d21e(%rip),%ymm13 # 2c168 <_sk_overlay_sse2_8bit+0x5b8>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
DB 196,65,52,194,202,1 ; vcmpltps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,205,210,1,0 ; vbroadcastss 0x1d2cd(%rip),%ymm10 # 2c230 <_sk_overlay_sse2_8bit+0x5bb>
+ DB 196,98,125,24,21,9,210,1,0 ; vbroadcastss 0x1d209(%rip),%ymm10 # 2c16c <_sk_overlay_sse2_8bit+0x5bc>
DB 196,65,44,92,211 ; vsubps %ymm11,%ymm10,%ymm10
DB 196,67,37,74,202,144 ; vblendvps %ymm9,%ymm10,%ymm11,%ymm9
DB 196,193,124,194,192,1 ; vcmpltps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,21,99,209,1,0 ; vbroadcastss 0x1d163(%rip),%ymm10 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,21,159,208,1,0 ; vbroadcastss 0x1d09f(%rip),%ymm10 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,44,92,209 ; vsubps %ymm9,%ymm10,%ymm10
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 196,65,116,194,200,1 ; vcmpltps %ymm8,%ymm1,%ymm9
- DB 196,98,125,24,21,77,209,1,0 ; vbroadcastss 0x1d14d(%rip),%ymm10 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,21,137,208,1,0 ; vbroadcastss 0x1d089(%rip),%ymm10 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,44,92,208 ; vsubps %ymm0,%ymm10,%ymm10
DB 196,195,125,74,194,144 ; vblendvps %ymm9,%ymm10,%ymm0,%ymm0
DB 196,65,124,194,200,3 ; vcmpunordps %ymm8,%ymm0,%ymm9
@@ -14158,7 +14158,7 @@ _sk_xy_to_2pt_conical_quadratic_max_avx LABEL PROC
DB 196,67,121,4,210,0 ; vpermilps $0x0,%xmm10,%xmm10
DB 196,67,45,24,210,1 ; vinsertf128 $0x1,%xmm10,%ymm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,67,210,1,0 ; vbroadcastss 0x1d243(%rip),%ymm11 # 2c234 <_sk_overlay_sse2_8bit+0x5bf>
+ DB 196,98,125,24,29,127,209,1,0 ; vbroadcastss 0x1d17f(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x5c0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,252,89,192 ; vmulps %ymm0,%ymm0,%ymm0
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
@@ -14167,17 +14167,17 @@ _sk_xy_to_2pt_conical_quadratic_max_avx LABEL PROC
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,23,210,1,0 ; vbroadcastss 0x1d217(%rip),%ymm9 # 2c238 <_sk_overlay_sse2_8bit+0x5c3>
+ DB 196,98,125,24,13,83,209,1,0 ; vbroadcastss 0x1d153(%rip),%ymm9 # 2c174 <_sk_overlay_sse2_8bit+0x5c4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,65,44,89,194 ; vmulps %ymm10,%ymm10,%ymm8
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,36 ; vbroadcastss 0x24(%rax),%ymm8
- DB 196,98,125,24,13,245,209,1,0 ; vbroadcastss 0x1d1f5(%rip),%ymm9 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,13,49,209,1,0 ; vbroadcastss 0x1d131(%rip),%ymm9 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,134,208,1,0 ; vbroadcastss 0x1d086(%rip),%ymm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,29,194,207,1,0 ; vbroadcastss 0x1cfc2(%rip),%ymm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,60,89,210 ; vmulps %ymm10,%ymm8,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -14195,7 +14195,7 @@ _sk_xy_to_2pt_conical_quadratic_min_avx LABEL PROC
DB 196,67,121,4,210,0 ; vpermilps $0x0,%xmm10,%xmm10
DB 196,67,45,24,210,1 ; vinsertf128 $0x1,%xmm10,%ymm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,149,209,1,0 ; vbroadcastss 0x1d195(%rip),%ymm11 # 2c234 <_sk_overlay_sse2_8bit+0x5bf>
+ DB 196,98,125,24,29,209,208,1,0 ; vbroadcastss 0x1d0d1(%rip),%ymm11 # 2c170 <_sk_overlay_sse2_8bit+0x5c0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,252,89,192 ; vmulps %ymm0,%ymm0,%ymm0
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
@@ -14204,17 +14204,17 @@ _sk_xy_to_2pt_conical_quadratic_min_avx LABEL PROC
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,105,209,1,0 ; vbroadcastss 0x1d169(%rip),%ymm9 # 2c238 <_sk_overlay_sse2_8bit+0x5c3>
+ DB 196,98,125,24,13,165,208,1,0 ; vbroadcastss 0x1d0a5(%rip),%ymm9 # 2c174 <_sk_overlay_sse2_8bit+0x5c4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,65,44,89,194 ; vmulps %ymm10,%ymm10,%ymm8
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,36 ; vbroadcastss 0x24(%rax),%ymm8
- DB 196,98,125,24,13,71,209,1,0 ; vbroadcastss 0x1d147(%rip),%ymm9 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,13,131,208,1,0 ; vbroadcastss 0x1d083(%rip),%ymm9 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,216,207,1,0 ; vbroadcastss 0x1cfd8(%rip),%ymm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,29,20,207,1,0 ; vbroadcastss 0x1cf14(%rip),%ymm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,60,89,210 ; vmulps %ymm10,%ymm8,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -14231,7 +14231,7 @@ _sk_xy_to_2pt_conical_linear_avx LABEL PROC
DB 196,67,121,4,201,0 ; vpermilps $0x0,%xmm9,%xmm9
DB 196,67,53,24,201,1 ; vinsertf128 $0x1,%xmm9,%ymm9,%ymm9
DB 197,52,88,200 ; vaddps %ymm0,%ymm9,%ymm9
- DB 196,98,125,24,21,237,208,1,0 ; vbroadcastss 0x1d0ed(%rip),%ymm10 # 2c234 <_sk_overlay_sse2_8bit+0x5bf>
+ DB 196,98,125,24,21,41,208,1,0 ; vbroadcastss 0x1d029(%rip),%ymm10 # 2c170 <_sk_overlay_sse2_8bit+0x5c0>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
DB 197,252,89,192 ; vmulps %ymm0,%ymm0,%ymm0
DB 197,116,89,209 ; vmulps %ymm1,%ymm1,%ymm10
@@ -14240,7 +14240,7 @@ _sk_xy_to_2pt_conical_linear_avx LABEL PROC
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,172,92,192 ; vsubps %ymm0,%ymm10,%ymm0
- DB 196,98,125,24,5,197,208,1,0 ; vbroadcastss 0x1d0c5(%rip),%ymm8 # 2c23c <_sk_overlay_sse2_8bit+0x5c7>
+ DB 196,98,125,24,5,1,208,1,0 ; vbroadcastss 0x1d001(%rip),%ymm8 # 2c178 <_sk_overlay_sse2_8bit+0x5c8>
DB 196,193,124,87,192 ; vxorps %ymm8,%ymm0,%ymm0
DB 196,193,124,94,193 ; vdivps %ymm9,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14275,7 +14275,7 @@ _sk_apply_vector_mask_avx LABEL PROC
PUBLIC _sk_save_xy_avx
_sk_save_xy_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,1,207,1,0 ; vbroadcastss 0x1cf01(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,61,206,1,0 ; vbroadcastss 0x1ce3d(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,124,88,200 ; vaddps %ymm8,%ymm0,%ymm9
DB 196,67,125,8,209,1 ; vroundps $0x1,%ymm9,%ymm10
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
@@ -14308,9 +14308,9 @@ _sk_accumulate_avx LABEL PROC
PUBLIC _sk_bilinear_nx_avx
_sk_bilinear_nx_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,233,207,1,0 ; vbroadcastss 0x1cfe9(%rip),%ymm0 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,5,37,207,1,0 ; vbroadcastss 0x1cf25(%rip),%ymm0 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,128,206,1,0 ; vbroadcastss 0x1ce80(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,188,205,1,0 ; vbroadcastss 0x1cdbc(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14319,7 +14319,7 @@ _sk_bilinear_nx_avx LABEL PROC
PUBLIC _sk_bilinear_px_avx
_sk_bilinear_px_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,96,206,1,0 ; vbroadcastss 0x1ce60(%rip),%ymm0 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,5,156,205,1,0 ; vbroadcastss 0x1cd9c(%rip),%ymm0 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -14329,9 +14329,9 @@ _sk_bilinear_px_avx LABEL PROC
PUBLIC _sk_bilinear_ny_avx
_sk_bilinear_ny_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,160,207,1,0 ; vbroadcastss 0x1cfa0(%rip),%ymm1 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,13,220,206,1,0 ; vbroadcastss 0x1cedc(%rip),%ymm1 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,54,206,1,0 ; vbroadcastss 0x1ce36(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,114,205,1,0 ; vbroadcastss 0x1cd72(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14340,7 +14340,7 @@ _sk_bilinear_ny_avx LABEL PROC
PUBLIC _sk_bilinear_py_avx
_sk_bilinear_py_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,22,206,1,0 ; vbroadcastss 0x1ce16(%rip),%ymm1 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,226,125,24,13,82,205,1,0 ; vbroadcastss 0x1cd52(%rip),%ymm1 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -14350,14 +14350,14 @@ _sk_bilinear_py_avx LABEL PROC
PUBLIC _sk_bicubic_n3x_avx
_sk_bicubic_n3x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,89,207,1,0 ; vbroadcastss 0x1cf59(%rip),%ymm0 # 2c244 <_sk_overlay_sse2_8bit+0x5cf>
+ DB 196,226,125,24,5,149,206,1,0 ; vbroadcastss 0x1ce95(%rip),%ymm0 # 2c180 <_sk_overlay_sse2_8bit+0x5d0>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,236,205,1,0 ; vbroadcastss 0x1cdec(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,40,205,1,0 ; vbroadcastss 0x1cd28(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,61,207,1,0 ; vbroadcastss 0x1cf3d(%rip),%ymm10 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,121,206,1,0 ; vbroadcastss 0x1ce79(%rip),%ymm10 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,59,206,1,0 ; vbroadcastss 0x1ce3b(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
+ DB 196,98,125,24,21,119,205,1,0 ; vbroadcastss 0x1cd77(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -14367,19 +14367,19 @@ _sk_bicubic_n3x_avx LABEL PROC
PUBLIC _sk_bicubic_n1x_avx
_sk_bicubic_n1x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,6,207,1,0 ; vbroadcastss 0x1cf06(%rip),%ymm0 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,5,66,206,1,0 ; vbroadcastss 0x1ce42(%rip),%ymm0 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,157,205,1,0 ; vbroadcastss 0x1cd9d(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,217,204,1,0 ; vbroadcastss 0x1ccd9(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,251,206,1,0 ; vbroadcastss 0x1cefb(%rip),%ymm9 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,13,55,206,1,0 ; vbroadcastss 0x1ce37(%rip),%ymm9 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,233,206,1,0 ; vbroadcastss 0x1cee9(%rip),%ymm10 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,98,125,24,21,37,206,1,0 ; vbroadcastss 0x1ce25(%rip),%ymm10 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,106,205,1,0 ; vbroadcastss 0x1cd6a(%rip),%ymm10 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,21,166,204,1,0 ; vbroadcastss 0x1cca6(%rip),%ymm10 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,203,206,1,0 ; vbroadcastss 0x1cecb(%rip),%ymm9 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,13,7,206,1,0 ; vbroadcastss 0x1ce07(%rip),%ymm9 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14388,17 +14388,17 @@ _sk_bicubic_n1x_avx LABEL PROC
PUBLIC _sk_bicubic_p1x_avx
_sk_bicubic_p1x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,59,205,1,0 ; vbroadcastss 0x1cd3b(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,119,204,1,0 ; vbroadcastss 0x1cc77(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,188,88,0 ; vaddps (%rax),%ymm8,%ymm0
DB 197,124,16,72,64 ; vmovups 0x40(%rax),%ymm9
- DB 196,98,125,24,21,153,206,1,0 ; vbroadcastss 0x1ce99(%rip),%ymm10 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,21,213,205,1,0 ; vbroadcastss 0x1cdd5(%rip),%ymm10 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
- DB 196,98,125,24,29,135,206,1,0 ; vbroadcastss 0x1ce87(%rip),%ymm11 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,98,125,24,29,195,205,1,0 ; vbroadcastss 0x1cdc3(%rip),%ymm11 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 196,98,125,24,13,114,206,1,0 ; vbroadcastss 0x1ce72(%rip),%ymm9 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,13,174,205,1,0 ; vbroadcastss 0x1cdae(%rip),%ymm9 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14407,13 +14407,13 @@ _sk_bicubic_p1x_avx LABEL PROC
PUBLIC _sk_bicubic_p3x_avx
_sk_bicubic_p3x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,78,206,1,0 ; vbroadcastss 0x1ce4e(%rip),%ymm0 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,226,125,24,5,138,205,1,0 ; vbroadcastss 0x1cd8a(%rip),%ymm0 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,51,206,1,0 ; vbroadcastss 0x1ce33(%rip),%ymm10 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,111,205,1,0 ; vbroadcastss 0x1cd6f(%rip),%ymm10 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,49,205,1,0 ; vbroadcastss 0x1cd31(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
+ DB 196,98,125,24,21,109,204,1,0 ; vbroadcastss 0x1cc6d(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -14423,14 +14423,14 @@ _sk_bicubic_p3x_avx LABEL PROC
PUBLIC _sk_bicubic_n3y_avx
_sk_bicubic_n3y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,0,206,1,0 ; vbroadcastss 0x1ce00(%rip),%ymm1 # 2c244 <_sk_overlay_sse2_8bit+0x5cf>
+ DB 196,226,125,24,13,60,205,1,0 ; vbroadcastss 0x1cd3c(%rip),%ymm1 # 2c180 <_sk_overlay_sse2_8bit+0x5d0>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,146,204,1,0 ; vbroadcastss 0x1cc92(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,206,203,1,0 ; vbroadcastss 0x1cbce(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,227,205,1,0 ; vbroadcastss 0x1cde3(%rip),%ymm10 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,31,205,1,0 ; vbroadcastss 0x1cd1f(%rip),%ymm10 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,225,204,1,0 ; vbroadcastss 0x1cce1(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
+ DB 196,98,125,24,21,29,204,1,0 ; vbroadcastss 0x1cc1d(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -14440,19 +14440,19 @@ _sk_bicubic_n3y_avx LABEL PROC
PUBLIC _sk_bicubic_n1y_avx
_sk_bicubic_n1y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,172,205,1,0 ; vbroadcastss 0x1cdac(%rip),%ymm1 # 2c240 <_sk_overlay_sse2_8bit+0x5cb>
+ DB 196,226,125,24,13,232,204,1,0 ; vbroadcastss 0x1cce8(%rip),%ymm1 # 2c17c <_sk_overlay_sse2_8bit+0x5cc>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,66,204,1,0 ; vbroadcastss 0x1cc42(%rip),%ymm8 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,98,125,24,5,126,203,1,0 ; vbroadcastss 0x1cb7e(%rip),%ymm8 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,160,205,1,0 ; vbroadcastss 0x1cda0(%rip),%ymm9 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,13,220,204,1,0 ; vbroadcastss 0x1ccdc(%rip),%ymm9 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,142,205,1,0 ; vbroadcastss 0x1cd8e(%rip),%ymm10 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,98,125,24,21,202,204,1,0 ; vbroadcastss 0x1ccca(%rip),%ymm10 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,15,204,1,0 ; vbroadcastss 0x1cc0f(%rip),%ymm10 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,21,75,203,1,0 ; vbroadcastss 0x1cb4b(%rip),%ymm10 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,112,205,1,0 ; vbroadcastss 0x1cd70(%rip),%ymm9 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,13,172,204,1,0 ; vbroadcastss 0x1ccac(%rip),%ymm9 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14461,17 +14461,17 @@ _sk_bicubic_n1y_avx LABEL PROC
PUBLIC _sk_bicubic_p1y_avx
_sk_bicubic_p1y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,224,203,1,0 ; vbroadcastss 0x1cbe0(%rip),%ymm8 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 196,98,125,24,5,28,203,1,0 ; vbroadcastss 0x1cb1c(%rip),%ymm8 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 197,188,88,72,32 ; vaddps 0x20(%rax),%ymm8,%ymm1
DB 197,124,16,72,96 ; vmovups 0x60(%rax),%ymm9
- DB 196,98,125,24,21,61,205,1,0 ; vbroadcastss 0x1cd3d(%rip),%ymm10 # 2c250 <_sk_overlay_sse2_8bit+0x5db>
+ DB 196,98,125,24,21,121,204,1,0 ; vbroadcastss 0x1cc79(%rip),%ymm10 # 2c18c <_sk_overlay_sse2_8bit+0x5dc>
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
- DB 196,98,125,24,29,43,205,1,0 ; vbroadcastss 0x1cd2b(%rip),%ymm11 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,98,125,24,29,103,204,1,0 ; vbroadcastss 0x1cc67(%rip),%ymm11 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 196,98,125,24,13,22,205,1,0 ; vbroadcastss 0x1cd16(%rip),%ymm9 # 2c254 <_sk_overlay_sse2_8bit+0x5df>
+ DB 196,98,125,24,13,82,204,1,0 ; vbroadcastss 0x1cc52(%rip),%ymm9 # 2c190 <_sk_overlay_sse2_8bit+0x5e0>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14480,13 +14480,13 @@ _sk_bicubic_p1y_avx LABEL PROC
PUBLIC _sk_bicubic_p3y_avx
_sk_bicubic_p3y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,242,204,1,0 ; vbroadcastss 0x1ccf2(%rip),%ymm1 # 2c24c <_sk_overlay_sse2_8bit+0x5d7>
+ DB 196,226,125,24,13,46,204,1,0 ; vbroadcastss 0x1cc2e(%rip),%ymm1 # 2c188 <_sk_overlay_sse2_8bit+0x5d8>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,214,204,1,0 ; vbroadcastss 0x1ccd6(%rip),%ymm10 # 2c248 <_sk_overlay_sse2_8bit+0x5d3>
+ DB 196,98,125,24,21,18,204,1,0 ; vbroadcastss 0x1cc12(%rip),%ymm10 # 2c184 <_sk_overlay_sse2_8bit+0x5d4>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,212,203,1,0 ; vbroadcastss 0x1cbd4(%rip),%ymm10 # 2c154 <_sk_overlay_sse2_8bit+0x4df>
+ DB 196,98,125,24,21,16,203,1,0 ; vbroadcastss 0x1cb10(%rip),%ymm10 # 2c090 <_sk_overlay_sse2_8bit+0x4e0>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -14617,7 +14617,7 @@ _sk_clut_3D_avx LABEL PROC
DB 197,249,127,68,36,96 ; vmovdqa %xmm0,0x60(%rsp)
DB 72,139,0 ; mov (%rax),%rax
DB 196,193,121,254,194 ; vpaddd %xmm10,%xmm0,%xmm0
- DB 196,98,121,24,29,138,202,1,0 ; vbroadcastss 0x1ca8a(%rip),%xmm11 # 2c25c <_sk_overlay_sse2_8bit+0x5e7>
+ DB 196,98,121,24,29,198,201,1,0 ; vbroadcastss 0x1c9c6(%rip),%xmm11 # 2c198 <_sk_overlay_sse2_8bit+0x5e8>
DB 196,194,121,64,203 ; vpmulld %xmm11,%xmm0,%xmm1
DB 196,193,249,126,200 ; vmovq %xmm1,%r8
DB 69,137,193 ; mov %r8d,%r9d
@@ -14651,7 +14651,7 @@ _sk_clut_3D_avx LABEL PROC
DB 196,163,65,33,60,152,48 ; vinsertps $0x30,(%rax,%r11,4),%xmm7,%xmm7
DB 196,227,93,24,223,1 ; vinsertf128 $0x1,%xmm7,%ymm4,%ymm3
DB 197,252,17,156,36,192,0,0,0 ; vmovups %ymm3,0xc0(%rsp)
- DB 196,98,121,24,13,81,200,1,0 ; vbroadcastss 0x1c851(%rip),%xmm9 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,121,24,13,141,199,1,0 ; vbroadcastss 0x1c78d(%rip),%xmm9 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,193,105,254,249 ; vpaddd %xmm9,%xmm2,%xmm7
DB 196,195,249,22,248,1 ; vpextrq $0x1,%xmm7,%r8
DB 196,193,249,126,249 ; vmovq %xmm7,%r9
@@ -14679,7 +14679,7 @@ _sk_clut_3D_avx LABEL PROC
DB 196,161,122,16,60,152 ; vmovss (%rax,%r11,4),%xmm7
DB 196,227,81,33,239,48 ; vinsertps $0x30,%xmm7,%xmm5,%xmm5
DB 196,99,85,24,254,1 ; vinsertf128 $0x1,%xmm6,%ymm5,%ymm15
- DB 196,98,121,24,37,198,199,1,0 ; vbroadcastss 0x1c7c6(%rip),%xmm12 # 2c0f0 <_sk_overlay_sse2_8bit+0x47b>
+ DB 196,98,121,24,37,2,199,1,0 ; vbroadcastss 0x1c702(%rip),%xmm12 # 2c02c <_sk_overlay_sse2_8bit+0x47c>
DB 196,193,105,254,212 ; vpaddd %xmm12,%xmm2,%xmm2
DB 196,195,249,22,208,1 ; vpextrq $0x1,%xmm2,%r8
DB 196,193,249,126,209 ; vmovq %xmm2,%r9
@@ -14707,7 +14707,7 @@ _sk_clut_3D_avx LABEL PROC
DB 197,250,16,44,152 ; vmovss (%rax,%rbx,4),%xmm5
DB 196,227,105,33,213,48 ; vinsertps $0x30,%xmm5,%xmm2,%xmm2
DB 196,227,109,24,225,1 ; vinsertf128 $0x1,%xmm1,%ymm2,%ymm4
- DB 196,226,125,24,13,154,200,1,0 ; vbroadcastss 0x1c89a(%rip),%ymm1 # 2c258 <_sk_overlay_sse2_8bit+0x5e3>
+ DB 196,226,125,24,13,214,199,1,0 ; vbroadcastss 0x1c7d6(%rip),%ymm1 # 2c194 <_sk_overlay_sse2_8bit+0x5e4>
DB 197,188,88,209 ; vaddps %ymm1,%ymm8,%ymm2
DB 197,252,17,140,36,160,0,0,0 ; vmovups %ymm1,0xa0(%rsp)
DB 197,254,91,210 ; vcvttps2dq %ymm2,%ymm2
@@ -15458,7 +15458,7 @@ _sk_clut_4D_avx LABEL PROC
DB 196,226,25,64,200 ; vpmulld %xmm0,%xmm12,%xmm1
DB 197,249,127,12,36 ; vmovdqa %xmm1,(%rsp)
DB 197,241,254,202 ; vpaddd %xmm2,%xmm1,%xmm1
- DB 196,98,121,24,61,31,185,1,0 ; vbroadcastss 0x1b91f(%rip),%xmm15 # 2c25c <_sk_overlay_sse2_8bit+0x5e7>
+ DB 196,98,121,24,61,91,184,1,0 ; vbroadcastss 0x1b85b(%rip),%xmm15 # 2c198 <_sk_overlay_sse2_8bit+0x5e8>
DB 196,194,113,64,247 ; vpmulld %xmm15,%xmm1,%xmm6
DB 196,193,249,126,240 ; vmovq %xmm6,%r8
DB 69,137,193 ; mov %r8d,%r9d
@@ -15496,7 +15496,7 @@ _sk_clut_4D_avx LABEL PROC
DB 196,163,65,33,60,144,32 ; vinsertps $0x20,(%rax,%r10,4),%xmm7,%xmm7
DB 196,163,65,33,60,152,48 ; vinsertps $0x30,(%rax,%r11,4),%xmm7,%xmm7
DB 196,99,53,24,247,1 ; vinsertf128 $0x1,%xmm7,%ymm9,%ymm14
- DB 196,98,121,24,21,205,182,1,0 ; vbroadcastss 0x1b6cd(%rip),%xmm10 # 2c0e8 <_sk_overlay_sse2_8bit+0x473>
+ DB 196,98,121,24,21,9,182,1,0 ; vbroadcastss 0x1b609(%rip),%xmm10 # 2c024 <_sk_overlay_sse2_8bit+0x474>
DB 196,65,97,254,202 ; vpaddd %xmm10,%xmm3,%xmm9
DB 196,67,249,22,200,1 ; vpextrq $0x1,%xmm9,%r8
DB 196,65,249,126,201 ; vmovq %xmm9,%r9
@@ -15524,7 +15524,7 @@ _sk_clut_4D_avx LABEL PROC
DB 196,161,122,16,60,152 ; vmovss (%rax,%r11,4),%xmm7
DB 196,227,81,33,239,48 ; vinsertps $0x30,%xmm7,%xmm5,%xmm5
DB 196,99,85,24,220,1 ; vinsertf128 $0x1,%xmm4,%ymm5,%ymm11
- DB 196,98,121,24,13,66,182,1,0 ; vbroadcastss 0x1b642(%rip),%xmm9 # 2c0f0 <_sk_overlay_sse2_8bit+0x47b>
+ DB 196,98,121,24,13,126,181,1,0 ; vbroadcastss 0x1b57e(%rip),%xmm9 # 2c02c <_sk_overlay_sse2_8bit+0x47c>
DB 196,193,97,254,217 ; vpaddd %xmm9,%xmm3,%xmm3
DB 196,195,249,22,216,1 ; vpextrq $0x1,%xmm3,%r8
DB 196,193,249,126,217 ; vmovq %xmm3,%r9
@@ -15552,7 +15552,7 @@ _sk_clut_4D_avx LABEL PROC
DB 197,250,16,44,152 ; vmovss (%rax,%rbx,4),%xmm5
DB 196,227,89,33,229,48 ; vinsertps $0x30,%xmm5,%xmm4,%xmm4
DB 196,227,93,24,243,1 ; vinsertf128 $0x1,%xmm3,%ymm4,%ymm6
- DB 196,226,125,24,37,22,183,1,0 ; vbroadcastss 0x1b716(%rip),%ymm4 # 2c258 <_sk_overlay_sse2_8bit+0x5e3>
+ DB 196,226,125,24,37,82,182,1,0 ; vbroadcastss 0x1b652(%rip),%ymm4 # 2c194 <_sk_overlay_sse2_8bit+0x5e4>
DB 197,148,88,220 ; vaddps %ymm4,%ymm13,%ymm3
DB 197,252,40,252 ; vmovaps %ymm4,%ymm7
DB 197,252,17,188,36,160,0,0,0 ; vmovups %ymm7,0xa0(%rsp)
@@ -16982,7 +16982,7 @@ _sk_clut_4D_avx LABEL PROC
DB 197,220,89,210 ; vmulps %ymm2,%ymm4,%ymm2
DB 197,212,88,210 ; vaddps %ymm2,%ymm5,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,219,151,1,0 ; vbroadcastss 0x197db(%rip),%ymm3 # 2c0e4 <_sk_overlay_sse2_8bit+0x46f>
+ DB 196,226,125,24,29,23,151,1,0 ; vbroadcastss 0x19717(%rip),%ymm3 # 2c020 <_sk_overlay_sse2_8bit+0x470>
DB 197,252,16,164,36,160,2,0,0 ; vmovups 0x2a0(%rsp),%ymm4
DB 197,252,16,172,36,192,2,0,0 ; vmovups 0x2c0(%rsp),%ymm5
DB 197,252,16,180,36,224,2,0,0 ; vmovups 0x2e0(%rsp),%ymm6
@@ -17080,15 +17080,15 @@ _sk_seed_shader_sse41 LABEL PROC
DB 102,15,110,194 ; movd %edx,%xmm0
DB 102,15,112,192,0 ; pshufd $0x0,%xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,40,21,155,160,1,0 ; movaps 0x1a09b(%rip),%xmm2 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,40,21,219,159,1,0 ; movaps 0x19fdb(%rip),%xmm2 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,88,194 ; addps %xmm2,%xmm0
- DB 15,88,5,161,160,1,0 ; addps 0x1a0a1(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xebb>
+ DB 15,88,5,225,159,1,0 ; addps 0x19fe1(%rip),%xmm0 # 2ca70 <_sk_overlay_sse2_8bit+0xec0>
DB 102,15,110,201 ; movd %ecx,%xmm1
DB 102,15,112,201,0 ; pshufd $0x0,%xmm1,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,88,202 ; addps %xmm2,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,21,153,160,1,0 ; movaps 0x1a099(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,217,159,1,0 ; movaps 0x19fd9(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,87,219 ; xorps %xmm3,%xmm3
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,87,237 ; xorps %xmm5,%xmm5
@@ -17101,18 +17101,18 @@ _sk_dither_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 102,68,15,110,194 ; movd %edx,%xmm8
DB 102,69,15,112,200,0 ; pshufd $0x0,%xmm8,%xmm9
- DB 102,68,15,254,13,50,160,1,0 ; paddd 0x1a032(%rip),%xmm9 # 2cb00 <_sk_overlay_sse2_8bit+0xe8b>
+ DB 102,68,15,254,13,114,159,1,0 ; paddd 0x19f72(%rip),%xmm9 # 2ca40 <_sk_overlay_sse2_8bit+0xe90>
DB 102,68,15,110,193 ; movd %ecx,%xmm8
DB 102,69,15,112,192,0 ; pshufd $0x0,%xmm8,%xmm8
DB 102,69,15,239,193 ; pxor %xmm9,%xmm8
- DB 102,68,15,111,21,105,160,1,0 ; movdqa 0x1a069(%rip),%xmm10 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,21,169,159,1,0 ; movdqa 0x19fa9(%rip),%xmm10 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,69,15,111,216 ; movdqa %xmm8,%xmm11
DB 102,69,15,219,218 ; pand %xmm10,%xmm11
DB 102,65,15,114,243,5 ; pslld $0x5,%xmm11
DB 102,69,15,219,209 ; pand %xmm9,%xmm10
DB 102,65,15,114,242,4 ; pslld $0x4,%xmm10
- DB 102,68,15,111,37,85,160,1,0 ; movdqa 0x1a055(%rip),%xmm12 # 2cb60 <_sk_overlay_sse2_8bit+0xeeb>
- DB 102,68,15,111,45,92,160,1,0 ; movdqa 0x1a05c(%rip),%xmm13 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,37,149,159,1,0 ; movdqa 0x19f95(%rip),%xmm12 # 2caa0 <_sk_overlay_sse2_8bit+0xef0>
+ DB 102,68,15,111,45,156,159,1,0 ; movdqa 0x19f9c(%rip),%xmm13 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,69,15,111,240 ; movdqa %xmm8,%xmm14
DB 102,69,15,219,245 ; pand %xmm13,%xmm14
DB 102,65,15,114,246,2 ; pslld $0x2,%xmm14
@@ -17128,8 +17128,8 @@ _sk_dither_sse41 LABEL PROC
DB 102,69,15,235,245 ; por %xmm13,%xmm14
DB 102,69,15,235,240 ; por %xmm8,%xmm14
DB 69,15,91,198 ; cvtdq2ps %xmm14,%xmm8
- DB 68,15,89,5,23,160,1,0 ; mulps 0x1a017(%rip),%xmm8 # 2cb80 <_sk_overlay_sse2_8bit+0xf0b>
- DB 68,15,88,5,31,160,1,0 ; addps 0x1a01f(%rip),%xmm8 # 2cb90 <_sk_overlay_sse2_8bit+0xf1b>
+ DB 68,15,89,5,87,159,1,0 ; mulps 0x19f57(%rip),%xmm8 # 2cac0 <_sk_overlay_sse2_8bit+0xf10>
+ DB 68,15,88,5,95,159,1,0 ; addps 0x19f5f(%rip),%xmm8 # 2cad0 <_sk_overlay_sse2_8bit+0xf20>
DB 243,68,15,16,16 ; movss (%rax),%xmm10
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,89,208 ; mulps %xmm8,%xmm10
@@ -17167,7 +17167,7 @@ _sk_uniform_color_sse41 LABEL PROC
PUBLIC _sk_black_color_sse41
_sk_black_color_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,85,159,1,0 ; movaps 0x19f55(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,149,158,1,0 ; movaps 0x19e95(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,87,201 ; xorps %xmm1,%xmm1
DB 15,87,210 ; xorps %xmm2,%xmm2
@@ -17176,7 +17176,7 @@ _sk_black_color_sse41 LABEL PROC
PUBLIC _sk_white_color_sse41
_sk_white_color_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,5,65,159,1,0 ; movaps 0x19f41(%rip),%xmm0 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,5,129,158,1,0 ; movaps 0x19e81(%rip),%xmm0 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,40,216 ; movaps %xmm0,%xmm3
@@ -17214,7 +17214,7 @@ _sk_clear_sse41 LABEL PROC
PUBLIC _sk_srcatop_sse41
_sk_srcatop_sse41 LABEL PROC
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 68,15,40,5,241,158,1,0 ; movaps 0x19ef1(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,49,158,1,0 ; movaps 0x19e31(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -17237,7 +17237,7 @@ PUBLIC _sk_dstatop_sse41
_sk_dstatop_sse41 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
DB 68,15,89,196 ; mulps %xmm4,%xmm8
- DB 68,15,40,13,164,158,1,0 ; movaps 0x19ea4(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,228,157,1,0 ; movaps 0x19de4(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,88,192 ; addps %xmm8,%xmm0
@@ -17278,7 +17278,7 @@ _sk_dstin_sse41 LABEL PROC
PUBLIC _sk_srcout_sse41
_sk_srcout_sse41 LABEL PROC
- DB 68,15,40,5,56,158,1,0 ; movaps 0x19e38(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,120,157,1,0 ; movaps 0x19d78(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
@@ -17289,7 +17289,7 @@ _sk_srcout_sse41 LABEL PROC
PUBLIC _sk_dstout_sse41
_sk_dstout_sse41 LABEL PROC
- DB 68,15,40,5,24,158,1,0 ; movaps 0x19e18(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,88,157,1,0 ; movaps 0x19d58(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 15,89,196 ; mulps %xmm4,%xmm0
@@ -17304,7 +17304,7 @@ _sk_dstout_sse41 LABEL PROC
PUBLIC _sk_srcover_sse41
_sk_srcover_sse41 LABEL PROC
- DB 68,15,40,5,235,157,1,0 ; movaps 0x19deb(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,43,157,1,0 ; movaps 0x19d2b(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -17322,7 +17322,7 @@ _sk_srcover_sse41 LABEL PROC
PUBLIC _sk_dstover_sse41
_sk_dstover_sse41 LABEL PROC
- DB 68,15,40,5,175,157,1,0 ; movaps 0x19daf(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,239,156,1,0 ; movaps 0x19cef(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -17346,7 +17346,7 @@ _sk_modulate_sse41 LABEL PROC
PUBLIC _sk_multiply_sse41
_sk_multiply_sse41 LABEL PROC
- DB 68,15,40,5,115,157,1,0 ; movaps 0x19d73(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,179,156,1,0 ; movaps 0x19cb3(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 69,15,40,209 ; movaps %xmm9,%xmm10
@@ -17382,7 +17382,7 @@ _sk_multiply_sse41 LABEL PROC
PUBLIC _sk_plus__sse41
_sk_plus__sse41 LABEL PROC
DB 15,88,196 ; addps %xmm4,%xmm0
- DB 68,15,40,5,244,156,1,0 ; movaps 0x19cf4(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,52,156,1,0 ; movaps 0x19c34(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,93,192 ; minps %xmm8,%xmm0
DB 15,88,205 ; addps %xmm5,%xmm1
DB 65,15,93,200 ; minps %xmm8,%xmm1
@@ -17420,7 +17420,7 @@ _sk_screen_sse41 LABEL PROC
PUBLIC _sk_xor__sse41
_sk_xor__sse41 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
- DB 15,40,29,128,156,1,0 ; movaps 0x19c80(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,192,155,1,0 ; movaps 0x19bc0(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,40,203 ; movaps %xmm3,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
@@ -17466,7 +17466,7 @@ _sk_darken_sse41 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,95,209 ; maxps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,219,155,1,0 ; movaps 0x19bdb(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,27,155,1,0 ; movaps 0x19b1b(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -17498,7 +17498,7 @@ _sk_lighten_sse41 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,112,155,1,0 ; movaps 0x19b70(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,176,154,1,0 ; movaps 0x19ab0(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -17533,7 +17533,7 @@ _sk_difference_sse41 LABEL PROC
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,250,154,1,0 ; movaps 0x19afa(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,58,154,1,0 ; movaps 0x19a3a(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -17559,7 +17559,7 @@ _sk_exclusion_sse41 LABEL PROC
DB 15,89,214 ; mulps %xmm6,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,170,154,1,0 ; movaps 0x19aaa(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,234,153,1,0 ; movaps 0x199ea(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -17569,7 +17569,7 @@ _sk_exclusion_sse41 LABEL PROC
PUBLIC _sk_colorburn_sse41
_sk_colorburn_sse41 LABEL PROC
- DB 68,15,40,29,145,154,1,0 ; movaps 0x19a91(%rip),%xmm11 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,29,209,153,1,0 ; movaps 0x199d1(%rip),%xmm11 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,227 ; movaps %xmm11,%xmm12
DB 68,15,92,231 ; subps %xmm7,%xmm12
DB 69,15,40,204 ; movaps %xmm12,%xmm9
@@ -17651,7 +17651,7 @@ _sk_colorburn_sse41 LABEL PROC
PUBLIC _sk_colordodge_sse41
_sk_colordodge_sse41 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,40,21,91,153,1,0 ; movaps 0x1995b(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,155,152,1,0 ; movaps 0x1989b(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 69,15,40,227 ; movaps %xmm11,%xmm12
@@ -17732,7 +17732,7 @@ _sk_hardlight_sse41 LABEL PROC
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 15,40,227 ; movaps %xmm3,%xmm4
DB 68,15,40,200 ; movaps %xmm0,%xmm9
- DB 68,15,40,21,35,152,1,0 ; movaps 0x19823(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,99,151,1,0 ; movaps 0x19763(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,40,234 ; movaps %xmm10,%xmm5
DB 15,92,239 ; subps %xmm7,%xmm5
DB 15,40,197 ; movaps %xmm5,%xmm0
@@ -17814,7 +17814,7 @@ PUBLIC _sk_overlay_sse41
_sk_overlay_sse41 LABEL PROC
DB 68,15,40,201 ; movaps %xmm1,%xmm9
DB 68,15,40,240 ; movaps %xmm0,%xmm14
- DB 68,15,40,21,245,150,1,0 ; movaps 0x196f5(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,53,150,1,0 ; movaps 0x19635(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 65,15,40,195 ; movaps %xmm11,%xmm0
@@ -17898,7 +17898,7 @@ _sk_softlight_sse41 LABEL PROC
DB 15,40,198 ; movaps %xmm6,%xmm0
DB 15,94,199 ; divps %xmm7,%xmm0
DB 65,15,84,193 ; andps %xmm9,%xmm0
- DB 15,40,13,184,149,1,0 ; movaps 0x195b8(%rip),%xmm1 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,13,248,148,1,0 ; movaps 0x194f8(%rip),%xmm1 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 68,15,92,208 ; subps %xmm0,%xmm10
DB 68,15,40,240 ; movaps %xmm0,%xmm14
@@ -17911,10 +17911,10 @@ _sk_softlight_sse41 LABEL PROC
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,89,210 ; mulps %xmm2,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
- DB 68,15,40,45,230,149,1,0 ; movaps 0x195e6(%rip),%xmm13 # 2cba0 <_sk_overlay_sse2_8bit+0xf2b>
+ DB 68,15,40,45,38,149,1,0 ; movaps 0x19526(%rip),%xmm13 # 2cae0 <_sk_overlay_sse2_8bit+0xf30>
DB 69,15,88,245 ; addps %xmm13,%xmm14
DB 68,15,89,242 ; mulps %xmm2,%xmm14
- DB 68,15,40,37,230,149,1,0 ; movaps 0x195e6(%rip),%xmm12 # 2cbb0 <_sk_overlay_sse2_8bit+0xf3b>
+ DB 68,15,40,37,38,149,1,0 ; movaps 0x19526(%rip),%xmm12 # 2caf0 <_sk_overlay_sse2_8bit+0xf40>
DB 69,15,89,252 ; mulps %xmm12,%xmm15
DB 69,15,88,254 ; addps %xmm14,%xmm15
DB 15,40,198 ; movaps %xmm6,%xmm0
@@ -18100,12 +18100,12 @@ _sk_hue_sse41 LABEL PROC
DB 68,15,84,208 ; andps %xmm0,%xmm10
DB 15,84,200 ; andps %xmm0,%xmm1
DB 68,15,84,232 ; andps %xmm0,%xmm13
- DB 15,40,5,76,147,1,0 ; movaps 0x1934c(%rip),%xmm0 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 15,40,5,140,146,1,0 ; movaps 0x1928c(%rip),%xmm0 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 68,15,89,224 ; mulps %xmm0,%xmm12
- DB 15,40,21,81,147,1,0 ; movaps 0x19351(%rip),%xmm2 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 15,40,21,145,146,1,0 ; movaps 0x19291(%rip),%xmm2 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 15,89,250 ; mulps %xmm2,%xmm7
DB 65,15,88,252 ; addps %xmm12,%xmm7
- DB 68,15,40,53,82,147,1,0 ; movaps 0x19352(%rip),%xmm14 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,53,146,146,1,0 ; movaps 0x19292(%rip),%xmm14 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 68,15,40,252 ; movaps %xmm4,%xmm15
DB 69,15,89,254 ; mulps %xmm14,%xmm15
DB 68,15,88,255 ; addps %xmm7,%xmm15
@@ -18188,7 +18188,7 @@ _sk_hue_sse41 LABEL PROC
DB 65,15,88,214 ; addps %xmm14,%xmm2
DB 15,40,196 ; movaps %xmm4,%xmm0
DB 102,15,56,20,202 ; blendvps %xmm0,%xmm2,%xmm1
- DB 68,15,40,13,103,145,1,0 ; movaps 0x19167(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,167,144,1,0 ; movaps 0x190a7(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,40,225 ; movaps %xmm9,%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 15,40,68,36,48 ; movaps 0x30(%rsp),%xmm0
@@ -18282,14 +18282,14 @@ _sk_saturation_sse41 LABEL PROC
DB 68,15,84,215 ; andps %xmm7,%xmm10
DB 68,15,84,223 ; andps %xmm7,%xmm11
DB 68,15,84,199 ; andps %xmm7,%xmm8
- DB 15,40,21,138,144,1,0 ; movaps 0x1908a(%rip),%xmm2 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 15,40,21,202,143,1,0 ; movaps 0x18fca(%rip),%xmm2 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 15,40,221 ; movaps %xmm5,%xmm3
DB 15,89,218 ; mulps %xmm2,%xmm3
- DB 15,40,13,141,144,1,0 ; movaps 0x1908d(%rip),%xmm1 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 15,40,13,205,143,1,0 ; movaps 0x18fcd(%rip),%xmm1 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 15,40,254 ; movaps %xmm6,%xmm7
DB 15,89,249 ; mulps %xmm1,%xmm7
DB 15,88,251 ; addps %xmm3,%xmm7
- DB 68,15,40,45,140,144,1,0 ; movaps 0x1908c(%rip),%xmm13 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,45,204,143,1,0 ; movaps 0x18fcc(%rip),%xmm13 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 69,15,89,245 ; mulps %xmm13,%xmm14
DB 68,15,88,247 ; addps %xmm7,%xmm14
DB 65,15,40,218 ; movaps %xmm10,%xmm3
@@ -18370,7 +18370,7 @@ _sk_saturation_sse41 LABEL PROC
DB 65,15,88,253 ; addps %xmm13,%xmm7
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 102,68,15,56,20,223 ; blendvps %xmm0,%xmm7,%xmm11
- DB 68,15,40,13,162,142,1,0 ; movaps 0x18ea2(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,226,141,1,0 ; movaps 0x18de2(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 68,15,92,204 ; subps %xmm4,%xmm9
DB 15,40,60,36 ; movaps (%rsp),%xmm7
@@ -18425,14 +18425,14 @@ _sk_color_sse41 LABEL PROC
DB 15,40,231 ; movaps %xmm7,%xmm4
DB 68,15,89,244 ; mulps %xmm4,%xmm14
DB 15,89,204 ; mulps %xmm4,%xmm1
- DB 68,15,40,13,87,142,1,0 ; movaps 0x18e57(%rip),%xmm9 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,13,151,141,1,0 ; movaps 0x18d97(%rip),%xmm9 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 65,15,40,250 ; movaps %xmm10,%xmm7
DB 65,15,89,249 ; mulps %xmm9,%xmm7
- DB 68,15,40,21,87,142,1,0 ; movaps 0x18e57(%rip),%xmm10 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 68,15,40,21,151,141,1,0 ; movaps 0x18d97(%rip),%xmm10 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 65,15,40,219 ; movaps %xmm11,%xmm3
DB 65,15,89,218 ; mulps %xmm10,%xmm3
DB 15,88,223 ; addps %xmm7,%xmm3
- DB 68,15,40,29,84,142,1,0 ; movaps 0x18e54(%rip),%xmm11 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,29,148,141,1,0 ; movaps 0x18d94(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 69,15,40,236 ; movaps %xmm12,%xmm13
DB 69,15,89,235 ; mulps %xmm11,%xmm13
DB 68,15,88,235 ; addps %xmm3,%xmm13
@@ -18517,7 +18517,7 @@ _sk_color_sse41 LABEL PROC
DB 65,15,88,251 ; addps %xmm11,%xmm7
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 102,15,56,20,207 ; blendvps %xmm0,%xmm7,%xmm1
- DB 68,15,40,13,96,140,1,0 ; movaps 0x18c60(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,160,139,1,0 ; movaps 0x18ba0(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,92,196 ; subps %xmm4,%xmm0
DB 68,15,89,192 ; mulps %xmm0,%xmm8
@@ -18569,13 +18569,13 @@ _sk_luminosity_sse41 LABEL PROC
DB 69,15,89,216 ; mulps %xmm8,%xmm11
DB 68,15,40,203 ; movaps %xmm3,%xmm9
DB 68,15,89,205 ; mulps %xmm5,%xmm9
- DB 68,15,40,5,34,140,1,0 ; movaps 0x18c22(%rip),%xmm8 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,5,98,139,1,0 ; movaps 0x18b62(%rip),%xmm8 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
- DB 68,15,40,21,38,140,1,0 ; movaps 0x18c26(%rip),%xmm10 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 68,15,40,21,102,139,1,0 ; movaps 0x18b66(%rip),%xmm10 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 15,40,233 ; movaps %xmm1,%xmm5
DB 65,15,89,234 ; mulps %xmm10,%xmm5
DB 15,88,232 ; addps %xmm0,%xmm5
- DB 68,15,40,37,36,140,1,0 ; movaps 0x18c24(%rip),%xmm12 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,37,100,139,1,0 ; movaps 0x18b64(%rip),%xmm12 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 68,15,40,242 ; movaps %xmm2,%xmm14
DB 69,15,89,244 ; mulps %xmm12,%xmm14
DB 68,15,88,245 ; addps %xmm5,%xmm14
@@ -18660,7 +18660,7 @@ _sk_luminosity_sse41 LABEL PROC
DB 65,15,88,244 ; addps %xmm12,%xmm6
DB 65,15,40,195 ; movaps %xmm11,%xmm0
DB 102,68,15,56,20,206 ; blendvps %xmm0,%xmm6,%xmm9
- DB 15,40,5,42,138,1,0 ; movaps 0x18a2a(%rip),%xmm0 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,5,106,137,1,0 ; movaps 0x1896a(%rip),%xmm0 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,92,215 ; subps %xmm7,%xmm2
DB 15,89,226 ; mulps %xmm2,%xmm4
@@ -18707,20 +18707,20 @@ _sk_srcover_rgba_8888_sse41 LABEL PROC
DB 15,133,219,0,0,0 ; jne 14281 <_sk_srcover_rgba_8888_sse41+0xfb>
DB 243,65,15,111,60,128 ; movdqu (%r8,%rax,4),%xmm7
DB 72,133,255 ; test %rdi,%rdi
- DB 102,15,111,37,57,138,1,0 ; movdqa 0x18a39(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,37,121,137,1,0 ; movdqa 0x18979(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,231 ; pand %xmm7,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
DB 102,15,111,239 ; movdqa %xmm7,%xmm5
- DB 102,15,56,0,45,53,138,1,0 ; pshufb 0x18a35(%rip),%xmm5 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,45,117,137,1,0 ; pshufb 0x18975(%rip),%xmm5 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
DB 102,15,111,247 ; movdqa %xmm7,%xmm6
- DB 102,15,56,0,53,53,138,1,0 ; pshufb 0x18a35(%rip),%xmm6 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,53,117,137,1,0 ; pshufb 0x18975(%rip),%xmm6 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 102,15,114,215,24 ; psrld $0x18,%xmm7
DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7
- DB 68,15,40,5,82,137,1,0 ; movaps 0x18952(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,146,136,1,0 ; movaps 0x18892(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
- DB 68,15,40,37,38,138,1,0 ; movaps 0x18a26(%rip),%xmm12 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,37,102,137,1,0 ; movaps 0x18966(%rip),%xmm12 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 65,15,89,196 ; mulps %xmm12,%xmm0
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -18796,7 +18796,7 @@ _sk_clamp_0_sse41 LABEL PROC
PUBLIC _sk_clamp_1_sse41
_sk_clamp_1_sse41 LABEL PROC
- DB 68,15,40,5,33,136,1,0 ; movaps 0x18821(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,97,135,1,0 ; movaps 0x18761(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,93,192 ; minps %xmm8,%xmm0
DB 65,15,93,200 ; minps %xmm8,%xmm1
DB 65,15,93,208 ; minps %xmm8,%xmm2
@@ -18806,7 +18806,7 @@ _sk_clamp_1_sse41 LABEL PROC
PUBLIC _sk_clamp_a_sse41
_sk_clamp_a_sse41 LABEL PROC
- DB 15,93,29,6,136,1,0 ; minps 0x18806(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,29,70,135,1,0 ; minps 0x18746(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,93,195 ; minps %xmm3,%xmm0
DB 15,93,203 ; minps %xmm3,%xmm1
DB 15,93,211 ; minps %xmm3,%xmm2
@@ -18815,7 +18815,7 @@ _sk_clamp_a_sse41 LABEL PROC
PUBLIC _sk_clamp_a_dst_sse41
_sk_clamp_a_dst_sse41 LABEL PROC
- DB 15,93,61,242,135,1,0 ; minps 0x187f2(%rip),%xmm7 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,61,50,135,1,0 ; minps 0x18732(%rip),%xmm7 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,93,231 ; minps %xmm7,%xmm4
DB 15,93,239 ; minps %xmm7,%xmm5
DB 15,93,247 ; minps %xmm7,%xmm6
@@ -18844,7 +18844,7 @@ _sk_swap_rb_sse41 LABEL PROC
PUBLIC _sk_invert_sse41
_sk_invert_sse41 LABEL PROC
- DB 68,15,40,5,174,135,1,0 ; movaps 0x187ae(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,238,134,1,0 ; movaps 0x186ee(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,92,200 ; subps %xmm0,%xmm9
DB 69,15,40,208 ; movaps %xmm8,%xmm10
@@ -18896,7 +18896,7 @@ _sk_premul_dst_sse41 LABEL PROC
PUBLIC _sk_unpremul_sse41
_sk_unpremul_sse41 LABEL PROC
DB 69,15,87,192 ; xorps %xmm8,%xmm8
- DB 68,15,40,13,56,135,1,0 ; movaps 0x18738(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,120,134,1,0 ; movaps 0x18678(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,94,203 ; divps %xmm3,%xmm9
DB 68,15,194,195,4 ; cmpneqps %xmm3,%xmm8
DB 69,15,84,193 ; andps %xmm9,%xmm8
@@ -18908,20 +18908,20 @@ _sk_unpremul_sse41 LABEL PROC
PUBLIC _sk_from_srgb_sse41
_sk_from_srgb_sse41 LABEL PROC
- DB 68,15,40,29,3,136,1,0 ; movaps 0x18803(%rip),%xmm11 # 2cc30 <_sk_overlay_sse2_8bit+0xfbb>
+ DB 68,15,40,29,67,135,1,0 ; movaps 0x18743(%rip),%xmm11 # 2cb70 <_sk_overlay_sse2_8bit+0xfc0>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
DB 68,15,40,208 ; movaps %xmm0,%xmm10
DB 69,15,89,210 ; mulps %xmm10,%xmm10
- DB 68,15,40,37,123,135,1,0 ; movaps 0x1877b(%rip),%xmm12 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,37,187,134,1,0 ; movaps 0x186bb(%rip),%xmm12 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 68,15,40,192 ; movaps %xmm0,%xmm8
DB 69,15,89,196 ; mulps %xmm12,%xmm8
- DB 68,15,40,45,235,135,1,0 ; movaps 0x187eb(%rip),%xmm13 # 2cc40 <_sk_overlay_sse2_8bit+0xfcb>
+ DB 68,15,40,45,43,135,1,0 ; movaps 0x1872b(%rip),%xmm13 # 2cb80 <_sk_overlay_sse2_8bit+0xfd0>
DB 69,15,88,197 ; addps %xmm13,%xmm8
DB 69,15,89,194 ; mulps %xmm10,%xmm8
- DB 68,15,40,53,235,135,1,0 ; movaps 0x187eb(%rip),%xmm14 # 2cc50 <_sk_overlay_sse2_8bit+0xfdb>
+ DB 68,15,40,53,43,135,1,0 ; movaps 0x1872b(%rip),%xmm14 # 2cb90 <_sk_overlay_sse2_8bit+0xfe0>
DB 69,15,88,198 ; addps %xmm14,%xmm8
- DB 68,15,40,61,239,135,1,0 ; movaps 0x187ef(%rip),%xmm15 # 2cc60 <_sk_overlay_sse2_8bit+0xfeb>
+ DB 68,15,40,61,47,135,1,0 ; movaps 0x1872f(%rip),%xmm15 # 2cba0 <_sk_overlay_sse2_8bit+0xff0>
DB 65,15,194,199,1 ; cmpltps %xmm15,%xmm0
DB 102,69,15,56,20,193 ; blendvps %xmm0,%xmm9,%xmm8
DB 68,15,40,209 ; movaps %xmm1,%xmm10
@@ -18956,19 +18956,19 @@ PUBLIC _sk_from_srgb_dst_sse41
_sk_from_srgb_dst_sse41 LABEL PROC
DB 68,15,40,204 ; movaps %xmm4,%xmm9
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,40,29,58,135,1,0 ; movaps 0x1873a(%rip),%xmm11 # 2cc30 <_sk_overlay_sse2_8bit+0xfbb>
+ DB 68,15,40,29,122,134,1,0 ; movaps 0x1867a(%rip),%xmm11 # 2cb70 <_sk_overlay_sse2_8bit+0xfc0>
DB 69,15,40,209 ; movaps %xmm9,%xmm10
DB 69,15,89,211 ; mulps %xmm11,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
- DB 68,15,40,37,179,134,1,0 ; movaps 0x186b3(%rip),%xmm12 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,37,243,133,1,0 ; movaps 0x185f3(%rip),%xmm12 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 65,15,89,228 ; mulps %xmm12,%xmm4
- DB 68,15,40,45,39,135,1,0 ; movaps 0x18727(%rip),%xmm13 # 2cc40 <_sk_overlay_sse2_8bit+0xfcb>
+ DB 68,15,40,45,103,134,1,0 ; movaps 0x18667(%rip),%xmm13 # 2cb80 <_sk_overlay_sse2_8bit+0xfd0>
DB 65,15,88,229 ; addps %xmm13,%xmm4
DB 15,89,224 ; mulps %xmm0,%xmm4
- DB 68,15,40,53,40,135,1,0 ; movaps 0x18728(%rip),%xmm14 # 2cc50 <_sk_overlay_sse2_8bit+0xfdb>
+ DB 68,15,40,53,104,134,1,0 ; movaps 0x18668(%rip),%xmm14 # 2cb90 <_sk_overlay_sse2_8bit+0xfe0>
DB 65,15,88,230 ; addps %xmm14,%xmm4
- DB 68,15,40,61,44,135,1,0 ; movaps 0x1872c(%rip),%xmm15 # 2cc60 <_sk_overlay_sse2_8bit+0xfeb>
+ DB 68,15,40,61,108,134,1,0 ; movaps 0x1866c(%rip),%xmm15 # 2cba0 <_sk_overlay_sse2_8bit+0xff0>
DB 69,15,194,207,1 ; cmpltps %xmm15,%xmm9
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 102,65,15,56,20,226 ; blendvps %xmm0,%xmm10,%xmm4
@@ -19011,22 +19011,22 @@ _sk_to_srgb_sse41 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
DB 15,40,209 ; movaps %xmm1,%xmm2
DB 68,15,82,192 ; rsqrtps %xmm0,%xmm8
- DB 68,15,40,29,157,134,1,0 ; movaps 0x1869d(%rip),%xmm11 # 2cc70 <_sk_overlay_sse2_8bit+0xffb>
+ DB 68,15,40,29,221,133,1,0 ; movaps 0x185dd(%rip),%xmm11 # 2cbb0 <_sk_overlay_sse2_8bit+0x1000>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
- DB 68,15,40,37,157,134,1,0 ; movaps 0x1869d(%rip),%xmm12 # 2cc80 <_sk_overlay_sse2_8bit+0x100b>
+ DB 68,15,40,37,221,133,1,0 ; movaps 0x185dd(%rip),%xmm12 # 2cbc0 <_sk_overlay_sse2_8bit+0x1010>
DB 69,15,40,248 ; movaps %xmm8,%xmm15
DB 69,15,89,252 ; mulps %xmm12,%xmm15
- DB 68,15,40,21,157,134,1,0 ; movaps 0x1869d(%rip),%xmm10 # 2cc90 <_sk_overlay_sse2_8bit+0x101b>
+ DB 68,15,40,21,221,133,1,0 ; movaps 0x185dd(%rip),%xmm10 # 2cbd0 <_sk_overlay_sse2_8bit+0x1020>
DB 69,15,88,250 ; addps %xmm10,%xmm15
DB 69,15,89,248 ; mulps %xmm8,%xmm15
- DB 68,15,40,45,157,134,1,0 ; movaps 0x1869d(%rip),%xmm13 # 2cca0 <_sk_overlay_sse2_8bit+0x102b>
+ DB 68,15,40,45,221,133,1,0 ; movaps 0x185dd(%rip),%xmm13 # 2cbe0 <_sk_overlay_sse2_8bit+0x1030>
DB 69,15,88,253 ; addps %xmm13,%xmm15
- DB 68,15,40,53,161,134,1,0 ; movaps 0x186a1(%rip),%xmm14 # 2ccb0 <_sk_overlay_sse2_8bit+0x103b>
+ DB 68,15,40,53,225,133,1,0 ; movaps 0x185e1(%rip),%xmm14 # 2cbf0 <_sk_overlay_sse2_8bit+0x1040>
DB 69,15,88,198 ; addps %xmm14,%xmm8
DB 69,15,83,192 ; rcpps %xmm8,%xmm8
DB 69,15,89,199 ; mulps %xmm15,%xmm8
- DB 68,15,40,61,157,134,1,0 ; movaps 0x1869d(%rip),%xmm15 # 2ccc0 <_sk_overlay_sse2_8bit+0x104b>
+ DB 68,15,40,61,221,133,1,0 ; movaps 0x185dd(%rip),%xmm15 # 2cc00 <_sk_overlay_sse2_8bit+0x1050>
DB 65,15,194,199,1 ; cmpltps %xmm15,%xmm0
DB 102,69,15,56,20,193 ; blendvps %xmm0,%xmm9,%xmm8
DB 68,15,82,202 ; rsqrtps %xmm2,%xmm9
@@ -19080,7 +19080,7 @@ _sk_rgb_to_hsl_sse41 LABEL PROC
DB 68,15,93,224 ; minps %xmm0,%xmm12
DB 65,15,40,203 ; movaps %xmm11,%xmm1
DB 65,15,92,204 ; subps %xmm12,%xmm1
- DB 68,15,40,53,81,132,1,0 ; movaps 0x18451(%rip),%xmm14 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,53,145,131,1,0 ; movaps 0x18391(%rip),%xmm14 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,94,241 ; divps %xmm1,%xmm14
DB 69,15,40,211 ; movaps %xmm11,%xmm10
DB 69,15,194,208,0 ; cmpeqps %xmm8,%xmm10
@@ -19089,27 +19089,27 @@ _sk_rgb_to_hsl_sse41 LABEL PROC
DB 65,15,89,198 ; mulps %xmm14,%xmm0
DB 69,15,40,249 ; movaps %xmm9,%xmm15
DB 68,15,194,250,1 ; cmpltps %xmm2,%xmm15
- DB 68,15,84,61,184,133,1,0 ; andps 0x185b8(%rip),%xmm15 # 2ccd0 <_sk_overlay_sse2_8bit+0x105b>
+ DB 68,15,84,61,248,132,1,0 ; andps 0x184f8(%rip),%xmm15 # 2cc10 <_sk_overlay_sse2_8bit+0x1060>
DB 68,15,88,248 ; addps %xmm0,%xmm15
DB 65,15,40,195 ; movaps %xmm11,%xmm0
DB 65,15,194,193,0 ; cmpeqps %xmm9,%xmm0
DB 65,15,92,208 ; subps %xmm8,%xmm2
DB 65,15,89,214 ; mulps %xmm14,%xmm2
- DB 68,15,40,45,171,133,1,0 ; movaps 0x185ab(%rip),%xmm13 # 2cce0 <_sk_overlay_sse2_8bit+0x106b>
+ DB 68,15,40,45,235,132,1,0 ; movaps 0x184eb(%rip),%xmm13 # 2cc20 <_sk_overlay_sse2_8bit+0x1070>
DB 65,15,88,213 ; addps %xmm13,%xmm2
DB 69,15,92,193 ; subps %xmm9,%xmm8
DB 69,15,89,198 ; mulps %xmm14,%xmm8
- DB 68,15,88,5,167,133,1,0 ; addps 0x185a7(%rip),%xmm8 # 2ccf0 <_sk_overlay_sse2_8bit+0x107b>
+ DB 68,15,88,5,231,132,1,0 ; addps 0x184e7(%rip),%xmm8 # 2cc30 <_sk_overlay_sse2_8bit+0x1080>
DB 102,68,15,56,20,194 ; blendvps %xmm0,%xmm2,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 102,69,15,56,20,199 ; blendvps %xmm0,%xmm15,%xmm8
- DB 68,15,89,5,159,133,1,0 ; mulps 0x1859f(%rip),%xmm8 # 2cd00 <_sk_overlay_sse2_8bit+0x108b>
+ DB 68,15,89,5,223,132,1,0 ; mulps 0x184df(%rip),%xmm8 # 2cc40 <_sk_overlay_sse2_8bit+0x1090>
DB 69,15,40,203 ; movaps %xmm11,%xmm9
DB 69,15,194,204,4 ; cmpneqps %xmm12,%xmm9
DB 69,15,84,193 ; andps %xmm9,%xmm8
DB 69,15,92,235 ; subps %xmm11,%xmm13
DB 69,15,88,220 ; addps %xmm12,%xmm11
- DB 15,40,5,163,131,1,0 ; movaps 0x183a3(%rip),%xmm0 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,40,5,227,130,1,0 ; movaps 0x182e3(%rip),%xmm0 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,40,211 ; movaps %xmm11,%xmm2
DB 15,89,208 ; mulps %xmm0,%xmm2
DB 15,194,194,1 ; cmpltps %xmm2,%xmm0
@@ -19130,7 +19130,7 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 15,41,100,36,32 ; movaps %xmm4,0x20(%rsp)
DB 15,41,92,36,16 ; movaps %xmm3,0x10(%rsp)
DB 68,15,40,208 ; movaps %xmm0,%xmm10
- DB 68,15,40,13,85,131,1,0 ; movaps 0x18355(%rip),%xmm9 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,13,149,130,1,0 ; movaps 0x18295(%rip),%xmm9 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,194,194,2 ; cmpleps %xmm2,%xmm0
DB 15,40,217 ; movaps %xmm1,%xmm3
@@ -19143,19 +19143,19 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 15,41,20,36 ; movaps %xmm2,(%rsp)
DB 69,15,88,192 ; addps %xmm8,%xmm8
DB 68,15,92,197 ; subps %xmm5,%xmm8
- DB 68,15,40,53,17,133,1,0 ; movaps 0x18511(%rip),%xmm14 # 2cd10 <_sk_overlay_sse2_8bit+0x109b>
+ DB 68,15,40,53,81,132,1,0 ; movaps 0x18451(%rip),%xmm14 # 2cc50 <_sk_overlay_sse2_8bit+0x10a0>
DB 69,15,88,242 ; addps %xmm10,%xmm14
DB 102,65,15,58,8,198,1 ; roundps $0x1,%xmm14,%xmm0
DB 68,15,92,240 ; subps %xmm0,%xmm14
- DB 68,15,40,29,10,133,1,0 ; movaps 0x1850a(%rip),%xmm11 # 2cd20 <_sk_overlay_sse2_8bit+0x10ab>
+ DB 68,15,40,29,74,132,1,0 ; movaps 0x1844a(%rip),%xmm11 # 2cc60 <_sk_overlay_sse2_8bit+0x10b0>
DB 65,15,40,195 ; movaps %xmm11,%xmm0
DB 65,15,194,198,2 ; cmpleps %xmm14,%xmm0
DB 15,40,245 ; movaps %xmm5,%xmm6
DB 65,15,92,240 ; subps %xmm8,%xmm6
- DB 15,40,61,163,132,1,0 ; movaps 0x184a3(%rip),%xmm7 # 2ccd0 <_sk_overlay_sse2_8bit+0x105b>
+ DB 15,40,61,227,131,1,0 ; movaps 0x183e3(%rip),%xmm7 # 2cc10 <_sk_overlay_sse2_8bit+0x1060>
DB 69,15,40,238 ; movaps %xmm14,%xmm13
DB 68,15,89,239 ; mulps %xmm7,%xmm13
- DB 15,40,29,180,132,1,0 ; movaps 0x184b4(%rip),%xmm3 # 2ccf0 <_sk_overlay_sse2_8bit+0x107b>
+ DB 15,40,29,244,131,1,0 ; movaps 0x183f4(%rip),%xmm3 # 2cc30 <_sk_overlay_sse2_8bit+0x1080>
DB 68,15,40,227 ; movaps %xmm3,%xmm12
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 68,15,89,230 ; mulps %xmm6,%xmm12
@@ -19165,7 +19165,7 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 65,15,194,198,2 ; cmpleps %xmm14,%xmm0
DB 68,15,40,253 ; movaps %xmm5,%xmm15
DB 102,69,15,56,20,252 ; blendvps %xmm0,%xmm12,%xmm15
- DB 68,15,40,37,147,132,1,0 ; movaps 0x18493(%rip),%xmm12 # 2cd00 <_sk_overlay_sse2_8bit+0x108b>
+ DB 68,15,40,37,211,131,1,0 ; movaps 0x183d3(%rip),%xmm12 # 2cc40 <_sk_overlay_sse2_8bit+0x1090>
DB 65,15,40,196 ; movaps %xmm12,%xmm0
DB 65,15,194,198,2 ; cmpleps %xmm14,%xmm0
DB 68,15,89,238 ; mulps %xmm6,%xmm13
@@ -19199,7 +19199,7 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 65,15,40,198 ; movaps %xmm14,%xmm0
DB 15,40,20,36 ; movaps (%rsp),%xmm2
DB 102,15,56,20,202 ; blendvps %xmm0,%xmm2,%xmm1
- DB 68,15,88,21,44,132,1,0 ; addps 0x1842c(%rip),%xmm10 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,88,21,108,131,1,0 ; addps 0x1836c(%rip),%xmm10 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 102,65,15,58,8,194,1 ; roundps $0x1,%xmm10,%xmm0
DB 68,15,92,208 ; subps %xmm0,%xmm10
DB 69,15,194,218,2 ; cmpleps %xmm10,%xmm11
@@ -19253,9 +19253,9 @@ _sk_scale_u8_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,52 ; jne 149ef <_sk_scale_u8_sse41+0x4c>
DB 102,71,15,56,49,4,16 ; pmovzxbd (%r8,%r10,1),%xmm8
- DB 102,68,15,219,5,37,130,1,0 ; pand 0x18225(%rip),%xmm8 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,68,15,219,5,101,129,1,0 ; pand 0x18165(%rip),%xmm8 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,105,131,1,0 ; mulps 0x18369(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,89,5,169,130,1,0 ; mulps 0x182a9(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 65,15,89,208 ; mulps %xmm8,%xmm2
@@ -19297,17 +19297,17 @@ _sk_scale_565_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,159,0,0,0 ; jne 14b09 <_sk_scale_565_sse41+0xc3>
DB 102,71,15,56,51,28,80 ; pmovzxwd (%r8,%r10,2),%xmm11
- DB 102,15,111,5,215,130,1,0 ; movdqa 0x182d7(%rip),%xmm0 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,5,23,130,1,0 ; movdqa 0x18217(%rip),%xmm0 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,65,15,219,195 ; pand %xmm11,%xmm0
DB 68,15,91,200 ; cvtdq2ps %xmm0,%xmm9
- DB 68,15,89,13,214,130,1,0 ; mulps 0x182d6(%rip),%xmm9 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,5,222,130,1,0 ; movdqa 0x182de(%rip),%xmm0 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 68,15,89,13,22,130,1,0 ; mulps 0x18216(%rip),%xmm9 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,5,30,130,1,0 ; movdqa 0x1821e(%rip),%xmm0 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,65,15,219,195 ; pand %xmm11,%xmm0
DB 68,15,91,208 ; cvtdq2ps %xmm0,%xmm10
- DB 68,15,89,21,221,130,1,0 ; mulps 0x182dd(%rip),%xmm10 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,68,15,219,29,228,130,1,0 ; pand 0x182e4(%rip),%xmm11 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 68,15,89,21,29,130,1,0 ; mulps 0x1821d(%rip),%xmm10 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,68,15,219,29,36,130,1,0 ; pand 0x18224(%rip),%xmm11 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 69,15,91,219 ; cvtdq2ps %xmm11,%xmm11
- DB 68,15,89,29,232,130,1,0 ; mulps 0x182e8(%rip),%xmm11 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 68,15,89,29,40,130,1,0 ; mulps 0x18228(%rip),%xmm11 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 15,40,195 ; movaps %xmm3,%xmm0
DB 15,194,199,1 ; cmpltps %xmm7,%xmm0
DB 69,15,40,226 ; movaps %xmm10,%xmm12
@@ -19380,9 +19380,9 @@ _sk_lerp_u8_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,72 ; jne 14bf9 <_sk_lerp_u8_sse41+0x60>
DB 102,71,15,56,49,4,16 ; pmovzxbd (%r8,%r10,1),%xmm8
- DB 102,68,15,219,5,47,128,1,0 ; pand 0x1802f(%rip),%xmm8 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,68,15,219,5,111,127,1,0 ; pand 0x17f6f(%rip),%xmm8 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,115,129,1,0 ; mulps 0x18173(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,89,5,179,128,1,0 ; mulps 0x180b3(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 15,92,196 ; subps %xmm4,%xmm0
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -19431,17 +19431,17 @@ _sk_lerp_565_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 15,133,165,0,0,0 ; jne 14d1c <_sk_lerp_565_sse41+0xc9>
DB 102,71,15,56,51,20,80 ; pmovzxwd (%r8,%r10,2),%xmm10
- DB 102,15,111,5,202,128,1,0 ; movdqa 0x180ca(%rip),%xmm0 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,5,10,128,1,0 ; movdqa 0x1800a(%rip),%xmm0 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,65,15,219,194 ; pand %xmm10,%xmm0
DB 68,15,91,200 ; cvtdq2ps %xmm0,%xmm9
- DB 68,15,89,13,201,128,1,0 ; mulps 0x180c9(%rip),%xmm9 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,5,209,128,1,0 ; movdqa 0x180d1(%rip),%xmm0 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 68,15,89,13,9,128,1,0 ; mulps 0x18009(%rip),%xmm9 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,5,17,128,1,0 ; movdqa 0x18011(%rip),%xmm0 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,65,15,219,194 ; pand %xmm10,%xmm0
DB 68,15,91,216 ; cvtdq2ps %xmm0,%xmm11
- DB 68,15,89,29,208,128,1,0 ; mulps 0x180d0(%rip),%xmm11 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,68,15,219,21,215,128,1,0 ; pand 0x180d7(%rip),%xmm10 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 68,15,89,29,16,128,1,0 ; mulps 0x18010(%rip),%xmm11 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,68,15,219,21,23,128,1,0 ; pand 0x18017(%rip),%xmm10 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
- DB 68,15,89,21,219,128,1,0 ; mulps 0x180db(%rip),%xmm10 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 68,15,89,21,27,128,1,0 ; mulps 0x1801b(%rip),%xmm10 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 15,40,195 ; movaps %xmm3,%xmm0
DB 15,194,199,1 ; cmpltps %xmm7,%xmm0
DB 69,15,40,227 ; movaps %xmm11,%xmm12
@@ -19495,7 +19495,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 243,69,15,111,4,144 ; movdqu (%r8,%rdx,4),%xmm8
DB 65,86 ; push %r14
DB 83 ; push %rbx
- DB 102,15,111,5,93,126,1,0 ; movdqa 0x17e5d(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,157,125,1,0 ; movdqa 0x17d9d(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,73,15,58,22,192,1 ; pextrq $0x1,%xmm0,%r8
DB 102,73,15,126,193 ; movq %xmm0,%r9
@@ -19510,7 +19510,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 102,66,15,58,33,4,155,32 ; insertps $0x20,(%rbx,%r11,4),%xmm0
DB 102,66,15,58,33,4,3,48 ; insertps $0x30,(%rbx,%r8,1),%xmm0
DB 102,65,15,111,200 ; movdqa %xmm8,%xmm1
- DB 102,15,56,0,13,24,126,1,0 ; pshufb 0x17e18(%rip),%xmm1 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,13,88,125,1,0 ; pshufb 0x17d58(%rip),%xmm1 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 102,73,15,58,22,200,1 ; pextrq $0x1,%xmm1,%r8
DB 102,72,15,126,203 ; movq %xmm1,%rbx
DB 68,15,182,203 ; movzbl %bl,%r9d
@@ -19525,7 +19525,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 102,15,58,33,202,48 ; insertps $0x30,%xmm2,%xmm1
DB 76,139,64,24 ; mov 0x18(%rax),%r8
DB 102,65,15,111,208 ; movdqa %xmm8,%xmm2
- DB 102,15,56,0,21,212,125,1,0 ; pshufb 0x17dd4(%rip),%xmm2 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,21,20,125,1,0 ; pshufb 0x17d14(%rip),%xmm2 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 102,72,15,58,22,211,1 ; pextrq $0x1,%xmm2,%rbx
DB 102,72,15,126,208 ; movq %xmm2,%rax
DB 68,15,182,200 ; movzbl %al,%r9d
@@ -19540,7 +19540,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 102,15,58,33,211,48 ; insertps $0x30,%xmm3,%xmm2
DB 102,65,15,114,208,24 ; psrld $0x18,%xmm8
DB 65,15,91,216 ; cvtdq2ps %xmm8,%xmm3
- DB 15,89,29,177,126,1,0 ; mulps 0x17eb1(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,29,241,125,1,0 ; mulps 0x17df1(%rip),%xmm3 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
DB 65,94 ; pop %r14
@@ -19579,7 +19579,7 @@ _sk_load_tables_u16_be_sse41 LABEL PROC
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,97,200 ; punpcklwd %xmm0,%xmm1
DB 102,68,15,105,200 ; punpckhwd %xmm0,%xmm9
- DB 102,68,15,111,5,131,126,1,0 ; movdqa 0x17e83(%rip),%xmm8 # 2cdb0 <_sk_overlay_sse2_8bit+0x113b>
+ DB 102,68,15,111,5,195,125,1,0 ; movdqa 0x17dc3(%rip),%xmm8 # 2ccf0 <_sk_overlay_sse2_8bit+0x1140>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,15,56,51,192 ; pmovzxwd %xmm0,%xmm0
@@ -19597,7 +19597,7 @@ _sk_load_tables_u16_be_sse41 LABEL PROC
DB 102,15,58,33,194,32 ; insertps $0x20,%xmm2,%xmm0
DB 243,66,15,16,20,3 ; movss (%rbx,%r8,1),%xmm2
DB 102,15,58,33,194,48 ; insertps $0x30,%xmm2,%xmm0
- DB 102,15,56,0,13,50,126,1,0 ; pshufb 0x17e32(%rip),%xmm1 # 2cdc0 <_sk_overlay_sse2_8bit+0x114b>
+ DB 102,15,56,0,13,114,125,1,0 ; pshufb 0x17d72(%rip),%xmm1 # 2cd00 <_sk_overlay_sse2_8bit+0x1150>
DB 102,15,56,51,201 ; pmovzxwd %xmm1,%xmm1
DB 102,73,15,58,22,200,1 ; pextrq $0x1,%xmm1,%r8
DB 102,72,15,126,203 ; movq %xmm1,%rbx
@@ -19633,7 +19633,7 @@ _sk_load_tables_u16_be_sse41 LABEL PROC
DB 102,65,15,235,216 ; por %xmm8,%xmm3
DB 102,15,56,51,219 ; pmovzxwd %xmm3,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,128,125,1,0 ; mulps 0x17d80(%rip),%xmm3 # 2cdd0 <_sk_overlay_sse2_8bit+0x115b>
+ DB 15,89,29,192,124,1,0 ; mulps 0x17cc0(%rip),%xmm3 # 2cd10 <_sk_overlay_sse2_8bit+0x1160>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
DB 65,94 ; pop %r14
@@ -19671,7 +19671,7 @@ _sk_load_tables_rgb_u16_be_sse41 LABEL PROC
DB 102,68,15,97,200 ; punpcklwd %xmm0,%xmm9
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,65,15,97,201 ; punpcklwd %xmm9,%xmm1
- DB 102,68,15,111,5,201,124,1,0 ; movdqa 0x17cc9(%rip),%xmm8 # 2cdb0 <_sk_overlay_sse2_8bit+0x113b>
+ DB 102,68,15,111,5,9,124,1,0 ; movdqa 0x17c09(%rip),%xmm8 # 2ccf0 <_sk_overlay_sse2_8bit+0x1140>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,15,56,51,192 ; pmovzxwd %xmm0,%xmm0
@@ -19689,7 +19689,7 @@ _sk_load_tables_rgb_u16_be_sse41 LABEL PROC
DB 102,15,58,33,195,32 ; insertps $0x20,%xmm3,%xmm0
DB 243,66,15,16,28,3 ; movss (%rbx,%r8,1),%xmm3
DB 102,15,58,33,195,48 ; insertps $0x30,%xmm3,%xmm0
- DB 102,15,56,0,13,152,124,1,0 ; pshufb 0x17c98(%rip),%xmm1 # 2cde0 <_sk_overlay_sse2_8bit+0x116b>
+ DB 102,15,56,0,13,216,123,1,0 ; pshufb 0x17bd8(%rip),%xmm1 # 2cd20 <_sk_overlay_sse2_8bit+0x1170>
DB 102,15,56,51,201 ; pmovzxwd %xmm1,%xmm1
DB 102,73,15,58,22,200,1 ; pextrq $0x1,%xmm1,%r8
DB 102,72,15,126,203 ; movq %xmm1,%rbx
@@ -19720,7 +19720,7 @@ _sk_load_tables_rgb_u16_be_sse41 LABEL PROC
DB 243,65,15,16,28,24 ; movss (%r8,%rbx,1),%xmm3
DB 102,15,58,33,211,48 ; insertps $0x30,%xmm3,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,83,121,1,0 ; movaps 0x17953(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,147,120,1,0 ; movaps 0x17893(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 91 ; pop %rbx
DB 65,94 ; pop %r14
DB 255,224 ; jmpq *%rax
@@ -19750,7 +19750,7 @@ _sk_byte_tables_sse41 LABEL PROC
DB 65,86 ; push %r14
DB 83 ; push %rbx
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,191,121,1,0 ; movaps 0x179bf(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,255,120,1,0 ; movaps 0x178ff(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 102,73,15,58,22,192,1 ; pextrq $0x1,%xmm0,%r8
@@ -19769,7 +19769,7 @@ _sk_byte_tables_sse41 LABEL PROC
DB 102,15,58,32,195,3 ; pinsrb $0x3,%ebx,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,13,128,122,1,0 ; movaps 0x17a80(%rip),%xmm9 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,13,192,121,1,0 ; movaps 0x179c0(%rip),%xmm9 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -19861,7 +19861,7 @@ _sk_byte_tables_rgb_sse41 LABEL PROC
DB 102,15,58,32,195,3 ; pinsrb $0x3,%ebx,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,13,236,120,1,0 ; movaps 0x178ec(%rip),%xmm9 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,13,44,120,1,0 ; movaps 0x1782c(%rip),%xmm9 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -20029,31 +20029,31 @@ _sk_parametric_r_sse41 LABEL PROC
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,194 ; cvtdq2ps %xmm10,%xmm8
- DB 68,15,89,5,222,118,1,0 ; mulps 0x176de(%rip),%xmm8 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,21,230,118,1,0 ; andps 0x176e6(%rip),%xmm10 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,21,254,115,1,0 ; orps 0x173fe(%rip),%xmm10 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,5,230,118,1,0 ; addps 0x176e6(%rip),%xmm8 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 68,15,40,37,238,118,1,0 ; movaps 0x176ee(%rip),%xmm12 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,5,30,118,1,0 ; mulps 0x1761e(%rip),%xmm8 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,21,38,118,1,0 ; andps 0x17626(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,21,62,115,1,0 ; orps 0x1733e(%rip),%xmm10 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,5,38,118,1,0 ; addps 0x17626(%rip),%xmm8 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 68,15,40,37,46,118,1,0 ; movaps 0x1762e(%rip),%xmm12 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,196 ; subps %xmm12,%xmm8
- DB 68,15,88,21,238,118,1,0 ; addps 0x176ee(%rip),%xmm10 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 68,15,40,37,246,118,1,0 ; movaps 0x176f6(%rip),%xmm12 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,21,46,118,1,0 ; addps 0x1762e(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 68,15,40,37,54,118,1,0 ; movaps 0x17636(%rip),%xmm12 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,196 ; subps %xmm12,%xmm8
DB 69,15,89,195 ; mulps %xmm11,%xmm8
DB 102,69,15,58,8,208,1 ; roundps $0x1,%xmm8,%xmm10
DB 69,15,40,216 ; movaps %xmm8,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,5,227,118,1,0 ; addps 0x176e3(%rip),%xmm8 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 68,15,40,21,235,118,1,0 ; movaps 0x176eb(%rip),%xmm10 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,5,35,118,1,0 ; addps 0x17623(%rip),%xmm8 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 68,15,40,21,43,118,1,0 ; movaps 0x1762b(%rip),%xmm10 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 69,15,89,211 ; mulps %xmm11,%xmm10
DB 69,15,92,194 ; subps %xmm10,%xmm8
- DB 68,15,40,21,235,118,1,0 ; movaps 0x176eb(%rip),%xmm10 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,21,43,118,1,0 ; movaps 0x1762b(%rip),%xmm10 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 68,15,40,29,239,118,1,0 ; movaps 0x176ef(%rip),%xmm11 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,29,47,118,1,0 ; movaps 0x1762f(%rip),%xmm11 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 69,15,94,218 ; divps %xmm10,%xmm11
DB 69,15,88,216 ; addps %xmm8,%xmm11
- DB 68,15,89,29,239,118,1,0 ; mulps 0x176ef(%rip),%xmm11 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 68,15,89,29,47,118,1,0 ; mulps 0x1762f(%rip),%xmm11 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,69,15,91,211 ; cvtps2dq %xmm11,%xmm10
DB 243,68,15,16,64,20 ; movss 0x14(%rax),%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
@@ -20061,7 +20061,7 @@ _sk_parametric_r_sse41 LABEL PROC
DB 102,69,15,56,20,193 ; blendvps %xmm0,%xmm9,%xmm8
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 68,15,95,192 ; maxps %xmm0,%xmm8
- DB 68,15,93,5,118,115,1,0 ; minps 0x17376(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,93,5,182,114,1,0 ; minps 0x172b6(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -20089,31 +20089,31 @@ _sk_parametric_g_sse41 LABEL PROC
DB 68,15,88,217 ; addps %xmm1,%xmm11
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,91,227 ; cvtdq2ps %xmm11,%xmm12
- DB 68,15,89,37,183,117,1,0 ; mulps 0x175b7(%rip),%xmm12 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,29,191,117,1,0 ; andps 0x175bf(%rip),%xmm11 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,29,215,114,1,0 ; orps 0x172d7(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,37,191,117,1,0 ; addps 0x175bf(%rip),%xmm12 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 15,40,13,200,117,1,0 ; movaps 0x175c8(%rip),%xmm1 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,37,247,116,1,0 ; mulps 0x174f7(%rip),%xmm12 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,29,255,116,1,0 ; andps 0x174ff(%rip),%xmm11 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,29,23,114,1,0 ; orps 0x17217(%rip),%xmm11 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,37,255,116,1,0 ; addps 0x174ff(%rip),%xmm12 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 15,40,13,8,117,1,0 ; movaps 0x17508(%rip),%xmm1 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 65,15,89,203 ; mulps %xmm11,%xmm1
DB 68,15,92,225 ; subps %xmm1,%xmm12
- DB 68,15,88,29,200,117,1,0 ; addps 0x175c8(%rip),%xmm11 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 15,40,13,209,117,1,0 ; movaps 0x175d1(%rip),%xmm1 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,29,8,117,1,0 ; addps 0x17508(%rip),%xmm11 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 15,40,13,17,117,1,0 ; movaps 0x17511(%rip),%xmm1 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 65,15,94,203 ; divps %xmm11,%xmm1
DB 68,15,92,225 ; subps %xmm1,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 102,69,15,58,8,212,1 ; roundps $0x1,%xmm12,%xmm10
DB 69,15,40,220 ; movaps %xmm12,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,37,190,117,1,0 ; addps 0x175be(%rip),%xmm12 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 15,40,13,199,117,1,0 ; movaps 0x175c7(%rip),%xmm1 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,37,254,116,1,0 ; addps 0x174fe(%rip),%xmm12 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 15,40,13,7,117,1,0 ; movaps 0x17507(%rip),%xmm1 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 65,15,89,203 ; mulps %xmm11,%xmm1
DB 68,15,92,225 ; subps %xmm1,%xmm12
- DB 68,15,40,21,199,117,1,0 ; movaps 0x175c7(%rip),%xmm10 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,21,7,117,1,0 ; movaps 0x17507(%rip),%xmm10 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 15,40,13,204,117,1,0 ; movaps 0x175cc(%rip),%xmm1 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 15,40,13,12,117,1,0 ; movaps 0x1750c(%rip),%xmm1 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 65,15,94,202 ; divps %xmm10,%xmm1
DB 65,15,88,204 ; addps %xmm12,%xmm1
- DB 15,89,13,205,117,1,0 ; mulps 0x175cd(%rip),%xmm1 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 15,89,13,13,117,1,0 ; mulps 0x1750d(%rip),%xmm1 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,68,15,91,209 ; cvtps2dq %xmm1,%xmm10
DB 243,15,16,72,20 ; movss 0x14(%rax),%xmm1
DB 15,198,201,0 ; shufps $0x0,%xmm1,%xmm1
@@ -20121,7 +20121,7 @@ _sk_parametric_g_sse41 LABEL PROC
DB 102,65,15,56,20,201 ; blendvps %xmm0,%xmm9,%xmm1
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,95,200 ; maxps %xmm0,%xmm1
- DB 15,93,13,88,114,1,0 ; minps 0x17258(%rip),%xmm1 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,13,152,113,1,0 ; minps 0x17198(%rip),%xmm1 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -20149,31 +20149,31 @@ _sk_parametric_b_sse41 LABEL PROC
DB 68,15,88,218 ; addps %xmm2,%xmm11
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,91,227 ; cvtdq2ps %xmm11,%xmm12
- DB 68,15,89,37,153,116,1,0 ; mulps 0x17499(%rip),%xmm12 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,29,161,116,1,0 ; andps 0x174a1(%rip),%xmm11 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,29,185,113,1,0 ; orps 0x171b9(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,37,161,116,1,0 ; addps 0x174a1(%rip),%xmm12 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 15,40,21,170,116,1,0 ; movaps 0x174aa(%rip),%xmm2 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,37,217,115,1,0 ; mulps 0x173d9(%rip),%xmm12 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,29,225,115,1,0 ; andps 0x173e1(%rip),%xmm11 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,29,249,112,1,0 ; orps 0x170f9(%rip),%xmm11 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,37,225,115,1,0 ; addps 0x173e1(%rip),%xmm12 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 15,40,21,234,115,1,0 ; movaps 0x173ea(%rip),%xmm2 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 65,15,89,211 ; mulps %xmm11,%xmm2
DB 68,15,92,226 ; subps %xmm2,%xmm12
- DB 68,15,88,29,170,116,1,0 ; addps 0x174aa(%rip),%xmm11 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 15,40,21,179,116,1,0 ; movaps 0x174b3(%rip),%xmm2 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,29,234,115,1,0 ; addps 0x173ea(%rip),%xmm11 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 15,40,21,243,115,1,0 ; movaps 0x173f3(%rip),%xmm2 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 65,15,94,211 ; divps %xmm11,%xmm2
DB 68,15,92,226 ; subps %xmm2,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 102,69,15,58,8,212,1 ; roundps $0x1,%xmm12,%xmm10
DB 69,15,40,220 ; movaps %xmm12,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,37,160,116,1,0 ; addps 0x174a0(%rip),%xmm12 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 15,40,21,169,116,1,0 ; movaps 0x174a9(%rip),%xmm2 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,37,224,115,1,0 ; addps 0x173e0(%rip),%xmm12 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 15,40,21,233,115,1,0 ; movaps 0x173e9(%rip),%xmm2 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 65,15,89,211 ; mulps %xmm11,%xmm2
DB 68,15,92,226 ; subps %xmm2,%xmm12
- DB 68,15,40,21,169,116,1,0 ; movaps 0x174a9(%rip),%xmm10 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,21,233,115,1,0 ; movaps 0x173e9(%rip),%xmm10 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 15,40,21,174,116,1,0 ; movaps 0x174ae(%rip),%xmm2 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 15,40,21,238,115,1,0 ; movaps 0x173ee(%rip),%xmm2 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 65,15,94,210 ; divps %xmm10,%xmm2
DB 65,15,88,212 ; addps %xmm12,%xmm2
- DB 15,89,21,175,116,1,0 ; mulps 0x174af(%rip),%xmm2 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 15,89,21,239,115,1,0 ; mulps 0x173ef(%rip),%xmm2 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,68,15,91,210 ; cvtps2dq %xmm2,%xmm10
DB 243,15,16,80,20 ; movss 0x14(%rax),%xmm2
DB 15,198,210,0 ; shufps $0x0,%xmm2,%xmm2
@@ -20181,7 +20181,7 @@ _sk_parametric_b_sse41 LABEL PROC
DB 102,65,15,56,20,209 ; blendvps %xmm0,%xmm9,%xmm2
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,95,208 ; maxps %xmm0,%xmm2
- DB 15,93,21,58,113,1,0 ; minps 0x1713a(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,21,122,112,1,0 ; minps 0x1707a(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -20209,31 +20209,31 @@ _sk_parametric_a_sse41 LABEL PROC
DB 68,15,88,219 ; addps %xmm3,%xmm11
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,91,227 ; cvtdq2ps %xmm11,%xmm12
- DB 68,15,89,37,123,115,1,0 ; mulps 0x1737b(%rip),%xmm12 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,29,131,115,1,0 ; andps 0x17383(%rip),%xmm11 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,29,155,112,1,0 ; orps 0x1709b(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,37,131,115,1,0 ; addps 0x17383(%rip),%xmm12 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 15,40,29,140,115,1,0 ; movaps 0x1738c(%rip),%xmm3 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,37,187,114,1,0 ; mulps 0x172bb(%rip),%xmm12 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,29,195,114,1,0 ; andps 0x172c3(%rip),%xmm11 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,29,219,111,1,0 ; orps 0x16fdb(%rip),%xmm11 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,37,195,114,1,0 ; addps 0x172c3(%rip),%xmm12 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 15,40,29,204,114,1,0 ; movaps 0x172cc(%rip),%xmm3 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 65,15,89,219 ; mulps %xmm11,%xmm3
DB 68,15,92,227 ; subps %xmm3,%xmm12
- DB 68,15,88,29,140,115,1,0 ; addps 0x1738c(%rip),%xmm11 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 15,40,29,149,115,1,0 ; movaps 0x17395(%rip),%xmm3 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,29,204,114,1,0 ; addps 0x172cc(%rip),%xmm11 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 15,40,29,213,114,1,0 ; movaps 0x172d5(%rip),%xmm3 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 65,15,94,219 ; divps %xmm11,%xmm3
DB 68,15,92,227 ; subps %xmm3,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 102,69,15,58,8,212,1 ; roundps $0x1,%xmm12,%xmm10
DB 69,15,40,220 ; movaps %xmm12,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,37,130,115,1,0 ; addps 0x17382(%rip),%xmm12 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 15,40,29,139,115,1,0 ; movaps 0x1738b(%rip),%xmm3 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,37,194,114,1,0 ; addps 0x172c2(%rip),%xmm12 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 15,40,29,203,114,1,0 ; movaps 0x172cb(%rip),%xmm3 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 65,15,89,219 ; mulps %xmm11,%xmm3
DB 68,15,92,227 ; subps %xmm3,%xmm12
- DB 68,15,40,21,139,115,1,0 ; movaps 0x1738b(%rip),%xmm10 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,21,203,114,1,0 ; movaps 0x172cb(%rip),%xmm10 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 15,40,29,144,115,1,0 ; movaps 0x17390(%rip),%xmm3 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 15,40,29,208,114,1,0 ; movaps 0x172d0(%rip),%xmm3 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 65,15,94,218 ; divps %xmm10,%xmm3
DB 65,15,88,220 ; addps %xmm12,%xmm3
- DB 15,89,29,145,115,1,0 ; mulps 0x17391(%rip),%xmm3 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 15,89,29,209,114,1,0 ; mulps 0x172d1(%rip),%xmm3 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,68,15,91,211 ; cvtps2dq %xmm3,%xmm10
DB 243,15,16,88,20 ; movss 0x14(%rax),%xmm3
DB 15,198,219,0 ; shufps $0x0,%xmm3,%xmm3
@@ -20241,7 +20241,7 @@ _sk_parametric_a_sse41 LABEL PROC
DB 102,65,15,56,20,217 ; blendvps %xmm0,%xmm9,%xmm3
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,95,216 ; maxps %xmm0,%xmm3
- DB 15,93,29,28,112,1,0 ; minps 0x1701c(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,29,92,111,1,0 ; minps 0x16f5c(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -20257,20 +20257,20 @@ _sk_gamma_sse41 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,91,194 ; cvtdq2ps %xmm2,%xmm0
- DB 15,89,5,152,114,1,0 ; mulps 0x17298(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,40,53,160,114,1,0 ; movaps 0x172a0(%rip),%xmm14 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
+ DB 15,89,5,216,113,1,0 ; mulps 0x171d8(%rip),%xmm0 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,40,53,224,113,1,0 ; movaps 0x171e0(%rip),%xmm14 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
DB 65,15,84,214 ; andps %xmm14,%xmm2
- DB 68,15,40,37,180,111,1,0 ; movaps 0x16fb4(%rip),%xmm12 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,37,244,110,1,0 ; movaps 0x16ef4(%rip),%xmm12 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,86,212 ; orps %xmm12,%xmm2
- DB 68,15,40,21,152,114,1,0 ; movaps 0x17298(%rip),%xmm10 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
+ DB 68,15,40,21,216,113,1,0 ; movaps 0x171d8(%rip),%xmm10 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
DB 65,15,88,194 ; addps %xmm10,%xmm0
- DB 68,15,40,29,156,114,1,0 ; movaps 0x1729c(%rip),%xmm11 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,40,29,220,113,1,0 ; movaps 0x171dc(%rip),%xmm11 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 15,40,226 ; movaps %xmm2,%xmm4
DB 65,15,89,227 ; mulps %xmm11,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 68,15,40,13,154,114,1,0 ; movaps 0x1729a(%rip),%xmm9 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
+ DB 68,15,40,13,218,113,1,0 ; movaps 0x171da(%rip),%xmm9 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
DB 65,15,88,209 ; addps %xmm9,%xmm2
- DB 68,15,40,45,158,114,1,0 ; movaps 0x1729e(%rip),%xmm13 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,40,45,222,113,1,0 ; movaps 0x171de(%rip),%xmm13 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 65,15,40,229 ; movaps %xmm13,%xmm4
DB 15,94,226 ; divps %xmm2,%xmm4
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -20281,21 +20281,21 @@ _sk_gamma_sse41 LABEL PROC
DB 102,15,58,8,208,1 ; roundps $0x1,%xmm0,%xmm2
DB 15,40,224 ; movaps %xmm0,%xmm4
DB 15,92,226 ; subps %xmm2,%xmm4
- DB 15,40,53,129,114,1,0 ; movaps 0x17281(%rip),%xmm6 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
+ DB 15,40,53,193,113,1,0 ; movaps 0x171c1(%rip),%xmm6 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
DB 15,88,198 ; addps %xmm6,%xmm0
- DB 15,40,61,151,114,1,0 ; movaps 0x17297(%rip),%xmm7 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 15,40,61,215,113,1,0 ; movaps 0x171d7(%rip),%xmm7 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 15,40,239 ; movaps %xmm7,%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,40,212 ; movaps %xmm4,%xmm2
- DB 15,40,37,119,114,1,0 ; movaps 0x17277(%rip),%xmm4 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 15,40,37,183,113,1,0 ; movaps 0x171b7(%rip),%xmm4 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,92,194 ; subps %xmm2,%xmm0
- DB 68,15,40,61,137,114,1,0 ; movaps 0x17289(%rip),%xmm15 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,61,201,113,1,0 ; movaps 0x171c9(%rip),%xmm15 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 65,15,40,215 ; movaps %xmm15,%xmm2
DB 15,94,213 ; divps %xmm5,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0
- DB 15,89,5,229,113,1,0 ; mulps 0x171e5(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
+ DB 15,89,5,37,113,1,0 ; mulps 0x17125(%rip),%xmm0 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
DB 65,15,84,206 ; andps %xmm14,%xmm1
DB 65,15,86,204 ; orps %xmm12,%xmm1
DB 65,15,88,194 ; addps %xmm10,%xmm0
@@ -20321,8 +20321,8 @@ _sk_gamma_sse41 LABEL PROC
DB 15,94,206 ; divps %xmm6,%xmm1
DB 15,88,200 ; addps %xmm0,%xmm1
DB 15,91,195 ; cvtdq2ps %xmm3,%xmm0
- DB 15,89,5,134,113,1,0 ; mulps 0x17186(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 15,84,29,143,113,1,0 ; andps 0x1718f(%rip),%xmm3 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
+ DB 15,89,5,198,112,1,0 ; mulps 0x170c6(%rip),%xmm0 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 15,84,29,207,112,1,0 ; andps 0x170cf(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
DB 65,15,86,220 ; orps %xmm12,%xmm3
DB 65,15,88,194 ; addps %xmm10,%xmm0
DB 68,15,89,219 ; mulps %xmm3,%xmm11
@@ -20340,7 +20340,7 @@ _sk_gamma_sse41 LABEL PROC
DB 15,92,253 ; subps %xmm5,%xmm7
DB 68,15,94,255 ; divps %xmm7,%xmm15
DB 68,15,88,248 ; addps %xmm0,%xmm15
- DB 15,40,5,215,113,1,0 ; movaps 0x171d7(%rip),%xmm0 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 15,40,5,23,113,1,0 ; movaps 0x17117(%rip),%xmm0 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 15,89,208 ; mulps %xmm0,%xmm2
DB 15,89,200 ; mulps %xmm0,%xmm1
DB 68,15,89,248 ; mulps %xmm0,%xmm15
@@ -20359,29 +20359,29 @@ _sk_gamma_sse41 LABEL PROC
PUBLIC _sk_lab_to_xyz_sse41
_sk_lab_to_xyz_sse41 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,89,5,164,113,1,0 ; mulps 0x171a4(%rip),%xmm8 # 2cea0 <_sk_overlay_sse2_8bit+0x122b>
- DB 68,15,40,13,28,111,1,0 ; movaps 0x16f1c(%rip),%xmm9 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,89,5,228,112,1,0 ; mulps 0x170e4(%rip),%xmm8 # 2cde0 <_sk_overlay_sse2_8bit+0x1230>
+ DB 68,15,40,13,92,110,1,0 ; movaps 0x16e5c(%rip),%xmm9 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 65,15,89,201 ; mulps %xmm9,%xmm1
- DB 15,40,5,161,113,1,0 ; movaps 0x171a1(%rip),%xmm0 # 2ceb0 <_sk_overlay_sse2_8bit+0x123b>
+ DB 15,40,5,225,112,1,0 ; movaps 0x170e1(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x1240>
DB 15,88,200 ; addps %xmm0,%xmm1
DB 65,15,89,209 ; mulps %xmm9,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
- DB 68,15,88,5,159,113,1,0 ; addps 0x1719f(%rip),%xmm8 # 2cec0 <_sk_overlay_sse2_8bit+0x124b>
- DB 68,15,89,5,167,113,1,0 ; mulps 0x171a7(%rip),%xmm8 # 2ced0 <_sk_overlay_sse2_8bit+0x125b>
- DB 15,89,13,176,113,1,0 ; mulps 0x171b0(%rip),%xmm1 # 2cee0 <_sk_overlay_sse2_8bit+0x126b>
+ DB 68,15,88,5,223,112,1,0 ; addps 0x170df(%rip),%xmm8 # 2ce00 <_sk_overlay_sse2_8bit+0x1250>
+ DB 68,15,89,5,231,112,1,0 ; mulps 0x170e7(%rip),%xmm8 # 2ce10 <_sk_overlay_sse2_8bit+0x1260>
+ DB 15,89,13,240,112,1,0 ; mulps 0x170f0(%rip),%xmm1 # 2ce20 <_sk_overlay_sse2_8bit+0x1270>
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 15,89,21,181,113,1,0 ; mulps 0x171b5(%rip),%xmm2 # 2cef0 <_sk_overlay_sse2_8bit+0x127b>
+ DB 15,89,21,245,112,1,0 ; mulps 0x170f5(%rip),%xmm2 # 2ce30 <_sk_overlay_sse2_8bit+0x1280>
DB 69,15,40,208 ; movaps %xmm8,%xmm10
DB 68,15,92,210 ; subps %xmm2,%xmm10
DB 68,15,40,217 ; movaps %xmm1,%xmm11
DB 69,15,89,219 ; mulps %xmm11,%xmm11
DB 68,15,89,217 ; mulps %xmm1,%xmm11
- DB 68,15,40,13,169,113,1,0 ; movaps 0x171a9(%rip),%xmm9 # 2cf00 <_sk_overlay_sse2_8bit+0x128b>
+ DB 68,15,40,13,233,112,1,0 ; movaps 0x170e9(%rip),%xmm9 # 2ce40 <_sk_overlay_sse2_8bit+0x1290>
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 65,15,194,195,1 ; cmpltps %xmm11,%xmm0
- DB 15,40,21,169,113,1,0 ; movaps 0x171a9(%rip),%xmm2 # 2cf10 <_sk_overlay_sse2_8bit+0x129b>
+ DB 15,40,21,233,112,1,0 ; movaps 0x170e9(%rip),%xmm2 # 2ce50 <_sk_overlay_sse2_8bit+0x12a0>
DB 15,88,202 ; addps %xmm2,%xmm1
- DB 68,15,40,37,174,113,1,0 ; movaps 0x171ae(%rip),%xmm12 # 2cf20 <_sk_overlay_sse2_8bit+0x12ab>
+ DB 68,15,40,37,238,112,1,0 ; movaps 0x170ee(%rip),%xmm12 # 2ce60 <_sk_overlay_sse2_8bit+0x12b0>
DB 65,15,89,204 ; mulps %xmm12,%xmm1
DB 102,65,15,56,20,203 ; blendvps %xmm0,%xmm11,%xmm1
DB 69,15,40,216 ; movaps %xmm8,%xmm11
@@ -20400,8 +20400,8 @@ _sk_lab_to_xyz_sse41 LABEL PROC
DB 65,15,89,212 ; mulps %xmm12,%xmm2
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 102,65,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm2
- DB 15,89,13,103,113,1,0 ; mulps 0x17167(%rip),%xmm1 # 2cf30 <_sk_overlay_sse2_8bit+0x12bb>
- DB 15,89,21,112,113,1,0 ; mulps 0x17170(%rip),%xmm2 # 2cf40 <_sk_overlay_sse2_8bit+0x12cb>
+ DB 15,89,13,167,112,1,0 ; mulps 0x170a7(%rip),%xmm1 # 2ce70 <_sk_overlay_sse2_8bit+0x12c0>
+ DB 15,89,21,176,112,1,0 ; mulps 0x170b0(%rip),%xmm2 # 2ce80 <_sk_overlay_sse2_8bit+0x12d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 65,15,40,200 ; movaps %xmm8,%xmm1
@@ -20418,9 +20418,9 @@ _sk_load_a8_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,39 ; jne 15e1a <_sk_load_a8_sse41+0x3f>
DB 102,67,15,56,49,4,16 ; pmovzxbd (%r8,%r10,1),%xmm0
- DB 102,15,219,5,238,109,1,0 ; pand 0x16dee(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,5,46,109,1,0 ; pand 0x16d2e(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,52,111,1,0 ; mulps 0x16f34(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,29,116,110,1,0 ; mulps 0x16e74(%rip),%xmm3 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
@@ -20458,9 +20458,9 @@ _sk_load_a8_dst_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,39 ; jne 15ea6 <_sk_load_a8_dst_sse41+0x3f>
DB 102,67,15,56,49,36,16 ; pmovzxbd (%r8,%r10,1),%xmm4
- DB 102,15,219,37,98,109,1,0 ; pand 0x16d62(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,37,162,108,1,0 ; pand 0x16ca2(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,252 ; cvtdq2ps %xmm4,%xmm7
- DB 15,89,61,168,110,1,0 ; mulps 0x16ea8(%rip),%xmm7 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,61,232,109,1,0 ; mulps 0x16de8(%rip),%xmm7 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 102,15,239,237 ; pxor %xmm5,%xmm5
@@ -20511,7 +20511,7 @@ _sk_gather_a8_sse41 LABEL PROC
DB 102,15,58,32,192,3 ; pinsrb $0x3,%eax,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,221,109,1,0 ; mulps 0x16ddd(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,29,29,109,1,0 ; mulps 0x16d1d(%rip),%xmm3 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
@@ -20527,7 +20527,7 @@ _sk_store_a8_sse41 LABEL PROC
DB 77,15,175,193 ; imul %r9,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,210 ; movslq %edx,%r10
- DB 68,15,40,5,143,108,1,0 ; movaps 0x16c8f(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,207,107,1,0 ; movaps 0x16bcf(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 68,15,89,195 ; mulps %xmm3,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
DB 102,69,15,56,43,192 ; packusdw %xmm8,%xmm8
@@ -20549,7 +20549,7 @@ _sk_store_a8_sse41 LABEL PROC
DB 65,128,249,3 ; cmp $0x3,%r9b
DB 117,217 ; jne 15fb3 <_sk_store_a8_sse41+0x41>
DB 102,71,15,58,20,68,16,2,8 ; pextrb $0x8,%xmm8,0x2(%r8,%r10,1)
- DB 102,68,15,56,0,5,99,111,1,0 ; pshufb 0x16f63(%rip),%xmm8 # 2cf50 <_sk_overlay_sse2_8bit+0x12db>
+ DB 102,68,15,56,0,5,163,110,1,0 ; pshufb 0x16ea3(%rip),%xmm8 # 2ce90 <_sk_overlay_sse2_8bit+0x12e0>
DB 102,71,15,58,21,4,16,0 ; pextrw $0x0,%xmm8,(%r8,%r10,1)
DB 235,188 ; jmp 15fb3 <_sk_store_a8_sse41+0x41>
DB 102,71,15,58,20,4,16,0 ; pextrb $0x0,%xmm8,(%r8,%r10,1)
@@ -20566,11 +20566,11 @@ _sk_load_g8_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,42 ; jne 16043 <_sk_load_g8_sse41+0x42>
DB 102,67,15,56,49,4,16 ; pmovzxbd (%r8,%r10,1),%xmm0
- DB 102,15,219,5,200,107,1,0 ; pand 0x16bc8(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,5,8,107,1,0 ; pand 0x16b08(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,14,109,1,0 ; mulps 0x16d0e(%rip),%xmm0 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,5,78,108,1,0 ; mulps 0x16c4e(%rip),%xmm0 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,5,107,1,0 ; movaps 0x16b05(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,69,106,1,0 ; movaps 0x16a45(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -20606,11 +20606,11 @@ _sk_load_g8_dst_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,42 ; jne 160d2 <_sk_load_g8_dst_sse41+0x42>
DB 102,67,15,56,49,36,16 ; pmovzxbd (%r8,%r10,1),%xmm4
- DB 102,15,219,37,57,107,1,0 ; pand 0x16b39(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,37,121,106,1,0 ; pand 0x16a79(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,37,127,108,1,0 ; mulps 0x16c7f(%rip),%xmm4 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,37,191,107,1,0 ; mulps 0x16bbf(%rip),%xmm4 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,61,118,106,1,0 ; movaps 0x16a76(%rip),%xmm7 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,61,182,105,1,0 ; movaps 0x169b6(%rip),%xmm7 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 255,224 ; jmpq *%rax
@@ -20659,9 +20659,9 @@ _sk_gather_g8_sse41 LABEL PROC
DB 102,15,58,32,192,3 ; pinsrb $0x3,%eax,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,177,107,1,0 ; mulps 0x16bb1(%rip),%xmm0 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,5,241,106,1,0 ; mulps 0x16af1(%rip),%xmm0 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,168,105,1,0 ; movaps 0x169a8(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,232,104,1,0 ; movaps 0x168e8(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -20678,19 +20678,19 @@ _sk_load_565_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,80 ; jne 1620b <_sk_load_565_sse41+0x6b>
DB 102,67,15,56,51,20,80 ; pmovzxwd (%r8,%r10,2),%xmm2
- DB 102,15,111,5,134,107,1,0 ; movdqa 0x16b86(%rip),%xmm0 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,5,198,106,1,0 ; movdqa 0x16ac6(%rip),%xmm0 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,136,107,1,0 ; mulps 0x16b88(%rip),%xmm0 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,13,144,107,1,0 ; movdqa 0x16b90(%rip),%xmm1 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 15,89,5,200,106,1,0 ; mulps 0x16ac8(%rip),%xmm0 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,13,208,106,1,0 ; movdqa 0x16ad0(%rip),%xmm1 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,146,107,1,0 ; mulps 0x16b92(%rip),%xmm1 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,15,219,21,154,107,1,0 ; pand 0x16b9a(%rip),%xmm2 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 15,89,13,210,106,1,0 ; mulps 0x16ad2(%rip),%xmm1 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,15,219,21,218,106,1,0 ; pand 0x16ada(%rip),%xmm2 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,160,107,1,0 ; mulps 0x16ba0(%rip),%xmm2 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 15,89,21,224,106,1,0 ; mulps 0x16ae0(%rip),%xmm2 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,55,105,1,0 ; movaps 0x16937(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,119,104,1,0 ; movaps 0x16877(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,3 ; and $0x3,%r9b
@@ -20724,19 +20724,19 @@ _sk_load_565_dst_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,80 ; jne 162c6 <_sk_load_565_dst_sse41+0x6b>
DB 102,67,15,56,51,52,80 ; pmovzxwd (%r8,%r10,2),%xmm6
- DB 102,15,111,37,203,106,1,0 ; movdqa 0x16acb(%rip),%xmm4 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,37,11,106,1,0 ; movdqa 0x16a0b(%rip),%xmm4 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,15,219,230 ; pand %xmm6,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,37,205,106,1,0 ; mulps 0x16acd(%rip),%xmm4 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,45,213,106,1,0 ; movdqa 0x16ad5(%rip),%xmm5 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 15,89,37,13,106,1,0 ; mulps 0x16a0d(%rip),%xmm4 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,45,21,106,1,0 ; movdqa 0x16a15(%rip),%xmm5 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,15,219,238 ; pand %xmm6,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,45,215,106,1,0 ; mulps 0x16ad7(%rip),%xmm5 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,15,219,53,223,106,1,0 ; pand 0x16adf(%rip),%xmm6 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 15,89,45,23,106,1,0 ; mulps 0x16a17(%rip),%xmm5 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,15,219,53,31,106,1,0 ; pand 0x16a1f(%rip),%xmm6 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,89,53,229,106,1,0 ; mulps 0x16ae5(%rip),%xmm6 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 15,89,53,37,106,1,0 ; mulps 0x16a25(%rip),%xmm6 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,61,124,104,1,0 ; movaps 0x1687c(%rip),%xmm7 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,61,188,103,1,0 ; movaps 0x167bc(%rip),%xmm7 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,3 ; and $0x3,%r9b
@@ -20781,19 +20781,19 @@ _sk_gather_565_sse41 LABEL PROC
DB 65,15,183,4,64 ; movzwl (%r8,%rax,2),%eax
DB 102,15,196,192,3 ; pinsrw $0x3,%eax,%xmm0
DB 102,15,56,51,208 ; pmovzxwd %xmm0,%xmm2
- DB 102,15,111,5,208,105,1,0 ; movdqa 0x169d0(%rip),%xmm0 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,5,16,105,1,0 ; movdqa 0x16910(%rip),%xmm0 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,210,105,1,0 ; mulps 0x169d2(%rip),%xmm0 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,13,218,105,1,0 ; movdqa 0x169da(%rip),%xmm1 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 15,89,5,18,105,1,0 ; mulps 0x16912(%rip),%xmm0 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,13,26,105,1,0 ; movdqa 0x1691a(%rip),%xmm1 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,220,105,1,0 ; mulps 0x169dc(%rip),%xmm1 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,15,219,21,228,105,1,0 ; pand 0x169e4(%rip),%xmm2 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 15,89,13,28,105,1,0 ; mulps 0x1691c(%rip),%xmm1 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,15,219,21,36,105,1,0 ; pand 0x16924(%rip),%xmm2 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,234,105,1,0 ; mulps 0x169ea(%rip),%xmm2 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 15,89,21,42,105,1,0 ; mulps 0x1692a(%rip),%xmm2 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,129,103,1,0 ; movaps 0x16781(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,193,102,1,0 ; movaps 0x166c1(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_store_565_sse41
@@ -20805,12 +20805,12 @@ _sk_store_565_sse41 LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 68,15,40,5,129,107,1,0 ; movaps 0x16b81(%rip),%xmm8 # 2cf60 <_sk_overlay_sse2_8bit+0x12eb>
+ DB 68,15,40,5,193,106,1,0 ; movaps 0x16ac1(%rip),%xmm8 # 2cea0 <_sk_overlay_sse2_8bit+0x12f0>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
DB 102,65,15,114,241,11 ; pslld $0xb,%xmm9
- DB 68,15,40,21,118,107,1,0 ; movaps 0x16b76(%rip),%xmm10 # 2cf70 <_sk_overlay_sse2_8bit+0x12fb>
+ DB 68,15,40,21,182,106,1,0 ; movaps 0x16ab6(%rip),%xmm10 # 2ceb0 <_sk_overlay_sse2_8bit+0x1300>
DB 68,15,89,209 ; mulps %xmm1,%xmm10
DB 102,69,15,91,210 ; cvtps2dq %xmm10,%xmm10
DB 102,65,15,114,242,5 ; pslld $0x5,%xmm10
@@ -20852,21 +20852,21 @@ _sk_load_4444_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,95 ; jne 164eb <_sk_load_4444_sse41+0x7a>
DB 102,67,15,56,51,28,80 ; pmovzxwd (%r8,%r10,2),%xmm3
- DB 102,15,111,5,229,106,1,0 ; movdqa 0x16ae5(%rip),%xmm0 # 2cf80 <_sk_overlay_sse2_8bit+0x130b>
+ DB 102,15,111,5,37,106,1,0 ; movdqa 0x16a25(%rip),%xmm0 # 2cec0 <_sk_overlay_sse2_8bit+0x1310>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,231,106,1,0 ; mulps 0x16ae7(%rip),%xmm0 # 2cf90 <_sk_overlay_sse2_8bit+0x131b>
- DB 102,15,111,13,239,106,1,0 ; movdqa 0x16aef(%rip),%xmm1 # 2cfa0 <_sk_overlay_sse2_8bit+0x132b>
+ DB 15,89,5,39,106,1,0 ; mulps 0x16a27(%rip),%xmm0 # 2ced0 <_sk_overlay_sse2_8bit+0x1320>
+ DB 102,15,111,13,47,106,1,0 ; movdqa 0x16a2f(%rip),%xmm1 # 2cee0 <_sk_overlay_sse2_8bit+0x1330>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,241,106,1,0 ; mulps 0x16af1(%rip),%xmm1 # 2cfb0 <_sk_overlay_sse2_8bit+0x133b>
- DB 102,15,111,21,249,106,1,0 ; movdqa 0x16af9(%rip),%xmm2 # 2cfc0 <_sk_overlay_sse2_8bit+0x134b>
+ DB 15,89,13,49,106,1,0 ; mulps 0x16a31(%rip),%xmm1 # 2cef0 <_sk_overlay_sse2_8bit+0x1340>
+ DB 102,15,111,21,57,106,1,0 ; movdqa 0x16a39(%rip),%xmm2 # 2cf00 <_sk_overlay_sse2_8bit+0x1350>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,251,106,1,0 ; mulps 0x16afb(%rip),%xmm2 # 2cfd0 <_sk_overlay_sse2_8bit+0x135b>
- DB 102,15,219,29,3,107,1,0 ; pand 0x16b03(%rip),%xmm3 # 2cfe0 <_sk_overlay_sse2_8bit+0x136b>
+ DB 15,89,21,59,106,1,0 ; mulps 0x16a3b(%rip),%xmm2 # 2cf10 <_sk_overlay_sse2_8bit+0x1360>
+ DB 102,15,219,29,67,106,1,0 ; pand 0x16a43(%rip),%xmm3 # 2cf20 <_sk_overlay_sse2_8bit+0x1370>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,9,107,1,0 ; mulps 0x16b09(%rip),%xmm3 # 2cff0 <_sk_overlay_sse2_8bit+0x137b>
+ DB 15,89,29,73,106,1,0 ; mulps 0x16a49(%rip),%xmm3 # 2cf30 <_sk_overlay_sse2_8bit+0x1380>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
@@ -20901,21 +20901,21 @@ _sk_load_4444_dst_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,95 ; jne 165b5 <_sk_load_4444_dst_sse41+0x7a>
DB 102,67,15,56,51,60,80 ; pmovzxwd (%r8,%r10,2),%xmm7
- DB 102,15,111,37,27,106,1,0 ; movdqa 0x16a1b(%rip),%xmm4 # 2cf80 <_sk_overlay_sse2_8bit+0x130b>
+ DB 102,15,111,37,91,105,1,0 ; movdqa 0x1695b(%rip),%xmm4 # 2cec0 <_sk_overlay_sse2_8bit+0x1310>
DB 102,15,219,231 ; pand %xmm7,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,37,29,106,1,0 ; mulps 0x16a1d(%rip),%xmm4 # 2cf90 <_sk_overlay_sse2_8bit+0x131b>
- DB 102,15,111,45,37,106,1,0 ; movdqa 0x16a25(%rip),%xmm5 # 2cfa0 <_sk_overlay_sse2_8bit+0x132b>
+ DB 15,89,37,93,105,1,0 ; mulps 0x1695d(%rip),%xmm4 # 2ced0 <_sk_overlay_sse2_8bit+0x1320>
+ DB 102,15,111,45,101,105,1,0 ; movdqa 0x16965(%rip),%xmm5 # 2cee0 <_sk_overlay_sse2_8bit+0x1330>
DB 102,15,219,239 ; pand %xmm7,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,45,39,106,1,0 ; mulps 0x16a27(%rip),%xmm5 # 2cfb0 <_sk_overlay_sse2_8bit+0x133b>
- DB 102,15,111,53,47,106,1,0 ; movdqa 0x16a2f(%rip),%xmm6 # 2cfc0 <_sk_overlay_sse2_8bit+0x134b>
+ DB 15,89,45,103,105,1,0 ; mulps 0x16967(%rip),%xmm5 # 2cef0 <_sk_overlay_sse2_8bit+0x1340>
+ DB 102,15,111,53,111,105,1,0 ; movdqa 0x1696f(%rip),%xmm6 # 2cf00 <_sk_overlay_sse2_8bit+0x1350>
DB 102,15,219,247 ; pand %xmm7,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,89,53,49,106,1,0 ; mulps 0x16a31(%rip),%xmm6 # 2cfd0 <_sk_overlay_sse2_8bit+0x135b>
- DB 102,15,219,61,57,106,1,0 ; pand 0x16a39(%rip),%xmm7 # 2cfe0 <_sk_overlay_sse2_8bit+0x136b>
+ DB 15,89,53,113,105,1,0 ; mulps 0x16971(%rip),%xmm6 # 2cf10 <_sk_overlay_sse2_8bit+0x1360>
+ DB 102,15,219,61,121,105,1,0 ; pand 0x16979(%rip),%xmm7 # 2cf20 <_sk_overlay_sse2_8bit+0x1370>
DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7
- DB 15,89,61,63,106,1,0 ; mulps 0x16a3f(%rip),%xmm7 # 2cff0 <_sk_overlay_sse2_8bit+0x137b>
+ DB 15,89,61,127,105,1,0 ; mulps 0x1697f(%rip),%xmm7 # 2cf30 <_sk_overlay_sse2_8bit+0x1380>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
@@ -20961,21 +20961,21 @@ _sk_gather_4444_sse41 LABEL PROC
DB 65,15,183,4,64 ; movzwl (%r8,%rax,2),%eax
DB 102,15,196,192,3 ; pinsrw $0x3,%eax,%xmm0
DB 102,15,56,51,216 ; pmovzxwd %xmm0,%xmm3
- DB 102,15,111,5,17,105,1,0 ; movdqa 0x16911(%rip),%xmm0 # 2cf80 <_sk_overlay_sse2_8bit+0x130b>
+ DB 102,15,111,5,81,104,1,0 ; movdqa 0x16851(%rip),%xmm0 # 2cec0 <_sk_overlay_sse2_8bit+0x1310>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,19,105,1,0 ; mulps 0x16913(%rip),%xmm0 # 2cf90 <_sk_overlay_sse2_8bit+0x131b>
- DB 102,15,111,13,27,105,1,0 ; movdqa 0x1691b(%rip),%xmm1 # 2cfa0 <_sk_overlay_sse2_8bit+0x132b>
+ DB 15,89,5,83,104,1,0 ; mulps 0x16853(%rip),%xmm0 # 2ced0 <_sk_overlay_sse2_8bit+0x1320>
+ DB 102,15,111,13,91,104,1,0 ; movdqa 0x1685b(%rip),%xmm1 # 2cee0 <_sk_overlay_sse2_8bit+0x1330>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,29,105,1,0 ; mulps 0x1691d(%rip),%xmm1 # 2cfb0 <_sk_overlay_sse2_8bit+0x133b>
- DB 102,15,111,21,37,105,1,0 ; movdqa 0x16925(%rip),%xmm2 # 2cfc0 <_sk_overlay_sse2_8bit+0x134b>
+ DB 15,89,13,93,104,1,0 ; mulps 0x1685d(%rip),%xmm1 # 2cef0 <_sk_overlay_sse2_8bit+0x1340>
+ DB 102,15,111,21,101,104,1,0 ; movdqa 0x16865(%rip),%xmm2 # 2cf00 <_sk_overlay_sse2_8bit+0x1350>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,39,105,1,0 ; mulps 0x16927(%rip),%xmm2 # 2cfd0 <_sk_overlay_sse2_8bit+0x135b>
- DB 102,15,219,29,47,105,1,0 ; pand 0x1692f(%rip),%xmm3 # 2cfe0 <_sk_overlay_sse2_8bit+0x136b>
+ DB 15,89,21,103,104,1,0 ; mulps 0x16867(%rip),%xmm2 # 2cf10 <_sk_overlay_sse2_8bit+0x1360>
+ DB 102,15,219,29,111,104,1,0 ; pand 0x1686f(%rip),%xmm3 # 2cf20 <_sk_overlay_sse2_8bit+0x1370>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,53,105,1,0 ; mulps 0x16935(%rip),%xmm3 # 2cff0 <_sk_overlay_sse2_8bit+0x137b>
+ DB 15,89,29,117,104,1,0 ; mulps 0x16875(%rip),%xmm3 # 2cf30 <_sk_overlay_sse2_8bit+0x1380>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -20988,7 +20988,7 @@ _sk_store_4444_sse41 LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 68,15,40,5,35,105,1,0 ; movaps 0x16923(%rip),%xmm8 # 2d000 <_sk_overlay_sse2_8bit+0x138b>
+ DB 68,15,40,5,99,104,1,0 ; movaps 0x16863(%rip),%xmm8 # 2cf40 <_sk_overlay_sse2_8bit+0x1390>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -21040,17 +21040,17 @@ _sk_load_8888_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,89 ; jne 167f8 <_sk_load_8888_sse41+0x75>
DB 243,65,15,111,28,128 ; movdqu (%r8,%rax,4),%xmm3
- DB 102,15,111,5,67,100,1,0 ; movdqa 0x16443(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,131,99,1,0 ; movdqa 0x16383(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,132,101,1,0 ; movaps 0x16584(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,196,100,1,0 ; movaps 0x164c4(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
- DB 102,15,56,0,13,51,100,1,0 ; pshufb 0x16433(%rip),%xmm1 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,13,115,99,1,0 ; pshufb 0x16373(%rip),%xmm1 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
- DB 102,15,56,0,21,47,100,1,0 ; pshufb 0x1642f(%rip),%xmm2 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,21,111,99,1,0 ; pshufb 0x1636f(%rip),%xmm2 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -21087,17 +21087,17 @@ _sk_load_8888_dst_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,89 ; jne 168b2 <_sk_load_8888_dst_sse41+0x75>
DB 243,65,15,111,60,128 ; movdqu (%r8,%rax,4),%xmm7
- DB 102,15,111,37,137,99,1,0 ; movdqa 0x16389(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,37,201,98,1,0 ; movdqa 0x162c9(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,231 ; pand %xmm7,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 68,15,40,5,202,100,1,0 ; movaps 0x164ca(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,10,100,1,0 ; movaps 0x1640a(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,224 ; mulps %xmm8,%xmm4
DB 102,15,111,239 ; movdqa %xmm7,%xmm5
- DB 102,15,56,0,45,121,99,1,0 ; pshufb 0x16379(%rip),%xmm5 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,45,185,98,1,0 ; pshufb 0x162b9(%rip),%xmm5 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
DB 65,15,89,232 ; mulps %xmm8,%xmm5
DB 102,15,111,247 ; movdqa %xmm7,%xmm6
- DB 102,15,56,0,53,117,99,1,0 ; pshufb 0x16375(%rip),%xmm6 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,53,181,98,1,0 ; pshufb 0x162b5(%rip),%xmm6 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 65,15,89,240 ; mulps %xmm8,%xmm6
DB 102,15,114,215,24 ; psrld $0x18,%xmm7
@@ -21142,17 +21142,17 @@ _sk_gather_8888_sse41 LABEL PROC
DB 102,65,15,58,34,28,128,1 ; pinsrd $0x1,(%r8,%rax,4),%xmm3
DB 102,67,15,58,34,28,152,2 ; pinsrd $0x2,(%r8,%r11,4),%xmm3
DB 102,67,15,58,34,28,144,3 ; pinsrd $0x3,(%r8,%r10,4),%xmm3
- DB 102,15,111,5,153,98,1,0 ; movdqa 0x16299(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,217,97,1,0 ; movdqa 0x161d9(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,218,99,1,0 ; movaps 0x163da(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,26,99,1,0 ; movaps 0x1631a(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
- DB 102,15,56,0,13,137,98,1,0 ; pshufb 0x16289(%rip),%xmm1 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,13,201,97,1,0 ; pshufb 0x161c9(%rip),%xmm1 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
- DB 102,15,56,0,21,133,98,1,0 ; pshufb 0x16285(%rip),%xmm2 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,21,197,97,1,0 ; pshufb 0x161c5(%rip),%xmm2 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -21170,7 +21170,7 @@ _sk_store_8888_sse41 LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 68,15,40,5,95,98,1,0 ; movaps 0x1625f(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,159,97,1,0 ; movaps 0x1619f(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -21219,17 +21219,17 @@ _sk_load_bgra_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,89 ; jne 16ac8 <_sk_load_bgra_sse41+0x75>
DB 243,65,15,111,28,128 ; movdqu (%r8,%rax,4),%xmm3
- DB 102,15,111,5,115,97,1,0 ; movdqa 0x16173(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,179,96,1,0 ; movdqa 0x160b3(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,208 ; cvtdq2ps %xmm0,%xmm2
- DB 68,15,40,5,180,98,1,0 ; movaps 0x162b4(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,244,97,1,0 ; movaps 0x161f4(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
- DB 102,15,56,0,5,99,97,1,0 ; pshufb 0x16163(%rip),%xmm0 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,5,163,96,1,0 ; pshufb 0x160a3(%rip),%xmm0 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,200 ; cvtdq2ps %xmm0,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
- DB 102,15,56,0,5,95,97,1,0 ; pshufb 0x1615f(%rip),%xmm0 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,5,159,96,1,0 ; pshufb 0x1609f(%rip),%xmm0 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -21266,17 +21266,17 @@ _sk_load_bgra_dst_sse41 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,89 ; jne 16b82 <_sk_load_bgra_dst_sse41+0x75>
DB 243,65,15,111,60,128 ; movdqu (%r8,%rax,4),%xmm7
- DB 102,15,111,37,185,96,1,0 ; movdqa 0x160b9(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,37,249,95,1,0 ; movdqa 0x15ff9(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,231 ; pand %xmm7,%xmm4
DB 15,91,244 ; cvtdq2ps %xmm4,%xmm6
- DB 68,15,40,5,250,97,1,0 ; movaps 0x161fa(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,58,97,1,0 ; movaps 0x1613a(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,240 ; mulps %xmm8,%xmm6
DB 102,15,111,231 ; movdqa %xmm7,%xmm4
- DB 102,15,56,0,37,169,96,1,0 ; pshufb 0x160a9(%rip),%xmm4 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,37,233,95,1,0 ; pshufb 0x15fe9(%rip),%xmm4 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,236 ; cvtdq2ps %xmm4,%xmm5
DB 65,15,89,232 ; mulps %xmm8,%xmm5
DB 102,15,111,231 ; movdqa %xmm7,%xmm4
- DB 102,15,56,0,37,165,96,1,0 ; pshufb 0x160a5(%rip),%xmm4 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,37,229,95,1,0 ; pshufb 0x15fe5(%rip),%xmm4 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
DB 65,15,89,224 ; mulps %xmm8,%xmm4
DB 102,15,114,215,24 ; psrld $0x18,%xmm7
@@ -21321,17 +21321,17 @@ _sk_gather_bgra_sse41 LABEL PROC
DB 102,65,15,58,34,28,128,1 ; pinsrd $0x1,(%r8,%rax,4),%xmm3
DB 102,67,15,58,34,28,152,2 ; pinsrd $0x2,(%r8,%r11,4),%xmm3
DB 102,67,15,58,34,28,144,3 ; pinsrd $0x3,(%r8,%r10,4),%xmm3
- DB 102,15,111,5,201,95,1,0 ; movdqa 0x15fc9(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,9,95,1,0 ; movdqa 0x15f09(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,208 ; cvtdq2ps %xmm0,%xmm2
- DB 68,15,40,5,10,97,1,0 ; movaps 0x1610a(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,74,96,1,0 ; movaps 0x1604a(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
- DB 102,15,56,0,5,185,95,1,0 ; pshufb 0x15fb9(%rip),%xmm0 # 2cc00 <_sk_overlay_sse2_8bit+0xf8b>
+ DB 102,15,56,0,5,249,94,1,0 ; pshufb 0x15ef9(%rip),%xmm0 # 2cb40 <_sk_overlay_sse2_8bit+0xf90>
DB 15,91,200 ; cvtdq2ps %xmm0,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
- DB 102,15,56,0,5,181,95,1,0 ; pshufb 0x15fb5(%rip),%xmm0 # 2cc10 <_sk_overlay_sse2_8bit+0xf9b>
+ DB 102,15,56,0,5,245,94,1,0 ; pshufb 0x15ef5(%rip),%xmm0 # 2cb50 <_sk_overlay_sse2_8bit+0xfa0>
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -21349,7 +21349,7 @@ _sk_store_bgra_sse41 LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 68,15,40,5,143,95,1,0 ; movaps 0x15f8f(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,207,94,1,0 ; movaps 0x15ecf(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 68,15,40,202 ; movaps %xmm2,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -21406,18 +21406,18 @@ _sk_load_f16_sse41 LABEL PROC
DB 102,68,15,97,216 ; punpcklwd %xmm0,%xmm11
DB 102,68,15,105,200 ; punpckhwd %xmm0,%xmm9
DB 102,65,15,56,51,203 ; pmovzxwd %xmm11,%xmm1
- DB 102,68,15,111,5,148,98,1,0 ; movdqa 0x16294(%rip),%xmm8 # 2d010 <_sk_overlay_sse2_8bit+0x139b>
+ DB 102,68,15,111,5,212,97,1,0 ; movdqa 0x161d4(%rip),%xmm8 # 2cf50 <_sk_overlay_sse2_8bit+0x13a0>
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,65,15,219,208 ; pand %xmm8,%xmm2
DB 102,15,239,202 ; pxor %xmm2,%xmm1
- DB 102,15,111,29,143,98,1,0 ; movdqa 0x1628f(%rip),%xmm3 # 2d020 <_sk_overlay_sse2_8bit+0x13ab>
+ DB 102,15,111,29,207,97,1,0 ; movdqa 0x161cf(%rip),%xmm3 # 2cf60 <_sk_overlay_sse2_8bit+0x13b0>
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,56,63,195 ; pmaxud %xmm3,%xmm0
DB 102,15,118,193 ; pcmpeqd %xmm1,%xmm0
DB 102,15,114,241,13 ; pslld $0xd,%xmm1
DB 102,15,235,202 ; por %xmm2,%xmm1
- DB 102,68,15,111,21,123,98,1,0 ; movdqa 0x1627b(%rip),%xmm10 # 2d030 <_sk_overlay_sse2_8bit+0x13bb>
+ DB 102,68,15,111,21,187,97,1,0 ; movdqa 0x161bb(%rip),%xmm10 # 2cf70 <_sk_overlay_sse2_8bit+0x13c0>
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,15,219,193 ; pand %xmm1,%xmm0
DB 102,65,15,115,219,8 ; psrldq $0x8,%xmm11
@@ -21491,18 +21491,18 @@ _sk_load_f16_dst_sse41 LABEL PROC
DB 102,68,15,97,220 ; punpcklwd %xmm4,%xmm11
DB 102,68,15,105,204 ; punpckhwd %xmm4,%xmm9
DB 102,65,15,56,51,235 ; pmovzxwd %xmm11,%xmm5
- DB 102,68,15,111,5,252,96,1,0 ; movdqa 0x160fc(%rip),%xmm8 # 2d010 <_sk_overlay_sse2_8bit+0x139b>
+ DB 102,68,15,111,5,60,96,1,0 ; movdqa 0x1603c(%rip),%xmm8 # 2cf50 <_sk_overlay_sse2_8bit+0x13a0>
DB 102,15,111,245 ; movdqa %xmm5,%xmm6
DB 102,65,15,219,240 ; pand %xmm8,%xmm6
DB 102,15,239,238 ; pxor %xmm6,%xmm5
- DB 102,15,111,61,247,96,1,0 ; movdqa 0x160f7(%rip),%xmm7 # 2d020 <_sk_overlay_sse2_8bit+0x13ab>
+ DB 102,15,111,61,55,96,1,0 ; movdqa 0x16037(%rip),%xmm7 # 2cf60 <_sk_overlay_sse2_8bit+0x13b0>
DB 102,15,114,246,16 ; pslld $0x10,%xmm6
DB 102,15,111,229 ; movdqa %xmm5,%xmm4
DB 102,15,56,63,231 ; pmaxud %xmm7,%xmm4
DB 102,15,118,229 ; pcmpeqd %xmm5,%xmm4
DB 102,15,114,245,13 ; pslld $0xd,%xmm5
DB 102,15,235,238 ; por %xmm6,%xmm5
- DB 102,68,15,111,21,227,96,1,0 ; movdqa 0x160e3(%rip),%xmm10 # 2d030 <_sk_overlay_sse2_8bit+0x13bb>
+ DB 102,68,15,111,21,35,96,1,0 ; movdqa 0x16023(%rip),%xmm10 # 2cf70 <_sk_overlay_sse2_8bit+0x13c0>
DB 102,65,15,254,234 ; paddd %xmm10,%xmm5
DB 102,15,219,229 ; pand %xmm5,%xmm4
DB 102,65,15,115,219,8 ; psrldq $0x8,%xmm11
@@ -21585,18 +21585,18 @@ _sk_gather_f16_sse41 LABEL PROC
DB 102,68,15,97,218 ; punpcklwd %xmm2,%xmm11
DB 102,68,15,105,202 ; punpckhwd %xmm2,%xmm9
DB 102,65,15,56,51,203 ; pmovzxwd %xmm11,%xmm1
- DB 102,68,15,111,5,55,95,1,0 ; movdqa 0x15f37(%rip),%xmm8 # 2d010 <_sk_overlay_sse2_8bit+0x139b>
+ DB 102,68,15,111,5,119,94,1,0 ; movdqa 0x15e77(%rip),%xmm8 # 2cf50 <_sk_overlay_sse2_8bit+0x13a0>
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,65,15,219,208 ; pand %xmm8,%xmm2
DB 102,15,239,202 ; pxor %xmm2,%xmm1
- DB 102,15,111,29,50,95,1,0 ; movdqa 0x15f32(%rip),%xmm3 # 2d020 <_sk_overlay_sse2_8bit+0x13ab>
+ DB 102,15,111,29,114,94,1,0 ; movdqa 0x15e72(%rip),%xmm3 # 2cf60 <_sk_overlay_sse2_8bit+0x13b0>
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,56,63,195 ; pmaxud %xmm3,%xmm0
DB 102,15,118,193 ; pcmpeqd %xmm1,%xmm0
DB 102,15,114,241,13 ; pslld $0xd,%xmm1
DB 102,15,235,202 ; por %xmm2,%xmm1
- DB 102,68,15,111,21,30,95,1,0 ; movdqa 0x15f1e(%rip),%xmm10 # 2d030 <_sk_overlay_sse2_8bit+0x13bb>
+ DB 102,68,15,111,21,94,94,1,0 ; movdqa 0x15e5e(%rip),%xmm10 # 2cf70 <_sk_overlay_sse2_8bit+0x13c0>
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,15,219,193 ; pand %xmm1,%xmm0
DB 102,65,15,115,219,8 ; psrldq $0x8,%xmm11
@@ -21647,17 +21647,17 @@ _sk_store_f16_sse41 LABEL PROC
DB 73,193,224,3 ; shl $0x3,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 102,68,15,111,21,66,94,1,0 ; movdqa 0x15e42(%rip),%xmm10 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 102,68,15,111,21,130,93,1,0 ; movdqa 0x15d82(%rip),%xmm10 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 102,68,15,111,216 ; movdqa %xmm0,%xmm11
DB 102,69,15,219,218 ; pand %xmm10,%xmm11
DB 102,68,15,111,232 ; movdqa %xmm0,%xmm13
DB 102,69,15,239,235 ; pxor %xmm11,%xmm13
- DB 102,68,15,111,13,53,94,1,0 ; movdqa 0x15e35(%rip),%xmm9 # 2d050 <_sk_overlay_sse2_8bit+0x13db>
+ DB 102,68,15,111,13,117,93,1,0 ; movdqa 0x15d75(%rip),%xmm9 # 2cf90 <_sk_overlay_sse2_8bit+0x13e0>
DB 102,65,15,114,211,16 ; psrld $0x10,%xmm11
DB 102,69,15,111,193 ; movdqa %xmm9,%xmm8
DB 102,69,15,102,197 ; pcmpgtd %xmm13,%xmm8
DB 102,65,15,114,213,13 ; psrld $0xd,%xmm13
- DB 102,68,15,111,37,38,94,1,0 ; movdqa 0x15e26(%rip),%xmm12 # 2d060 <_sk_overlay_sse2_8bit+0x13eb>
+ DB 102,68,15,111,37,102,93,1,0 ; movdqa 0x15d66(%rip),%xmm12 # 2cfa0 <_sk_overlay_sse2_8bit+0x13f0>
DB 102,69,15,235,220 ; por %xmm12,%xmm11
DB 102,69,15,254,221 ; paddd %xmm13,%xmm11
DB 102,69,15,223,195 ; pandn %xmm11,%xmm8
@@ -21744,7 +21744,7 @@ _sk_load_u16_be_sse41 LABEL PROC
DB 102,15,235,200 ; por %xmm0,%xmm1
DB 102,15,56,51,193 ; pmovzxwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,6,90,1,0 ; movaps 0x15a06(%rip),%xmm8 # 2cdd0 <_sk_overlay_sse2_8bit+0x115b>
+ DB 68,15,40,5,70,89,1,0 ; movaps 0x15946(%rip),%xmm8 # 2cd10 <_sk_overlay_sse2_8bit+0x1160>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -21816,7 +21816,7 @@ _sk_load_rgb_u16_be_sse41 LABEL PROC
DB 102,15,235,200 ; por %xmm0,%xmm1
DB 102,15,56,51,193 ; pmovzxwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,213,88,1,0 ; movaps 0x158d5(%rip),%xmm8 # 2cdd0 <_sk_overlay_sse2_8bit+0x115b>
+ DB 68,15,40,5,21,88,1,0 ; movaps 0x15815(%rip),%xmm8 # 2cd10 <_sk_overlay_sse2_8bit+0x1160>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -21833,7 +21833,7 @@ _sk_load_rgb_u16_be_sse41 LABEL PROC
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,252,85,1,0 ; movaps 0x155fc(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,60,85,1,0 ; movaps 0x1553c(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
DB 102,65,15,110,20,64 ; movd (%r8,%rax,2),%xmm2
DB 102,65,15,196,84,64,4,2 ; pinsrw $0x2,0x4(%r8,%rax,2),%xmm2
@@ -21865,7 +21865,7 @@ _sk_store_u16_be_sse41 LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 73,99,193 ; movslq %r9d,%rax
- DB 68,15,40,21,165,90,1,0 ; movaps 0x15aa5(%rip),%xmm10 # 2d070 <_sk_overlay_sse2_8bit+0x13fb>
+ DB 68,15,40,21,229,89,1,0 ; movaps 0x159e5(%rip),%xmm10 # 2cfb0 <_sk_overlay_sse2_8bit+0x1400>
DB 68,15,40,192 ; movaps %xmm0,%xmm8
DB 69,15,89,194 ; mulps %xmm10,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
@@ -22124,7 +22124,7 @@ _sk_mirror_x_sse41 LABEL PROC
DB 65,15,92,194 ; subps %xmm10,%xmm0
DB 243,69,15,88,192 ; addss %xmm8,%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
- DB 243,68,15,89,13,79,71,1,0 ; mulss 0x1474f(%rip),%xmm9 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 243,68,15,89,13,139,70,1,0 ; mulss 0x1468b(%rip),%xmm9 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,89,200 ; mulps %xmm0,%xmm9
DB 102,69,15,58,8,201,1 ; roundps $0x1,%xmm9,%xmm9
@@ -22153,7 +22153,7 @@ _sk_mirror_y_sse41 LABEL PROC
DB 65,15,92,202 ; subps %xmm10,%xmm1
DB 243,69,15,88,192 ; addss %xmm8,%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
- DB 243,68,15,89,13,221,70,1,0 ; mulss 0x146dd(%rip),%xmm9 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 243,68,15,89,13,25,70,1,0 ; mulss 0x14619(%rip),%xmm9 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,89,201 ; mulps %xmm1,%xmm9
DB 102,69,15,58,8,201,1 ; roundps $0x1,%xmm9,%xmm9
@@ -22176,7 +22176,7 @@ PUBLIC _sk_clamp_x_1_sse41
_sk_clamp_x_1_sse41 LABEL PROC
DB 69,15,87,192 ; xorps %xmm8,%xmm8
DB 68,15,95,192 ; maxps %xmm0,%xmm8
- DB 68,15,93,5,232,80,1,0 ; minps 0x150e8(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,93,5,40,80,1,0 ; minps 0x15028(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -22190,9 +22190,9 @@ _sk_repeat_x_1_sse41 LABEL PROC
PUBLIC _sk_mirror_x_1_sse41
_sk_mirror_x_1_sse41 LABEL PROC
- DB 68,15,40,5,41,81,1,0 ; movaps 0x15129(%rip),%xmm8 # 2cba0 <_sk_overlay_sse2_8bit+0xf2b>
+ DB 68,15,40,5,105,80,1,0 ; movaps 0x15069(%rip),%xmm8 # 2cae0 <_sk_overlay_sse2_8bit+0xf30>
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,13,157,80,1,0 ; movaps 0x1509d(%rip),%xmm9 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,13,221,79,1,0 ; movaps 0x14fdd(%rip),%xmm9 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 68,15,89,200 ; mulps %xmm0,%xmm9
DB 102,69,15,58,8,201,1 ; roundps $0x1,%xmm9,%xmm9
DB 69,15,88,201 ; addps %xmm9,%xmm9
@@ -22207,10 +22207,10 @@ _sk_mirror_x_1_sse41 LABEL PROC
PUBLIC _sk_luminance_to_alpha_sse41
_sk_luminance_to_alpha_sse41 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 15,89,5,204,85,1,0 ; mulps 0x155cc(%rip),%xmm0 # 2d080 <_sk_overlay_sse2_8bit+0x140b>
- DB 15,89,13,213,85,1,0 ; mulps 0x155d5(%rip),%xmm1 # 2d090 <_sk_overlay_sse2_8bit+0x141b>
+ DB 15,89,5,12,85,1,0 ; mulps 0x1550c(%rip),%xmm0 # 2cfc0 <_sk_overlay_sse2_8bit+0x1410>
+ DB 15,89,13,21,85,1,0 ; mulps 0x15515(%rip),%xmm1 # 2cfd0 <_sk_overlay_sse2_8bit+0x1420>
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,29,219,85,1,0 ; mulps 0x155db(%rip),%xmm3 # 2d0a0 <_sk_overlay_sse2_8bit+0x142b>
+ DB 15,89,29,27,85,1,0 ; mulps 0x1551b(%rip),%xmm3 # 2cfe0 <_sk_overlay_sse2_8bit+0x1430>
DB 15,88,217 ; addps %xmm1,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
@@ -22595,15 +22595,15 @@ _sk_evenly_spaced_gradient_sse41 LABEL PROC
PUBLIC _sk_gauss_a_to_rgba_sse41
_sk_gauss_a_to_rgba_sse41 LABEL PROC
- DB 15,40,5,138,79,1,0 ; movaps 0x14f8a(%rip),%xmm0 # 2d0b0 <_sk_overlay_sse2_8bit+0x143b>
+ DB 15,40,5,202,78,1,0 ; movaps 0x14eca(%rip),%xmm0 # 2cff0 <_sk_overlay_sse2_8bit+0x1440>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,144,79,1,0 ; addps 0x14f90(%rip),%xmm0 # 2d0c0 <_sk_overlay_sse2_8bit+0x144b>
+ DB 15,88,5,208,78,1,0 ; addps 0x14ed0(%rip),%xmm0 # 2d000 <_sk_overlay_sse2_8bit+0x1450>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,150,79,1,0 ; addps 0x14f96(%rip),%xmm0 # 2d0d0 <_sk_overlay_sse2_8bit+0x145b>
+ DB 15,88,5,214,78,1,0 ; addps 0x14ed6(%rip),%xmm0 # 2d010 <_sk_overlay_sse2_8bit+0x1460>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,156,79,1,0 ; addps 0x14f9c(%rip),%xmm0 # 2d0e0 <_sk_overlay_sse2_8bit+0x146b>
+ DB 15,88,5,220,78,1,0 ; addps 0x14edc(%rip),%xmm0 # 2d020 <_sk_overlay_sse2_8bit+0x1470>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,162,79,1,0 ; addps 0x14fa2(%rip),%xmm0 # 2d0f0 <_sk_overlay_sse2_8bit+0x147b>
+ DB 15,88,5,226,78,1,0 ; addps 0x14ee2(%rip),%xmm0 # 2d030 <_sk_overlay_sse2_8bit+0x1480>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
@@ -22621,7 +22621,7 @@ _sk_gradient_sse41 LABEL PROC
DB 73,255,200 ; dec %r8
DB 73,131,193,4 ; add $0x4,%r9
DB 102,15,239,201 ; pxor %xmm1,%xmm1
- DB 15,40,21,208,73,1,0 ; movaps 0x149d0(%rip),%xmm2 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 15,40,21,16,73,1,0 ; movaps 0x14910(%rip),%xmm2 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 243,65,15,16,25 ; movss (%r9),%xmm3
DB 15,198,219,0 ; shufps $0x0,%xmm3,%xmm3
DB 15,194,216,2 ; cmpleps %xmm0,%xmm3
@@ -22756,26 +22756,26 @@ _sk_xy_to_unit_angle_sse41 LABEL PROC
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,40,236 ; movaps %xmm12,%xmm13
DB 69,15,89,237 ; mulps %xmm13,%xmm13
- DB 68,15,40,21,15,77,1,0 ; movaps 0x14d0f(%rip),%xmm10 # 2d100 <_sk_overlay_sse2_8bit+0x148b>
+ DB 68,15,40,21,79,76,1,0 ; movaps 0x14c4f(%rip),%xmm10 # 2d040 <_sk_overlay_sse2_8bit+0x1490>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,19,77,1,0 ; addps 0x14d13(%rip),%xmm10 # 2d110 <_sk_overlay_sse2_8bit+0x149b>
+ DB 68,15,88,21,83,76,1,0 ; addps 0x14c53(%rip),%xmm10 # 2d050 <_sk_overlay_sse2_8bit+0x14a0>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,23,77,1,0 ; addps 0x14d17(%rip),%xmm10 # 2d120 <_sk_overlay_sse2_8bit+0x14ab>
+ DB 68,15,88,21,87,76,1,0 ; addps 0x14c57(%rip),%xmm10 # 2d060 <_sk_overlay_sse2_8bit+0x14b0>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,27,77,1,0 ; addps 0x14d1b(%rip),%xmm10 # 2d130 <_sk_overlay_sse2_8bit+0x14bb>
+ DB 68,15,88,21,91,76,1,0 ; addps 0x14c5b(%rip),%xmm10 # 2d070 <_sk_overlay_sse2_8bit+0x14c0>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,194,195,1 ; cmpltps %xmm11,%xmm0
- DB 68,15,40,29,26,77,1,0 ; movaps 0x14d1a(%rip),%xmm11 # 2d140 <_sk_overlay_sse2_8bit+0x14cb>
+ DB 68,15,40,29,90,76,1,0 ; movaps 0x14c5a(%rip),%xmm11 # 2d080 <_sk_overlay_sse2_8bit+0x14d0>
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 102,69,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm10
DB 69,15,194,200,1 ; cmpltps %xmm8,%xmm9
- DB 68,15,40,29,227,70,1,0 ; movaps 0x146e3(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,29,35,70,1,0 ; movaps 0x14623(%rip),%xmm11 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 102,69,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm10
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 65,15,194,192,1 ; cmpltps %xmm8,%xmm0
- DB 68,15,40,13,229,70,1,0 ; movaps 0x146e5(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,37,70,1,0 ; movaps 0x14625(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 102,69,15,56,20,209 ; blendvps %xmm0,%xmm9,%xmm10
DB 69,15,194,194,7 ; cmpordps %xmm10,%xmm8
@@ -22805,7 +22805,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,142,76,1,0 ; mulps 0x14c8e(%rip),%xmm9 # 2d150 <_sk_overlay_sse2_8bit+0x14db>
+ DB 68,15,89,13,206,75,1,0 ; mulps 0x14bce(%rip),%xmm9 # 2d090 <_sk_overlay_sse2_8bit+0x14e0>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -22813,7 +22813,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,121,76,1,0 ; mulps 0x14c79(%rip),%xmm10 # 2d160 <_sk_overlay_sse2_8bit+0x14eb>
+ DB 68,15,89,21,185,75,1,0 ; mulps 0x14bb9(%rip),%xmm10 # 2d0a0 <_sk_overlay_sse2_8bit+0x14f0>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -22822,8 +22822,8 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,49,75,1,0 ; xorps 0x14b31(%rip),%xmm9 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
- DB 68,15,89,5,9,70,1,0 ; mulps 0x14609(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,87,13,113,74,1,0 ; xorps 0x14a71(%rip),%xmm9 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
+ DB 68,15,89,5,73,69,1,0 ; mulps 0x14549(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -22842,7 +22842,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,240,75,1,0 ; mulps 0x14bf0(%rip),%xmm9 # 2d150 <_sk_overlay_sse2_8bit+0x14db>
+ DB 68,15,89,13,48,75,1,0 ; mulps 0x14b30(%rip),%xmm9 # 2d090 <_sk_overlay_sse2_8bit+0x14e0>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -22850,7 +22850,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,219,75,1,0 ; mulps 0x14bdb(%rip),%xmm10 # 2d160 <_sk_overlay_sse2_8bit+0x14eb>
+ DB 68,15,89,21,27,75,1,0 ; mulps 0x14b1b(%rip),%xmm10 # 2d0a0 <_sk_overlay_sse2_8bit+0x14f0>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -22859,8 +22859,8 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,147,74,1,0 ; xorps 0x14a93(%rip),%xmm9 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
- DB 68,15,89,5,107,69,1,0 ; mulps 0x1456b(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,87,13,211,73,1,0 ; xorps 0x149d3(%rip),%xmm9 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
+ DB 68,15,89,5,171,68,1,0 ; mulps 0x144ab(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -22876,7 +22876,7 @@ _sk_xy_to_2pt_conical_linear_sse41 LABEL PROC
DB 243,69,15,89,200 ; mulss %xmm8,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,99,75,1,0 ; mulps 0x14b63(%rip),%xmm9 # 2d150 <_sk_overlay_sse2_8bit+0x14db>
+ DB 68,15,89,13,163,74,1,0 ; mulps 0x14aa3(%rip),%xmm9 # 2d090 <_sk_overlay_sse2_8bit+0x14e0>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 69,15,89,210 ; mulps %xmm10,%xmm10
@@ -22884,7 +22884,7 @@ _sk_xy_to_2pt_conical_linear_sse41 LABEL PROC
DB 243,69,15,89,192 ; mulss %xmm8,%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,92,192 ; subps %xmm8,%xmm0
- DB 15,87,5,47,74,1,0 ; xorps 0x14a2f(%rip),%xmm0 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 15,87,5,111,73,1,0 ; xorps 0x1496f(%rip),%xmm0 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 65,15,94,193 ; divps %xmm9,%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -22921,7 +22921,7 @@ _sk_apply_vector_mask_sse41 LABEL PROC
PUBLIC _sk_save_xy_sse41
_sk_save_xy_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,165,68,1,0 ; movaps 0x144a5(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,5,229,67,1,0 ; movaps 0x143e5(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,17,0 ; movups %xmm0,(%rax)
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,88,200 ; addps %xmm8,%xmm9
@@ -22961,8 +22961,8 @@ _sk_bilinear_nx_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,103,74,1,0 ; addps 0x14a67(%rip),%xmm0 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,47,68,1,0 ; movaps 0x1442f(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,5,167,73,1,0 ; addps 0x149a7(%rip),%xmm0 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,111,67,1,0 ; movaps 0x1436f(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -22973,7 +22973,7 @@ _sk_bilinear_px_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,238,67,1,0 ; addps 0x143ee(%rip),%xmm0 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,88,5,46,67,1,0 ; addps 0x1432e(%rip),%xmm0 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -22983,8 +22983,8 @@ _sk_bilinear_ny_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,32,74,1,0 ; addps 0x14a20(%rip),%xmm1 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,232,67,1,0 ; movaps 0x143e8(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,13,96,73,1,0 ; addps 0x14960(%rip),%xmm1 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,40,67,1,0 ; movaps 0x14328(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -22995,7 +22995,7 @@ _sk_bilinear_py_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,166,67,1,0 ; addps 0x143a6(%rip),%xmm1 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,88,13,230,66,1,0 ; addps 0x142e6(%rip),%xmm1 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23005,13 +23005,13 @@ _sk_bicubic_n3x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,233,73,1,0 ; addps 0x149e9(%rip),%xmm0 # 2d180 <_sk_overlay_sse2_8bit+0x150b>
- DB 68,15,40,13,161,67,1,0 ; movaps 0x143a1(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,5,41,73,1,0 ; addps 0x14929(%rip),%xmm0 # 2d0c0 <_sk_overlay_sse2_8bit+0x1510>
+ DB 68,15,40,13,225,66,1,0 ; movaps 0x142e1(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,221,73,1,0 ; mulps 0x149dd(%rip),%xmm9 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,13,117,69,1,0 ; addps 0x14575(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,13,29,73,1,0 ; mulps 0x1491d(%rip),%xmm9 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,13,181,68,1,0 ; addps 0x144b5(%rip),%xmm9 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23022,16 +23022,16 @@ _sk_bicubic_n1x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,148,73,1,0 ; addps 0x14994(%rip),%xmm0 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,92,67,1,0 ; movaps 0x1435c(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,5,212,72,1,0 ; addps 0x148d4(%rip),%xmm0 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,156,66,1,0 ; movaps 0x1429c(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,176,73,1,0 ; movaps 0x149b0(%rip),%xmm8 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,5,240,72,1,0 ; movaps 0x148f0(%rip),%xmm8 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,180,73,1,0 ; addps 0x149b4(%rip),%xmm8 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,5,244,72,1,0 ; addps 0x148f4(%rip),%xmm8 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,24,67,1,0 ; addps 0x14318(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,88,5,88,66,1,0 ; addps 0x14258(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,172,73,1,0 ; addps 0x149ac(%rip),%xmm8 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,5,236,72,1,0 ; addps 0x148ec(%rip),%xmm8 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23039,17 +23039,17 @@ _sk_bicubic_n1x_sse41 LABEL PROC
PUBLIC _sk_bicubic_p1x_sse41
_sk_bicubic_p1x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,246,66,1,0 ; movaps 0x142f6(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,5,54,66,1,0 ; movaps 0x14236(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,72,64 ; movups 0x40(%rax),%xmm9
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,21,98,73,1,0 ; movaps 0x14962(%rip),%xmm10 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,21,162,72,1,0 ; movaps 0x148a2(%rip),%xmm10 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,102,73,1,0 ; addps 0x14966(%rip),%xmm10 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,21,166,72,1,0 ; addps 0x148a6(%rip),%xmm10 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,98,73,1,0 ; addps 0x14962(%rip),%xmm10 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,21,162,72,1,0 ; addps 0x148a2(%rip),%xmm10 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,144,128,0,0,0 ; movups %xmm10,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23059,11 +23059,11 @@ _sk_bicubic_p3x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,53,73,1,0 ; addps 0x14935(%rip),%xmm0 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 15,88,5,117,72,1,0 ; addps 0x14875(%rip),%xmm0 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,5,73,1,0 ; mulps 0x14905(%rip),%xmm8 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,5,157,68,1,0 ; addps 0x1449d(%rip),%xmm8 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,5,69,72,1,0 ; mulps 0x14845(%rip),%xmm8 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,5,221,67,1,0 ; addps 0x143dd(%rip),%xmm8 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23074,13 +23074,13 @@ _sk_bicubic_n3y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,203,72,1,0 ; addps 0x148cb(%rip),%xmm1 # 2d180 <_sk_overlay_sse2_8bit+0x150b>
- DB 68,15,40,13,131,66,1,0 ; movaps 0x14283(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,13,11,72,1,0 ; addps 0x1480b(%rip),%xmm1 # 2d0c0 <_sk_overlay_sse2_8bit+0x1510>
+ DB 68,15,40,13,195,65,1,0 ; movaps 0x141c3(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,191,72,1,0 ; mulps 0x148bf(%rip),%xmm9 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,13,87,68,1,0 ; addps 0x14457(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,13,255,71,1,0 ; mulps 0x147ff(%rip),%xmm9 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,13,151,67,1,0 ; addps 0x14397(%rip),%xmm9 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23091,16 +23091,16 @@ _sk_bicubic_n1y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,117,72,1,0 ; addps 0x14875(%rip),%xmm1 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,61,66,1,0 ; movaps 0x1423d(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,13,181,71,1,0 ; addps 0x147b5(%rip),%xmm1 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,125,65,1,0 ; movaps 0x1417d(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,145,72,1,0 ; movaps 0x14891(%rip),%xmm8 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,5,209,71,1,0 ; movaps 0x147d1(%rip),%xmm8 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,149,72,1,0 ; addps 0x14895(%rip),%xmm8 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,5,213,71,1,0 ; addps 0x147d5(%rip),%xmm8 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,249,65,1,0 ; addps 0x141f9(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,88,5,57,65,1,0 ; addps 0x14139(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,141,72,1,0 ; addps 0x1488d(%rip),%xmm8 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,5,205,71,1,0 ; addps 0x147cd(%rip),%xmm8 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23108,17 +23108,17 @@ _sk_bicubic_n1y_sse41 LABEL PROC
PUBLIC _sk_bicubic_p1y_sse41
_sk_bicubic_p1y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,215,65,1,0 ; movaps 0x141d7(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,5,23,65,1,0 ; movaps 0x14117(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,72,96 ; movups 0x60(%rax),%xmm9
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 68,15,40,21,66,72,1,0 ; movaps 0x14842(%rip),%xmm10 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,21,130,71,1,0 ; movaps 0x14782(%rip),%xmm10 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,70,72,1,0 ; addps 0x14846(%rip),%xmm10 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,21,134,71,1,0 ; addps 0x14786(%rip),%xmm10 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,66,72,1,0 ; addps 0x14842(%rip),%xmm10 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,21,130,71,1,0 ; addps 0x14782(%rip),%xmm10 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,144,160,0,0,0 ; movups %xmm10,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23128,11 +23128,11 @@ _sk_bicubic_p3y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,20,72,1,0 ; addps 0x14814(%rip),%xmm1 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 15,88,13,84,71,1,0 ; addps 0x14754(%rip),%xmm1 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,228,71,1,0 ; mulps 0x147e4(%rip),%xmm8 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,5,124,67,1,0 ; addps 0x1437c(%rip),%xmm8 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,5,36,71,1,0 ; mulps 0x14724(%rip),%xmm8 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,5,188,66,1,0 ; addps 0x142bc(%rip),%xmm8 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23259,10 +23259,10 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,68,15,56,64,227 ; pmulld %xmm3,%xmm12
DB 102,65,15,111,212 ; movdqa %xmm12,%xmm2
DB 102,15,254,209 ; paddd %xmm1,%xmm2
- DB 102,15,111,37,90,70,1,0 ; movdqa 0x1465a(%rip),%xmm4 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,37,154,69,1,0 ; movdqa 0x1459a(%rip),%xmm4 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,56,64,212 ; pmulld %xmm4,%xmm2
DB 102,68,15,111,220 ; movdqa %xmm4,%xmm11
- DB 102,68,15,111,61,183,63,1,0 ; movdqa 0x13fb7(%rip),%xmm15 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,61,247,62,1,0 ; movdqa 0x13ef7(%rip),%xmm15 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,111,226 ; movdqa %xmm2,%xmm4
DB 102,65,15,254,231 ; paddd %xmm15,%xmm4
DB 102,73,15,58,22,224,1 ; pextrq $0x1,%xmm4,%r8
@@ -23282,7 +23282,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,65,15,58,22,209,1 ; pextrd $0x1,%xmm2,%r9d
DB 102,65,15,58,22,210,2 ; pextrd $0x2,%xmm2,%r10d
DB 102,65,15,58,22,211,3 ; pextrd $0x3,%xmm2,%r11d
- DB 102,68,15,111,13,104,63,1,0 ; movdqa 0x13f68(%rip),%xmm9 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,13,168,62,1,0 ; movdqa 0x13ea8(%rip),%xmm9 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,65,15,254,209 ; paddd %xmm9,%xmm2
DB 102,73,15,58,22,214,1 ; pextrq $0x1,%xmm2,%r14
DB 102,72,15,126,211 ; movq %xmm2,%rbx
@@ -23296,7 +23296,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 73,193,238,32 ; shr $0x20,%r14
DB 243,66,15,16,20,176 ; movss (%rax,%r14,4),%xmm2
DB 102,15,58,33,242,48 ; insertps $0x30,%xmm2,%xmm6
- DB 15,40,45,125,69,1,0 ; movaps 0x1457d(%rip),%xmm5 # 2d1d0 <_sk_overlay_sse2_8bit+0x155b>
+ DB 15,40,45,189,68,1,0 ; movaps 0x144bd(%rip),%xmm5 # 2d110 <_sk_overlay_sse2_8bit+0x1560>
DB 68,15,88,197 ; addps %xmm5,%xmm8
DB 68,15,41,68,36,48 ; movaps %xmm8,0x30(%rsp)
DB 15,40,215 ; movaps %xmm7,%xmm2
@@ -23465,7 +23465,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,68,15,254,232 ; paddd %xmm0,%xmm13
DB 102,65,15,111,212 ; movdqa %xmm12,%xmm2
DB 102,65,15,254,213 ; paddd %xmm13,%xmm2
- DB 102,15,111,45,50,66,1,0 ; movdqa 0x14232(%rip),%xmm5 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,45,114,65,1,0 ; movdqa 0x14172(%rip),%xmm5 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,56,64,213 ; pmulld %xmm5,%xmm2
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,65,15,254,207 ; paddd %xmm15,%xmm1
@@ -23571,7 +23571,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,69,15,58,22,225,1 ; pextrd $0x1,%xmm12,%r9d
DB 102,69,15,58,22,226,2 ; pextrd $0x2,%xmm12,%r10d
DB 102,69,15,58,22,227,3 ; pextrd $0x3,%xmm12,%r11d
- DB 102,15,111,21,141,57,1,0 ; movdqa 0x1398d(%rip),%xmm2 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,111,21,205,56,1,0 ; movdqa 0x138cd(%rip),%xmm2 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,68,15,254,226 ; paddd %xmm2,%xmm12
DB 102,76,15,58,22,225,1 ; pextrq $0x1,%xmm12,%rcx
DB 102,76,15,126,227 ; movq %xmm12,%rbx
@@ -23744,8 +23744,8 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,111,197 ; movdqa %xmm13,%xmm0
DB 102,68,15,127,108,36,48 ; movdqa %xmm13,0x30(%rsp)
DB 102,15,254,193 ; paddd %xmm1,%xmm0
- DB 102,15,56,64,5,218,60,1,0 ; pmulld 0x13cda(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
- DB 102,68,15,111,29,65,54,1,0 ; movdqa 0x13641(%rip),%xmm11 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,56,64,5,26,60,1,0 ; pmulld 0x13c1a(%rip),%xmm0 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
+ DB 102,68,15,111,29,129,53,1,0 ; movdqa 0x13581(%rip),%xmm11 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
DB 102,65,15,254,211 ; paddd %xmm11,%xmm2
DB 102,73,15,58,22,208,1 ; pextrq $0x1,%xmm2,%r8
@@ -23765,7 +23765,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,193,1 ; pextrd $0x1,%xmm0,%r9d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,195,3 ; pextrd $0x3,%xmm0,%r11d
- DB 102,68,15,111,5,242,53,1,0 ; movdqa 0x135f2(%rip),%xmm8 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,5,50,53,1,0 ; movdqa 0x13532(%rip),%xmm8 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,65,15,254,192 ; paddd %xmm8,%xmm0
DB 102,73,15,58,22,198,1 ; pextrq $0x1,%xmm0,%r14
DB 102,72,15,126,195 ; movq %xmm0,%rbx
@@ -23779,7 +23779,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 73,193,238,32 ; shr $0x20,%r14
DB 243,66,15,16,4,176 ; movss (%rax,%r14,4),%xmm0
DB 102,15,58,33,232,48 ; insertps $0x30,%xmm0,%xmm5
- DB 15,40,53,7,60,1,0 ; movaps 0x13c07(%rip),%xmm6 # 2d1d0 <_sk_overlay_sse2_8bit+0x155b>
+ DB 15,40,53,71,59,1,0 ; movaps 0x13b47(%rip),%xmm6 # 2d110 <_sk_overlay_sse2_8bit+0x1560>
DB 68,15,88,214 ; addps %xmm6,%xmm10
DB 68,15,41,148,36,176,0,0,0 ; movaps %xmm10,0xb0(%rsp)
DB 15,88,254 ; addps %xmm6,%xmm7
@@ -23792,7 +23792,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,254,206 ; paddd %xmm6,%xmm1
DB 102,68,15,111,214 ; movdqa %xmm6,%xmm10
DB 102,68,15,127,84,36,32 ; movdqa %xmm10,0x20(%rsp)
- DB 102,15,56,64,13,210,59,1,0 ; pmulld 0x13bd2(%rip),%xmm1 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,56,64,13,18,59,1,0 ; pmulld 0x13b12(%rip),%xmm1 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,65,15,254,227 ; paddd %xmm11,%xmm4
DB 102,73,15,58,22,230,1 ; pextrq $0x1,%xmm4,%r14
@@ -23850,11 +23850,11 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,254,216 ; paddd %xmm0,%xmm3
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,65,15,254,205 ; paddd %xmm13,%xmm1
- DB 102,15,111,5,164,58,1,0 ; movdqa 0x13aa4(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,5,228,57,1,0 ; movdqa 0x139e4(%rip),%xmm0 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,56,64,200 ; pmulld %xmm0,%xmm1
DB 102,68,15,111,200 ; movdqa %xmm0,%xmm9
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
- DB 102,68,15,111,5,253,51,1,0 ; movdqa 0x133fd(%rip),%xmm8 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,5,61,51,1,0 ; movdqa 0x1333d(%rip),%xmm8 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,192 ; paddd %xmm8,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,197 ; movq %xmm0,%rbp
@@ -23956,7 +23956,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,68,15,111,108,36,48 ; movdqa 0x30(%rsp),%xmm13
DB 102,65,15,254,205 ; paddd %xmm13,%xmm1
- DB 102,15,111,45,106,56,1,0 ; movdqa 0x1386a(%rip),%xmm5 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,45,170,55,1,0 ; movdqa 0x137aa(%rip),%xmm5 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,56,64,205 ; pmulld %xmm5,%xmm1
DB 102,15,126,201 ; movd %xmm1,%ecx
DB 102,15,58,22,205,1 ; pextrd $0x1,%xmm1,%ebp
@@ -23968,7 +23968,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 243,15,16,20,152 ; movss (%rax,%rbx,4),%xmm2
DB 102,15,58,33,242,48 ; insertps $0x30,%xmm2,%xmm6
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
- DB 102,15,111,29,147,49,1,0 ; movdqa 0x13193(%rip),%xmm3 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,29,211,48,1,0 ; movdqa 0x130d3(%rip),%xmm3 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,211 ; paddd %xmm3,%xmm2
DB 102,72,15,58,22,209,1 ; pextrq $0x1,%xmm2,%rcx
DB 102,72,15,126,213 ; movq %xmm2,%rbp
@@ -24016,7 +24016,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,195,1 ; pextrd $0x1,%xmm0,%r11d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,192,3 ; pextrd $0x3,%xmm0,%r8d
- DB 102,15,254,5,187,48,1,0 ; paddd 0x130bb(%rip),%xmm0 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,5,251,47,1,0 ; paddd 0x12ffb(%rip),%xmm0 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
DB 137,221 ; mov %ebx,%ebp
@@ -24045,10 +24045,10 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,254,100,36,16 ; paddd 0x10(%rsp),%xmm4
DB 102,15,111,196 ; movdqa %xmm4,%xmm0
DB 102,65,15,254,197 ; paddd %xmm13,%xmm0
- DB 102,68,15,111,45,155,54,1,0 ; movdqa 0x1369b(%rip),%xmm13 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,68,15,111,45,219,53,1,0 ; movdqa 0x135db(%rip),%xmm13 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,65,15,56,64,197 ; pmulld %xmm13,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,111,53,249,47,1,0 ; movdqa 0x12ff9(%rip),%xmm6 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,53,57,47,1,0 ; movdqa 0x12f39(%rip),%xmm6 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,206 ; paddd %xmm6,%xmm1
DB 102,72,15,58,22,201,1 ; pextrq $0x1,%xmm1,%rcx
DB 102,72,15,126,205 ; movq %xmm1,%rbp
@@ -24066,7 +24066,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,193,1 ; pextrd $0x1,%xmm0,%r9d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,195,3 ; pextrd $0x3,%xmm0,%r11d
- DB 102,15,111,61,183,47,1,0 ; movdqa 0x12fb7(%rip),%xmm7 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,111,61,247,46,1,0 ; movdqa 0x12ef7(%rip),%xmm7 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,254,199 ; paddd %xmm7,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
@@ -24083,7 +24083,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,254,227 ; paddd %xmm11,%xmm4
DB 102,65,15,56,64,229 ; pmulld %xmm13,%xmm4
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
- DB 102,68,15,111,45,63,47,1,0 ; movdqa 0x12f3f(%rip),%xmm13 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,45,127,46,1,0 ; movdqa 0x12e7f(%rip),%xmm13 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,245 ; paddd %xmm13,%xmm6
DB 102,72,15,58,22,241,1 ; pextrq $0x1,%xmm6,%rcx
DB 102,72,15,126,243 ; movq %xmm6,%rbx
@@ -24162,7 +24162,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,68,15,111,76,36,48 ; movdqa 0x30(%rsp),%xmm9
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,254,194 ; paddd %xmm2,%xmm0
- DB 102,15,111,29,73,52,1,0 ; movdqa 0x13449(%rip),%xmm3 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,29,137,51,1,0 ; movdqa 0x13389(%rip),%xmm3 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,56,64,195 ; pmulld %xmm3,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,69,15,111,213 ; movdqa %xmm13,%xmm10
@@ -24183,7 +24183,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,193,1 ; pextrd $0x1,%xmm0,%r9d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,195,3 ; pextrd $0x3,%xmm0,%r11d
- DB 102,15,111,45,104,45,1,0 ; movdqa 0x12d68(%rip),%xmm5 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,111,45,168,44,1,0 ; movdqa 0x12ca8(%rip),%xmm5 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,254,197 ; paddd %xmm5,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
@@ -24271,7 +24271,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,225,1 ; pextrd $0x1,%xmm4,%r9d
DB 102,65,15,58,22,226,2 ; pextrd $0x2,%xmm4,%r10d
DB 102,65,15,58,22,227,3 ; pextrd $0x3,%xmm4,%r11d
- DB 102,68,15,111,13,156,43,1,0 ; movdqa 0x12b9c(%rip),%xmm9 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,13,220,42,1,0 ; movdqa 0x12adc(%rip),%xmm9 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,65,15,254,225 ; paddd %xmm9,%xmm4
DB 102,72,15,58,22,225,1 ; pextrq $0x1,%xmm4,%rcx
DB 102,72,15,126,227 ; movq %xmm4,%rbx
@@ -24353,7 +24353,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,254,76,36,48 ; paddd 0x30(%rsp),%xmm1
DB 102,65,15,56,64,205 ; pmulld %xmm13,%xmm1
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
- DB 102,68,15,111,37,209,41,1,0 ; movdqa 0x129d1(%rip),%xmm12 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,37,17,41,1,0 ; movdqa 0x12911(%rip),%xmm12 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,196 ; paddd %xmm12,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,197 ; movq %xmm0,%rbp
@@ -24371,7 +24371,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,201,1 ; pextrd $0x1,%xmm1,%r9d
DB 102,65,15,58,22,202,2 ; pextrd $0x2,%xmm1,%r10d
DB 102,65,15,58,22,203,3 ; pextrd $0x3,%xmm1,%r11d
- DB 102,15,111,29,142,41,1,0 ; movdqa 0x1298e(%rip),%xmm3 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,111,29,206,40,1,0 ; movdqa 0x128ce(%rip),%xmm3 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,254,203 ; paddd %xmm3,%xmm1
DB 102,72,15,58,22,201,1 ; pextrq $0x1,%xmm1,%rcx
DB 102,72,15,126,203 ; movq %xmm1,%rbx
@@ -24440,9 +24440,9 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,68,15,254,116,36,16 ; paddd 0x10(%rsp),%xmm14
DB 102,15,111,68,36,48 ; movdqa 0x30(%rsp),%xmm0
DB 102,65,15,254,198 ; paddd %xmm14,%xmm0
- DB 102,15,56,64,5,138,46,1,0 ; pmulld 0x12e8a(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,56,64,5,202,45,1,0 ; pmulld 0x12dca(%rip),%xmm0 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,254,5,238,39,1,0 ; paddd 0x127ee(%rip),%xmm0 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,5,46,39,1,0 ; paddd 0x1272e(%rip),%xmm0 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,197 ; movq %xmm0,%rbp
DB 137,235 ; mov %ebp,%ebx
@@ -24475,8 +24475,8 @@ _sk_clut_4D_sse41 LABEL PROC
DB 243,15,16,4,136 ; movss (%rax,%rcx,4),%xmm0
DB 102,15,58,33,232,48 ; insertps $0x30,%xmm0,%xmm5
DB 102,68,15,254,116,36,32 ; paddd 0x20(%rsp),%xmm14
- DB 102,68,15,56,64,53,207,45,1,0 ; pmulld 0x12dcf(%rip),%xmm14 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
- DB 102,15,111,5,55,39,1,0 ; movdqa 0x12737(%rip),%xmm0 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,56,64,53,15,45,1,0 ; pmulld 0x12d0f(%rip),%xmm14 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
+ DB 102,15,111,5,119,38,1,0 ; movdqa 0x12677(%rip),%xmm0 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,198 ; paddd %xmm14,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
@@ -24557,7 +24557,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,88,215 ; addps %xmm7,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,175,37,1,0 ; movaps 0x125af(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,239,36,1,0 ; movaps 0x124ef(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,139,76,36,120 ; mov 0x78(%rsp),%rcx
DB 15,40,164,36,208,0,0,0 ; movaps 0xd0(%rsp),%xmm4
DB 15,40,172,36,224,0,0,0 ; movaps 0xe0(%rsp),%xmm5
@@ -24660,15 +24660,15 @@ _sk_seed_shader_sse2 LABEL PROC
DB 102,15,110,194 ; movd %edx,%xmm0
DB 102,15,112,192,0 ; pshufd $0x0,%xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,40,21,11,36,1,0 ; movaps 0x1240b(%rip),%xmm2 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,40,21,75,35,1,0 ; movaps 0x1234b(%rip),%xmm2 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,88,194 ; addps %xmm2,%xmm0
- DB 15,88,5,17,36,1,0 ; addps 0x12411(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xebb>
+ DB 15,88,5,81,35,1,0 ; addps 0x12351(%rip),%xmm0 # 2ca70 <_sk_overlay_sse2_8bit+0xec0>
DB 102,15,110,201 ; movd %ecx,%xmm1
DB 102,15,112,201,0 ; pshufd $0x0,%xmm1,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,88,202 ; addps %xmm2,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,21,9,36,1,0 ; movaps 0x12409(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,73,35,1,0 ; movaps 0x12349(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,87,219 ; xorps %xmm3,%xmm3
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,87,237 ; xorps %xmm5,%xmm5
@@ -24681,18 +24681,18 @@ _sk_dither_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 102,68,15,110,194 ; movd %edx,%xmm8
DB 102,69,15,112,200,0 ; pshufd $0x0,%xmm8,%xmm9
- DB 102,68,15,254,13,162,35,1,0 ; paddd 0x123a2(%rip),%xmm9 # 2cb00 <_sk_overlay_sse2_8bit+0xe8b>
+ DB 102,68,15,254,13,226,34,1,0 ; paddd 0x122e2(%rip),%xmm9 # 2ca40 <_sk_overlay_sse2_8bit+0xe90>
DB 102,68,15,110,193 ; movd %ecx,%xmm8
DB 102,69,15,112,192,0 ; pshufd $0x0,%xmm8,%xmm8
DB 102,69,15,239,193 ; pxor %xmm9,%xmm8
- DB 102,68,15,111,21,217,35,1,0 ; movdqa 0x123d9(%rip),%xmm10 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,21,25,35,1,0 ; movdqa 0x12319(%rip),%xmm10 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,69,15,111,216 ; movdqa %xmm8,%xmm11
DB 102,69,15,219,218 ; pand %xmm10,%xmm11
DB 102,65,15,114,243,5 ; pslld $0x5,%xmm11
DB 102,69,15,219,209 ; pand %xmm9,%xmm10
DB 102,65,15,114,242,4 ; pslld $0x4,%xmm10
- DB 102,68,15,111,37,197,35,1,0 ; movdqa 0x123c5(%rip),%xmm12 # 2cb60 <_sk_overlay_sse2_8bit+0xeeb>
- DB 102,68,15,111,45,204,35,1,0 ; movdqa 0x123cc(%rip),%xmm13 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,37,5,35,1,0 ; movdqa 0x12305(%rip),%xmm12 # 2caa0 <_sk_overlay_sse2_8bit+0xef0>
+ DB 102,68,15,111,45,12,35,1,0 ; movdqa 0x1230c(%rip),%xmm13 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,69,15,111,240 ; movdqa %xmm8,%xmm14
DB 102,69,15,219,245 ; pand %xmm13,%xmm14
DB 102,65,15,114,246,2 ; pslld $0x2,%xmm14
@@ -24708,8 +24708,8 @@ _sk_dither_sse2 LABEL PROC
DB 102,69,15,235,245 ; por %xmm13,%xmm14
DB 102,69,15,235,240 ; por %xmm8,%xmm14
DB 69,15,91,198 ; cvtdq2ps %xmm14,%xmm8
- DB 68,15,89,5,135,35,1,0 ; mulps 0x12387(%rip),%xmm8 # 2cb80 <_sk_overlay_sse2_8bit+0xf0b>
- DB 68,15,88,5,143,35,1,0 ; addps 0x1238f(%rip),%xmm8 # 2cb90 <_sk_overlay_sse2_8bit+0xf1b>
+ DB 68,15,89,5,199,34,1,0 ; mulps 0x122c7(%rip),%xmm8 # 2cac0 <_sk_overlay_sse2_8bit+0xf10>
+ DB 68,15,88,5,207,34,1,0 ; addps 0x122cf(%rip),%xmm8 # 2cad0 <_sk_overlay_sse2_8bit+0xf20>
DB 243,68,15,16,16 ; movss (%rax),%xmm10
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,89,208 ; mulps %xmm8,%xmm10
@@ -24747,7 +24747,7 @@ _sk_uniform_color_sse2 LABEL PROC
PUBLIC _sk_black_color_sse2
_sk_black_color_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,197,34,1,0 ; movaps 0x122c5(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,5,34,1,0 ; movaps 0x12205(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,87,201 ; xorps %xmm1,%xmm1
DB 15,87,210 ; xorps %xmm2,%xmm2
@@ -24756,7 +24756,7 @@ _sk_black_color_sse2 LABEL PROC
PUBLIC _sk_white_color_sse2
_sk_white_color_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,5,177,34,1,0 ; movaps 0x122b1(%rip),%xmm0 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,5,241,33,1,0 ; movaps 0x121f1(%rip),%xmm0 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,40,216 ; movaps %xmm0,%xmm3
@@ -24794,7 +24794,7 @@ _sk_clear_sse2 LABEL PROC
PUBLIC _sk_srcatop_sse2
_sk_srcatop_sse2 LABEL PROC
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 68,15,40,5,97,34,1,0 ; movaps 0x12261(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,161,33,1,0 ; movaps 0x121a1(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -24817,7 +24817,7 @@ PUBLIC _sk_dstatop_sse2
_sk_dstatop_sse2 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
DB 68,15,89,196 ; mulps %xmm4,%xmm8
- DB 68,15,40,13,20,34,1,0 ; movaps 0x12214(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,84,33,1,0 ; movaps 0x12154(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,88,192 ; addps %xmm8,%xmm0
@@ -24858,7 +24858,7 @@ _sk_dstin_sse2 LABEL PROC
PUBLIC _sk_srcout_sse2
_sk_srcout_sse2 LABEL PROC
- DB 68,15,40,5,168,33,1,0 ; movaps 0x121a8(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,232,32,1,0 ; movaps 0x120e8(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
@@ -24869,7 +24869,7 @@ _sk_srcout_sse2 LABEL PROC
PUBLIC _sk_dstout_sse2
_sk_dstout_sse2 LABEL PROC
- DB 68,15,40,5,136,33,1,0 ; movaps 0x12188(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,200,32,1,0 ; movaps 0x120c8(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 15,89,196 ; mulps %xmm4,%xmm0
@@ -24884,7 +24884,7 @@ _sk_dstout_sse2 LABEL PROC
PUBLIC _sk_srcover_sse2
_sk_srcover_sse2 LABEL PROC
- DB 68,15,40,5,91,33,1,0 ; movaps 0x1215b(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,155,32,1,0 ; movaps 0x1209b(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -24902,7 +24902,7 @@ _sk_srcover_sse2 LABEL PROC
PUBLIC _sk_dstover_sse2
_sk_dstover_sse2 LABEL PROC
- DB 68,15,40,5,31,33,1,0 ; movaps 0x1211f(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,95,32,1,0 ; movaps 0x1205f(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -24926,7 +24926,7 @@ _sk_modulate_sse2 LABEL PROC
PUBLIC _sk_multiply_sse2
_sk_multiply_sse2 LABEL PROC
- DB 68,15,40,5,227,32,1,0 ; movaps 0x120e3(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,35,32,1,0 ; movaps 0x12023(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 69,15,40,209 ; movaps %xmm9,%xmm10
@@ -24962,7 +24962,7 @@ _sk_multiply_sse2 LABEL PROC
PUBLIC _sk_plus__sse2
_sk_plus__sse2 LABEL PROC
DB 15,88,196 ; addps %xmm4,%xmm0
- DB 68,15,40,5,100,32,1,0 ; movaps 0x12064(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,164,31,1,0 ; movaps 0x11fa4(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,93,192 ; minps %xmm8,%xmm0
DB 15,88,205 ; addps %xmm5,%xmm1
DB 65,15,93,200 ; minps %xmm8,%xmm1
@@ -25000,7 +25000,7 @@ _sk_screen_sse2 LABEL PROC
PUBLIC _sk_xor__sse2
_sk_xor__sse2 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
- DB 15,40,29,240,31,1,0 ; movaps 0x11ff0(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,48,31,1,0 ; movaps 0x11f30(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,40,203 ; movaps %xmm3,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
@@ -25046,7 +25046,7 @@ _sk_darken_sse2 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,95,209 ; maxps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,75,31,1,0 ; movaps 0x11f4b(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,139,30,1,0 ; movaps 0x11e8b(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -25078,7 +25078,7 @@ _sk_lighten_sse2 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,224,30,1,0 ; movaps 0x11ee0(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,32,30,1,0 ; movaps 0x11e20(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -25113,7 +25113,7 @@ _sk_difference_sse2 LABEL PROC
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,106,30,1,0 ; movaps 0x11e6a(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,170,29,1,0 ; movaps 0x11daa(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -25139,7 +25139,7 @@ _sk_exclusion_sse2 LABEL PROC
DB 15,89,214 ; mulps %xmm6,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,26,30,1,0 ; movaps 0x11e1a(%rip),%xmm2 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,21,90,29,1,0 ; movaps 0x11d5a(%rip),%xmm2 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -25150,7 +25150,7 @@ _sk_exclusion_sse2 LABEL PROC
PUBLIC _sk_colorburn_sse2
_sk_colorburn_sse2 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,40,13,253,29,1,0 ; movaps 0x11dfd(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,61,29,1,0 ; movaps 0x11d3d(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,209 ; movaps %xmm9,%xmm10
DB 68,15,92,215 ; subps %xmm7,%xmm10
DB 69,15,40,218 ; movaps %xmm10,%xmm11
@@ -25243,7 +25243,7 @@ _sk_colorburn_sse2 LABEL PROC
PUBLIC _sk_colordodge_sse2
_sk_colordodge_sse2 LABEL PROC
DB 68,15,40,200 ; movaps %xmm0,%xmm9
- DB 68,15,40,21,165,28,1,0 ; movaps 0x11ca5(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,229,27,1,0 ; movaps 0x11be5(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 65,15,40,195 ; movaps %xmm11,%xmm0
@@ -25334,7 +25334,7 @@ _sk_hardlight_sse2 LABEL PROC
DB 15,41,52,36 ; movaps %xmm6,(%rsp)
DB 15,40,245 ; movaps %xmm5,%xmm6
DB 15,40,236 ; movaps %xmm4,%xmm5
- DB 68,15,40,29,75,27,1,0 ; movaps 0x11b4b(%rip),%xmm11 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,29,139,26,1,0 ; movaps 0x11a8b(%rip),%xmm11 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,211 ; movaps %xmm11,%xmm10
DB 68,15,92,215 ; subps %xmm7,%xmm10
DB 69,15,40,194 ; movaps %xmm10,%xmm8
@@ -25421,7 +25421,7 @@ PUBLIC _sk_overlay_sse2
_sk_overlay_sse2 LABEL PROC
DB 68,15,40,193 ; movaps %xmm1,%xmm8
DB 68,15,40,232 ; movaps %xmm0,%xmm13
- DB 68,15,40,13,6,26,1,0 ; movaps 0x11a06(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,70,25,1,0 ; movaps 0x11946(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,209 ; movaps %xmm9,%xmm10
DB 68,15,92,215 ; subps %xmm7,%xmm10
DB 69,15,40,218 ; movaps %xmm10,%xmm11
@@ -25511,7 +25511,7 @@ _sk_softlight_sse2 LABEL PROC
DB 68,15,40,213 ; movaps %xmm5,%xmm10
DB 68,15,94,215 ; divps %xmm7,%xmm10
DB 69,15,84,212 ; andps %xmm12,%xmm10
- DB 68,15,40,13,176,24,1,0 ; movaps 0x118b0(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,240,23,1,0 ; movaps 0x117f0(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,249 ; movaps %xmm9,%xmm15
DB 69,15,92,250 ; subps %xmm10,%xmm15
DB 69,15,40,218 ; movaps %xmm10,%xmm11
@@ -25524,10 +25524,10 @@ _sk_softlight_sse2 LABEL PROC
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 65,15,88,194 ; addps %xmm10,%xmm0
- DB 68,15,40,53,218,24,1,0 ; movaps 0x118da(%rip),%xmm14 # 2cba0 <_sk_overlay_sse2_8bit+0xf2b>
+ DB 68,15,40,53,26,24,1,0 ; movaps 0x1181a(%rip),%xmm14 # 2cae0 <_sk_overlay_sse2_8bit+0xf30>
DB 69,15,88,222 ; addps %xmm14,%xmm11
DB 68,15,89,216 ; mulps %xmm0,%xmm11
- DB 68,15,40,21,218,24,1,0 ; movaps 0x118da(%rip),%xmm10 # 2cbb0 <_sk_overlay_sse2_8bit+0xf3b>
+ DB 68,15,40,21,26,24,1,0 ; movaps 0x1181a(%rip),%xmm10 # 2caf0 <_sk_overlay_sse2_8bit+0xf40>
DB 69,15,89,234 ; mulps %xmm10,%xmm13
DB 69,15,88,235 ; addps %xmm11,%xmm13
DB 15,88,228 ; addps %xmm4,%xmm4
@@ -25672,7 +25672,7 @@ _sk_hue_sse2 LABEL PROC
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 68,15,89,211 ; mulps %xmm3,%xmm10
- DB 68,15,40,5,102,22,1,0 ; movaps 0x11666(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,166,21,1,0 ; movaps 0x115a6(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,216 ; movaps %xmm8,%xmm11
DB 15,40,207 ; movaps %xmm7,%xmm1
DB 68,15,92,217 ; subps %xmm1,%xmm11
@@ -25720,12 +25720,12 @@ _sk_hue_sse2 LABEL PROC
DB 69,15,84,206 ; andps %xmm14,%xmm9
DB 69,15,84,214 ; andps %xmm14,%xmm10
DB 65,15,84,214 ; andps %xmm14,%xmm2
- DB 68,15,40,61,35,22,1,0 ; movaps 0x11623(%rip),%xmm15 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,61,99,21,1,0 ; movaps 0x11563(%rip),%xmm15 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 65,15,89,231 ; mulps %xmm15,%xmm4
- DB 15,40,5,40,22,1,0 ; movaps 0x11628(%rip),%xmm0 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 15,40,5,104,21,1,0 ; movaps 0x11568(%rip),%xmm0 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 15,89,240 ; mulps %xmm0,%xmm6
DB 15,88,244 ; addps %xmm4,%xmm6
- DB 68,15,40,53,42,22,1,0 ; movaps 0x1162a(%rip),%xmm14 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,53,106,21,1,0 ; movaps 0x1156a(%rip),%xmm14 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 68,15,40,239 ; movaps %xmm7,%xmm13
DB 69,15,89,238 ; mulps %xmm14,%xmm13
DB 68,15,88,238 ; addps %xmm6,%xmm13
@@ -25903,14 +25903,14 @@ _sk_saturation_sse2 LABEL PROC
DB 68,15,84,211 ; andps %xmm3,%xmm10
DB 68,15,84,203 ; andps %xmm3,%xmm9
DB 15,84,195 ; andps %xmm3,%xmm0
- DB 68,15,40,5,119,19,1,0 ; movaps 0x11377(%rip),%xmm8 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,5,183,18,1,0 ; movaps 0x112b7(%rip),%xmm8 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 15,40,214 ; movaps %xmm6,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
- DB 15,40,13,121,19,1,0 ; movaps 0x11379(%rip),%xmm1 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 15,40,13,185,18,1,0 ; movaps 0x112b9(%rip),%xmm1 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 15,40,221 ; movaps %xmm5,%xmm3
DB 15,89,217 ; mulps %xmm1,%xmm3
DB 15,88,218 ; addps %xmm2,%xmm3
- DB 68,15,40,37,120,19,1,0 ; movaps 0x11378(%rip),%xmm12 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,37,184,18,1,0 ; movaps 0x112b8(%rip),%xmm12 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
DB 68,15,88,235 ; addps %xmm3,%xmm13
DB 65,15,40,210 ; movaps %xmm10,%xmm2
@@ -25955,7 +25955,7 @@ _sk_saturation_sse2 LABEL PROC
DB 15,40,223 ; movaps %xmm7,%xmm3
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,221 ; mulps %xmm5,%xmm3
- DB 68,15,40,5,45,18,1,0 ; movaps 0x1122d(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,109,17,1,0 ; movaps 0x1116d(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,40,224 ; movaps %xmm8,%xmm4
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 15,88,253 ; addps %xmm5,%xmm7
@@ -26056,14 +26056,14 @@ _sk_color_sse2 LABEL PROC
DB 68,15,40,213 ; movaps %xmm5,%xmm10
DB 69,15,89,208 ; mulps %xmm8,%xmm10
DB 65,15,40,208 ; movaps %xmm8,%xmm2
- DB 68,15,40,45,53,17,1,0 ; movaps 0x11135(%rip),%xmm13 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,45,117,16,1,0 ; movaps 0x11075(%rip),%xmm13 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 68,15,40,198 ; movaps %xmm6,%xmm8
DB 69,15,89,197 ; mulps %xmm13,%xmm8
- DB 68,15,40,53,53,17,1,0 ; movaps 0x11135(%rip),%xmm14 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 68,15,40,53,117,16,1,0 ; movaps 0x11075(%rip),%xmm14 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 65,15,40,195 ; movaps %xmm11,%xmm0
DB 65,15,89,198 ; mulps %xmm14,%xmm0
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,29,49,17,1,0 ; movaps 0x11131(%rip),%xmm11 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
+ DB 68,15,40,29,113,16,1,0 ; movaps 0x11071(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
DB 69,15,89,227 ; mulps %xmm11,%xmm12
DB 68,15,88,224 ; addps %xmm0,%xmm12
DB 65,15,40,193 ; movaps %xmm9,%xmm0
@@ -26071,7 +26071,7 @@ _sk_color_sse2 LABEL PROC
DB 69,15,40,250 ; movaps %xmm10,%xmm15
DB 69,15,89,254 ; mulps %xmm14,%xmm15
DB 68,15,88,248 ; addps %xmm0,%xmm15
- DB 68,15,40,5,109,16,1,0 ; movaps 0x1106d(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,173,15,1,0 ; movaps 0x10fad(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,40,224 ; movaps %xmm8,%xmm4
DB 15,92,226 ; subps %xmm2,%xmm4
DB 15,89,252 ; mulps %xmm4,%xmm7
@@ -26207,15 +26207,15 @@ _sk_luminosity_sse2 LABEL PROC
DB 68,15,40,205 ; movaps %xmm5,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
DB 15,89,222 ; mulps %xmm6,%xmm3
- DB 68,15,40,37,239,14,1,0 ; movaps 0x10eef(%rip),%xmm12 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,37,47,14,1,0 ; movaps 0x10e2f(%rip),%xmm12 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 68,15,40,199 ; movaps %xmm7,%xmm8
DB 69,15,89,196 ; mulps %xmm12,%xmm8
- DB 68,15,40,45,239,14,1,0 ; movaps 0x10eef(%rip),%xmm13 # 2cbd0 <_sk_overlay_sse2_8bit+0xf5b>
+ DB 68,15,40,45,47,14,1,0 ; movaps 0x10e2f(%rip),%xmm13 # 2cb10 <_sk_overlay_sse2_8bit+0xf60>
DB 68,15,40,241 ; movaps %xmm1,%xmm14
DB 69,15,89,245 ; mulps %xmm13,%xmm14
DB 69,15,88,240 ; addps %xmm8,%xmm14
- DB 68,15,40,29,235,14,1,0 ; movaps 0x10eeb(%rip),%xmm11 # 2cbe0 <_sk_overlay_sse2_8bit+0xf6b>
- DB 68,15,40,5,67,14,1,0 ; movaps 0x10e43(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,29,43,14,1,0 ; movaps 0x10e2b(%rip),%xmm11 # 2cb20 <_sk_overlay_sse2_8bit+0xf70>
+ DB 68,15,40,5,131,13,1,0 ; movaps 0x10d83(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,248 ; movaps %xmm8,%xmm15
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 68,15,92,248 ; subps %xmm0,%xmm15
@@ -26358,7 +26358,7 @@ _sk_srcover_rgba_8888_sse2 LABEL PROC
DB 15,133,228,0,0,0 ; jne 1bfea <_sk_srcover_rgba_8888_sse2+0x104>
DB 243,69,15,111,4,128 ; movdqu (%r8,%rax,4),%xmm8
DB 72,133,255 ; test %rdi,%rdi
- DB 102,15,111,53,217,12,1,0 ; movdqa 0x10cd9(%rip),%xmm6 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,53,25,12,1,0 ; movdqa 0x10c19(%rip),%xmm6 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,224 ; movdqa %xmm8,%xmm4
DB 102,15,219,230 ; pand %xmm6,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
@@ -26372,9 +26372,9 @@ _sk_srcover_rgba_8888_sse2 LABEL PROC
DB 15,91,247 ; cvtdq2ps %xmm7,%xmm6
DB 102,65,15,114,208,24 ; psrld $0x18,%xmm8
DB 65,15,91,248 ; cvtdq2ps %xmm8,%xmm7
- DB 68,15,40,5,233,11,1,0 ; movaps 0x10be9(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,41,11,1,0 ; movaps 0x10b29(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,92,195 ; subps %xmm3,%xmm8
- DB 68,15,40,37,189,12,1,0 ; movaps 0x10cbd(%rip),%xmm12 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,37,253,11,1,0 ; movaps 0x10bfd(%rip),%xmm12 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 65,15,89,196 ; mulps %xmm12,%xmm0
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -26450,7 +26450,7 @@ _sk_clamp_0_sse2 LABEL PROC
PUBLIC _sk_clamp_1_sse2
_sk_clamp_1_sse2 LABEL PROC
- DB 68,15,40,5,185,10,1,0 ; movaps 0x10ab9(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,249,9,1,0 ; movaps 0x109f9(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,93,192 ; minps %xmm8,%xmm0
DB 65,15,93,200 ; minps %xmm8,%xmm1
DB 65,15,93,208 ; minps %xmm8,%xmm2
@@ -26460,7 +26460,7 @@ _sk_clamp_1_sse2 LABEL PROC
PUBLIC _sk_clamp_a_sse2
_sk_clamp_a_sse2 LABEL PROC
- DB 15,93,29,158,10,1,0 ; minps 0x10a9e(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,29,222,9,1,0 ; minps 0x109de(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,93,195 ; minps %xmm3,%xmm0
DB 15,93,203 ; minps %xmm3,%xmm1
DB 15,93,211 ; minps %xmm3,%xmm2
@@ -26469,7 +26469,7 @@ _sk_clamp_a_sse2 LABEL PROC
PUBLIC _sk_clamp_a_dst_sse2
_sk_clamp_a_dst_sse2 LABEL PROC
- DB 15,93,61,138,10,1,0 ; minps 0x10a8a(%rip),%xmm7 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,93,61,202,9,1,0 ; minps 0x109ca(%rip),%xmm7 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,93,231 ; minps %xmm7,%xmm4
DB 15,93,239 ; minps %xmm7,%xmm5
DB 15,93,247 ; minps %xmm7,%xmm6
@@ -26498,7 +26498,7 @@ _sk_swap_rb_sse2 LABEL PROC
PUBLIC _sk_invert_sse2
_sk_invert_sse2 LABEL PROC
- DB 68,15,40,5,70,10,1,0 ; movaps 0x10a46(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,5,134,9,1,0 ; movaps 0x10986(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,92,200 ; subps %xmm0,%xmm9
DB 69,15,40,208 ; movaps %xmm8,%xmm10
@@ -26550,7 +26550,7 @@ _sk_premul_dst_sse2 LABEL PROC
PUBLIC _sk_unpremul_sse2
_sk_unpremul_sse2 LABEL PROC
DB 69,15,87,192 ; xorps %xmm8,%xmm8
- DB 68,15,40,13,208,9,1,0 ; movaps 0x109d0(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,16,9,1,0 ; movaps 0x10910(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,94,203 ; divps %xmm3,%xmm9
DB 68,15,194,195,4 ; cmpneqps %xmm3,%xmm8
DB 69,15,84,193 ; andps %xmm9,%xmm8
@@ -26562,20 +26562,20 @@ _sk_unpremul_sse2 LABEL PROC
PUBLIC _sk_from_srgb_sse2
_sk_from_srgb_sse2 LABEL PROC
- DB 68,15,40,5,155,10,1,0 ; movaps 0x10a9b(%rip),%xmm8 # 2cc30 <_sk_overlay_sse2_8bit+0xfbb>
+ DB 68,15,40,5,219,9,1,0 ; movaps 0x109db(%rip),%xmm8 # 2cb70 <_sk_overlay_sse2_8bit+0xfc0>
DB 68,15,40,232 ; movaps %xmm0,%xmm13
DB 69,15,89,232 ; mulps %xmm8,%xmm13
DB 68,15,40,216 ; movaps %xmm0,%xmm11
DB 69,15,89,219 ; mulps %xmm11,%xmm11
- DB 68,15,40,13,19,10,1,0 ; movaps 0x10a13(%rip),%xmm9 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,13,83,9,1,0 ; movaps 0x10953(%rip),%xmm9 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 68,15,40,240 ; movaps %xmm0,%xmm14
DB 69,15,89,241 ; mulps %xmm9,%xmm14
- DB 68,15,40,21,131,10,1,0 ; movaps 0x10a83(%rip),%xmm10 # 2cc40 <_sk_overlay_sse2_8bit+0xfcb>
+ DB 68,15,40,21,195,9,1,0 ; movaps 0x109c3(%rip),%xmm10 # 2cb80 <_sk_overlay_sse2_8bit+0xfd0>
DB 69,15,88,242 ; addps %xmm10,%xmm14
DB 69,15,89,243 ; mulps %xmm11,%xmm14
- DB 68,15,40,29,131,10,1,0 ; movaps 0x10a83(%rip),%xmm11 # 2cc50 <_sk_overlay_sse2_8bit+0xfdb>
+ DB 68,15,40,29,195,9,1,0 ; movaps 0x109c3(%rip),%xmm11 # 2cb90 <_sk_overlay_sse2_8bit+0xfe0>
DB 69,15,88,243 ; addps %xmm11,%xmm14
- DB 68,15,40,37,135,10,1,0 ; movaps 0x10a87(%rip),%xmm12 # 2cc60 <_sk_overlay_sse2_8bit+0xfeb>
+ DB 68,15,40,37,199,9,1,0 ; movaps 0x109c7(%rip),%xmm12 # 2cba0 <_sk_overlay_sse2_8bit+0xff0>
DB 65,15,194,196,1 ; cmpltps %xmm12,%xmm0
DB 68,15,84,232 ; andps %xmm0,%xmm13
DB 65,15,85,198 ; andnps %xmm14,%xmm0
@@ -26609,20 +26609,20 @@ _sk_from_srgb_sse2 LABEL PROC
PUBLIC _sk_from_srgb_dst_sse2
_sk_from_srgb_dst_sse2 LABEL PROC
- DB 68,15,40,5,216,9,1,0 ; movaps 0x109d8(%rip),%xmm8 # 2cc30 <_sk_overlay_sse2_8bit+0xfbb>
+ DB 68,15,40,5,24,9,1,0 ; movaps 0x10918(%rip),%xmm8 # 2cb70 <_sk_overlay_sse2_8bit+0xfc0>
DB 68,15,40,236 ; movaps %xmm4,%xmm13
DB 69,15,89,232 ; mulps %xmm8,%xmm13
DB 68,15,40,220 ; movaps %xmm4,%xmm11
DB 69,15,89,219 ; mulps %xmm11,%xmm11
- DB 68,15,40,13,80,9,1,0 ; movaps 0x10950(%rip),%xmm9 # 2cbc0 <_sk_overlay_sse2_8bit+0xf4b>
+ DB 68,15,40,13,144,8,1,0 ; movaps 0x10890(%rip),%xmm9 # 2cb00 <_sk_overlay_sse2_8bit+0xf50>
DB 68,15,40,244 ; movaps %xmm4,%xmm14
DB 69,15,89,241 ; mulps %xmm9,%xmm14
- DB 68,15,40,21,192,9,1,0 ; movaps 0x109c0(%rip),%xmm10 # 2cc40 <_sk_overlay_sse2_8bit+0xfcb>
+ DB 68,15,40,21,0,9,1,0 ; movaps 0x10900(%rip),%xmm10 # 2cb80 <_sk_overlay_sse2_8bit+0xfd0>
DB 69,15,88,242 ; addps %xmm10,%xmm14
DB 69,15,89,243 ; mulps %xmm11,%xmm14
- DB 68,15,40,29,192,9,1,0 ; movaps 0x109c0(%rip),%xmm11 # 2cc50 <_sk_overlay_sse2_8bit+0xfdb>
+ DB 68,15,40,29,0,9,1,0 ; movaps 0x10900(%rip),%xmm11 # 2cb90 <_sk_overlay_sse2_8bit+0xfe0>
DB 69,15,88,243 ; addps %xmm11,%xmm14
- DB 68,15,40,37,196,9,1,0 ; movaps 0x109c4(%rip),%xmm12 # 2cc60 <_sk_overlay_sse2_8bit+0xfeb>
+ DB 68,15,40,37,4,9,1,0 ; movaps 0x10904(%rip),%xmm12 # 2cba0 <_sk_overlay_sse2_8bit+0xff0>
DB 65,15,194,228,1 ; cmpltps %xmm12,%xmm4
DB 68,15,84,236 ; andps %xmm4,%xmm13
DB 65,15,85,230 ; andnps %xmm14,%xmm4
@@ -26657,22 +26657,22 @@ _sk_from_srgb_dst_sse2 LABEL PROC
PUBLIC _sk_to_srgb_sse2
_sk_to_srgb_sse2 LABEL PROC
DB 68,15,82,232 ; rsqrtps %xmm0,%xmm13
- DB 68,15,40,5,81,9,1,0 ; movaps 0x10951(%rip),%xmm8 # 2cc70 <_sk_overlay_sse2_8bit+0xffb>
+ DB 68,15,40,5,145,8,1,0 ; movaps 0x10891(%rip),%xmm8 # 2cbb0 <_sk_overlay_sse2_8bit+0x1000>
DB 68,15,40,240 ; movaps %xmm0,%xmm14
DB 69,15,89,240 ; mulps %xmm8,%xmm14
- DB 68,15,40,13,81,9,1,0 ; movaps 0x10951(%rip),%xmm9 # 2cc80 <_sk_overlay_sse2_8bit+0x100b>
+ DB 68,15,40,13,145,8,1,0 ; movaps 0x10891(%rip),%xmm9 # 2cbc0 <_sk_overlay_sse2_8bit+0x1010>
DB 69,15,40,253 ; movaps %xmm13,%xmm15
DB 69,15,89,249 ; mulps %xmm9,%xmm15
- DB 68,15,40,21,81,9,1,0 ; movaps 0x10951(%rip),%xmm10 # 2cc90 <_sk_overlay_sse2_8bit+0x101b>
+ DB 68,15,40,21,145,8,1,0 ; movaps 0x10891(%rip),%xmm10 # 2cbd0 <_sk_overlay_sse2_8bit+0x1020>
DB 69,15,88,250 ; addps %xmm10,%xmm15
DB 69,15,89,253 ; mulps %xmm13,%xmm15
- DB 68,15,40,29,81,9,1,0 ; movaps 0x10951(%rip),%xmm11 # 2cca0 <_sk_overlay_sse2_8bit+0x102b>
+ DB 68,15,40,29,145,8,1,0 ; movaps 0x10891(%rip),%xmm11 # 2cbe0 <_sk_overlay_sse2_8bit+0x1030>
DB 69,15,88,251 ; addps %xmm11,%xmm15
- DB 68,15,40,37,85,9,1,0 ; movaps 0x10955(%rip),%xmm12 # 2ccb0 <_sk_overlay_sse2_8bit+0x103b>
+ DB 68,15,40,37,149,8,1,0 ; movaps 0x10895(%rip),%xmm12 # 2cbf0 <_sk_overlay_sse2_8bit+0x1040>
DB 69,15,88,236 ; addps %xmm12,%xmm13
DB 69,15,83,237 ; rcpps %xmm13,%xmm13
DB 69,15,89,239 ; mulps %xmm15,%xmm13
- DB 68,15,40,61,81,9,1,0 ; movaps 0x10951(%rip),%xmm15 # 2ccc0 <_sk_overlay_sse2_8bit+0x104b>
+ DB 68,15,40,61,145,8,1,0 ; movaps 0x10891(%rip),%xmm15 # 2cc00 <_sk_overlay_sse2_8bit+0x1050>
DB 65,15,194,199,1 ; cmpltps %xmm15,%xmm0
DB 68,15,84,240 ; andps %xmm0,%xmm14
DB 65,15,85,197 ; andnps %xmm13,%xmm0
@@ -26722,7 +26722,7 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 68,15,93,216 ; minps %xmm0,%xmm11
DB 65,15,40,202 ; movaps %xmm10,%xmm1
DB 65,15,92,203 ; subps %xmm11,%xmm1
- DB 68,15,40,45,20,7,1,0 ; movaps 0x10714(%rip),%xmm13 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,45,84,6,1,0 ; movaps 0x10654(%rip),%xmm13 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 68,15,94,233 ; divps %xmm1,%xmm13
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,194,192,0 ; cmpeqps %xmm8,%xmm0
@@ -26731,30 +26731,30 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,40,241 ; movaps %xmm9,%xmm14
DB 68,15,194,242,1 ; cmpltps %xmm2,%xmm14
- DB 68,15,84,53,122,8,1,0 ; andps 0x1087a(%rip),%xmm14 # 2ccd0 <_sk_overlay_sse2_8bit+0x105b>
+ DB 68,15,84,53,186,7,1,0 ; andps 0x107ba(%rip),%xmm14 # 2cc10 <_sk_overlay_sse2_8bit+0x1060>
DB 69,15,88,244 ; addps %xmm12,%xmm14
DB 69,15,40,250 ; movaps %xmm10,%xmm15
DB 69,15,194,249,0 ; cmpeqps %xmm9,%xmm15
DB 65,15,92,208 ; subps %xmm8,%xmm2
DB 65,15,89,213 ; mulps %xmm13,%xmm2
- DB 68,15,40,37,109,8,1,0 ; movaps 0x1086d(%rip),%xmm12 # 2cce0 <_sk_overlay_sse2_8bit+0x106b>
+ DB 68,15,40,37,173,7,1,0 ; movaps 0x107ad(%rip),%xmm12 # 2cc20 <_sk_overlay_sse2_8bit+0x1070>
DB 65,15,88,212 ; addps %xmm12,%xmm2
DB 69,15,92,193 ; subps %xmm9,%xmm8
DB 69,15,89,197 ; mulps %xmm13,%xmm8
- DB 68,15,88,5,105,8,1,0 ; addps 0x10869(%rip),%xmm8 # 2ccf0 <_sk_overlay_sse2_8bit+0x107b>
+ DB 68,15,88,5,169,7,1,0 ; addps 0x107a9(%rip),%xmm8 # 2cc30 <_sk_overlay_sse2_8bit+0x1080>
DB 65,15,84,215 ; andps %xmm15,%xmm2
DB 69,15,85,248 ; andnps %xmm8,%xmm15
DB 68,15,86,250 ; orps %xmm2,%xmm15
DB 68,15,84,240 ; andps %xmm0,%xmm14
DB 65,15,85,199 ; andnps %xmm15,%xmm0
DB 65,15,86,198 ; orps %xmm14,%xmm0
- DB 15,89,5,90,8,1,0 ; mulps 0x1085a(%rip),%xmm0 # 2cd00 <_sk_overlay_sse2_8bit+0x108b>
+ DB 15,89,5,154,7,1,0 ; mulps 0x1079a(%rip),%xmm0 # 2cc40 <_sk_overlay_sse2_8bit+0x1090>
DB 69,15,40,194 ; movaps %xmm10,%xmm8
DB 69,15,194,195,4 ; cmpneqps %xmm11,%xmm8
DB 65,15,84,192 ; andps %xmm8,%xmm0
DB 69,15,92,226 ; subps %xmm10,%xmm12
DB 69,15,88,211 ; addps %xmm11,%xmm10
- DB 68,15,40,13,93,6,1,0 ; movaps 0x1065d(%rip),%xmm9 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,13,157,5,1,0 ; movaps 0x1059d(%rip),%xmm9 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,40,210 ; movaps %xmm10,%xmm2
DB 65,15,89,209 ; mulps %xmm9,%xmm2
DB 68,15,194,202,1 ; cmpltps %xmm2,%xmm9
@@ -26777,7 +26777,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,41,92,36,32 ; movaps %xmm3,0x20(%rsp)
DB 68,15,40,218 ; movaps %xmm2,%xmm11
DB 15,40,240 ; movaps %xmm0,%xmm6
- DB 68,15,40,13,8,6,1,0 ; movaps 0x10608(%rip),%xmm9 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,13,72,5,1,0 ; movaps 0x10548(%rip),%xmm9 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,40,209 ; movaps %xmm9,%xmm10
DB 69,15,194,211,2 ; cmpleps %xmm11,%xmm10
DB 15,40,193 ; movaps %xmm1,%xmm0
@@ -26794,28 +26794,28 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 69,15,88,211 ; addps %xmm11,%xmm10
DB 69,15,88,219 ; addps %xmm11,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 15,40,5,178,7,1,0 ; movaps 0x107b2(%rip),%xmm0 # 2cd10 <_sk_overlay_sse2_8bit+0x109b>
+ DB 15,40,5,242,6,1,0 ; movaps 0x106f2(%rip),%xmm0 # 2cc50 <_sk_overlay_sse2_8bit+0x10a0>
DB 15,88,198 ; addps %xmm6,%xmm0
DB 243,15,91,200 ; cvttps2dq %xmm0,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,40,216 ; movaps %xmm0,%xmm3
DB 15,194,217,1 ; cmpltps %xmm1,%xmm3
- DB 15,84,29,202,5,1,0 ; andps 0x105ca(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,84,29,10,5,1,0 ; andps 0x1050a(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,92,193 ; subps %xmm1,%xmm0
- DB 68,15,40,45,156,7,1,0 ; movaps 0x1079c(%rip),%xmm13 # 2cd20 <_sk_overlay_sse2_8bit+0x10ab>
+ DB 68,15,40,45,220,6,1,0 ; movaps 0x106dc(%rip),%xmm13 # 2cc60 <_sk_overlay_sse2_8bit+0x10b0>
DB 69,15,40,197 ; movaps %xmm13,%xmm8
DB 68,15,194,192,2 ; cmpleps %xmm0,%xmm8
DB 69,15,40,242 ; movaps %xmm10,%xmm14
DB 69,15,92,243 ; subps %xmm11,%xmm14
DB 65,15,40,217 ; movaps %xmm9,%xmm3
DB 15,194,216,2 ; cmpleps %xmm0,%xmm3
- DB 15,40,21,92,7,1,0 ; movaps 0x1075c(%rip),%xmm2 # 2cd00 <_sk_overlay_sse2_8bit+0x108b>
+ DB 15,40,21,156,6,1,0 ; movaps 0x1069c(%rip),%xmm2 # 2cc40 <_sk_overlay_sse2_8bit+0x1090>
DB 68,15,40,250 ; movaps %xmm2,%xmm15
DB 68,15,194,248,2 ; cmpleps %xmm0,%xmm15
- DB 15,40,13,28,7,1,0 ; movaps 0x1071c(%rip),%xmm1 # 2ccd0 <_sk_overlay_sse2_8bit+0x105b>
+ DB 15,40,13,92,6,1,0 ; movaps 0x1065c(%rip),%xmm1 # 2cc10 <_sk_overlay_sse2_8bit+0x1060>
DB 15,89,193 ; mulps %xmm1,%xmm0
- DB 15,40,45,50,7,1,0 ; movaps 0x10732(%rip),%xmm5 # 2ccf0 <_sk_overlay_sse2_8bit+0x107b>
+ DB 15,40,45,114,6,1,0 ; movaps 0x10672(%rip),%xmm5 # 2cc30 <_sk_overlay_sse2_8bit+0x1080>
DB 15,40,229 ; movaps %xmm5,%xmm4
DB 15,92,224 ; subps %xmm0,%xmm4
DB 65,15,89,230 ; mulps %xmm14,%xmm4
@@ -26838,7 +26838,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,40,222 ; movaps %xmm6,%xmm3
DB 15,194,216,1 ; cmpltps %xmm0,%xmm3
- DB 15,84,29,39,5,1,0 ; andps 0x10527(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,84,29,103,4,1,0 ; andps 0x10467(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,195 ; subps %xmm3,%xmm0
DB 68,15,40,230 ; movaps %xmm6,%xmm12
DB 68,15,92,224 ; subps %xmm0,%xmm12
@@ -26868,12 +26868,12 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,40,60,36 ; movaps (%rsp),%xmm7
DB 15,40,231 ; movaps %xmm7,%xmm4
DB 15,85,227 ; andnps %xmm3,%xmm4
- DB 15,88,53,160,6,1,0 ; addps 0x106a0(%rip),%xmm6 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 15,88,53,224,5,1,0 ; addps 0x105e0(%rip),%xmm6 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 243,15,91,198 ; cvttps2dq %xmm6,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,40,222 ; movaps %xmm6,%xmm3
DB 15,194,216,1 ; cmpltps %xmm0,%xmm3
- DB 15,84,29,155,4,1,0 ; andps 0x1049b(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,84,29,219,3,1,0 ; andps 0x103db(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,92,195 ; subps %xmm3,%xmm0
DB 15,92,240 ; subps %xmm0,%xmm6
DB 15,89,206 ; mulps %xmm6,%xmm1
@@ -26938,9 +26938,9 @@ _sk_scale_u8_sse2 LABEL PROC
DB 102,71,15,110,4,16 ; movd (%r8,%r10,1),%xmm8
DB 102,68,15,96,192 ; punpcklbw %xmm0,%xmm8
DB 102,68,15,97,192 ; punpcklwd %xmm0,%xmm8
- DB 102,68,15,219,5,106,4,1,0 ; pand 0x1046a(%rip),%xmm8 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,68,15,219,5,170,3,1,0 ; pand 0x103aa(%rip),%xmm8 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,174,5,1,0 ; mulps 0x105ae(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,89,5,238,4,1,0 ; mulps 0x104ee(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 65,15,89,208 ; mulps %xmm8,%xmm2
@@ -26983,17 +26983,17 @@ _sk_scale_565_sse2 LABEL PROC
DB 15,133,173,0,0,0 ; jne 1c8cf <_sk_scale_565_sse2+0xcc>
DB 243,71,15,126,20,80 ; movq (%r8,%r10,2),%xmm10
DB 102,68,15,97,208 ; punpcklwd %xmm0,%xmm10
- DB 102,68,15,111,5,26,5,1,0 ; movdqa 0x1051a(%rip),%xmm8 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,68,15,111,5,90,4,1,0 ; movdqa 0x1045a(%rip),%xmm8 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,69,15,219,194 ; pand %xmm10,%xmm8
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,25,5,1,0 ; mulps 0x10519(%rip),%xmm8 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,68,15,111,13,32,5,1,0 ; movdqa 0x10520(%rip),%xmm9 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 68,15,89,5,89,4,1,0 ; mulps 0x10459(%rip),%xmm8 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,68,15,111,13,96,4,1,0 ; movdqa 0x10460(%rip),%xmm9 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,69,15,219,202 ; pand %xmm10,%xmm9
DB 69,15,91,201 ; cvtdq2ps %xmm9,%xmm9
- DB 68,15,89,13,31,5,1,0 ; mulps 0x1051f(%rip),%xmm9 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,68,15,219,21,38,5,1,0 ; pand 0x10526(%rip),%xmm10 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 68,15,89,13,95,4,1,0 ; mulps 0x1045f(%rip),%xmm9 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,68,15,219,21,102,4,1,0 ; pand 0x10466(%rip),%xmm10 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
- DB 68,15,89,21,42,5,1,0 ; mulps 0x1052a(%rip),%xmm10 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 68,15,89,21,106,4,1,0 ; mulps 0x1046a(%rip),%xmm10 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 68,15,40,219 ; movaps %xmm3,%xmm11
DB 68,15,194,223,1 ; cmpltps %xmm7,%xmm11
DB 69,15,40,225 ; movaps %xmm9,%xmm12
@@ -27070,9 +27070,9 @@ _sk_lerp_u8_sse2 LABEL PROC
DB 102,71,15,110,4,16 ; movd (%r8,%r10,1),%xmm8
DB 102,68,15,96,192 ; punpcklbw %xmm0,%xmm8
DB 102,68,15,97,192 ; punpcklwd %xmm0,%xmm8
- DB 102,68,15,219,5,97,2,1,0 ; pand 0x10261(%rip),%xmm8 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,68,15,219,5,161,1,1,0 ; pand 0x101a1(%rip),%xmm8 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,165,3,1,0 ; mulps 0x103a5(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,89,5,229,2,1,0 ; mulps 0x102e5(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 15,92,196 ; subps %xmm4,%xmm0
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -27122,17 +27122,17 @@ _sk_lerp_565_sse2 LABEL PROC
DB 15,133,173,0,0,0 ; jne 1caef <_sk_lerp_565_sse2+0xcc>
DB 243,71,15,126,4,80 ; movq (%r8,%r10,2),%xmm8
DB 102,68,15,97,192 ; punpcklwd %xmm0,%xmm8
- DB 102,68,15,111,13,250,2,1,0 ; movdqa 0x102fa(%rip),%xmm9 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,68,15,111,13,58,2,1,0 ; movdqa 0x1023a(%rip),%xmm9 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,69,15,219,200 ; pand %xmm8,%xmm9
DB 69,15,91,201 ; cvtdq2ps %xmm9,%xmm9
- DB 68,15,89,13,249,2,1,0 ; mulps 0x102f9(%rip),%xmm9 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,68,15,111,21,0,3,1,0 ; movdqa 0x10300(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 68,15,89,13,57,2,1,0 ; mulps 0x10239(%rip),%xmm9 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,68,15,111,21,64,2,1,0 ; movdqa 0x10240(%rip),%xmm10 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,69,15,219,208 ; pand %xmm8,%xmm10
DB 69,15,91,218 ; cvtdq2ps %xmm10,%xmm11
- DB 68,15,89,29,255,2,1,0 ; mulps 0x102ff(%rip),%xmm11 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,68,15,219,5,6,3,1,0 ; pand 0x10306(%rip),%xmm8 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 68,15,89,29,63,2,1,0 ; mulps 0x1023f(%rip),%xmm11 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,68,15,219,5,70,2,1,0 ; pand 0x10246(%rip),%xmm8 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,10,3,1,0 ; mulps 0x1030a(%rip),%xmm8 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 68,15,89,5,74,2,1,0 ; mulps 0x1024a(%rip),%xmm8 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 68,15,40,211 ; movaps %xmm3,%xmm10
DB 68,15,194,215,1 ; cmpltps %xmm7,%xmm10
DB 69,15,40,227 ; movaps %xmm11,%xmm12
@@ -27187,7 +27187,7 @@ _sk_load_tables_sse2 LABEL PROC
DB 243,69,15,111,12,144 ; movdqu (%r8,%rdx,4),%xmm9
DB 65,86 ; push %r14
DB 83 ; push %rbx
- DB 102,68,15,111,5,138,0,1,0 ; movdqa 0x1008a(%rip),%xmm8 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,68,15,111,5,202,255,0,0 ; movdqa 0xffca(%rip),%xmm8 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
@@ -27243,7 +27243,7 @@ _sk_load_tables_sse2 LABEL PROC
DB 65,15,20,208 ; unpcklps %xmm8,%xmm2
DB 102,65,15,114,209,24 ; psrld $0x18,%xmm9
DB 65,15,91,217 ; cvtdq2ps %xmm9,%xmm3
- DB 15,89,29,211,0,1,0 ; mulps 0x100d3(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,29,19,0,1,0 ; mulps 0x10013(%rip),%xmm3 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
DB 65,94 ; pop %r14
@@ -27281,7 +27281,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,97,200 ; punpcklwd %xmm0,%xmm1
DB 102,68,15,105,200 ; punpckhwd %xmm0,%xmm9
- DB 102,68,15,111,21,172,0,1,0 ; movdqa 0x100ac(%rip),%xmm10 # 2cdb0 <_sk_overlay_sse2_8bit+0x113b>
+ DB 102,68,15,111,21,236,255,0,0 ; movdqa 0xffec(%rip),%xmm10 # 2ccf0 <_sk_overlay_sse2_8bit+0x1140>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,194 ; pand %xmm10,%xmm0
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
@@ -27343,7 +27343,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 102,65,15,235,217 ; por %xmm9,%xmm3
DB 102,65,15,97,216 ; punpcklwd %xmm8,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,167,255,0,0 ; mulps 0xffa7(%rip),%xmm3 # 2cdd0 <_sk_overlay_sse2_8bit+0x115b>
+ DB 15,89,29,231,254,0,0 ; mulps 0xfee7(%rip),%xmm3 # 2cd10 <_sk_overlay_sse2_8bit+0x1160>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
DB 65,94 ; pop %r14
@@ -27382,7 +27382,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC
DB 102,68,15,97,208 ; punpcklwd %xmm0,%xmm10
DB 102,65,15,111,195 ; movdqa %xmm11,%xmm0
DB 102,65,15,97,194 ; punpcklwd %xmm10,%xmm0
- DB 102,68,15,111,5,234,254,0,0 ; movdqa 0xfeea(%rip),%xmm8 # 2cdb0 <_sk_overlay_sse2_8bit+0x113b>
+ DB 102,68,15,111,5,42,254,0,0 ; movdqa 0xfe2a(%rip),%xmm8 # 2ccf0 <_sk_overlay_sse2_8bit+0x1140>
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
@@ -27438,7 +27438,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC
DB 15,20,211 ; unpcklps %xmm3,%xmm2
DB 65,15,20,208 ; unpcklps %xmm8,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,117,251,0,0 ; movaps 0xfb75(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,181,250,0,0 ; movaps 0xfab5(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 91 ; pop %rbx
DB 65,94 ; pop %r14
DB 255,224 ; jmpq *%rax
@@ -27468,7 +27468,7 @@ _sk_byte_tables_sse2 LABEL PROC
DB 65,86 ; push %r14
DB 83 ; push %rbx
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,226,251,0,0 ; movaps 0xfbe2(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,34,251,0,0 ; movaps 0xfb22(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 102,73,15,126,192 ; movq %xmm0,%r8
@@ -27496,7 +27496,7 @@ _sk_byte_tables_sse2 LABEL PROC
DB 102,65,15,96,193 ; punpcklbw %xmm9,%xmm0
DB 102,65,15,97,193 ; punpcklwd %xmm9,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,21,140,252,0,0 ; movaps 0xfc8c(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,21,204,251,0,0 ; movaps 0xfbcc(%rip),%xmm10 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,194 ; mulps %xmm10,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -27613,7 +27613,7 @@ _sk_byte_tables_rgb_sse2 LABEL PROC
DB 102,65,15,96,193 ; punpcklbw %xmm9,%xmm0
DB 102,65,15,97,193 ; punpcklwd %xmm9,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,21,200,250,0,0 ; movaps 0xfac8(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,21,8,250,0,0 ; movaps 0xfa08(%rip),%xmm10 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,194 ; mulps %xmm10,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -27801,15 +27801,15 @@ _sk_parametric_r_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,166,248,0,0 ; mulps 0xf8a6(%rip),%xmm9 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,21,174,248,0,0 ; andps 0xf8ae(%rip),%xmm10 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,21,198,245,0,0 ; orps 0xf5c6(%rip),%xmm10 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,13,174,248,0,0 ; addps 0xf8ae(%rip),%xmm9 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 68,15,40,37,182,248,0,0 ; movaps 0xf8b6(%rip),%xmm12 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,13,230,247,0,0 ; mulps 0xf7e6(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,21,238,247,0,0 ; andps 0xf7ee(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,21,6,245,0,0 ; orps 0xf506(%rip),%xmm10 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,13,238,247,0,0 ; addps 0xf7ee(%rip),%xmm9 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 68,15,40,37,246,247,0,0 ; movaps 0xf7f6(%rip),%xmm12 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,182,248,0,0 ; addps 0xf8b6(%rip),%xmm10 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 68,15,40,37,190,248,0,0 ; movaps 0xf8be(%rip),%xmm12 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,21,246,247,0,0 ; addps 0xf7f6(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 68,15,40,37,254,247,0,0 ; movaps 0xf7fe(%rip),%xmm12 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -27817,22 +27817,22 @@ _sk_parametric_r_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,152,245,0,0 ; movaps 0xf598(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,216,244,0,0 ; movaps 0xf4d8(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,140,248,0,0 ; addps 0xf88c(%rip),%xmm9 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 68,15,40,37,148,248,0,0 ; movaps 0xf894(%rip),%xmm12 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,13,204,247,0,0 ; addps 0xf7cc(%rip),%xmm9 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 68,15,40,37,212,247,0,0 ; movaps 0xf7d4(%rip),%xmm12 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,148,248,0,0 ; movaps 0xf894(%rip),%xmm12 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,37,212,247,0,0 ; movaps 0xf7d4(%rip),%xmm12 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,152,248,0,0 ; movaps 0xf898(%rip),%xmm13 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,45,216,247,0,0 ; movaps 0xf7d8(%rip),%xmm13 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,152,248,0,0 ; mulps 0xf898(%rip),%xmm13 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 68,15,89,45,216,247,0,0 ; mulps 0xf7d8(%rip),%xmm13 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -27866,15 +27866,15 @@ _sk_parametric_g_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,104,247,0,0 ; mulps 0xf768(%rip),%xmm9 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,21,112,247,0,0 ; andps 0xf770(%rip),%xmm10 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,21,136,244,0,0 ; orps 0xf488(%rip),%xmm10 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,13,112,247,0,0 ; addps 0xf770(%rip),%xmm9 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 68,15,40,37,120,247,0,0 ; movaps 0xf778(%rip),%xmm12 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,13,168,246,0,0 ; mulps 0xf6a8(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,21,176,246,0,0 ; andps 0xf6b0(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,21,200,243,0,0 ; orps 0xf3c8(%rip),%xmm10 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,13,176,246,0,0 ; addps 0xf6b0(%rip),%xmm9 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 68,15,40,37,184,246,0,0 ; movaps 0xf6b8(%rip),%xmm12 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,120,247,0,0 ; addps 0xf778(%rip),%xmm10 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 68,15,40,37,128,247,0,0 ; movaps 0xf780(%rip),%xmm12 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,21,184,246,0,0 ; addps 0xf6b8(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 68,15,40,37,192,246,0,0 ; movaps 0xf6c0(%rip),%xmm12 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -27882,22 +27882,22 @@ _sk_parametric_g_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,90,244,0,0 ; movaps 0xf45a(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,154,243,0,0 ; movaps 0xf39a(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,78,247,0,0 ; addps 0xf74e(%rip),%xmm9 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 68,15,40,37,86,247,0,0 ; movaps 0xf756(%rip),%xmm12 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,13,142,246,0,0 ; addps 0xf68e(%rip),%xmm9 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 68,15,40,37,150,246,0,0 ; movaps 0xf696(%rip),%xmm12 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,86,247,0,0 ; movaps 0xf756(%rip),%xmm12 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,37,150,246,0,0 ; movaps 0xf696(%rip),%xmm12 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,90,247,0,0 ; movaps 0xf75a(%rip),%xmm13 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,45,154,246,0,0 ; movaps 0xf69a(%rip),%xmm13 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,90,247,0,0 ; mulps 0xf75a(%rip),%xmm13 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 68,15,89,45,154,246,0,0 ; mulps 0xf69a(%rip),%xmm13 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -27931,15 +27931,15 @@ _sk_parametric_b_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,42,246,0,0 ; mulps 0xf62a(%rip),%xmm9 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,21,50,246,0,0 ; andps 0xf632(%rip),%xmm10 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,21,74,243,0,0 ; orps 0xf34a(%rip),%xmm10 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,13,50,246,0,0 ; addps 0xf632(%rip),%xmm9 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 68,15,40,37,58,246,0,0 ; movaps 0xf63a(%rip),%xmm12 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,13,106,245,0,0 ; mulps 0xf56a(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,21,114,245,0,0 ; andps 0xf572(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,21,138,242,0,0 ; orps 0xf28a(%rip),%xmm10 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,13,114,245,0,0 ; addps 0xf572(%rip),%xmm9 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 68,15,40,37,122,245,0,0 ; movaps 0xf57a(%rip),%xmm12 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,58,246,0,0 ; addps 0xf63a(%rip),%xmm10 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 68,15,40,37,66,246,0,0 ; movaps 0xf642(%rip),%xmm12 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,21,122,245,0,0 ; addps 0xf57a(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 68,15,40,37,130,245,0,0 ; movaps 0xf582(%rip),%xmm12 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -27947,22 +27947,22 @@ _sk_parametric_b_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,28,243,0,0 ; movaps 0xf31c(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,92,242,0,0 ; movaps 0xf25c(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,16,246,0,0 ; addps 0xf610(%rip),%xmm9 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 68,15,40,37,24,246,0,0 ; movaps 0xf618(%rip),%xmm12 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,13,80,245,0,0 ; addps 0xf550(%rip),%xmm9 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 68,15,40,37,88,245,0,0 ; movaps 0xf558(%rip),%xmm12 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,24,246,0,0 ; movaps 0xf618(%rip),%xmm12 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,37,88,245,0,0 ; movaps 0xf558(%rip),%xmm12 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,28,246,0,0 ; movaps 0xf61c(%rip),%xmm13 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,45,92,245,0,0 ; movaps 0xf55c(%rip),%xmm13 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,28,246,0,0 ; mulps 0xf61c(%rip),%xmm13 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 68,15,89,45,92,245,0,0 ; mulps 0xf55c(%rip),%xmm13 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -27996,15 +27996,15 @@ _sk_parametric_a_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,236,244,0,0 ; mulps 0xf4ec(%rip),%xmm9 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 68,15,84,21,244,244,0,0 ; andps 0xf4f4(%rip),%xmm10 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,86,21,12,242,0,0 ; orps 0xf20c(%rip),%xmm10 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
- DB 68,15,88,13,244,244,0,0 ; addps 0xf4f4(%rip),%xmm9 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
- DB 68,15,40,37,252,244,0,0 ; movaps 0xf4fc(%rip),%xmm12 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,89,13,44,244,0,0 ; mulps 0xf42c(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 68,15,84,21,52,244,0,0 ; andps 0xf434(%rip),%xmm10 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,86,21,76,241,0,0 ; orps 0xf14c(%rip),%xmm10 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
+ DB 68,15,88,13,52,244,0,0 ; addps 0xf434(%rip),%xmm9 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
+ DB 68,15,40,37,60,244,0,0 ; movaps 0xf43c(%rip),%xmm12 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,252,244,0,0 ; addps 0xf4fc(%rip),%xmm10 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
- DB 68,15,40,37,4,245,0,0 ; movaps 0xf504(%rip),%xmm12 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,88,21,60,244,0,0 ; addps 0xf43c(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
+ DB 68,15,40,37,68,244,0,0 ; movaps 0xf444(%rip),%xmm12 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -28012,22 +28012,22 @@ _sk_parametric_a_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,222,241,0,0 ; movaps 0xf1de(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,30,241,0,0 ; movaps 0xf11e(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,210,244,0,0 ; addps 0xf4d2(%rip),%xmm9 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
- DB 68,15,40,37,218,244,0,0 ; movaps 0xf4da(%rip),%xmm12 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 68,15,88,13,18,244,0,0 ; addps 0xf412(%rip),%xmm9 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
+ DB 68,15,40,37,26,244,0,0 ; movaps 0xf41a(%rip),%xmm12 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,218,244,0,0 ; movaps 0xf4da(%rip),%xmm12 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 68,15,40,37,26,244,0,0 ; movaps 0xf41a(%rip),%xmm12 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,222,244,0,0 ; movaps 0xf4de(%rip),%xmm13 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,45,30,244,0,0 ; movaps 0xf41e(%rip),%xmm13 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,222,244,0,0 ; mulps 0xf4de(%rip),%xmm13 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 68,15,89,45,30,244,0,0 ; mulps 0xf41e(%rip),%xmm13 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -28051,19 +28051,19 @@ _sk_gamma_sse2 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,91,194 ; cvtdq2ps %xmm2,%xmm0
- DB 15,89,5,230,243,0,0 ; mulps 0xf3e6(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 15,84,21,239,243,0,0 ; andps 0xf3ef(%rip),%xmm2 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 68,15,40,53,7,241,0,0 ; movaps 0xf107(%rip),%xmm14 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,89,5,38,243,0,0 ; mulps 0xf326(%rip),%xmm0 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 15,84,21,47,243,0,0 ; andps 0xf32f(%rip),%xmm2 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 68,15,40,53,71,240,0,0 ; movaps 0xf047(%rip),%xmm14 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,86,214 ; orps %xmm14,%xmm2
- DB 68,15,40,37,235,243,0,0 ; movaps 0xf3eb(%rip),%xmm12 # 2ce10 <_sk_overlay_sse2_8bit+0x119b>
+ DB 68,15,40,37,43,243,0,0 ; movaps 0xf32b(%rip),%xmm12 # 2cd50 <_sk_overlay_sse2_8bit+0x11a0>
DB 65,15,88,196 ; addps %xmm12,%xmm0
- DB 68,15,40,29,239,243,0,0 ; movaps 0xf3ef(%rip),%xmm11 # 2ce20 <_sk_overlay_sse2_8bit+0x11ab>
+ DB 68,15,40,29,47,243,0,0 ; movaps 0xf32f(%rip),%xmm11 # 2cd60 <_sk_overlay_sse2_8bit+0x11b0>
DB 15,40,226 ; movaps %xmm2,%xmm4
DB 65,15,89,227 ; mulps %xmm11,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 68,15,40,21,237,243,0,0 ; movaps 0xf3ed(%rip),%xmm10 # 2ce30 <_sk_overlay_sse2_8bit+0x11bb>
+ DB 68,15,40,21,45,243,0,0 ; movaps 0xf32d(%rip),%xmm10 # 2cd70 <_sk_overlay_sse2_8bit+0x11c0>
DB 65,15,88,210 ; addps %xmm10,%xmm2
- DB 68,15,40,45,241,243,0,0 ; movaps 0xf3f1(%rip),%xmm13 # 2ce40 <_sk_overlay_sse2_8bit+0x11cb>
+ DB 68,15,40,45,49,243,0,0 ; movaps 0xf331(%rip),%xmm13 # 2cd80 <_sk_overlay_sse2_8bit+0x11d0>
DB 65,15,40,229 ; movaps %xmm13,%xmm4
DB 15,94,226 ; divps %xmm2,%xmm4
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -28075,27 +28075,27 @@ _sk_gamma_sse2 LABEL PROC
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 15,40,224 ; movaps %xmm0,%xmm4
DB 15,194,226,1 ; cmpltps %xmm2,%xmm4
- DB 68,15,40,13,193,240,0,0 ; movaps 0xf0c1(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,13,1,240,0,0 ; movaps 0xf001(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 65,15,84,225 ; andps %xmm9,%xmm4
DB 15,92,212 ; subps %xmm4,%xmm2
DB 15,40,224 ; movaps %xmm0,%xmm4
DB 15,92,226 ; subps %xmm2,%xmm4
- DB 15,40,53,189,243,0,0 ; movaps 0xf3bd(%rip),%xmm6 # 2ce50 <_sk_overlay_sse2_8bit+0x11db>
+ DB 15,40,53,253,242,0,0 ; movaps 0xf2fd(%rip),%xmm6 # 2cd90 <_sk_overlay_sse2_8bit+0x11e0>
DB 15,88,198 ; addps %xmm6,%xmm0
- DB 15,40,61,211,243,0,0 ; movaps 0xf3d3(%rip),%xmm7 # 2ce70 <_sk_overlay_sse2_8bit+0x11fb>
+ DB 15,40,61,19,243,0,0 ; movaps 0xf313(%rip),%xmm7 # 2cdb0 <_sk_overlay_sse2_8bit+0x1200>
DB 15,40,239 ; movaps %xmm7,%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,40,212 ; movaps %xmm4,%xmm2
- DB 15,40,37,179,243,0,0 ; movaps 0xf3b3(%rip),%xmm4 # 2ce60 <_sk_overlay_sse2_8bit+0x11eb>
+ DB 15,40,37,243,242,0,0 ; movaps 0xf2f3(%rip),%xmm4 # 2cda0 <_sk_overlay_sse2_8bit+0x11f0>
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,92,194 ; subps %xmm2,%xmm0
- DB 68,15,40,61,197,243,0,0 ; movaps 0xf3c5(%rip),%xmm15 # 2ce80 <_sk_overlay_sse2_8bit+0x120b>
+ DB 68,15,40,61,5,243,0,0 ; movaps 0xf305(%rip),%xmm15 # 2cdc0 <_sk_overlay_sse2_8bit+0x1210>
DB 65,15,40,215 ; movaps %xmm15,%xmm2
DB 15,94,213 ; divps %xmm5,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0
- DB 15,89,5,33,243,0,0 ; mulps 0xf321(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 15,84,13,42,243,0,0 ; andps 0xf32a(%rip),%xmm1 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
+ DB 15,89,5,97,242,0,0 ; mulps 0xf261(%rip),%xmm0 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 15,84,13,106,242,0,0 ; andps 0xf26a(%rip),%xmm1 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
DB 65,15,86,206 ; orps %xmm14,%xmm1
DB 65,15,88,196 ; addps %xmm12,%xmm0
DB 15,40,233 ; movaps %xmm1,%xmm5
@@ -28125,9 +28125,9 @@ _sk_gamma_sse2 LABEL PROC
DB 15,94,206 ; divps %xmm6,%xmm1
DB 15,88,200 ; addps %xmm0,%xmm1
DB 15,91,195 ; cvtdq2ps %xmm3,%xmm0
- DB 15,89,5,176,242,0,0 ; mulps 0xf2b0(%rip),%xmm0 # 2cdf0 <_sk_overlay_sse2_8bit+0x117b>
- DB 15,84,29,185,242,0,0 ; andps 0xf2b9(%rip),%xmm3 # 2ce00 <_sk_overlay_sse2_8bit+0x118b>
- DB 15,86,29,210,239,0,0 ; orps 0xefd2(%rip),%xmm3 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,89,5,240,241,0,0 ; mulps 0xf1f0(%rip),%xmm0 # 2cd30 <_sk_overlay_sse2_8bit+0x1180>
+ DB 15,84,29,249,241,0,0 ; andps 0xf1f9(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x1190>
+ DB 15,86,29,18,239,0,0 ; orps 0xef12(%rip),%xmm3 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,88,196 ; addps %xmm12,%xmm0
DB 68,15,89,219 ; mulps %xmm3,%xmm11
DB 65,15,92,195 ; subps %xmm11,%xmm0
@@ -28149,7 +28149,7 @@ _sk_gamma_sse2 LABEL PROC
DB 15,92,253 ; subps %xmm5,%xmm7
DB 68,15,94,255 ; divps %xmm7,%xmm15
DB 68,15,88,248 ; addps %xmm0,%xmm15
- DB 15,40,5,239,242,0,0 ; movaps 0xf2ef(%rip),%xmm0 # 2ce90 <_sk_overlay_sse2_8bit+0x121b>
+ DB 15,40,5,47,242,0,0 ; movaps 0xf22f(%rip),%xmm0 # 2cdd0 <_sk_overlay_sse2_8bit+0x1220>
DB 15,89,208 ; mulps %xmm0,%xmm2
DB 15,89,200 ; mulps %xmm0,%xmm1
DB 68,15,89,248 ; mulps %xmm0,%xmm15
@@ -28167,29 +28167,29 @@ _sk_gamma_sse2 LABEL PROC
PUBLIC _sk_lab_to_xyz_sse2
_sk_lab_to_xyz_sse2 LABEL PROC
- DB 15,89,5,193,242,0,0 ; mulps 0xf2c1(%rip),%xmm0 # 2cea0 <_sk_overlay_sse2_8bit+0x122b>
- DB 68,15,40,5,57,240,0,0 ; movaps 0xf039(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 15,89,5,1,242,0,0 ; mulps 0xf201(%rip),%xmm0 # 2cde0 <_sk_overlay_sse2_8bit+0x1230>
+ DB 68,15,40,5,121,239,0,0 ; movaps 0xef79(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 65,15,89,200 ; mulps %xmm8,%xmm1
- DB 68,15,40,13,189,242,0,0 ; movaps 0xf2bd(%rip),%xmm9 # 2ceb0 <_sk_overlay_sse2_8bit+0x123b>
+ DB 68,15,40,13,253,241,0,0 ; movaps 0xf1fd(%rip),%xmm9 # 2cdf0 <_sk_overlay_sse2_8bit+0x1240>
DB 65,15,88,201 ; addps %xmm9,%xmm1
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 65,15,88,209 ; addps %xmm9,%xmm2
- DB 15,88,5,186,242,0,0 ; addps 0xf2ba(%rip),%xmm0 # 2cec0 <_sk_overlay_sse2_8bit+0x124b>
- DB 15,89,5,195,242,0,0 ; mulps 0xf2c3(%rip),%xmm0 # 2ced0 <_sk_overlay_sse2_8bit+0x125b>
- DB 15,89,13,204,242,0,0 ; mulps 0xf2cc(%rip),%xmm1 # 2cee0 <_sk_overlay_sse2_8bit+0x126b>
+ DB 15,88,5,250,241,0,0 ; addps 0xf1fa(%rip),%xmm0 # 2ce00 <_sk_overlay_sse2_8bit+0x1250>
+ DB 15,89,5,3,242,0,0 ; mulps 0xf203(%rip),%xmm0 # 2ce10 <_sk_overlay_sse2_8bit+0x1260>
+ DB 15,89,13,12,242,0,0 ; mulps 0xf20c(%rip),%xmm1 # 2ce20 <_sk_overlay_sse2_8bit+0x1270>
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,21,210,242,0,0 ; mulps 0xf2d2(%rip),%xmm2 # 2cef0 <_sk_overlay_sse2_8bit+0x127b>
+ DB 15,89,21,18,242,0,0 ; mulps 0xf212(%rip),%xmm2 # 2ce30 <_sk_overlay_sse2_8bit+0x1280>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 68,15,92,202 ; subps %xmm2,%xmm9
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
DB 68,15,89,225 ; mulps %xmm1,%xmm12
- DB 15,40,21,199,242,0,0 ; movaps 0xf2c7(%rip),%xmm2 # 2cf00 <_sk_overlay_sse2_8bit+0x128b>
+ DB 15,40,21,7,242,0,0 ; movaps 0xf207(%rip),%xmm2 # 2ce40 <_sk_overlay_sse2_8bit+0x1290>
DB 68,15,40,194 ; movaps %xmm2,%xmm8
DB 69,15,194,196,1 ; cmpltps %xmm12,%xmm8
- DB 68,15,40,21,198,242,0,0 ; movaps 0xf2c6(%rip),%xmm10 # 2cf10 <_sk_overlay_sse2_8bit+0x129b>
+ DB 68,15,40,21,6,242,0,0 ; movaps 0xf206(%rip),%xmm10 # 2ce50 <_sk_overlay_sse2_8bit+0x12a0>
DB 65,15,88,202 ; addps %xmm10,%xmm1
- DB 68,15,40,29,202,242,0,0 ; movaps 0xf2ca(%rip),%xmm11 # 2cf20 <_sk_overlay_sse2_8bit+0x12ab>
+ DB 68,15,40,29,10,242,0,0 ; movaps 0xf20a(%rip),%xmm11 # 2ce60 <_sk_overlay_sse2_8bit+0x12b0>
DB 65,15,89,203 ; mulps %xmm11,%xmm1
DB 69,15,84,224 ; andps %xmm8,%xmm12
DB 68,15,85,193 ; andnps %xmm1,%xmm8
@@ -28213,8 +28213,8 @@ _sk_lab_to_xyz_sse2 LABEL PROC
DB 15,84,194 ; andps %xmm2,%xmm0
DB 65,15,85,209 ; andnps %xmm9,%xmm2
DB 15,86,208 ; orps %xmm0,%xmm2
- DB 68,15,89,5,122,242,0,0 ; mulps 0xf27a(%rip),%xmm8 # 2cf30 <_sk_overlay_sse2_8bit+0x12bb>
- DB 15,89,21,131,242,0,0 ; mulps 0xf283(%rip),%xmm2 # 2cf40 <_sk_overlay_sse2_8bit+0x12cb>
+ DB 68,15,89,5,186,241,0,0 ; mulps 0xf1ba(%rip),%xmm8 # 2ce70 <_sk_overlay_sse2_8bit+0x12c0>
+ DB 15,89,21,195,241,0,0 ; mulps 0xf1c3(%rip),%xmm2 # 2ce80 <_sk_overlay_sse2_8bit+0x12d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -28232,9 +28232,9 @@ _sk_load_a8_sse2 LABEL PROC
DB 102,67,15,110,4,16 ; movd (%r8,%r10,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
DB 102,15,97,192 ; punpcklwd %xmm0,%xmm0
- DB 102,15,219,5,253,238,0,0 ; pand 0xeefd(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,5,61,238,0,0 ; pand 0xee3d(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,67,240,0,0 ; mulps 0xf043(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,29,131,239,0,0 ; mulps 0xef83(%rip),%xmm3 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,87,201 ; xorpd %xmm1,%xmm1
@@ -28275,9 +28275,9 @@ _sk_load_a8_dst_sse2 LABEL PROC
DB 102,67,15,110,36,16 ; movd (%r8,%r10,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,219,37,105,238,0,0 ; pand 0xee69(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,37,169,237,0,0 ; pand 0xeda9(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,252 ; cvtdq2ps %xmm4,%xmm7
- DB 15,89,61,175,239,0,0 ; mulps 0xefaf(%rip),%xmm7 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,61,239,238,0,0 ; mulps 0xeeef(%rip),%xmm7 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 102,15,87,237 ; xorpd %xmm5,%xmm5
@@ -28341,7 +28341,7 @@ _sk_gather_a8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,190,238,0,0 ; mulps 0xeebe(%rip),%xmm3 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,29,254,237,0,0 ; mulps 0xedfe(%rip),%xmm3 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
@@ -28357,7 +28357,7 @@ _sk_store_a8_sse2 LABEL PROC
DB 77,15,175,193 ; imul %r9,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,210 ; movslq %edx,%r10
- DB 68,15,40,5,112,237,0,0 ; movaps 0xed70(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,176,236,0,0 ; movaps 0xecb0(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 68,15,89,195 ; mulps %xmm3,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
DB 102,65,15,114,240,16 ; pslld $0x10,%xmm8
@@ -28384,7 +28384,7 @@ _sk_store_a8_sse2 LABEL PROC
DB 102,68,15,127,68,36,16 ; movdqa %xmm8,0x10(%rsp)
DB 138,68,36,24 ; mov 0x18(%rsp),%al
DB 67,136,68,16,2 ; mov %al,0x2(%r8,%r10,1)
- DB 102,68,15,219,5,207,236,0,0 ; pand 0xeccf(%rip),%xmm8 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,68,15,219,5,15,236,0,0 ; pand 0xec0f(%rip),%xmm8 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,69,15,103,192 ; packuswb %xmm8,%xmm8
DB 102,69,15,103,192 ; packuswb %xmm8,%xmm8
DB 102,68,15,126,192 ; movd %xmm8,%eax
@@ -28408,11 +28408,11 @@ _sk_load_g8_sse2 LABEL PROC
DB 102,67,15,110,4,16 ; movd (%r8,%r10,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
DB 102,15,97,192 ; punpcklwd %xmm0,%xmm0
- DB 102,15,219,5,124,236,0,0 ; pand 0xec7c(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,5,188,235,0,0 ; pand 0xebbc(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,194,237,0,0 ; mulps 0xedc2(%rip),%xmm0 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,5,2,237,0,0 ; mulps 0xed02(%rip),%xmm0 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,185,235,0,0 ; movaps 0xebb9(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,249,234,0,0 ; movaps 0xeaf9(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -28451,11 +28451,11 @@ _sk_load_g8_dst_sse2 LABEL PROC
DB 102,67,15,110,36,16 ; movd (%r8,%r10,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,219,37,229,235,0,0 ; pand 0xebe5(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,219,37,37,235,0,0 ; pand 0xeb25(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,37,43,237,0,0 ; mulps 0xed2b(%rip),%xmm4 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,37,107,236,0,0 ; mulps 0xec6b(%rip),%xmm4 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,61,34,235,0,0 ; movaps 0xeb22(%rip),%xmm7 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,61,98,234,0,0 ; movaps 0xea62(%rip),%xmm7 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 255,224 ; jmpq *%rax
@@ -28517,9 +28517,9 @@ _sk_gather_g8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,55,236,0,0 ; mulps 0xec37(%rip),%xmm0 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 15,89,5,119,235,0,0 ; mulps 0xeb77(%rip),%xmm0 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,46,234,0,0 ; movaps 0xea2e(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,110,233,0,0 ; movaps 0xe96e(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -28537,19 +28537,19 @@ _sk_load_565_sse2 LABEL PROC
DB 117,83 ; jne 1e188 <_sk_load_565_sse2+0x6e>
DB 243,67,15,126,20,80 ; movq (%r8,%r10,2),%xmm2
DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2
- DB 102,15,111,5,9,236,0,0 ; movdqa 0xec09(%rip),%xmm0 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,5,73,235,0,0 ; movdqa 0xeb49(%rip),%xmm0 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,11,236,0,0 ; mulps 0xec0b(%rip),%xmm0 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,13,19,236,0,0 ; movdqa 0xec13(%rip),%xmm1 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 15,89,5,75,235,0,0 ; mulps 0xeb4b(%rip),%xmm0 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,13,83,235,0,0 ; movdqa 0xeb53(%rip),%xmm1 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,21,236,0,0 ; mulps 0xec15(%rip),%xmm1 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,15,219,21,29,236,0,0 ; pand 0xec1d(%rip),%xmm2 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 15,89,13,85,235,0,0 ; mulps 0xeb55(%rip),%xmm1 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,15,219,21,93,235,0,0 ; pand 0xeb5d(%rip),%xmm2 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,35,236,0,0 ; mulps 0xec23(%rip),%xmm2 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 15,89,21,99,235,0,0 ; mulps 0xeb63(%rip),%xmm2 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,186,233,0,0 ; movaps 0xe9ba(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,250,232,0,0 ; movaps 0xe8fa(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,3 ; and $0x3,%r9b
@@ -28584,19 +28584,19 @@ _sk_load_565_dst_sse2 LABEL PROC
DB 117,83 ; jne 1e243 <_sk_load_565_dst_sse2+0x6e>
DB 243,67,15,126,52,80 ; movq (%r8,%r10,2),%xmm6
DB 102,15,97,240 ; punpcklwd %xmm0,%xmm6
- DB 102,15,111,37,78,235,0,0 ; movdqa 0xeb4e(%rip),%xmm4 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,37,142,234,0,0 ; movdqa 0xea8e(%rip),%xmm4 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,15,219,230 ; pand %xmm6,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,37,80,235,0,0 ; mulps 0xeb50(%rip),%xmm4 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,45,88,235,0,0 ; movdqa 0xeb58(%rip),%xmm5 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 15,89,37,144,234,0,0 ; mulps 0xea90(%rip),%xmm4 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,45,152,234,0,0 ; movdqa 0xea98(%rip),%xmm5 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,15,219,238 ; pand %xmm6,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,45,90,235,0,0 ; mulps 0xeb5a(%rip),%xmm5 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,15,219,53,98,235,0,0 ; pand 0xeb62(%rip),%xmm6 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 15,89,45,154,234,0,0 ; mulps 0xea9a(%rip),%xmm5 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,15,219,53,162,234,0,0 ; pand 0xeaa2(%rip),%xmm6 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,89,53,104,235,0,0 ; mulps 0xeb68(%rip),%xmm6 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 15,89,53,168,234,0,0 ; mulps 0xeaa8(%rip),%xmm6 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,61,255,232,0,0 ; movaps 0xe8ff(%rip),%xmm7 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,61,63,232,0,0 ; movaps 0xe83f(%rip),%xmm7 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,3 ; and $0x3,%r9b
@@ -28648,19 +28648,19 @@ _sk_gather_565_sse2 LABEL PROC
DB 102,15,196,208,3 ; pinsrw $0x3,%eax,%xmm2
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2
- DB 102,15,111,5,58,234,0,0 ; movdqa 0xea3a(%rip),%xmm0 # 2cd50 <_sk_overlay_sse2_8bit+0x10db>
+ DB 102,15,111,5,122,233,0,0 ; movdqa 0xe97a(%rip),%xmm0 # 2cc90 <_sk_overlay_sse2_8bit+0x10e0>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,60,234,0,0 ; mulps 0xea3c(%rip),%xmm0 # 2cd60 <_sk_overlay_sse2_8bit+0x10eb>
- DB 102,15,111,13,68,234,0,0 ; movdqa 0xea44(%rip),%xmm1 # 2cd70 <_sk_overlay_sse2_8bit+0x10fb>
+ DB 15,89,5,124,233,0,0 ; mulps 0xe97c(%rip),%xmm0 # 2cca0 <_sk_overlay_sse2_8bit+0x10f0>
+ DB 102,15,111,13,132,233,0,0 ; movdqa 0xe984(%rip),%xmm1 # 2ccb0 <_sk_overlay_sse2_8bit+0x1100>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,70,234,0,0 ; mulps 0xea46(%rip),%xmm1 # 2cd80 <_sk_overlay_sse2_8bit+0x110b>
- DB 102,15,219,21,78,234,0,0 ; pand 0xea4e(%rip),%xmm2 # 2cd90 <_sk_overlay_sse2_8bit+0x111b>
+ DB 15,89,13,134,233,0,0 ; mulps 0xe986(%rip),%xmm1 # 2ccc0 <_sk_overlay_sse2_8bit+0x1110>
+ DB 102,15,219,21,142,233,0,0 ; pand 0xe98e(%rip),%xmm2 # 2ccd0 <_sk_overlay_sse2_8bit+0x1120>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,84,234,0,0 ; mulps 0xea54(%rip),%xmm2 # 2cda0 <_sk_overlay_sse2_8bit+0x112b>
+ DB 15,89,21,148,233,0,0 ; mulps 0xe994(%rip),%xmm2 # 2cce0 <_sk_overlay_sse2_8bit+0x1130>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,235,231,0,0 ; movaps 0xe7eb(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,43,231,0,0 ; movaps 0xe72b(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_store_565_sse2
@@ -28672,12 +28672,12 @@ _sk_store_565_sse2 LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,210 ; movslq %edx,%r10
- DB 68,15,40,5,235,235,0,0 ; movaps 0xebeb(%rip),%xmm8 # 2cf60 <_sk_overlay_sse2_8bit+0x12eb>
+ DB 68,15,40,5,43,235,0,0 ; movaps 0xeb2b(%rip),%xmm8 # 2cea0 <_sk_overlay_sse2_8bit+0x12f0>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
DB 102,65,15,114,241,11 ; pslld $0xb,%xmm9
- DB 68,15,40,21,224,235,0,0 ; movaps 0xebe0(%rip),%xmm10 # 2cf70 <_sk_overlay_sse2_8bit+0x12fb>
+ DB 68,15,40,21,32,235,0,0 ; movaps 0xeb20(%rip),%xmm10 # 2ceb0 <_sk_overlay_sse2_8bit+0x1300>
DB 68,15,89,209 ; mulps %xmm1,%xmm10
DB 102,69,15,91,210 ; cvtps2dq %xmm10,%xmm10
DB 102,65,15,114,242,5 ; pslld $0x5,%xmm10
@@ -28724,21 +28724,21 @@ _sk_load_4444_sse2 LABEL PROC
DB 117,98 ; jne 1e493 <_sk_load_4444_sse2+0x7d>
DB 243,67,15,126,28,80 ; movq (%r8,%r10,2),%xmm3
DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3
- DB 102,15,111,5,61,235,0,0 ; movdqa 0xeb3d(%rip),%xmm0 # 2cf80 <_sk_overlay_sse2_8bit+0x130b>
+ DB 102,15,111,5,125,234,0,0 ; movdqa 0xea7d(%rip),%xmm0 # 2cec0 <_sk_overlay_sse2_8bit+0x1310>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,63,235,0,0 ; mulps 0xeb3f(%rip),%xmm0 # 2cf90 <_sk_overlay_sse2_8bit+0x131b>
- DB 102,15,111,13,71,235,0,0 ; movdqa 0xeb47(%rip),%xmm1 # 2cfa0 <_sk_overlay_sse2_8bit+0x132b>
+ DB 15,89,5,127,234,0,0 ; mulps 0xea7f(%rip),%xmm0 # 2ced0 <_sk_overlay_sse2_8bit+0x1320>
+ DB 102,15,111,13,135,234,0,0 ; movdqa 0xea87(%rip),%xmm1 # 2cee0 <_sk_overlay_sse2_8bit+0x1330>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,73,235,0,0 ; mulps 0xeb49(%rip),%xmm1 # 2cfb0 <_sk_overlay_sse2_8bit+0x133b>
- DB 102,15,111,21,81,235,0,0 ; movdqa 0xeb51(%rip),%xmm2 # 2cfc0 <_sk_overlay_sse2_8bit+0x134b>
+ DB 15,89,13,137,234,0,0 ; mulps 0xea89(%rip),%xmm1 # 2cef0 <_sk_overlay_sse2_8bit+0x1340>
+ DB 102,15,111,21,145,234,0,0 ; movdqa 0xea91(%rip),%xmm2 # 2cf00 <_sk_overlay_sse2_8bit+0x1350>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,83,235,0,0 ; mulps 0xeb53(%rip),%xmm2 # 2cfd0 <_sk_overlay_sse2_8bit+0x135b>
- DB 102,15,219,29,91,235,0,0 ; pand 0xeb5b(%rip),%xmm3 # 2cfe0 <_sk_overlay_sse2_8bit+0x136b>
+ DB 15,89,21,147,234,0,0 ; mulps 0xea93(%rip),%xmm2 # 2cf10 <_sk_overlay_sse2_8bit+0x1360>
+ DB 102,15,219,29,155,234,0,0 ; pand 0xea9b(%rip),%xmm3 # 2cf20 <_sk_overlay_sse2_8bit+0x1370>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,97,235,0,0 ; mulps 0xeb61(%rip),%xmm3 # 2cff0 <_sk_overlay_sse2_8bit+0x137b>
+ DB 15,89,29,161,234,0,0 ; mulps 0xeaa1(%rip),%xmm3 # 2cf30 <_sk_overlay_sse2_8bit+0x1380>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
@@ -28774,21 +28774,21 @@ _sk_load_4444_dst_sse2 LABEL PROC
DB 117,98 ; jne 1e55d <_sk_load_4444_dst_sse2+0x7d>
DB 243,67,15,126,60,80 ; movq (%r8,%r10,2),%xmm7
DB 102,15,97,248 ; punpcklwd %xmm0,%xmm7
- DB 102,15,111,37,115,234,0,0 ; movdqa 0xea73(%rip),%xmm4 # 2cf80 <_sk_overlay_sse2_8bit+0x130b>
+ DB 102,15,111,37,179,233,0,0 ; movdqa 0xe9b3(%rip),%xmm4 # 2cec0 <_sk_overlay_sse2_8bit+0x1310>
DB 102,15,219,231 ; pand %xmm7,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,37,117,234,0,0 ; mulps 0xea75(%rip),%xmm4 # 2cf90 <_sk_overlay_sse2_8bit+0x131b>
- DB 102,15,111,45,125,234,0,0 ; movdqa 0xea7d(%rip),%xmm5 # 2cfa0 <_sk_overlay_sse2_8bit+0x132b>
+ DB 15,89,37,181,233,0,0 ; mulps 0xe9b5(%rip),%xmm4 # 2ced0 <_sk_overlay_sse2_8bit+0x1320>
+ DB 102,15,111,45,189,233,0,0 ; movdqa 0xe9bd(%rip),%xmm5 # 2cee0 <_sk_overlay_sse2_8bit+0x1330>
DB 102,15,219,239 ; pand %xmm7,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,45,127,234,0,0 ; mulps 0xea7f(%rip),%xmm5 # 2cfb0 <_sk_overlay_sse2_8bit+0x133b>
- DB 102,15,111,53,135,234,0,0 ; movdqa 0xea87(%rip),%xmm6 # 2cfc0 <_sk_overlay_sse2_8bit+0x134b>
+ DB 15,89,45,191,233,0,0 ; mulps 0xe9bf(%rip),%xmm5 # 2cef0 <_sk_overlay_sse2_8bit+0x1340>
+ DB 102,15,111,53,199,233,0,0 ; movdqa 0xe9c7(%rip),%xmm6 # 2cf00 <_sk_overlay_sse2_8bit+0x1350>
DB 102,15,219,247 ; pand %xmm7,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,89,53,137,234,0,0 ; mulps 0xea89(%rip),%xmm6 # 2cfd0 <_sk_overlay_sse2_8bit+0x135b>
- DB 102,15,219,61,145,234,0,0 ; pand 0xea91(%rip),%xmm7 # 2cfe0 <_sk_overlay_sse2_8bit+0x136b>
+ DB 15,89,53,201,233,0,0 ; mulps 0xe9c9(%rip),%xmm6 # 2cf10 <_sk_overlay_sse2_8bit+0x1360>
+ DB 102,15,219,61,209,233,0,0 ; pand 0xe9d1(%rip),%xmm7 # 2cf20 <_sk_overlay_sse2_8bit+0x1370>
DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7
- DB 15,89,61,151,234,0,0 ; mulps 0xea97(%rip),%xmm7 # 2cff0 <_sk_overlay_sse2_8bit+0x137b>
+ DB 15,89,61,215,233,0,0 ; mulps 0xe9d7(%rip),%xmm7 # 2cf30 <_sk_overlay_sse2_8bit+0x1380>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
DB 65,137,249 ; mov %edi,%r9d
@@ -28841,21 +28841,21 @@ _sk_gather_4444_sse2 LABEL PROC
DB 102,15,196,216,3 ; pinsrw $0x3,%eax,%xmm3
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3
- DB 102,15,111,5,80,233,0,0 ; movdqa 0xe950(%rip),%xmm0 # 2cf80 <_sk_overlay_sse2_8bit+0x130b>
+ DB 102,15,111,5,144,232,0,0 ; movdqa 0xe890(%rip),%xmm0 # 2cec0 <_sk_overlay_sse2_8bit+0x1310>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,82,233,0,0 ; mulps 0xe952(%rip),%xmm0 # 2cf90 <_sk_overlay_sse2_8bit+0x131b>
- DB 102,15,111,13,90,233,0,0 ; movdqa 0xe95a(%rip),%xmm1 # 2cfa0 <_sk_overlay_sse2_8bit+0x132b>
+ DB 15,89,5,146,232,0,0 ; mulps 0xe892(%rip),%xmm0 # 2ced0 <_sk_overlay_sse2_8bit+0x1320>
+ DB 102,15,111,13,154,232,0,0 ; movdqa 0xe89a(%rip),%xmm1 # 2cee0 <_sk_overlay_sse2_8bit+0x1330>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,92,233,0,0 ; mulps 0xe95c(%rip),%xmm1 # 2cfb0 <_sk_overlay_sse2_8bit+0x133b>
- DB 102,15,111,21,100,233,0,0 ; movdqa 0xe964(%rip),%xmm2 # 2cfc0 <_sk_overlay_sse2_8bit+0x134b>
+ DB 15,89,13,156,232,0,0 ; mulps 0xe89c(%rip),%xmm1 # 2cef0 <_sk_overlay_sse2_8bit+0x1340>
+ DB 102,15,111,21,164,232,0,0 ; movdqa 0xe8a4(%rip),%xmm2 # 2cf00 <_sk_overlay_sse2_8bit+0x1350>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,102,233,0,0 ; mulps 0xe966(%rip),%xmm2 # 2cfd0 <_sk_overlay_sse2_8bit+0x135b>
- DB 102,15,219,29,110,233,0,0 ; pand 0xe96e(%rip),%xmm3 # 2cfe0 <_sk_overlay_sse2_8bit+0x136b>
+ DB 15,89,21,166,232,0,0 ; mulps 0xe8a6(%rip),%xmm2 # 2cf10 <_sk_overlay_sse2_8bit+0x1360>
+ DB 102,15,219,29,174,232,0,0 ; pand 0xe8ae(%rip),%xmm3 # 2cf20 <_sk_overlay_sse2_8bit+0x1370>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,116,233,0,0 ; mulps 0xe974(%rip),%xmm3 # 2cff0 <_sk_overlay_sse2_8bit+0x137b>
+ DB 15,89,29,180,232,0,0 ; mulps 0xe8b4(%rip),%xmm3 # 2cf30 <_sk_overlay_sse2_8bit+0x1380>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -28868,7 +28868,7 @@ _sk_store_4444_sse2 LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 76,99,210 ; movslq %edx,%r10
- DB 68,15,40,5,98,233,0,0 ; movaps 0xe962(%rip),%xmm8 # 2d000 <_sk_overlay_sse2_8bit+0x138b>
+ DB 68,15,40,5,162,232,0,0 ; movaps 0xe8a2(%rip),%xmm8 # 2cf40 <_sk_overlay_sse2_8bit+0x1390>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -28924,11 +28924,11 @@ _sk_load_8888_sse2 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,98 ; jne 1e7d1 <_sk_load_8888_sse2+0x7e>
DB 243,69,15,111,12,128 ; movdqu (%r8,%rax,4),%xmm9
- DB 102,15,111,21,115,228,0,0 ; movdqa 0xe473(%rip),%xmm2 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,21,179,227,0,0 ; movdqa 0xe3b3(%rip),%xmm2 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,175,229,0,0 ; movaps 0xe5af(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,239,228,0,0 ; movaps 0xe4ef(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -28973,11 +28973,11 @@ _sk_load_8888_dst_sse2 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,98 ; jne 1e890 <_sk_load_8888_dst_sse2+0x7e>
DB 243,69,15,111,12,128 ; movdqu (%r8,%rax,4),%xmm9
- DB 102,15,111,53,180,227,0,0 ; movdqa 0xe3b4(%rip),%xmm6 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,53,244,226,0,0 ; movdqa 0xe2f4(%rip),%xmm6 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,225 ; movdqa %xmm9,%xmm4
DB 102,15,219,230 ; pand %xmm6,%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 68,15,40,5,240,228,0,0 ; movaps 0xe4f0(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,48,228,0,0 ; movaps 0xe430(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,224 ; mulps %xmm8,%xmm4
DB 102,65,15,111,233 ; movdqa %xmm9,%xmm5
DB 102,15,114,213,8 ; psrld $0x8,%xmm5
@@ -29039,11 +29039,11 @@ _sk_gather_8888_sse2 LABEL PROC
DB 102,67,15,110,12,136 ; movd (%r8,%r9,4),%xmm1
DB 102,68,15,98,201 ; punpckldq %xmm1,%xmm9
DB 102,68,15,98,200 ; punpckldq %xmm0,%xmm9
- DB 102,15,111,21,158,226,0,0 ; movdqa 0xe29e(%rip),%xmm2 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,21,222,225,0,0 ; movdqa 0xe1de(%rip),%xmm2 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,218,227,0,0 ; movaps 0xe3da(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,26,227,0,0 ; movaps 0xe31a(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -29070,7 +29070,7 @@ _sk_store_8888_sse2 LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 68,15,40,5,91,226,0,0 ; movaps 0xe25b(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,155,225,0,0 ; movaps 0xe19b(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -29120,11 +29120,11 @@ _sk_load_bgra_sse2 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,98 ; jne 1ead9 <_sk_load_bgra_sse2+0x7e>
DB 243,69,15,111,12,128 ; movdqu (%r8,%rax,4),%xmm9
- DB 102,15,111,5,107,225,0,0 ; movdqa 0xe16b(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,171,224,0,0 ; movdqa 0xe0ab(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,219,200 ; pand %xmm0,%xmm1
DB 15,91,209 ; cvtdq2ps %xmm1,%xmm2
- DB 68,15,40,5,167,226,0,0 ; movaps 0xe2a7(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,231,225,0,0 ; movaps 0xe1e7(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -29169,11 +29169,11 @@ _sk_load_bgra_dst_sse2 LABEL PROC
DB 72,133,255 ; test %rdi,%rdi
DB 117,98 ; jne 1eb98 <_sk_load_bgra_dst_sse2+0x7e>
DB 243,69,15,111,12,128 ; movdqu (%r8,%rax,4),%xmm9
- DB 102,15,111,37,172,224,0,0 ; movdqa 0xe0ac(%rip),%xmm4 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,37,236,223,0,0 ; movdqa 0xdfec(%rip),%xmm4 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,233 ; movdqa %xmm9,%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 15,91,245 ; cvtdq2ps %xmm5,%xmm6
- DB 68,15,40,5,232,225,0,0 ; movaps 0xe1e8(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,40,225,0,0 ; movaps 0xe128(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,240 ; mulps %xmm8,%xmm6
DB 102,65,15,111,233 ; movdqa %xmm9,%xmm5
DB 102,15,114,213,8 ; psrld $0x8,%xmm5
@@ -29235,11 +29235,11 @@ _sk_gather_bgra_sse2 LABEL PROC
DB 102,67,15,110,12,136 ; movd (%r8,%r9,4),%xmm1
DB 102,68,15,98,201 ; punpckldq %xmm1,%xmm9
DB 102,68,15,98,200 ; punpckldq %xmm0,%xmm9
- DB 102,15,111,5,150,223,0,0 ; movdqa 0xdf96(%rip),%xmm0 # 2cbf0 <_sk_overlay_sse2_8bit+0xf7b>
+ DB 102,15,111,5,214,222,0,0 ; movdqa 0xded6(%rip),%xmm0 # 2cb30 <_sk_overlay_sse2_8bit+0xf80>
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,219,200 ; pand %xmm0,%xmm1
DB 15,91,209 ; cvtdq2ps %xmm1,%xmm2
- DB 68,15,40,5,210,224,0,0 ; movaps 0xe0d2(%rip),%xmm8 # 2cd40 <_sk_overlay_sse2_8bit+0x10cb>
+ DB 68,15,40,5,18,224,0,0 ; movaps 0xe012(%rip),%xmm8 # 2cc80 <_sk_overlay_sse2_8bit+0x10d0>
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -29266,7 +29266,7 @@ _sk_store_bgra_sse2 LABEL PROC
DB 73,193,224,2 ; shl $0x2,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 68,15,40,5,83,223,0,0 ; movaps 0xdf53(%rip),%xmm8 # 2cc20 <_sk_overlay_sse2_8bit+0xfab>
+ DB 68,15,40,5,147,222,0,0 ; movaps 0xde93(%rip),%xmm8 # 2cb60 <_sk_overlay_sse2_8bit+0xfb0>
DB 68,15,40,202 ; movaps %xmm2,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -29326,7 +29326,7 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,69,15,239,210 ; pxor %xmm10,%xmm10
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,65,15,97,202 ; punpcklwd %xmm10,%xmm1
- DB 102,68,15,111,13,75,226,0,0 ; movdqa 0xe24b(%rip),%xmm9 # 2d010 <_sk_overlay_sse2_8bit+0x139b>
+ DB 102,68,15,111,13,139,225,0,0 ; movdqa 0xe18b(%rip),%xmm9 # 2cf50 <_sk_overlay_sse2_8bit+0x13a0>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,193 ; pand %xmm9,%xmm0
DB 102,15,239,200 ; pxor %xmm0,%xmm1
@@ -29334,11 +29334,11 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,68,15,111,233 ; movdqa %xmm1,%xmm13
DB 102,65,15,114,245,13 ; pslld $0xd,%xmm13
DB 102,68,15,235,232 ; por %xmm0,%xmm13
- DB 102,68,15,111,29,64,226,0,0 ; movdqa 0xe240(%rip),%xmm11 # 2d030 <_sk_overlay_sse2_8bit+0x13bb>
+ DB 102,68,15,111,29,128,225,0,0 ; movdqa 0xe180(%rip),%xmm11 # 2cf70 <_sk_overlay_sse2_8bit+0x13c0>
DB 102,69,15,254,235 ; paddd %xmm11,%xmm13
- DB 102,68,15,111,37,66,226,0,0 ; movdqa 0xe242(%rip),%xmm12 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 102,68,15,111,37,130,225,0,0 ; movdqa 0xe182(%rip),%xmm12 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 102,65,15,239,204 ; pxor %xmm12,%xmm1
- DB 102,15,111,29,229,227,0,0 ; movdqa 0xe3e5(%rip),%xmm3 # 2d1f0 <_sk_overlay_sse2_8bit+0x157b>
+ DB 102,15,111,29,37,227,0,0 ; movdqa 0xe325(%rip),%xmm3 # 2d130 <_sk_overlay_sse2_8bit+0x1580>
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,102,193 ; pcmpgtd %xmm1,%xmm0
DB 102,65,15,223,197 ; pandn %xmm13,%xmm0
@@ -29420,7 +29420,7 @@ _sk_load_f16_dst_sse2 LABEL PROC
DB 102,69,15,239,210 ; pxor %xmm10,%xmm10
DB 102,65,15,111,238 ; movdqa %xmm14,%xmm5
DB 102,65,15,97,234 ; punpcklwd %xmm10,%xmm5
- DB 102,68,15,111,13,139,224,0,0 ; movdqa 0xe08b(%rip),%xmm9 # 2d010 <_sk_overlay_sse2_8bit+0x139b>
+ DB 102,68,15,111,13,203,223,0,0 ; movdqa 0xdfcb(%rip),%xmm9 # 2cf50 <_sk_overlay_sse2_8bit+0x13a0>
DB 102,15,111,229 ; movdqa %xmm5,%xmm4
DB 102,65,15,219,225 ; pand %xmm9,%xmm4
DB 102,15,239,236 ; pxor %xmm4,%xmm5
@@ -29428,11 +29428,11 @@ _sk_load_f16_dst_sse2 LABEL PROC
DB 102,68,15,111,237 ; movdqa %xmm5,%xmm13
DB 102,65,15,114,245,13 ; pslld $0xd,%xmm13
DB 102,68,15,235,236 ; por %xmm4,%xmm13
- DB 102,68,15,111,29,128,224,0,0 ; movdqa 0xe080(%rip),%xmm11 # 2d030 <_sk_overlay_sse2_8bit+0x13bb>
+ DB 102,68,15,111,29,192,223,0,0 ; movdqa 0xdfc0(%rip),%xmm11 # 2cf70 <_sk_overlay_sse2_8bit+0x13c0>
DB 102,69,15,254,235 ; paddd %xmm11,%xmm13
- DB 102,68,15,111,37,130,224,0,0 ; movdqa 0xe082(%rip),%xmm12 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 102,68,15,111,37,194,223,0,0 ; movdqa 0xdfc2(%rip),%xmm12 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 102,65,15,239,236 ; pxor %xmm12,%xmm5
- DB 102,15,111,61,37,226,0,0 ; movdqa 0xe225(%rip),%xmm7 # 2d1f0 <_sk_overlay_sse2_8bit+0x157b>
+ DB 102,15,111,61,101,225,0,0 ; movdqa 0xe165(%rip),%xmm7 # 2d130 <_sk_overlay_sse2_8bit+0x1580>
DB 102,15,111,231 ; movdqa %xmm7,%xmm4
DB 102,15,102,229 ; pcmpgtd %xmm5,%xmm4
DB 102,65,15,223,229 ; pandn %xmm13,%xmm4
@@ -29529,7 +29529,7 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,69,15,239,210 ; pxor %xmm10,%xmm10
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,65,15,97,202 ; punpcklwd %xmm10,%xmm1
- DB 102,68,15,111,13,133,222,0,0 ; movdqa 0xde85(%rip),%xmm9 # 2d010 <_sk_overlay_sse2_8bit+0x139b>
+ DB 102,68,15,111,13,197,221,0,0 ; movdqa 0xddc5(%rip),%xmm9 # 2cf50 <_sk_overlay_sse2_8bit+0x13a0>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,193 ; pand %xmm9,%xmm0
DB 102,15,239,200 ; pxor %xmm0,%xmm1
@@ -29537,11 +29537,11 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,68,15,111,233 ; movdqa %xmm1,%xmm13
DB 102,65,15,114,245,13 ; pslld $0xd,%xmm13
DB 102,68,15,235,232 ; por %xmm0,%xmm13
- DB 102,68,15,111,29,122,222,0,0 ; movdqa 0xde7a(%rip),%xmm11 # 2d030 <_sk_overlay_sse2_8bit+0x13bb>
+ DB 102,68,15,111,29,186,221,0,0 ; movdqa 0xddba(%rip),%xmm11 # 2cf70 <_sk_overlay_sse2_8bit+0x13c0>
DB 102,69,15,254,235 ; paddd %xmm11,%xmm13
- DB 102,68,15,111,37,124,222,0,0 ; movdqa 0xde7c(%rip),%xmm12 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 102,68,15,111,37,188,221,0,0 ; movdqa 0xddbc(%rip),%xmm12 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 102,65,15,239,204 ; pxor %xmm12,%xmm1
- DB 102,15,111,29,31,224,0,0 ; movdqa 0xe01f(%rip),%xmm3 # 2d1f0 <_sk_overlay_sse2_8bit+0x157b>
+ DB 102,15,111,29,95,223,0,0 ; movdqa 0xdf5f(%rip),%xmm3 # 2d130 <_sk_overlay_sse2_8bit+0x1580>
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,102,193 ; pcmpgtd %xmm1,%xmm0
DB 102,65,15,223,197 ; pandn %xmm13,%xmm0
@@ -29597,17 +29597,17 @@ _sk_store_f16_sse2 LABEL PROC
DB 73,193,224,3 ; shl $0x3,%r8
DB 76,3,0 ; add (%rax),%r8
DB 72,99,194 ; movslq %edx,%rax
- DB 102,68,15,111,21,117,221,0,0 ; movdqa 0xdd75(%rip),%xmm10 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 102,68,15,111,21,181,220,0,0 ; movdqa 0xdcb5(%rip),%xmm10 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 102,68,15,111,224 ; movdqa %xmm0,%xmm12
DB 102,69,15,219,226 ; pand %xmm10,%xmm12
DB 102,68,15,111,232 ; movdqa %xmm0,%xmm13
DB 102,69,15,239,236 ; pxor %xmm12,%xmm13
- DB 102,68,15,111,13,104,221,0,0 ; movdqa 0xdd68(%rip),%xmm9 # 2d050 <_sk_overlay_sse2_8bit+0x13db>
+ DB 102,68,15,111,13,168,220,0,0 ; movdqa 0xdca8(%rip),%xmm9 # 2cf90 <_sk_overlay_sse2_8bit+0x13e0>
DB 102,65,15,114,212,16 ; psrld $0x10,%xmm12
DB 102,69,15,111,193 ; movdqa %xmm9,%xmm8
DB 102,69,15,102,197 ; pcmpgtd %xmm13,%xmm8
DB 102,65,15,114,213,13 ; psrld $0xd,%xmm13
- DB 102,68,15,111,29,89,221,0,0 ; movdqa 0xdd59(%rip),%xmm11 # 2d060 <_sk_overlay_sse2_8bit+0x13eb>
+ DB 102,68,15,111,29,153,220,0,0 ; movdqa 0xdc99(%rip),%xmm11 # 2cfa0 <_sk_overlay_sse2_8bit+0x13f0>
DB 102,69,15,235,227 ; por %xmm11,%xmm12
DB 102,69,15,254,229 ; paddd %xmm13,%xmm12
DB 102,65,15,114,244,16 ; pslld $0x10,%xmm12
@@ -29703,7 +29703,7 @@ _sk_load_u16_be_sse2 LABEL PROC
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
DB 102,65,15,97,201 ; punpcklwd %xmm9,%xmm1
DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0
- DB 68,15,40,5,8,217,0,0 ; movaps 0xd908(%rip),%xmm8 # 2cdd0 <_sk_overlay_sse2_8bit+0x115b>
+ DB 68,15,40,5,72,216,0,0 ; movaps 0xd848(%rip),%xmm8 # 2cd10 <_sk_overlay_sse2_8bit+0x1160>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -29777,7 +29777,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,65,15,97,200 ; punpcklwd %xmm8,%xmm1
DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0
- DB 68,15,40,13,206,215,0,0 ; movaps 0xd7ce(%rip),%xmm9 # 2cdd0 <_sk_overlay_sse2_8bit+0x115b>
+ DB 68,15,40,13,14,215,0,0 ; movaps 0xd70e(%rip),%xmm9 # 2cd10 <_sk_overlay_sse2_8bit+0x1160>
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -29794,7 +29794,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,209 ; mulps %xmm9,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,245,212,0,0 ; movaps 0xd4f5(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,53,212,0,0 ; movaps 0xd435(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 255,224 ; jmpq *%rax
DB 102,65,15,110,20,64 ; movd (%r8,%rax,2),%xmm2
DB 102,65,15,196,84,64,4,2 ; pinsrw $0x2,0x4(%r8,%rax,2),%xmm2
@@ -29826,7 +29826,7 @@ _sk_store_u16_be_sse2 LABEL PROC
DB 77,1,192 ; add %r8,%r8
DB 76,3,0 ; add (%rax),%r8
DB 73,99,193 ; movslq %r9d,%rax
- DB 68,15,40,21,158,217,0,0 ; movaps 0xd99e(%rip),%xmm10 # 2d070 <_sk_overlay_sse2_8bit+0x13fb>
+ DB 68,15,40,21,222,216,0,0 ; movaps 0xd8de(%rip),%xmm10 # 2cfb0 <_sk_overlay_sse2_8bit+0x1400>
DB 68,15,40,192 ; movaps %xmm0,%xmm8
DB 69,15,89,194 ; mulps %xmm10,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
@@ -30053,7 +30053,7 @@ _sk_repeat_x_sse2 LABEL PROC
DB 243,69,15,91,194 ; cvttps2dq %xmm10,%xmm8
DB 69,15,91,216 ; cvtdq2ps %xmm8,%xmm11
DB 69,15,194,211,1 ; cmpltps %xmm11,%xmm10
- DB 68,15,84,21,11,209,0,0 ; andps 0xd10b(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,84,21,75,208,0,0 ; andps 0xd04b(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,87,192 ; xorps %xmm8,%xmm8
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
@@ -30077,7 +30077,7 @@ _sk_repeat_y_sse2 LABEL PROC
DB 243,69,15,91,194 ; cvttps2dq %xmm10,%xmm8
DB 69,15,91,216 ; cvtdq2ps %xmm8,%xmm11
DB 69,15,194,211,1 ; cmpltps %xmm11,%xmm10
- DB 68,15,84,21,177,208,0,0 ; andps 0xd0b1(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,84,21,241,207,0,0 ; andps 0xcff1(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,87,192 ; xorps %xmm8,%xmm8
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
@@ -30101,13 +30101,13 @@ _sk_mirror_x_sse2 LABEL PROC
DB 65,15,92,193 ; subps %xmm9,%xmm0
DB 243,69,15,88,210 ; addss %xmm10,%xmm10
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
- DB 243,68,15,89,29,246,197,0,0 ; mulss 0xc5f6(%rip),%xmm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 243,68,15,89,29,50,197,0,0 ; mulss 0xc532(%rip),%xmm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 68,15,89,216 ; mulps %xmm0,%xmm11
DB 243,69,15,91,195 ; cvttps2dq %xmm11,%xmm8
DB 69,15,91,224 ; cvtdq2ps %xmm8,%xmm12
DB 69,15,194,220,1 ; cmpltps %xmm12,%xmm11
- DB 68,15,84,29,55,208,0,0 ; andps 0xd037(%rip),%xmm11 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,84,29,119,207,0,0 ; andps 0xcf77(%rip),%xmm11 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,87,192 ; xorps %xmm8,%xmm8
DB 69,15,92,227 ; subps %xmm11,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
@@ -30134,13 +30134,13 @@ _sk_mirror_y_sse2 LABEL PROC
DB 65,15,92,201 ; subps %xmm9,%xmm1
DB 243,69,15,88,210 ; addss %xmm10,%xmm10
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
- DB 243,68,15,89,29,113,197,0,0 ; mulss 0xc571(%rip),%xmm11 # 2c0e0 <_sk_overlay_sse2_8bit+0x46b>
+ DB 243,68,15,89,29,173,196,0,0 ; mulss 0xc4ad(%rip),%xmm11 # 2c01c <_sk_overlay_sse2_8bit+0x46c>
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 68,15,89,217 ; mulps %xmm1,%xmm11
DB 243,69,15,91,195 ; cvttps2dq %xmm11,%xmm8
DB 69,15,91,224 ; cvtdq2ps %xmm8,%xmm12
DB 69,15,194,220,1 ; cmpltps %xmm12,%xmm11
- DB 68,15,84,29,178,207,0,0 ; andps 0xcfb2(%rip),%xmm11 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,84,29,242,206,0,0 ; andps 0xcef2(%rip),%xmm11 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,87,192 ; xorps %xmm8,%xmm8
DB 69,15,92,227 ; subps %xmm11,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
@@ -30161,7 +30161,7 @@ PUBLIC _sk_clamp_x_1_sse2
_sk_clamp_x_1_sse2 LABEL PROC
DB 69,15,87,192 ; xorps %xmm8,%xmm8
DB 68,15,95,192 ; maxps %xmm0,%xmm8
- DB 68,15,93,5,105,207,0,0 ; minps 0xcf69(%rip),%xmm8 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,93,5,169,206,0,0 ; minps 0xcea9(%rip),%xmm8 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -30172,7 +30172,7 @@ _sk_repeat_x_1_sse2 LABEL PROC
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,194,200,1 ; cmpltps %xmm8,%xmm9
- DB 68,15,84,13,71,207,0,0 ; andps 0xcf47(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,84,13,135,206,0,0 ; andps 0xce87(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,193 ; subps %xmm9,%xmm8
DB 65,15,92,192 ; subps %xmm8,%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -30180,14 +30180,14 @@ _sk_repeat_x_1_sse2 LABEL PROC
PUBLIC _sk_mirror_x_1_sse2
_sk_mirror_x_1_sse2 LABEL PROC
- DB 68,15,40,5,147,207,0,0 ; movaps 0xcf93(%rip),%xmm8 # 2cba0 <_sk_overlay_sse2_8bit+0xf2b>
+ DB 68,15,40,5,211,206,0,0 ; movaps 0xced3(%rip),%xmm8 # 2cae0 <_sk_overlay_sse2_8bit+0xf30>
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,13,7,207,0,0 ; movaps 0xcf07(%rip),%xmm9 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,13,71,206,0,0 ; movaps 0xce47(%rip),%xmm9 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 68,15,89,200 ; mulps %xmm0,%xmm9
DB 243,69,15,91,209 ; cvttps2dq %xmm9,%xmm10
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
DB 69,15,194,202,1 ; cmpltps %xmm10,%xmm9
- DB 68,15,84,13,13,207,0,0 ; andps 0xcf0d(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,84,13,77,206,0,0 ; andps 0xce4d(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,209 ; subps %xmm9,%xmm10
DB 69,15,88,210 ; addps %xmm10,%xmm10
@@ -30201,10 +30201,10 @@ _sk_mirror_x_1_sse2 LABEL PROC
PUBLIC _sk_luminance_to_alpha_sse2
_sk_luminance_to_alpha_sse2 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 15,89,5,35,212,0,0 ; mulps 0xd423(%rip),%xmm0 # 2d080 <_sk_overlay_sse2_8bit+0x140b>
- DB 15,89,13,44,212,0,0 ; mulps 0xd42c(%rip),%xmm1 # 2d090 <_sk_overlay_sse2_8bit+0x141b>
+ DB 15,89,5,99,211,0,0 ; mulps 0xd363(%rip),%xmm0 # 2cfc0 <_sk_overlay_sse2_8bit+0x1410>
+ DB 15,89,13,108,211,0,0 ; mulps 0xd36c(%rip),%xmm1 # 2cfd0 <_sk_overlay_sse2_8bit+0x1420>
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,29,50,212,0,0 ; mulps 0xd432(%rip),%xmm3 # 2d0a0 <_sk_overlay_sse2_8bit+0x142b>
+ DB 15,89,29,114,211,0,0 ; mulps 0xd372(%rip),%xmm3 # 2cfe0 <_sk_overlay_sse2_8bit+0x1430>
DB 15,88,217 ; addps %xmm1,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
@@ -30598,15 +30598,15 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC
PUBLIC _sk_gauss_a_to_rgba_sse2
_sk_gauss_a_to_rgba_sse2 LABEL PROC
- DB 15,40,5,1,206,0,0 ; movaps 0xce01(%rip),%xmm0 # 2d0b0 <_sk_overlay_sse2_8bit+0x143b>
+ DB 15,40,5,65,205,0,0 ; movaps 0xcd41(%rip),%xmm0 # 2cff0 <_sk_overlay_sse2_8bit+0x1440>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,7,206,0,0 ; addps 0xce07(%rip),%xmm0 # 2d0c0 <_sk_overlay_sse2_8bit+0x144b>
+ DB 15,88,5,71,205,0,0 ; addps 0xcd47(%rip),%xmm0 # 2d000 <_sk_overlay_sse2_8bit+0x1450>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,13,206,0,0 ; addps 0xce0d(%rip),%xmm0 # 2d0d0 <_sk_overlay_sse2_8bit+0x145b>
+ DB 15,88,5,77,205,0,0 ; addps 0xcd4d(%rip),%xmm0 # 2d010 <_sk_overlay_sse2_8bit+0x1460>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,19,206,0,0 ; addps 0xce13(%rip),%xmm0 # 2d0e0 <_sk_overlay_sse2_8bit+0x146b>
+ DB 15,88,5,83,205,0,0 ; addps 0xcd53(%rip),%xmm0 # 2d020 <_sk_overlay_sse2_8bit+0x1470>
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,25,206,0,0 ; addps 0xce19(%rip),%xmm0 # 2d0f0 <_sk_overlay_sse2_8bit+0x147b>
+ DB 15,88,5,89,205,0,0 ; addps 0xcd59(%rip),%xmm0 # 2d030 <_sk_overlay_sse2_8bit+0x1480>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
@@ -30624,7 +30624,7 @@ _sk_gradient_sse2 LABEL PROC
DB 73,255,200 ; dec %r8
DB 73,131,193,4 ; add $0x4,%r9
DB 102,15,239,201 ; pxor %xmm1,%xmm1
- DB 15,40,21,71,200,0,0 ; movaps 0xc847(%rip),%xmm2 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 15,40,21,135,199,0,0 ; movaps 0xc787(%rip),%xmm2 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 243,65,15,16,25 ; movss (%r9),%xmm3
DB 15,198,219,0 ; shufps $0x0,%xmm3,%xmm3
DB 15,194,216,2 ; cmpleps %xmm0,%xmm3
@@ -30768,29 +30768,29 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC
DB 69,15,94,220 ; divps %xmm12,%xmm11
DB 69,15,40,227 ; movaps %xmm11,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
- DB 68,15,40,45,166,203,0,0 ; movaps 0xcba6(%rip),%xmm13 # 2d100 <_sk_overlay_sse2_8bit+0x148b>
+ DB 68,15,40,45,230,202,0,0 ; movaps 0xcae6(%rip),%xmm13 # 2d040 <_sk_overlay_sse2_8bit+0x1490>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,170,203,0,0 ; addps 0xcbaa(%rip),%xmm13 # 2d110 <_sk_overlay_sse2_8bit+0x149b>
+ DB 68,15,88,45,234,202,0,0 ; addps 0xcaea(%rip),%xmm13 # 2d050 <_sk_overlay_sse2_8bit+0x14a0>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,174,203,0,0 ; addps 0xcbae(%rip),%xmm13 # 2d120 <_sk_overlay_sse2_8bit+0x14ab>
+ DB 68,15,88,45,238,202,0,0 ; addps 0xcaee(%rip),%xmm13 # 2d060 <_sk_overlay_sse2_8bit+0x14b0>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,178,203,0,0 ; addps 0xcbb2(%rip),%xmm13 # 2d130 <_sk_overlay_sse2_8bit+0x14bb>
+ DB 68,15,88,45,242,202,0,0 ; addps 0xcaf2(%rip),%xmm13 # 2d070 <_sk_overlay_sse2_8bit+0x14c0>
DB 69,15,89,235 ; mulps %xmm11,%xmm13
DB 69,15,194,202,1 ; cmpltps %xmm10,%xmm9
- DB 68,15,40,21,177,203,0,0 ; movaps 0xcbb1(%rip),%xmm10 # 2d140 <_sk_overlay_sse2_8bit+0x14cb>
+ DB 68,15,40,21,241,202,0,0 ; movaps 0xcaf1(%rip),%xmm10 # 2d080 <_sk_overlay_sse2_8bit+0x14d0>
DB 69,15,92,213 ; subps %xmm13,%xmm10
DB 69,15,84,209 ; andps %xmm9,%xmm10
DB 69,15,85,205 ; andnps %xmm13,%xmm9
DB 69,15,86,202 ; orps %xmm10,%xmm9
DB 68,15,194,192,1 ; cmpltps %xmm0,%xmm8
- DB 68,15,40,21,116,197,0,0 ; movaps 0xc574(%rip),%xmm10 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,21,180,196,0,0 ; movaps 0xc4b4(%rip),%xmm10 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,92,209 ; subps %xmm9,%xmm10
DB 69,15,84,208 ; andps %xmm8,%xmm10
DB 69,15,85,193 ; andnps %xmm9,%xmm8
DB 69,15,86,194 ; orps %xmm10,%xmm8
DB 68,15,40,201 ; movaps %xmm1,%xmm9
DB 68,15,194,200,1 ; cmpltps %xmm0,%xmm9
- DB 68,15,40,21,115,197,0,0 ; movaps 0xc573(%rip),%xmm10 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,21,179,196,0,0 ; movaps 0xc4b3(%rip),%xmm10 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,208 ; subps %xmm8,%xmm10
DB 69,15,84,209 ; andps %xmm9,%xmm10
DB 69,15,85,200 ; andnps %xmm8,%xmm9
@@ -30821,7 +30821,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,26,203,0,0 ; mulps 0xcb1a(%rip),%xmm9 # 2d150 <_sk_overlay_sse2_8bit+0x14db>
+ DB 68,15,89,13,90,202,0,0 ; mulps 0xca5a(%rip),%xmm9 # 2d090 <_sk_overlay_sse2_8bit+0x14e0>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -30829,7 +30829,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,5,203,0,0 ; mulps 0xcb05(%rip),%xmm10 # 2d160 <_sk_overlay_sse2_8bit+0x14eb>
+ DB 68,15,89,21,69,202,0,0 ; mulps 0xca45(%rip),%xmm10 # 2d0a0 <_sk_overlay_sse2_8bit+0x14f0>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -30838,8 +30838,8 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,189,201,0,0 ; xorps 0xc9bd(%rip),%xmm9 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
- DB 68,15,89,5,149,196,0,0 ; mulps 0xc495(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,87,13,253,200,0,0 ; xorps 0xc8fd(%rip),%xmm9 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
+ DB 68,15,89,5,213,195,0,0 ; mulps 0xc3d5(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -30858,7 +30858,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,124,202,0,0 ; mulps 0xca7c(%rip),%xmm9 # 2d150 <_sk_overlay_sse2_8bit+0x14db>
+ DB 68,15,89,13,188,201,0,0 ; mulps 0xc9bc(%rip),%xmm9 # 2d090 <_sk_overlay_sse2_8bit+0x14e0>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -30866,7 +30866,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,103,202,0,0 ; mulps 0xca67(%rip),%xmm10 # 2d160 <_sk_overlay_sse2_8bit+0x14eb>
+ DB 68,15,89,21,167,201,0,0 ; mulps 0xc9a7(%rip),%xmm10 # 2d0a0 <_sk_overlay_sse2_8bit+0x14f0>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -30875,8 +30875,8 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,31,201,0,0 ; xorps 0xc91f(%rip),%xmm9 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
- DB 68,15,89,5,247,195,0,0 ; mulps 0xc3f7(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,87,13,95,200,0,0 ; xorps 0xc85f(%rip),%xmm9 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
+ DB 68,15,89,5,55,195,0,0 ; mulps 0xc337(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -30892,7 +30892,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,69,15,89,200 ; mulss %xmm8,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,239,201,0,0 ; mulps 0xc9ef(%rip),%xmm9 # 2d150 <_sk_overlay_sse2_8bit+0x14db>
+ DB 68,15,89,13,47,201,0,0 ; mulps 0xc92f(%rip),%xmm9 # 2d090 <_sk_overlay_sse2_8bit+0x14e0>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 69,15,89,210 ; mulps %xmm10,%xmm10
@@ -30900,7 +30900,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,69,15,89,192 ; mulss %xmm8,%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,92,192 ; subps %xmm8,%xmm0
- DB 15,87,5,187,200,0,0 ; xorps 0xc8bb(%rip),%xmm0 # 2d040 <_sk_overlay_sse2_8bit+0x13cb>
+ DB 15,87,5,251,199,0,0 ; xorps 0xc7fb(%rip),%xmm0 # 2cf80 <_sk_overlay_sse2_8bit+0x13d0>
DB 65,15,94,193 ; divps %xmm9,%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -30937,7 +30937,7 @@ _sk_apply_vector_mask_sse2 LABEL PROC
PUBLIC _sk_save_xy_sse2
_sk_save_xy_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,49,195,0,0 ; movaps 0xc331(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,5,113,194,0,0 ; movaps 0xc271(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,17,0 ; movups %xmm0,(%rax)
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,88,200 ; addps %xmm8,%xmm9
@@ -30945,7 +30945,7 @@ _sk_save_xy_sse2 LABEL PROC
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
DB 69,15,40,217 ; movaps %xmm9,%xmm11
DB 69,15,194,218,1 ; cmpltps %xmm10,%xmm11
- DB 68,15,40,37,44,195,0,0 ; movaps 0xc32c(%rip),%xmm12 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 68,15,40,37,108,194,0,0 ; movaps 0xc26c(%rip),%xmm12 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,84,220 ; andps %xmm12,%xmm11
DB 69,15,92,211 ; subps %xmm11,%xmm10
DB 69,15,92,202 ; subps %xmm10,%xmm9
@@ -30988,8 +30988,8 @@ _sk_bilinear_nx_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,197,200,0,0 ; addps 0xc8c5(%rip),%xmm0 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,141,194,0,0 ; movaps 0xc28d(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,5,5,200,0,0 ; addps 0xc805(%rip),%xmm0 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,205,193,0,0 ; movaps 0xc1cd(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31000,7 +31000,7 @@ _sk_bilinear_px_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,76,194,0,0 ; addps 0xc24c(%rip),%xmm0 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,88,5,140,193,0,0 ; addps 0xc18c(%rip),%xmm0 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31010,8 +31010,8 @@ _sk_bilinear_ny_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,126,200,0,0 ; addps 0xc87e(%rip),%xmm1 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,70,194,0,0 ; movaps 0xc246(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,13,190,199,0,0 ; addps 0xc7be(%rip),%xmm1 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,134,193,0,0 ; movaps 0xc186(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31022,7 +31022,7 @@ _sk_bilinear_py_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,4,194,0,0 ; addps 0xc204(%rip),%xmm1 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 15,88,13,68,193,0,0 ; addps 0xc144(%rip),%xmm1 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31032,13 +31032,13 @@ _sk_bicubic_n3x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,71,200,0,0 ; addps 0xc847(%rip),%xmm0 # 2d180 <_sk_overlay_sse2_8bit+0x150b>
- DB 68,15,40,13,255,193,0,0 ; movaps 0xc1ff(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,5,135,199,0,0 ; addps 0xc787(%rip),%xmm0 # 2d0c0 <_sk_overlay_sse2_8bit+0x1510>
+ DB 68,15,40,13,63,193,0,0 ; movaps 0xc13f(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,59,200,0,0 ; mulps 0xc83b(%rip),%xmm9 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,13,211,195,0,0 ; addps 0xc3d3(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,13,123,199,0,0 ; mulps 0xc77b(%rip),%xmm9 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,13,19,195,0,0 ; addps 0xc313(%rip),%xmm9 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31049,16 +31049,16 @@ _sk_bicubic_n1x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,242,199,0,0 ; addps 0xc7f2(%rip),%xmm0 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,186,193,0,0 ; movaps 0xc1ba(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,5,50,199,0,0 ; addps 0xc732(%rip),%xmm0 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,250,192,0,0 ; movaps 0xc0fa(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,14,200,0,0 ; movaps 0xc80e(%rip),%xmm8 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,5,78,199,0,0 ; movaps 0xc74e(%rip),%xmm8 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,18,200,0,0 ; addps 0xc812(%rip),%xmm8 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,5,82,199,0,0 ; addps 0xc752(%rip),%xmm8 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,118,193,0,0 ; addps 0xc176(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,88,5,182,192,0,0 ; addps 0xc0b6(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,10,200,0,0 ; addps 0xc80a(%rip),%xmm8 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,5,74,199,0,0 ; addps 0xc74a(%rip),%xmm8 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31066,17 +31066,17 @@ _sk_bicubic_n1x_sse2 LABEL PROC
PUBLIC _sk_bicubic_p1x_sse2
_sk_bicubic_p1x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,84,193,0,0 ; movaps 0xc154(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,5,148,192,0,0 ; movaps 0xc094(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,72,64 ; movups 0x40(%rax),%xmm9
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,21,192,199,0,0 ; movaps 0xc7c0(%rip),%xmm10 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,21,0,199,0,0 ; movaps 0xc700(%rip),%xmm10 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,196,199,0,0 ; addps 0xc7c4(%rip),%xmm10 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,21,4,199,0,0 ; addps 0xc704(%rip),%xmm10 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,192,199,0,0 ; addps 0xc7c0(%rip),%xmm10 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,21,0,199,0,0 ; addps 0xc700(%rip),%xmm10 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,144,128,0,0,0 ; movups %xmm10,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31086,11 +31086,11 @@ _sk_bicubic_p3x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,147,199,0,0 ; addps 0xc793(%rip),%xmm0 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 15,88,5,211,198,0,0 ; addps 0xc6d3(%rip),%xmm0 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,99,199,0,0 ; mulps 0xc763(%rip),%xmm8 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,5,251,194,0,0 ; addps 0xc2fb(%rip),%xmm8 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,5,163,198,0,0 ; mulps 0xc6a3(%rip),%xmm8 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,5,59,194,0,0 ; addps 0xc23b(%rip),%xmm8 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31101,13 +31101,13 @@ _sk_bicubic_n3y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,41,199,0,0 ; addps 0xc729(%rip),%xmm1 # 2d180 <_sk_overlay_sse2_8bit+0x150b>
- DB 68,15,40,13,225,192,0,0 ; movaps 0xc0e1(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,13,105,198,0,0 ; addps 0xc669(%rip),%xmm1 # 2d0c0 <_sk_overlay_sse2_8bit+0x1510>
+ DB 68,15,40,13,33,192,0,0 ; movaps 0xc021(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,29,199,0,0 ; mulps 0xc71d(%rip),%xmm9 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,13,181,194,0,0 ; addps 0xc2b5(%rip),%xmm9 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,13,93,198,0,0 ; mulps 0xc65d(%rip),%xmm9 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,13,245,193,0,0 ; addps 0xc1f5(%rip),%xmm9 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31118,16 +31118,16 @@ _sk_bicubic_n1y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,211,198,0,0 ; addps 0xc6d3(%rip),%xmm1 # 2d170 <_sk_overlay_sse2_8bit+0x14fb>
- DB 68,15,40,13,155,192,0,0 ; movaps 0xc09b(%rip),%xmm9 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,88,13,19,198,0,0 ; addps 0xc613(%rip),%xmm1 # 2d0b0 <_sk_overlay_sse2_8bit+0x1500>
+ DB 68,15,40,13,219,191,0,0 ; movaps 0xbfdb(%rip),%xmm9 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,239,198,0,0 ; movaps 0xc6ef(%rip),%xmm8 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,5,47,198,0,0 ; movaps 0xc62f(%rip),%xmm8 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,243,198,0,0 ; addps 0xc6f3(%rip),%xmm8 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,5,51,198,0,0 ; addps 0xc633(%rip),%xmm8 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,87,192,0,0 ; addps 0xc057(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,88,5,151,191,0,0 ; addps 0xbf97(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,235,198,0,0 ; addps 0xc6eb(%rip),%xmm8 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,5,43,198,0,0 ; addps 0xc62b(%rip),%xmm8 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31135,17 +31135,17 @@ _sk_bicubic_n1y_sse2 LABEL PROC
PUBLIC _sk_bicubic_p1y_sse2
_sk_bicubic_p1y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,53,192,0,0 ; movaps 0xc035(%rip),%xmm8 # 2cb20 <_sk_overlay_sse2_8bit+0xeab>
+ DB 68,15,40,5,117,191,0,0 ; movaps 0xbf75(%rip),%xmm8 # 2ca60 <_sk_overlay_sse2_8bit+0xeb0>
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,72,96 ; movups 0x60(%rax),%xmm9
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 68,15,40,21,160,198,0,0 ; movaps 0xc6a0(%rip),%xmm10 # 2d1a0 <_sk_overlay_sse2_8bit+0x152b>
+ DB 68,15,40,21,224,197,0,0 ; movaps 0xc5e0(%rip),%xmm10 # 2d0e0 <_sk_overlay_sse2_8bit+0x1530>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,164,198,0,0 ; addps 0xc6a4(%rip),%xmm10 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 68,15,88,21,228,197,0,0 ; addps 0xc5e4(%rip),%xmm10 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,160,198,0,0 ; addps 0xc6a0(%rip),%xmm10 # 2d1c0 <_sk_overlay_sse2_8bit+0x154b>
+ DB 68,15,88,21,224,197,0,0 ; addps 0xc5e0(%rip),%xmm10 # 2d100 <_sk_overlay_sse2_8bit+0x1550>
DB 68,15,17,144,160,0,0,0 ; movups %xmm10,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31155,11 +31155,11 @@ _sk_bicubic_p3y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,114,198,0,0 ; addps 0xc672(%rip),%xmm1 # 2d1b0 <_sk_overlay_sse2_8bit+0x153b>
+ DB 15,88,13,178,197,0,0 ; addps 0xc5b2(%rip),%xmm1 # 2d0f0 <_sk_overlay_sse2_8bit+0x1540>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,66,198,0,0 ; mulps 0xc642(%rip),%xmm8 # 2d190 <_sk_overlay_sse2_8bit+0x151b>
- DB 68,15,88,5,218,193,0,0 ; addps 0xc1da(%rip),%xmm8 # 2cd30 <_sk_overlay_sse2_8bit+0x10bb>
+ DB 68,15,89,5,130,197,0,0 ; mulps 0xc582(%rip),%xmm8 # 2d0d0 <_sk_overlay_sse2_8bit+0x1520>
+ DB 68,15,88,5,26,193,0,0 ; addps 0xc11a(%rip),%xmm8 # 2cc70 <_sk_overlay_sse2_8bit+0x10c0>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31289,7 +31289,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,254,216 ; paddd %xmm0,%xmm3
DB 102,65,15,111,198 ; movdqa %xmm14,%xmm0
DB 102,15,254,195 ; paddd %xmm3,%xmm0
- DB 102,15,111,45,154,196,0,0 ; movdqa 0xc49a(%rip),%xmm5 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,45,218,195,0,0 ; movdqa 0xc3da(%rip),%xmm5 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
DB 102,15,244,197 ; pmuludq %xmm5,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
@@ -31312,7 +31312,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,20,241 ; unpcklps %xmm1,%xmm6
DB 15,20,245 ; unpcklps %xmm5,%xmm6
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,254,13,157,189,0,0 ; paddd 0xbd9d(%rip),%xmm1 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,13,221,188,0,0 ; paddd 0xbcdd(%rip),%xmm1 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,112,233,78 ; pshufd $0x4e,%xmm1,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
DB 102,73,15,126,201 ; movq %xmm1,%r9
@@ -31329,7 +31329,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,44,131 ; movss (%r11,%r8,4),%xmm5
DB 15,20,253 ; unpcklps %xmm5,%xmm7
DB 15,20,249 ; unpcklps %xmm1,%xmm7
- DB 102,15,254,5,113,189,0,0 ; paddd 0xbd71(%rip),%xmm0 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,5,177,188,0,0 ; paddd 0xbcb1(%rip),%xmm0 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
DB 102,73,15,126,193 ; movq %xmm0,%r9
@@ -31346,7 +31346,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,44,131 ; movss (%r11,%r8,4),%xmm5
DB 15,20,205 ; unpcklps %xmm5,%xmm1
DB 15,20,200 ; unpcklps %xmm0,%xmm1
- DB 15,40,45,134,195,0,0 ; movaps 0xc386(%rip),%xmm5 # 2d1d0 <_sk_overlay_sse2_8bit+0x155b>
+ DB 15,40,45,198,194,0,0 ; movaps 0xc2c6(%rip),%xmm5 # 2d110 <_sk_overlay_sse2_8bit+0x1560>
DB 15,88,229 ; addps %xmm5,%xmm4
DB 15,41,100,36,64 ; movaps %xmm4,0x40(%rsp)
DB 68,15,88,213 ; addps %xmm5,%xmm10
@@ -31361,7 +31361,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,127,68,36,32 ; movdqa %xmm0,0x20(%rsp)
DB 102,15,254,216 ; paddd %xmm0,%xmm3
DB 102,15,112,227,245 ; pshufd $0xf5,%xmm3,%xmm4
- DB 102,15,111,5,79,195,0,0 ; movdqa 0xc34f(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,5,143,194,0,0 ; movdqa 0xc28f(%rip),%xmm0 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,216 ; pmuludq %xmm0,%xmm3
DB 102,15,112,211,232 ; pshufd $0xe8,%xmm3,%xmm2
DB 102,15,244,224 ; pmuludq %xmm0,%xmm4
@@ -31383,7 +31383,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,20,227 ; unpcklps %xmm3,%xmm4
DB 15,20,229 ; unpcklps %xmm5,%xmm4
DB 102,15,111,218 ; movdqa %xmm2,%xmm3
- DB 102,15,254,29,86,188,0,0 ; paddd 0xbc56(%rip),%xmm3 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,29,150,187,0,0 ; paddd 0xbb96(%rip),%xmm3 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,112,235,78 ; pshufd $0x4e,%xmm3,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
DB 102,73,15,126,217 ; movq %xmm3,%r9
@@ -31400,7 +31400,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,4,131 ; movss (%r11,%r8,4),%xmm0
DB 15,20,216 ; unpcklps %xmm0,%xmm3
DB 15,20,221 ; unpcklps %xmm5,%xmm3
- DB 102,15,254,21,42,188,0,0 ; paddd 0xbc2a(%rip),%xmm2 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,21,106,187,0,0 ; paddd 0xbb6a(%rip),%xmm2 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,194,78 ; pshufd $0x4e,%xmm2,%xmm0
DB 102,73,15,126,192 ; movq %xmm0,%r8
DB 102,73,15,126,209 ; movq %xmm2,%r9
@@ -31462,7 +31462,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 68,15,20,193 ; unpcklps %xmm1,%xmm8
DB 68,15,20,199 ; unpcklps %xmm7,%xmm8
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,68,15,111,21,242,186,0,0 ; movdqa 0xbaf2(%rip),%xmm10 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,21,50,186,0,0 ; movdqa 0xba32(%rip),%xmm10 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,15,112,249,78 ; pshufd $0x4e,%xmm1,%xmm7
DB 102,73,15,126,248 ; movq %xmm7,%r8
@@ -31480,7 +31480,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,44,131 ; movss (%r11,%r8,4),%xmm5
DB 15,20,205 ; unpcklps %xmm5,%xmm1
DB 15,20,207 ; unpcklps %xmm7,%xmm1
- DB 102,15,111,45,193,186,0,0 ; movdqa 0xbac1(%rip),%xmm5 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,111,45,1,186,0,0 ; movdqa 0xba01(%rip),%xmm5 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,254,197 ; paddd %xmm5,%xmm0
DB 102,15,112,232,78 ; pshufd $0x4e,%xmm0,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
@@ -31538,7 +31538,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,60,131 ; movss (%r11,%r8,4),%xmm7
DB 68,15,20,223 ; unpcklps %xmm7,%xmm11
DB 68,15,20,221 ; unpcklps %xmm5,%xmm11
- DB 102,15,111,45,184,185,0,0 ; movdqa 0xb9b8(%rip),%xmm5 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,111,45,248,184,0,0 ; movdqa 0xb8f8(%rip),%xmm5 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,254,245 ; paddd %xmm5,%xmm6
DB 102,15,111,253 ; movdqa %xmm5,%xmm7
DB 102,15,112,238,78 ; pshufd $0x4e,%xmm6,%xmm5
@@ -31585,7 +31585,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,65,15,254,201 ; paddd %xmm9,%xmm1
DB 102,15,112,209,245 ; pshufd $0xf5,%xmm1,%xmm2
- DB 102,15,111,5,90,191,0,0 ; movdqa 0xbf5a(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,5,154,190,0,0 ; movdqa 0xbe9a(%rip),%xmm0 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,200 ; pmuludq %xmm0,%xmm1
DB 102,15,112,217,232 ; pshufd $0xe8,%xmm1,%xmm3
DB 102,15,244,208 ; pmuludq %xmm0,%xmm2
@@ -31607,7 +31607,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,20,204 ; unpcklps %xmm4,%xmm1
DB 15,20,202 ; unpcklps %xmm2,%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
- DB 102,15,111,5,98,184,0,0 ; movdqa 0xb862(%rip),%xmm0 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,5,162,183,0,0 ; movdqa 0xb7a2(%rip),%xmm0 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,208 ; paddd %xmm0,%xmm2
DB 102,15,112,226,78 ; pshufd $0x4e,%xmm2,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
@@ -31683,7 +31683,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,4,131 ; movss (%r11,%r8,4),%xmm0
DB 15,20,240 ; unpcklps %xmm0,%xmm6
DB 15,20,245 ; unpcklps %xmm5,%xmm6
- DB 102,15,254,29,44,183,0,0 ; paddd 0xb72c(%rip),%xmm3 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,29,108,182,0,0 ; paddd 0xb66c(%rip),%xmm3 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,195,78 ; pshufd $0x4e,%xmm3,%xmm0
DB 102,73,15,126,192 ; movq %xmm0,%r8
DB 102,73,15,126,217 ; movq %xmm3,%r9
@@ -31734,7 +31734,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 68,15,20,201 ; unpcklps %xmm1,%xmm9
DB 68,15,20,202 ; unpcklps %xmm2,%xmm9
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,254,13,38,182,0,0 ; paddd 0xb626(%rip),%xmm1 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,13,102,181,0,0 ; paddd 0xb566(%rip),%xmm1 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,112,209,78 ; pshufd $0x4e,%xmm1,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
DB 102,73,15,126,201 ; movq %xmm1,%r9
@@ -31751,7 +31751,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,20,131 ; movss (%r11,%r8,4),%xmm2
DB 68,15,20,242 ; unpcklps %xmm2,%xmm14
DB 68,15,20,241 ; unpcklps %xmm1,%xmm14
- DB 102,15,254,5,248,181,0,0 ; paddd 0xb5f8(%rip),%xmm0 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,5,56,181,0,0 ; paddd 0xb538(%rip),%xmm0 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
DB 102,73,15,126,193 ; movq %xmm0,%r9
@@ -31789,7 +31789,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,60,131 ; movss (%r11,%r8,4),%xmm7
DB 15,20,199 ; unpcklps %xmm7,%xmm0
DB 15,20,193 ; unpcklps %xmm1,%xmm0
- DB 102,15,111,37,39,181,0,0 ; movdqa 0xb527(%rip),%xmm4 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,37,103,180,0,0 ; movdqa 0xb467(%rip),%xmm4 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,226 ; paddd %xmm2,%xmm4
DB 102,15,112,204,78 ; pshufd $0x4e,%xmm4,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
@@ -31807,7 +31807,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,67,15,16,36,131 ; movss (%r11,%r8,4),%xmm4
DB 15,20,204 ; unpcklps %xmm4,%xmm1
DB 15,20,207 ; unpcklps %xmm7,%xmm1
- DB 102,15,254,21,247,180,0,0 ; paddd 0xb4f7(%rip),%xmm2 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,21,55,180,0,0 ; paddd 0xb437(%rip),%xmm2 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,226,78 ; pshufd $0x4e,%xmm2,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
DB 102,73,15,126,209 ; movq %xmm2,%r9
@@ -31956,7 +31956,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,254,209 ; paddd %xmm1,%xmm2
DB 102,15,111,220 ; movdqa %xmm4,%xmm3
DB 102,15,254,218 ; paddd %xmm2,%xmm3
- DB 102,68,15,111,21,195,184,0,0 ; movdqa 0xb8c3(%rip),%xmm10 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,68,15,111,21,3,184,0,0 ; movdqa 0xb803(%rip),%xmm10 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,112,235,245 ; pshufd $0xf5,%xmm3,%xmm5
DB 102,65,15,244,218 ; pmuludq %xmm10,%xmm3
DB 102,15,112,227,232 ; pshufd $0xe8,%xmm3,%xmm4
@@ -31979,7 +31979,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,222 ; unpcklps %xmm6,%xmm3
DB 15,20,221 ; unpcklps %xmm5,%xmm3
DB 102,15,111,236 ; movdqa %xmm4,%xmm5
- DB 102,15,254,45,196,177,0,0 ; paddd 0xb1c4(%rip),%xmm5 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,45,4,177,0,0 ; paddd 0xb104(%rip),%xmm5 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,112,245,78 ; pshufd $0x4e,%xmm5,%xmm6
DB 102,73,15,126,240 ; movq %xmm6,%r8
DB 102,73,15,126,233 ; movq %xmm5,%r9
@@ -31996,7 +31996,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,67,15,16,60,131 ; movss (%r11,%r8,4),%xmm7
DB 15,20,247 ; unpcklps %xmm7,%xmm6
DB 15,20,245 ; unpcklps %xmm5,%xmm6
- DB 102,15,254,37,152,177,0,0 ; paddd 0xb198(%rip),%xmm4 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,37,216,176,0,0 ; paddd 0xb0d8(%rip),%xmm4 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,236,78 ; pshufd $0x4e,%xmm4,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
DB 102,73,15,126,225 ; movq %xmm4,%r9
@@ -32013,7 +32013,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,67,15,16,60,131 ; movss (%r11,%r8,4),%xmm7
DB 15,20,239 ; unpcklps %xmm7,%xmm5
DB 15,20,236 ; unpcklps %xmm4,%xmm5
- DB 15,40,61,173,183,0,0 ; movaps 0xb7ad(%rip),%xmm7 # 2d1d0 <_sk_overlay_sse2_8bit+0x155b>
+ DB 15,40,61,237,182,0,0 ; movaps 0xb6ed(%rip),%xmm7 # 2d110 <_sk_overlay_sse2_8bit+0x1560>
DB 68,15,88,199 ; addps %xmm7,%xmm8
DB 68,15,41,68,36,48 ; movaps %xmm8,0x30(%rsp)
DB 68,15,88,207 ; addps %xmm7,%xmm9
@@ -32051,7 +32051,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,234 ; unpcklps %xmm2,%xmm13
DB 68,15,20,239 ; unpcklps %xmm7,%xmm13
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
- DB 102,15,254,21,108,176,0,0 ; paddd 0xb06c(%rip),%xmm2 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,21,172,175,0,0 ; paddd 0xafac(%rip),%xmm2 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,112,250,78 ; pshufd $0x4e,%xmm2,%xmm7
DB 102,73,15,126,248 ; movq %xmm7,%r8
DB 102,73,15,126,209 ; movq %xmm2,%r9
@@ -32068,7 +32068,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,71,15,16,12,131 ; movss (%r11,%r8,4),%xmm9
DB 65,15,20,209 ; unpcklps %xmm9,%xmm2
DB 15,20,215 ; unpcklps %xmm7,%xmm2
- DB 102,15,254,5,63,176,0,0 ; paddd 0xb03f(%rip),%xmm0 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,5,127,175,0,0 ; paddd 0xaf7f(%rip),%xmm0 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,248,78 ; pshufd $0x4e,%xmm0,%xmm7
DB 102,73,15,126,248 ; movq %xmm7,%r8
DB 102,73,15,126,193 ; movq %xmm0,%r9
@@ -32109,7 +32109,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,217 ; movdqa %xmm1,%xmm3
DB 102,15,254,92,36,32 ; paddd 0x20(%rsp),%xmm3
DB 102,15,112,227,245 ; pshufd $0xf5,%xmm3,%xmm4
- DB 102,68,15,111,53,251,181,0,0 ; movdqa 0xb5fb(%rip),%xmm14 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,68,15,111,53,59,181,0,0 ; movdqa 0xb53b(%rip),%xmm14 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,65,15,244,222 ; pmuludq %xmm14,%xmm3
DB 102,15,112,219,232 ; pshufd $0xe8,%xmm3,%xmm3
DB 102,65,15,244,230 ; pmuludq %xmm14,%xmm4
@@ -32130,7 +32130,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,228 ; unpcklps %xmm4,%xmm12
DB 68,15,20,229 ; unpcklps %xmm5,%xmm12
DB 102,15,111,227 ; movdqa %xmm3,%xmm4
- DB 102,15,111,61,3,175,0,0 ; movdqa 0xaf03(%rip),%xmm7 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,61,67,174,0,0 ; movdqa 0xae43(%rip),%xmm7 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,231 ; paddd %xmm7,%xmm4
DB 102,15,112,236,78 ; pshufd $0x4e,%xmm4,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
@@ -32148,7 +32148,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,67,15,16,44,131 ; movss (%r11,%r8,4),%xmm5
DB 15,20,245 ; unpcklps %xmm5,%xmm6
DB 15,20,244 ; unpcklps %xmm4,%xmm6
- DB 102,68,15,111,5,210,174,0,0 ; movdqa 0xaed2(%rip),%xmm8 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,5,18,174,0,0 ; movdqa 0xae12(%rip),%xmm8 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,65,15,254,216 ; paddd %xmm8,%xmm3
DB 102,15,112,227,78 ; pshufd $0x4e,%xmm3,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
@@ -32262,7 +32262,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,68,15,111,108,36,32 ; movdqa 0x20(%rsp),%xmm13
DB 102,65,15,254,205 ; paddd %xmm13,%xmm1
DB 102,15,112,209,245 ; pshufd $0xf5,%xmm1,%xmm2
- DB 102,15,111,29,48,179,0,0 ; movdqa 0xb330(%rip),%xmm3 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,29,112,178,0,0 ; movdqa 0xb270(%rip),%xmm3 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,203 ; pmuludq %xmm3,%xmm1
DB 102,15,112,201,232 ; pshufd $0xe8,%xmm1,%xmm1
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
@@ -32284,7 +32284,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,202 ; unpcklps %xmm2,%xmm9
DB 68,15,20,205 ; unpcklps %xmm5,%xmm9
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
- DB 102,15,111,29,54,172,0,0 ; movdqa 0xac36(%rip),%xmm3 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,29,118,171,0,0 ; movdqa 0xab76(%rip),%xmm3 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,211 ; paddd %xmm3,%xmm2
DB 102,15,112,234,78 ; pshufd $0x4e,%xmm2,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
@@ -32392,7 +32392,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,111,211 ; movdqa %xmm11,%xmm2
DB 102,65,15,254,213 ; paddd %xmm13,%xmm2
DB 102,15,112,218,245 ; pshufd $0xf5,%xmm2,%xmm3
- DB 102,15,111,5,235,176,0,0 ; movdqa 0xb0eb(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,5,43,176,0,0 ; movdqa 0xb02b(%rip),%xmm0 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,208 ; pmuludq %xmm0,%xmm2
DB 102,15,112,250,232 ; pshufd $0xe8,%xmm2,%xmm7
DB 102,15,244,216 ; pmuludq %xmm0,%xmm3
@@ -32413,7 +32413,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,202 ; unpcklps %xmm2,%xmm9
DB 68,15,20,203 ; unpcklps %xmm3,%xmm9
DB 102,15,111,215 ; movdqa %xmm7,%xmm2
- DB 102,15,111,5,245,169,0,0 ; movdqa 0xa9f5(%rip),%xmm0 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,5,53,169,0,0 ; movdqa 0xa935(%rip),%xmm0 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,208 ; paddd %xmm0,%xmm2
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
DB 102,73,15,126,216 ; movq %xmm3,%r8
@@ -32431,7 +32431,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,67,15,16,28,131 ; movss (%r11,%r8,4),%xmm3
DB 15,20,243 ; unpcklps %xmm3,%xmm6
DB 15,20,242 ; unpcklps %xmm2,%xmm6
- DB 102,68,15,111,45,196,169,0,0 ; movdqa 0xa9c4(%rip),%xmm13 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,45,4,169,0,0 ; movdqa 0xa904(%rip),%xmm13 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,65,15,254,253 ; paddd %xmm13,%xmm7
DB 102,15,112,215,78 ; pshufd $0x4e,%xmm7,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
@@ -32451,7 +32451,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,250 ; unpcklps %xmm2,%xmm7
DB 102,68,15,254,220 ; paddd %xmm4,%xmm11
DB 102,65,15,112,219,245 ; pshufd $0xf5,%xmm11,%xmm3
- DB 102,15,111,37,216,175,0,0 ; movdqa 0xafd8(%rip),%xmm4 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,37,24,175,0,0 ; movdqa 0xaf18(%rip),%xmm4 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,68,15,244,220 ; pmuludq %xmm4,%xmm11
DB 102,65,15,112,211,232 ; pshufd $0xe8,%xmm11,%xmm2
DB 102,15,244,220 ; pmuludq %xmm4,%xmm3
@@ -32552,7 +32552,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,111,202 ; movdqa %xmm10,%xmm1
DB 102,15,254,200 ; paddd %xmm0,%xmm1
DB 102,15,112,209,245 ; pshufd $0xf5,%xmm1,%xmm2
- DB 102,15,111,29,11,174,0,0 ; movdqa 0xae0b(%rip),%xmm3 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,29,75,173,0,0 ; movdqa 0xad4b(%rip),%xmm3 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,203 ; pmuludq %xmm3,%xmm1
DB 102,15,112,201,232 ; pshufd $0xe8,%xmm1,%xmm1
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
@@ -32574,7 +32574,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,212 ; unpcklps %xmm4,%xmm2
DB 15,20,211 ; unpcklps %xmm3,%xmm2
DB 102,15,111,217 ; movdqa %xmm1,%xmm3
- DB 102,15,111,61,18,167,0,0 ; movdqa 0xa712(%rip),%xmm7 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,61,82,166,0,0 ; movdqa 0xa652(%rip),%xmm7 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,223 ; paddd %xmm7,%xmm3
DB 102,15,112,227,78 ; pshufd $0x4e,%xmm3,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
@@ -32592,7 +32592,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,67,15,16,44,131 ; movss (%r11,%r8,4),%xmm5
DB 15,20,221 ; unpcklps %xmm5,%xmm3
DB 15,20,220 ; unpcklps %xmm4,%xmm3
- DB 102,68,15,111,13,225,166,0,0 ; movdqa 0xa6e1(%rip),%xmm9 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,68,15,111,13,33,166,0,0 ; movdqa 0xa621(%rip),%xmm9 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,65,15,254,201 ; paddd %xmm9,%xmm1
DB 102,15,112,225,78 ; pshufd $0x4e,%xmm1,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
@@ -32704,7 +32704,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,246 ; unpcklps %xmm6,%xmm14
DB 68,15,20,243 ; unpcklps %xmm3,%xmm14
DB 102,15,111,220 ; movdqa %xmm4,%xmm3
- DB 102,68,15,111,21,200,164,0,0 ; movdqa 0xa4c8(%rip),%xmm10 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,21,8,164,0,0 ; movdqa 0xa408(%rip),%xmm10 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,218 ; paddd %xmm10,%xmm3
DB 102,15,112,243,78 ; pshufd $0x4e,%xmm3,%xmm6
DB 102,73,15,126,240 ; movq %xmm6,%r8
@@ -32825,7 +32825,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,116,36,32 ; movdqa 0x20(%rsp),%xmm6
DB 102,15,254,198 ; paddd %xmm6,%xmm0
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
- DB 102,15,111,29,56,169,0,0 ; movdqa 0xa938(%rip),%xmm3 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,29,120,168,0,0 ; movdqa 0xa878(%rip),%xmm3 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,112,208,232 ; pshufd $0xe8,%xmm0,%xmm2
DB 102,15,244,203 ; pmuludq %xmm3,%xmm1
@@ -32847,7 +32847,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,195 ; unpcklps %xmm3,%xmm0
DB 15,20,193 ; unpcklps %xmm1,%xmm0
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
- DB 102,68,15,111,5,62,162,0,0 ; movdqa 0xa23e(%rip),%xmm8 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,68,15,111,5,126,161,0,0 ; movdqa 0xa17e(%rip),%xmm8 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,65,15,254,200 ; paddd %xmm8,%xmm1
DB 102,15,112,217,78 ; pshufd $0x4e,%xmm1,%xmm3
DB 102,73,15,126,216 ; movq %xmm3,%r8
@@ -32953,7 +32953,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,254,60,36 ; paddd (%rsp),%xmm7
DB 102,15,254,247 ; paddd %xmm7,%xmm6
DB 102,15,112,206,245 ; pshufd $0xf5,%xmm6,%xmm1
- DB 102,15,111,21,249,166,0,0 ; movdqa 0xa6f9(%rip),%xmm2 # 2d1e0 <_sk_overlay_sse2_8bit+0x156b>
+ DB 102,15,111,21,57,166,0,0 ; movdqa 0xa639(%rip),%xmm2 # 2d120 <_sk_overlay_sse2_8bit+0x1570>
DB 102,15,244,242 ; pmuludq %xmm2,%xmm6
DB 102,15,112,198,232 ; pshufd $0xe8,%xmm6,%xmm0
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
@@ -32975,7 +32975,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,201 ; unpcklps %xmm1,%xmm9
DB 68,15,20,202 ; unpcklps %xmm2,%xmm9
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,254,13,255,159,0,0 ; paddd 0x9fff(%rip),%xmm1 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,254,13,63,159,0,0 ; paddd 0x9f3f(%rip),%xmm1 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,112,209,78 ; pshufd $0x4e,%xmm1,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
DB 102,73,15,126,201 ; movq %xmm1,%r9
@@ -33031,7 +33031,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,67,15,16,60,131 ; movss (%r11,%r8,4),%xmm7
DB 15,20,199 ; unpcklps %xmm7,%xmm0
DB 15,20,193 ; unpcklps %xmm1,%xmm0
- DB 102,15,111,53,251,158,0,0 ; movdqa 0x9efb(%rip),%xmm6 # 2cb50 <_sk_overlay_sse2_8bit+0xedb>
+ DB 102,15,111,53,59,158,0,0 ; movdqa 0x9e3b(%rip),%xmm6 # 2ca90 <_sk_overlay_sse2_8bit+0xee0>
DB 102,15,254,242 ; paddd %xmm2,%xmm6
DB 102,15,112,206,78 ; pshufd $0x4e,%xmm6,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
@@ -33049,7 +33049,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,71,15,16,60,131 ; movss (%r11,%r8,4),%xmm15
DB 65,15,20,207 ; unpcklps %xmm15,%xmm1
DB 15,20,207 ; unpcklps %xmm7,%xmm1
- DB 102,15,254,21,202,158,0,0 ; paddd 0x9eca(%rip),%xmm2 # 2cb70 <_sk_overlay_sse2_8bit+0xefb>
+ DB 102,15,254,21,10,158,0,0 ; paddd 0x9e0a(%rip),%xmm2 # 2cab0 <_sk_overlay_sse2_8bit+0xf00>
DB 102,15,112,250,78 ; pshufd $0x4e,%xmm2,%xmm7
DB 102,73,15,126,248 ; movq %xmm7,%r8
DB 102,73,15,126,209 ; movq %xmm2,%r9
@@ -33111,7 +33111,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 65,15,88,213 ; addps %xmm13,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,164,157,0,0 ; movaps 0x9da4(%rip),%xmm3 # 2cb40 <_sk_overlay_sse2_8bit+0xecb>
+ DB 15,40,29,228,156,0,0 ; movaps 0x9ce4(%rip),%xmm3 # 2ca80 <_sk_overlay_sse2_8bit+0xed0>
DB 15,40,164,36,240,0,0,0 ; movaps 0xf0(%rsp),%xmm4
DB 15,40,172,36,0,1,0,0 ; movaps 0x100(%rsp),%xmm5
DB 15,40,180,36,16,1,0,0 ; movaps 0x110(%rsp),%xmm6
@@ -33133,7 +33133,7 @@ _sk_start_pipeline_hsw_8bit LABEL PROC
DB 86 ; push %rsi
DB 87 ; push %rdi
DB 83 ; push %rbx
- DB 72,129,236,216,0,0,0 ; sub $0xd8,%rsp
+ DB 72,129,236,200,0,0,0 ; sub $0xc8,%rsp
DB 197,120,41,125,176 ; vmovaps %xmm15,-0x50(%rbp)
DB 197,120,41,117,160 ; vmovaps %xmm14,-0x60(%rbp)
DB 197,120,41,109,144 ; vmovaps %xmm13,-0x70(%rbp)
@@ -33144,45 +33144,42 @@ _sk_start_pipeline_hsw_8bit LABEL PROC
DB 197,120,41,133,64,255,255,255 ; vmovaps %xmm8,-0xc0(%rbp)
DB 197,248,41,189,48,255,255,255 ; vmovaps %xmm7,-0xd0(%rbp)
DB 197,248,41,181,32,255,255,255 ; vmovaps %xmm6,-0xe0(%rbp)
- DB 76,137,195 ; mov %r8,%rbx
- DB 73,137,215 ; mov %rdx,%r15
+ DB 77,137,199 ; mov %r8,%r15
+ DB 72,137,211 ; mov %rdx,%rbx
DB 72,137,141,24,255,255,255 ; mov %rcx,-0xe8(%rbp)
DB 72,139,117,48 ; mov 0x30(%rbp),%rsi
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,197 ; mov %rax,%r13
DB 73,137,246 ; mov %rsi,%r14
- DB 76,137,141,240,254,255,255 ; mov %r9,-0x110(%rbp)
- DB 77,57,207 ; cmp %r9,%r15
- DB 15,131,138,0,0,0 ; jae 22ed5 <_sk_start_pipeline_hsw_8bit+0x10d>
+ DB 76,137,141,8,255,255,255 ; mov %r9,-0xf8(%rbp)
+ DB 76,57,203 ; cmp %r9,%rbx
+ DB 115,101 ; jae 22eac <_sk_start_pipeline_hsw_8bit+0xe4>
DB 72,139,133,24,255,255,255 ; mov -0xe8(%rbp),%rax
DB 72,141,64,16 ; lea 0x10(%rax),%rax
- DB 72,137,133,248,254,255,255 ; mov %rax,-0x108(%rbp)
- DB 76,141,165,0,255,255,255 ; lea -0x100(%rbp),%r12
- DB 72,139,133,24,255,255,255 ; mov -0xe8(%rbp),%rax
- DB 72,137,133,0,255,255,255 ; mov %rax,-0x100(%rbp)
- DB 76,137,189,8,255,255,255 ; mov %r15,-0xf8(%rbp)
- DB 72,199,133,16,255,255,255,0,0,0,0 ; movq $0x0,-0xf0(%rbp)
- DB 72,57,157,248,254,255,255 ; cmp %rbx,-0x108(%rbp)
- DB 119,36 ; ja 22eb1 <_sk_start_pipeline_hsw_8bit+0xe9>
- DB 76,137,231 ; mov %r12,%rdi
+ DB 72,137,133,16,255,255,255 ; mov %rax,-0xf0(%rbp)
+ DB 72,139,149,24,255,255,255 ; mov -0xe8(%rbp),%rdx
+ DB 76,57,189,16,255,255,255 ; cmp %r15,-0xf0(%rbp)
+ DB 119,38 ; ja 22e8f <_sk_start_pipeline_hsw_8bit+0xc7>
+ DB 76,139,165,24,255,255,255 ; mov -0xe8(%rbp),%r12
+ DB 49,255 ; xor %edi,%edi
DB 76,137,246 ; mov %r14,%rsi
- DB 65,255,213 ; callq *%r13
- DB 72,139,141,0,255,255,255 ; mov -0x100(%rbp),%rcx
- DB 72,141,65,16 ; lea 0x10(%rcx),%rax
- DB 72,137,133,0,255,255,255 ; mov %rax,-0x100(%rbp)
- DB 72,131,193,32 ; add $0x20,%rcx
- DB 72,57,217 ; cmp %rbx,%rcx
- DB 118,220 ; jbe 22e8d <_sk_start_pipeline_hsw_8bit+0xc5>
+ DB 76,137,226 ; mov %r12,%rdx
DB 72,137,217 ; mov %rbx,%rcx
- DB 72,41,193 ; sub %rax,%rcx
- DB 116,16 ; je 22ec9 <_sk_start_pipeline_hsw_8bit+0x101>
- DB 72,137,141,16,255,255,255 ; mov %rcx,-0xf0(%rbp)
- DB 76,137,231 ; mov %r12,%rdi
+ DB 65,255,213 ; callq *%r13
+ DB 73,141,84,36,16 ; lea 0x10(%r12),%rdx
+ DB 73,131,196,32 ; add $0x20,%r12
+ DB 77,57,252 ; cmp %r15,%r12
+ DB 73,137,212 ; mov %rdx,%r12
+ DB 118,225 ; jbe 22e70 <_sk_start_pipeline_hsw_8bit+0xa8>
+ DB 76,137,255 ; mov %r15,%rdi
+ DB 72,41,215 ; sub %rdx,%rdi
+ DB 116,9 ; je 22ea0 <_sk_start_pipeline_hsw_8bit+0xd8>
DB 76,137,246 ; mov %r14,%rsi
+ DB 72,137,217 ; mov %rbx,%rcx
DB 65,255,213 ; callq *%r13
- DB 73,255,199 ; inc %r15
- DB 76,59,189,240,254,255,255 ; cmp -0x110(%rbp),%r15
- DB 117,143 ; jne 22e64 <_sk_start_pipeline_hsw_8bit+0x9c>
+ DB 72,255,195 ; inc %rbx
+ DB 72,59,157,8,255,255,255 ; cmp -0xf8(%rbp),%rbx
+ DB 117,173 ; jne 22e59 <_sk_start_pipeline_hsw_8bit+0x91>
DB 197,248,40,181,32,255,255,255 ; vmovaps -0xe0(%rbp),%xmm6
DB 197,248,40,189,48,255,255,255 ; vmovaps -0xd0(%rbp),%xmm7
DB 197,120,40,133,64,255,255,255 ; vmovaps -0xc0(%rbp),%xmm8
@@ -33193,7 +33190,7 @@ _sk_start_pipeline_hsw_8bit LABEL PROC
DB 197,120,40,109,144 ; vmovaps -0x70(%rbp),%xmm13
DB 197,120,40,117,160 ; vmovaps -0x60(%rbp),%xmm14
DB 197,120,40,125,176 ; vmovaps -0x50(%rbp),%xmm15
- DB 72,129,196,216,0,0,0 ; add $0xd8,%rsp
+ DB 72,129,196,200,0,0,0 ; add $0xc8,%rsp
DB 91 ; pop %rbx
DB 95 ; pop %rdi
DB 94 ; pop %rsi
@@ -33220,20 +33217,20 @@ _sk_uniform_color_hsw_8bit LABEL PROC
PUBLIC _sk_set_rgb_hsw_8bit
_sk_set_rgb_hsw_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 197,250,16,37,197,145,0,0 ; vmovss 0x91c5(%rip),%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 197,250,16,37,42,145,0,0 ; vmovss 0x912a(%rip),%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 197,218,89,40 ; vmulss (%rax),%xmm4,%xmm5
- DB 196,225,250,44,205 ; vcvttss2si %xmm5,%rcx
+ DB 196,97,250,44,197 ; vcvttss2si %xmm5,%r8
DB 197,218,89,104,4 ; vmulss 0x4(%rax),%xmm4,%xmm5
- DB 196,225,250,44,213 ; vcvttss2si %xmm5,%rdx
- DB 193,226,8 ; shl $0x8,%edx
- DB 9,202 ; or %ecx,%edx
+ DB 196,97,250,44,205 ; vcvttss2si %xmm5,%r9
+ DB 65,193,225,8 ; shl $0x8,%r9d
+ DB 69,9,193 ; or %r8d,%r9d
DB 197,218,89,96,8 ; vmulss 0x8(%rax),%xmm4,%xmm4
DB 196,225,250,44,196 ; vcvttss2si %xmm4,%rax
DB 193,224,16 ; shl $0x10,%eax
- DB 9,208 ; or %edx,%eax
+ DB 68,9,200 ; or %r9d,%eax
DB 197,249,110,224 ; vmovd %eax,%xmm4
DB 196,226,125,88,228 ; vpbroadcastd %xmm4,%ymm4
- DB 197,253,111,45,93,151,0,0 ; vmovdqa 0x975d(%rip),%ymm5 # 2c6e0 <_sk_overlay_sse2_8bit+0xa6b>
+ DB 197,253,111,45,195,150,0,0 ; vmovdqa 0x96c3(%rip),%ymm5 # 2c620 <_sk_overlay_sse2_8bit+0xa70>
DB 197,245,219,205 ; vpand %ymm5,%ymm1,%ymm1
DB 197,253,219,197 ; vpand %ymm5,%ymm0,%ymm0
DB 197,221,235,192 ; vpor %ymm0,%ymm4,%ymm0
@@ -33243,10 +33240,10 @@ _sk_set_rgb_hsw_8bit LABEL PROC
PUBLIC _sk_premul_hsw_8bit
_sk_premul_hsw_8bit LABEL PROC
- DB 197,253,111,37,97,151,0,0 ; vmovdqa 0x9761(%rip),%ymm4 # 2c700 <_sk_overlay_sse2_8bit+0xa8b>
+ DB 197,253,111,37,199,150,0,0 ; vmovdqa 0x96c7(%rip),%ymm4 # 2c640 <_sk_overlay_sse2_8bit+0xa90>
DB 196,226,125,0,236 ; vpshufb %ymm4,%ymm0,%ymm5
DB 196,226,117,0,228 ; vpshufb %ymm4,%ymm1,%ymm4
- DB 197,253,111,53,111,151,0,0 ; vmovdqa 0x976f(%rip),%ymm6 # 2c720 <_sk_overlay_sse2_8bit+0xaab>
+ DB 197,253,111,53,213,150,0,0 ; vmovdqa 0x96d5(%rip),%ymm6 # 2c660 <_sk_overlay_sse2_8bit+0xab0>
DB 197,221,235,230 ; vpor %ymm6,%ymm4,%ymm4
DB 197,213,235,238 ; vpor %ymm6,%ymm5,%ymm5
DB 196,226,125,48,240 ; vpmovzxbw %xmm0,%ymm6
@@ -33284,7 +33281,7 @@ _sk_premul_hsw_8bit LABEL PROC
PUBLIC _sk_swap_rb_hsw_8bit
_sk_swap_rb_hsw_8bit LABEL PROC
- DB 197,253,111,37,231,150,0,0 ; vmovdqa 0x96e7(%rip),%ymm4 # 2c740 <_sk_overlay_sse2_8bit+0xacb>
+ DB 197,253,111,37,77,150,0,0 ; vmovdqa 0x964d(%rip),%ymm4 # 2c680 <_sk_overlay_sse2_8bit+0xad0>
DB 196,226,125,0,196 ; vpshufb %ymm4,%ymm0,%ymm0
DB 196,226,117,0,204 ; vpshufb %ymm4,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -33300,77 +33297,77 @@ _sk_invert_hsw_8bit LABEL PROC
PUBLIC _sk_load_8888_hsw_8bit
_sk_load_8888_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,17 ; jne 230a9 <_sk_load_8888_hsw_8bit+0x32>
- DB 196,161,126,111,76,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%ymm1
- DB 196,161,126,111,4,130 ; vmovdqu (%rdx,%r8,4),%ymm0
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 2307e <_sk_load_8888_hsw_8bit+0x2d>
+ DB 196,129,126,111,76,152,32 ; vmovdqu 0x20(%r8,%r11,4),%ymm1
+ DB 196,129,126,111,4,152 ; vmovdqu (%r8,%r11,4),%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 197,253,239,192 ; vpxor %ymm0,%ymm0,%ymm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,231 ; ja 230a5 <_sk_load_8888_hsw_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,23,1,0,0 ; lea 0x117(%rip),%rcx # 231e0 <_sk_load_8888_hsw_8bit+0x169>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,228 ; ja 2307a <_sk_load_8888_hsw_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,23,1,0,0 ; lea 0x117(%rip),%r10 # 231b8 <_sk_load_8888_hsw_8bit+0x167>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 196,161,121,110,4,130 ; vmovd (%rdx,%r8,4),%xmm0
- DB 235,203 ; jmp 230a5 <_sk_load_8888_hsw_8bit+0x2e>
- DB 196,161,121,110,68,130,8 ; vmovd 0x8(%rdx,%r8,4),%xmm0
+ DB 196,129,121,110,4,152 ; vmovd (%r8,%r11,4),%xmm0
+ DB 235,200 ; jmp 2307a <_sk_load_8888_hsw_8bit+0x29>
+ DB 196,129,121,110,68,152,8 ; vmovd 0x8(%r8,%r11,4),%xmm0
DB 196,226,121,89,192 ; vpbroadcastq %xmm0,%xmm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,192,4 ; vpblendd $0x4,%ymm0,%ymm1,%ymm0
- DB 196,162,121,53,36,130 ; vpmovzxdq (%rdx,%r8,4),%xmm4
+ DB 196,130,121,53,36,152 ; vpmovzxdq (%r8,%r11,4),%xmm4
DB 197,249,112,228,232 ; vpshufd $0xe8,%xmm4,%xmm4
DB 196,227,125,2,196,3 ; vpblendd $0x3,%ymm4,%ymm0,%ymm0
- DB 235,162 ; jmp 230a5 <_sk_load_8888_hsw_8bit+0x2e>
- DB 196,161,121,110,68,130,24 ; vmovd 0x18(%rdx,%r8,4),%xmm0
+ DB 235,159 ; jmp 2307a <_sk_load_8888_hsw_8bit+0x29>
+ DB 196,129,121,110,68,152,24 ; vmovd 0x18(%r8,%r11,4),%xmm0
DB 196,226,125,89,192 ; vpbroadcastq %xmm0,%ymm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,192,64 ; vpblendd $0x40,%ymm0,%ymm1,%ymm0
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,163,89,34,100,130,20,1 ; vpinsrd $0x1,0x14(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,20,1 ; vpinsrd $0x1,0x14(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,125,56,196,1 ; vinserti128 $0x1,%xmm4,%ymm0,%ymm0
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,163,89,34,100,130,16,0 ; vpinsrd $0x0,0x10(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,16,0 ; vpinsrd $0x0,0x10(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,125,56,196,1 ; vinserti128 $0x1,%xmm4,%ymm0,%ymm0
- DB 196,161,122,111,36,130 ; vmovdqu (%rdx,%r8,4),%xmm4
+ DB 196,129,122,111,36,152 ; vmovdqu (%r8,%r11,4),%xmm4
DB 196,227,93,2,192,240 ; vpblendd $0xf0,%ymm0,%ymm4,%ymm0
- DB 233,83,255,255,255 ; jmpq 230a5 <_sk_load_8888_hsw_8bit+0x2e>
- DB 196,161,121,110,68,130,40 ; vmovd 0x28(%rdx,%r8,4),%xmm0
+ DB 233,80,255,255,255 ; jmpq 2307a <_sk_load_8888_hsw_8bit+0x29>
+ DB 196,129,121,110,68,152,40 ; vmovd 0x28(%r8,%r11,4),%xmm0
DB 196,226,121,89,192 ; vpbroadcastq %xmm0,%xmm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,200,4 ; vpblendd $0x4,%ymm0,%ymm1,%ymm1
- DB 196,163,113,34,68,130,36,1 ; vpinsrd $0x1,0x24(%rdx,%r8,4),%xmm1,%xmm0
+ DB 196,131,113,34,68,152,36,1 ; vpinsrd $0x1,0x24(%r8,%r11,4),%xmm1,%xmm0
DB 196,227,117,2,200,15 ; vpblendd $0xf,%ymm0,%ymm1,%ymm1
- DB 196,161,121,110,68,130,32 ; vmovd 0x20(%rdx,%r8,4),%xmm0
+ DB 196,129,121,110,68,152,32 ; vmovd 0x20(%r8,%r11,4),%xmm0
DB 196,227,117,2,200,1 ; vpblendd $0x1,%ymm0,%ymm1,%ymm1
- DB 233,23,255,255,255 ; jmpq 2309f <_sk_load_8888_hsw_8bit+0x28>
- DB 196,161,121,110,68,130,56 ; vmovd 0x38(%rdx,%r8,4),%xmm0
+ DB 233,20,255,255,255 ; jmpq 23074 <_sk_load_8888_hsw_8bit+0x23>
+ DB 196,129,121,110,68,152,56 ; vmovd 0x38(%r8,%r11,4),%xmm0
DB 196,226,125,89,192 ; vpbroadcastq %xmm0,%ymm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,200,64 ; vpblendd $0x40,%ymm0,%ymm1,%ymm1
DB 196,227,125,57,200,1 ; vextracti128 $0x1,%ymm1,%xmm0
- DB 196,163,121,34,68,130,52,1 ; vpinsrd $0x1,0x34(%rdx,%r8,4),%xmm0,%xmm0
+ DB 196,131,121,34,68,152,52,1 ; vpinsrd $0x1,0x34(%r8,%r11,4),%xmm0,%xmm0
DB 196,227,117,56,200,1 ; vinserti128 $0x1,%xmm0,%ymm1,%ymm1
DB 196,227,125,57,200,1 ; vextracti128 $0x1,%ymm1,%xmm0
- DB 196,163,121,34,68,130,48,0 ; vpinsrd $0x0,0x30(%rdx,%r8,4),%xmm0,%xmm0
+ DB 196,131,121,34,68,152,48,0 ; vpinsrd $0x0,0x30(%r8,%r11,4),%xmm0,%xmm0
DB 196,227,117,56,200,1 ; vinserti128 $0x1,%xmm0,%ymm1,%ymm1
- DB 196,161,126,111,4,130 ; vmovdqu (%rdx,%r8,4),%ymm0
- DB 196,161,122,111,100,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%xmm4
+ DB 196,129,126,111,4,152 ; vmovdqu (%r8,%r11,4),%ymm0
+ DB 196,129,122,111,100,152,32 ; vmovdqu 0x20(%r8,%r11,4),%xmm4
DB 196,227,93,2,201,240 ; vpblendd $0xf0,%ymm1,%ymm4,%ymm1
- DB 233,199,254,255,255 ; jmpq 230a5 <_sk_load_8888_hsw_8bit+0x2e>
+ DB 233,196,254,255,255 ; jmpq 2307a <_sk_load_8888_hsw_8bit+0x29>
DB 102,144 ; xchg %ax,%ax
DB 242,254 ; repnz (bad)
DB 255 ; (bad)
@@ -33392,7 +33389,7 @@ _sk_load_8888_hsw_8bit LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 191,254,255,255,150 ; mov $0x96fffffe,%edi
+ DB 188,254,255,255,150 ; mov $0x96fffffe,%esp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,136,255,255,255,114 ; decl 0x72ffffff(%rax)
@@ -33412,535 +33409,534 @@ _sk_load_8888_hsw_8bit LABEL PROC
PUBLIC _sk_load_8888_dst_hsw_8bit
_sk_load_8888_dst_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,17 ; jne 2324e <_sk_load_8888_dst_hsw_8bit+0x32>
- DB 196,161,126,111,92,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%ymm3
- DB 196,161,126,111,20,130 ; vmovdqu (%rdx,%r8,4),%ymm2
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 23221 <_sk_load_8888_dst_hsw_8bit+0x2d>
+ DB 196,129,126,111,92,152,32 ; vmovdqu 0x20(%r8,%r11,4),%ymm3
+ DB 196,129,126,111,20,152 ; vmovdqu (%r8,%r11,4),%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 197,237,239,210 ; vpxor %ymm2,%ymm2,%ymm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,231 ; ja 2324a <_sk_load_8888_dst_hsw_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,22,1,0,0 ; lea 0x116(%rip),%rcx # 23384 <_sk_load_8888_dst_hsw_8bit+0x168>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,228 ; ja 2321d <_sk_load_8888_dst_hsw_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,24,1,0,0 ; lea 0x118(%rip),%r10 # 2335c <_sk_load_8888_dst_hsw_8bit+0x168>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 196,161,121,110,20,130 ; vmovd (%rdx,%r8,4),%xmm2
- DB 235,203 ; jmp 2324a <_sk_load_8888_dst_hsw_8bit+0x2e>
- DB 196,161,121,110,84,130,8 ; vmovd 0x8(%rdx,%r8,4),%xmm2
+ DB 196,129,121,110,20,152 ; vmovd (%r8,%r11,4),%xmm2
+ DB 235,200 ; jmp 2321d <_sk_load_8888_dst_hsw_8bit+0x29>
+ DB 196,129,121,110,84,152,8 ; vmovd 0x8(%r8,%r11,4),%xmm2
DB 196,226,121,89,210 ; vpbroadcastq %xmm2,%xmm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,210,4 ; vpblendd $0x4,%ymm2,%ymm3,%ymm2
- DB 196,162,121,53,36,130 ; vpmovzxdq (%rdx,%r8,4),%xmm4
+ DB 196,130,121,53,36,152 ; vpmovzxdq (%r8,%r11,4),%xmm4
DB 197,249,112,228,232 ; vpshufd $0xe8,%xmm4,%xmm4
DB 196,227,109,2,212,3 ; vpblendd $0x3,%ymm4,%ymm2,%ymm2
- DB 235,162 ; jmp 2324a <_sk_load_8888_dst_hsw_8bit+0x2e>
- DB 196,161,121,110,84,130,24 ; vmovd 0x18(%rdx,%r8,4),%xmm2
+ DB 235,159 ; jmp 2321d <_sk_load_8888_dst_hsw_8bit+0x29>
+ DB 196,129,121,110,84,152,24 ; vmovd 0x18(%r8,%r11,4),%xmm2
DB 196,226,125,89,210 ; vpbroadcastq %xmm2,%ymm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,210,64 ; vpblendd $0x40,%ymm2,%ymm3,%ymm2
DB 196,227,125,57,212,1 ; vextracti128 $0x1,%ymm2,%xmm4
- DB 196,163,89,34,100,130,20,1 ; vpinsrd $0x1,0x14(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,20,1 ; vpinsrd $0x1,0x14(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,109,56,212,1 ; vinserti128 $0x1,%xmm4,%ymm2,%ymm2
DB 196,227,125,57,212,1 ; vextracti128 $0x1,%ymm2,%xmm4
- DB 196,163,89,34,100,130,16,0 ; vpinsrd $0x0,0x10(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,16,0 ; vpinsrd $0x0,0x10(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,109,56,212,1 ; vinserti128 $0x1,%xmm4,%ymm2,%ymm2
- DB 196,161,122,111,36,130 ; vmovdqu (%rdx,%r8,4),%xmm4
+ DB 196,129,122,111,36,152 ; vmovdqu (%r8,%r11,4),%xmm4
DB 196,227,93,2,210,240 ; vpblendd $0xf0,%ymm2,%ymm4,%ymm2
- DB 233,83,255,255,255 ; jmpq 2324a <_sk_load_8888_dst_hsw_8bit+0x2e>
- DB 196,161,121,110,84,130,40 ; vmovd 0x28(%rdx,%r8,4),%xmm2
+ DB 233,80,255,255,255 ; jmpq 2321d <_sk_load_8888_dst_hsw_8bit+0x29>
+ DB 196,129,121,110,84,152,40 ; vmovd 0x28(%r8,%r11,4),%xmm2
DB 196,226,121,89,210 ; vpbroadcastq %xmm2,%xmm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,218,4 ; vpblendd $0x4,%ymm2,%ymm3,%ymm3
- DB 196,163,97,34,84,130,36,1 ; vpinsrd $0x1,0x24(%rdx,%r8,4),%xmm3,%xmm2
+ DB 196,131,97,34,84,152,36,1 ; vpinsrd $0x1,0x24(%r8,%r11,4),%xmm3,%xmm2
DB 196,227,101,2,218,15 ; vpblendd $0xf,%ymm2,%ymm3,%ymm3
- DB 196,161,121,110,84,130,32 ; vmovd 0x20(%rdx,%r8,4),%xmm2
+ DB 196,129,121,110,84,152,32 ; vmovd 0x20(%r8,%r11,4),%xmm2
DB 196,227,101,2,218,1 ; vpblendd $0x1,%ymm2,%ymm3,%ymm3
- DB 233,23,255,255,255 ; jmpq 23244 <_sk_load_8888_dst_hsw_8bit+0x28>
- DB 196,161,121,110,84,130,56 ; vmovd 0x38(%rdx,%r8,4),%xmm2
+ DB 233,20,255,255,255 ; jmpq 23217 <_sk_load_8888_dst_hsw_8bit+0x23>
+ DB 196,129,121,110,84,152,56 ; vmovd 0x38(%r8,%r11,4),%xmm2
DB 196,226,125,89,210 ; vpbroadcastq %xmm2,%ymm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,218,64 ; vpblendd $0x40,%ymm2,%ymm3,%ymm3
DB 196,227,125,57,218,1 ; vextracti128 $0x1,%ymm3,%xmm2
- DB 196,163,105,34,84,130,52,1 ; vpinsrd $0x1,0x34(%rdx,%r8,4),%xmm2,%xmm2
+ DB 196,131,105,34,84,152,52,1 ; vpinsrd $0x1,0x34(%r8,%r11,4),%xmm2,%xmm2
DB 196,227,101,56,218,1 ; vinserti128 $0x1,%xmm2,%ymm3,%ymm3
DB 196,227,125,57,218,1 ; vextracti128 $0x1,%ymm3,%xmm2
- DB 196,163,105,34,84,130,48,0 ; vpinsrd $0x0,0x30(%rdx,%r8,4),%xmm2,%xmm2
+ DB 196,131,105,34,84,152,48,0 ; vpinsrd $0x0,0x30(%r8,%r11,4),%xmm2,%xmm2
DB 196,227,101,56,218,1 ; vinserti128 $0x1,%xmm2,%ymm3,%ymm3
- DB 196,161,126,111,20,130 ; vmovdqu (%rdx,%r8,4),%ymm2
- DB 196,161,122,111,100,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%xmm4
+ DB 196,129,126,111,20,152 ; vmovdqu (%r8,%r11,4),%ymm2
+ DB 196,129,122,111,100,152,32 ; vmovdqu 0x20(%r8,%r11,4),%xmm4
DB 196,227,93,2,219,240 ; vpblendd $0xf0,%ymm3,%ymm4,%ymm3
- DB 233,199,254,255,255 ; jmpq 2324a <_sk_load_8888_dst_hsw_8bit+0x2e>
- DB 144 ; nop
- DB 243,254 ; repz (bad)
+ DB 233,196,254,255,255 ; jmpq 2321d <_sk_load_8888_dst_hsw_8bit+0x29>
+ DB 15,31,0 ; nopl (%rax)
+ DB 241 ; icebp
+ DB 254 ; (bad)
DB 255 ; (bad)
- DB 255,17 ; callq *(%rcx)
+ DB 255,15 ; decl (%rdi)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 251 ; sti
+ DB 249 ; stc
DB 254 ; (bad)
DB 255 ; (bad)
- DB 255,98,255 ; jmpq *-0x1(%rdx)
+ DB 255,96,255 ; jmpq *-0x1(%rax)
DB 255 ; (bad)
- DB 255,78,255 ; decl -0x1(%rsi)
+ DB 255,76,255,255 ; decl -0x1(%rdi,%rdi,8)
DB 255 ; (bad)
+ DB 56,255 ; cmp %bh,%bh
DB 255 ; (bad)
- DB 58,255 ; cmp %bh,%bh
+ DB 255,34 ; jmpq *(%rdx)
DB 255 ; (bad)
- DB 255,36,255 ; jmpq *(%rdi,%rdi,8)
DB 255 ; (bad)
- DB 255,192 ; inc %eax
- DB 254 ; (bad)
DB 255 ; (bad)
- DB 255,151,255,255,255,137 ; callq *-0x76000001(%rdi)
+ DB 187,254,255,255,149 ; mov $0x95fffffe,%ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,115,255 ; pushq -0x1(%rbx)
+ DB 255,135,255,255,255,113 ; incl 0x71ffffff(%rdi)
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
- DB 255,211 ; callq *%rbx
DB 255 ; (bad)
+ DB 255,209 ; callq *%rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 191,255,255,255,169 ; mov $0xa9ffffff,%edi
+ DB 255 ; (bad)
+ DB 189,255,255,255,167 ; mov $0xa7ffffff,%ebp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_8888_hsw_8bit
_sk_store_8888_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,17 ; jne 233f2 <_sk_store_8888_hsw_8bit+0x32>
- DB 196,161,126,127,4,130 ; vmovdqu %ymm0,(%rdx,%r8,4)
- DB 196,161,126,127,76,130,32 ; vmovdqu %ymm1,0x20(%rdx,%r8,4)
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 233c5 <_sk_store_8888_hsw_8bit+0x2d>
+ DB 196,129,126,127,4,152 ; vmovdqu %ymm0,(%r8,%r11,4)
+ DB 196,129,126,127,76,152,32 ; vmovdqu %ymm1,0x20(%r8,%r11,4)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,239 ; ja 233ee <_sk_store_8888_hsw_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,178,0,0,0 ; lea 0xb2(%rip),%rcx # 234bc <_sk_store_8888_hsw_8bit+0xfc>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 196,161,121,126,4,130 ; vmovd %xmm0,(%rdx,%r8,4)
- DB 235,211 ; jmp 233ee <_sk_store_8888_hsw_8bit+0x2e>
- DB 196,163,121,22,68,130,8,2 ; vpextrd $0x2,%xmm0,0x8(%rdx,%r8,4)
- DB 196,161,121,214,4,130 ; vmovq %xmm0,(%rdx,%r8,4)
- DB 235,195 ; jmp 233ee <_sk_store_8888_hsw_8bit+0x2e>
+ DB 119,236 ; ja 233c1 <_sk_store_8888_hsw_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,176,0,0,0 ; lea 0xb0(%rip),%r10 # 23490 <_sk_store_8888_hsw_8bit+0xf8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 196,129,121,126,4,152 ; vmovd %xmm0,(%r8,%r11,4)
+ DB 235,208 ; jmp 233c1 <_sk_store_8888_hsw_8bit+0x29>
+ DB 196,131,121,22,68,152,8,2 ; vpextrd $0x2,%xmm0,0x8(%r8,%r11,4)
+ DB 196,129,121,214,4,152 ; vmovq %xmm0,(%r8,%r11,4)
+ DB 235,192 ; jmp 233c1 <_sk_store_8888_hsw_8bit+0x29>
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,163,121,22,100,130,24,2 ; vpextrd $0x2,%xmm4,0x18(%rdx,%r8,4)
+ DB 196,131,121,22,100,152,24,2 ; vpextrd $0x2,%xmm4,0x18(%r8,%r11,4)
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,163,121,22,100,130,20,1 ; vpextrd $0x1,%xmm4,0x14(%rdx,%r8,4)
+ DB 196,131,121,22,100,152,20,1 ; vpextrd $0x1,%xmm4,0x14(%r8,%r11,4)
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,161,121,126,100,130,16 ; vmovd %xmm4,0x10(%rdx,%r8,4)
- DB 196,161,122,127,4,130 ; vmovdqu %xmm0,(%rdx,%r8,4)
- DB 235,146 ; jmp 233ee <_sk_store_8888_hsw_8bit+0x2e>
- DB 196,163,121,22,76,130,40,2 ; vpextrd $0x2,%xmm1,0x28(%rdx,%r8,4)
- DB 196,163,121,22,76,130,36,1 ; vpextrd $0x1,%xmm1,0x24(%rdx,%r8,4)
- DB 196,161,121,126,76,130,32 ; vmovd %xmm1,0x20(%rdx,%r8,4)
- DB 196,161,126,127,4,130 ; vmovdqu %ymm0,(%rdx,%r8,4)
- DB 233,112,255,255,255 ; jmpq 233ee <_sk_store_8888_hsw_8bit+0x2e>
+ DB 196,129,121,126,100,152,16 ; vmovd %xmm4,0x10(%r8,%r11,4)
+ DB 196,129,122,127,4,152 ; vmovdqu %xmm0,(%r8,%r11,4)
+ DB 235,143 ; jmp 233c1 <_sk_store_8888_hsw_8bit+0x29>
+ DB 196,131,121,22,76,152,40,2 ; vpextrd $0x2,%xmm1,0x28(%r8,%r11,4)
+ DB 196,131,121,22,76,152,36,1 ; vpextrd $0x1,%xmm1,0x24(%r8,%r11,4)
+ DB 196,129,121,126,76,152,32 ; vmovd %xmm1,0x20(%r8,%r11,4)
+ DB 196,129,126,127,4,152 ; vmovdqu %ymm0,(%r8,%r11,4)
+ DB 233,109,255,255,255 ; jmpq 233c1 <_sk_store_8888_hsw_8bit+0x29>
DB 196,227,125,57,204,1 ; vextracti128 $0x1,%ymm1,%xmm4
- DB 196,163,121,22,100,130,56,2 ; vpextrd $0x2,%xmm4,0x38(%rdx,%r8,4)
+ DB 196,131,121,22,100,152,56,2 ; vpextrd $0x2,%xmm4,0x38(%r8,%r11,4)
DB 196,227,125,57,204,1 ; vextracti128 $0x1,%ymm1,%xmm4
- DB 196,163,121,22,100,130,52,1 ; vpextrd $0x1,%xmm4,0x34(%rdx,%r8,4)
+ DB 196,131,121,22,100,152,52,1 ; vpextrd $0x1,%xmm4,0x34(%r8,%r11,4)
DB 196,227,125,57,204,1 ; vextracti128 $0x1,%ymm1,%xmm4
- DB 196,161,121,126,100,130,48 ; vmovd %xmm4,0x30(%rdx,%r8,4)
- DB 196,161,126,127,4,130 ; vmovdqu %ymm0,(%rdx,%r8,4)
- DB 196,161,122,127,76,130,32 ; vmovdqu %xmm1,0x20(%rdx,%r8,4)
- DB 233,53,255,255,255 ; jmpq 233ee <_sk_store_8888_hsw_8bit+0x2e>
- DB 15,31,0 ; nopl (%rax)
- DB 87 ; push %rdi
+ DB 196,129,121,126,100,152,48 ; vmovd %xmm4,0x30(%r8,%r11,4)
+ DB 196,129,126,127,4,152 ; vmovdqu %ymm0,(%r8,%r11,4)
+ DB 196,129,122,127,76,152,32 ; vmovdqu %xmm1,0x20(%r8,%r11,4)
+ DB 233,50,255,255,255 ; jmpq 233c1 <_sk_store_8888_hsw_8bit+0x29>
+ DB 144 ; nop
+ DB 89 ; pop %rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,103,255 ; jmpq *-0x1(%rdi)
+ DB 255,105,255 ; ljmp *-0x1(%rcx)
DB 255 ; (bad)
- DB 255,95,255 ; lcall *-0x1(%rdi)
+ DB 255,97,255 ; jmpq *-0x1(%rcx)
DB 255 ; (bad)
- DB 255,152,255,255,255,139 ; lcall *-0x74000001(%rax)
+ DB 255,154,255,255,255,141 ; lcall *-0x72000001(%rdx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 125,255 ; jge 234d1 <_sk_store_8888_hsw_8bit+0x111>
+ DB 127,255 ; jg 234a5 <_sk_store_8888_hsw_8bit+0x10d>
DB 255 ; (bad)
- DB 255,111,255 ; ljmp *-0x1(%rdi)
+ DB 255,113,255 ; pushq -0x1(%rcx)
DB 255 ; (bad)
- DB 255,183,255,255,255,176 ; pushq -0x4f000001(%rdi)
DB 255 ; (bad)
+ DB 185,255,255,255,178 ; mov $0xb2ffffff,%ecx
DB 255 ; (bad)
- DB 255,168,255,255,255,160 ; ljmp *-0x5f000001(%rax)
DB 255 ; (bad)
+ DB 255,170,255,255,255,162 ; ljmp *-0x5d000001(%rdx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 235,255 ; jmp 234e9 <_sk_store_8888_hsw_8bit+0x129>
DB 255 ; (bad)
+ DB 237 ; in (%dx),%eax
DB 255 ; (bad)
- DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,208 ; callq *%rax
+ DB 255,224 ; jmpq *%rax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,194 ; inc %edx
+ DB 255,210 ; callq *%rdx
+ DB 255 ; (bad)
+ DB 255 ; (bad)
+ DB 255,196 ; inc %esp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_bgra_hsw_8bit
_sk_load_bgra_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,35 ; jne 2353c <_sk_load_bgra_hsw_8bit+0x44>
- DB 196,161,126,111,76,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%ymm1
- DB 196,161,126,111,4,130 ; vmovdqu (%rdx,%r8,4),%ymm0
- DB 197,253,111,37,50,146,0,0 ; vmovdqa 0x9232(%rip),%ymm4 # 2c760 <_sk_overlay_sse2_8bit+0xaeb>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,35 ; jne 2350b <_sk_load_bgra_hsw_8bit+0x3f>
+ DB 196,129,126,111,76,152,32 ; vmovdqu 0x20(%r8,%r11,4),%ymm1
+ DB 196,129,126,111,4,152 ; vmovdqu (%r8,%r11,4),%ymm0
+ DB 197,253,111,37,163,145,0,0 ; vmovdqa 0x91a3(%rip),%ymm4 # 2c6a0 <_sk_overlay_sse2_8bit+0xaf0>
DB 196,226,125,0,196 ; vpshufb %ymm4,%ymm0,%ymm0
DB 196,226,117,0,204 ; vpshufb %ymm4,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 197,253,239,192 ; vpxor %ymm0,%ymm0,%ymm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,213 ; ja 23526 <_sk_load_bgra_hsw_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,24,1,0,0 ; lea 0x118(%rip),%rcx # 23674 <_sk_load_bgra_hsw_8bit+0x17c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,210 ; ja 234f5 <_sk_load_bgra_hsw_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,22,1,0,0 ; lea 0x116(%rip),%r10 # 23644 <_sk_load_bgra_hsw_8bit+0x178>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 196,161,121,110,4,130 ; vmovd (%rdx,%r8,4),%xmm0
- DB 235,185 ; jmp 23526 <_sk_load_bgra_hsw_8bit+0x2e>
- DB 196,161,121,110,68,130,8 ; vmovd 0x8(%rdx,%r8,4),%xmm0
+ DB 196,129,121,110,4,152 ; vmovd (%r8,%r11,4),%xmm0
+ DB 235,182 ; jmp 234f5 <_sk_load_bgra_hsw_8bit+0x29>
+ DB 196,129,121,110,68,152,8 ; vmovd 0x8(%r8,%r11,4),%xmm0
DB 196,226,121,89,192 ; vpbroadcastq %xmm0,%xmm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,192,4 ; vpblendd $0x4,%ymm0,%ymm1,%ymm0
- DB 196,162,121,53,36,130 ; vpmovzxdq (%rdx,%r8,4),%xmm4
+ DB 196,130,121,53,36,152 ; vpmovzxdq (%r8,%r11,4),%xmm4
DB 197,249,112,228,232 ; vpshufd $0xe8,%xmm4,%xmm4
DB 196,227,125,2,196,3 ; vpblendd $0x3,%ymm4,%ymm0,%ymm0
- DB 235,144 ; jmp 23526 <_sk_load_bgra_hsw_8bit+0x2e>
- DB 196,161,121,110,68,130,24 ; vmovd 0x18(%rdx,%r8,4),%xmm0
+ DB 235,141 ; jmp 234f5 <_sk_load_bgra_hsw_8bit+0x29>
+ DB 196,129,121,110,68,152,24 ; vmovd 0x18(%r8,%r11,4),%xmm0
DB 196,226,125,89,192 ; vpbroadcastq %xmm0,%ymm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,192,64 ; vpblendd $0x40,%ymm0,%ymm1,%ymm0
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,163,89,34,100,130,20,1 ; vpinsrd $0x1,0x14(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,20,1 ; vpinsrd $0x1,0x14(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,125,56,196,1 ; vinserti128 $0x1,%xmm4,%ymm0,%ymm0
DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
- DB 196,163,89,34,100,130,16,0 ; vpinsrd $0x0,0x10(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,16,0 ; vpinsrd $0x0,0x10(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,125,56,196,1 ; vinserti128 $0x1,%xmm4,%ymm0,%ymm0
- DB 196,161,122,111,36,130 ; vmovdqu (%rdx,%r8,4),%xmm4
+ DB 196,129,122,111,36,152 ; vmovdqu (%r8,%r11,4),%xmm4
DB 196,227,93,2,192,240 ; vpblendd $0xf0,%ymm0,%ymm4,%ymm0
- DB 233,65,255,255,255 ; jmpq 23526 <_sk_load_bgra_hsw_8bit+0x2e>
- DB 196,161,121,110,68,130,40 ; vmovd 0x28(%rdx,%r8,4),%xmm0
+ DB 233,62,255,255,255 ; jmpq 234f5 <_sk_load_bgra_hsw_8bit+0x29>
+ DB 196,129,121,110,68,152,40 ; vmovd 0x28(%r8,%r11,4),%xmm0
DB 196,226,121,89,192 ; vpbroadcastq %xmm0,%xmm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,200,4 ; vpblendd $0x4,%ymm0,%ymm1,%ymm1
- DB 196,163,113,34,68,130,36,1 ; vpinsrd $0x1,0x24(%rdx,%r8,4),%xmm1,%xmm0
+ DB 196,131,113,34,68,152,36,1 ; vpinsrd $0x1,0x24(%r8,%r11,4),%xmm1,%xmm0
DB 196,227,117,2,200,15 ; vpblendd $0xf,%ymm0,%ymm1,%ymm1
- DB 196,161,121,110,68,130,32 ; vmovd 0x20(%rdx,%r8,4),%xmm0
+ DB 196,129,121,110,68,152,32 ; vmovd 0x20(%r8,%r11,4),%xmm0
DB 196,227,117,2,200,1 ; vpblendd $0x1,%ymm0,%ymm1,%ymm1
- DB 233,5,255,255,255 ; jmpq 23520 <_sk_load_bgra_hsw_8bit+0x28>
- DB 196,161,121,110,68,130,56 ; vmovd 0x38(%rdx,%r8,4),%xmm0
+ DB 233,2,255,255,255 ; jmpq 234ef <_sk_load_bgra_hsw_8bit+0x23>
+ DB 196,129,121,110,68,152,56 ; vmovd 0x38(%r8,%r11,4),%xmm0
DB 196,226,125,89,192 ; vpbroadcastq %xmm0,%ymm0
DB 197,245,239,201 ; vpxor %ymm1,%ymm1,%ymm1
DB 196,227,117,2,200,64 ; vpblendd $0x40,%ymm0,%ymm1,%ymm1
DB 196,227,125,57,200,1 ; vextracti128 $0x1,%ymm1,%xmm0
- DB 196,163,121,34,68,130,52,1 ; vpinsrd $0x1,0x34(%rdx,%r8,4),%xmm0,%xmm0
+ DB 196,131,121,34,68,152,52,1 ; vpinsrd $0x1,0x34(%r8,%r11,4),%xmm0,%xmm0
DB 196,227,117,56,200,1 ; vinserti128 $0x1,%xmm0,%ymm1,%ymm1
DB 196,227,125,57,200,1 ; vextracti128 $0x1,%ymm1,%xmm0
- DB 196,163,121,34,68,130,48,0 ; vpinsrd $0x0,0x30(%rdx,%r8,4),%xmm0,%xmm0
+ DB 196,131,121,34,68,152,48,0 ; vpinsrd $0x0,0x30(%r8,%r11,4),%xmm0,%xmm0
DB 196,227,117,56,200,1 ; vinserti128 $0x1,%xmm0,%ymm1,%ymm1
- DB 196,161,126,111,4,130 ; vmovdqu (%rdx,%r8,4),%ymm0
- DB 196,161,122,111,100,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%xmm4
+ DB 196,129,126,111,4,152 ; vmovdqu (%r8,%r11,4),%ymm0
+ DB 196,129,122,111,100,152,32 ; vmovdqu 0x20(%r8,%r11,4),%xmm4
DB 196,227,93,2,201,240 ; vpblendd $0xf0,%ymm1,%ymm4,%ymm1
- DB 233,181,254,255,255 ; jmpq 23526 <_sk_load_bgra_hsw_8bit+0x2e>
- DB 15,31,0 ; nopl (%rax)
- DB 241 ; icebp
- DB 254 ; (bad)
+ DB 233,178,254,255,255 ; jmpq 234f5 <_sk_load_bgra_hsw_8bit+0x29>
+ DB 144 ; nop
+ DB 243,254 ; repz (bad)
DB 255 ; (bad)
- DB 255,15 ; decl (%rdi)
+ DB 255,17 ; callq *(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 249 ; stc
+ DB 251 ; sti
DB 254 ; (bad)
DB 255 ; (bad)
- DB 255,96,255 ; jmpq *-0x1(%rax)
+ DB 255,98,255 ; jmpq *-0x1(%rdx)
DB 255 ; (bad)
- DB 255,76,255,255 ; decl -0x1(%rdi,%rdi,8)
+ DB 255,78,255 ; decl -0x1(%rsi)
DB 255 ; (bad)
- DB 56,255 ; cmp %bh,%bh
DB 255 ; (bad)
- DB 255,34 ; jmpq *(%rdx)
+ DB 58,255 ; cmp %bh,%bh
DB 255 ; (bad)
+ DB 255,36,255 ; jmpq *(%rdi,%rdi,8)
DB 255 ; (bad)
- DB 255,172,254,255,255,149,255 ; ljmp *-0x6a0001(%rsi,%rdi,8)
+ DB 255,171,254,255,255,151 ; ljmp *-0x68000002(%rbx)
DB 255 ; (bad)
- DB 255,135,255,255,255,113 ; incl 0x71ffffff(%rdi)
DB 255 ; (bad)
+ DB 255,137,255,255,255,115 ; decl 0x73ffffff(%rcx)
DB 255 ; (bad)
- DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
+ DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
- DB 255,209 ; callq *%rcx
+ DB 255 ; (bad)
+ DB 255,211 ; callq *%rbx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 189,255,255,255,167 ; mov $0xa7ffffff,%ebp
+ DB 191,255,255,255,169 ; mov $0xa9ffffff,%edi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_bgra_dst_hsw_8bit
_sk_load_bgra_dst_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,35 ; jne 236f4 <_sk_load_bgra_dst_hsw_8bit+0x44>
- DB 196,161,126,111,92,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%ymm3
- DB 196,161,126,111,20,130 ; vmovdqu (%rdx,%r8,4),%ymm2
- DB 197,253,111,37,154,144,0,0 ; vmovdqa 0x909a(%rip),%ymm4 # 2c780 <_sk_overlay_sse2_8bit+0xb0b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,35 ; jne 236bf <_sk_load_bgra_dst_hsw_8bit+0x3f>
+ DB 196,129,126,111,92,152,32 ; vmovdqu 0x20(%r8,%r11,4),%ymm3
+ DB 196,129,126,111,20,152 ; vmovdqu (%r8,%r11,4),%ymm2
+ DB 197,253,111,37,15,144,0,0 ; vmovdqa 0x900f(%rip),%ymm4 # 2c6c0 <_sk_overlay_sse2_8bit+0xb10>
DB 196,226,109,0,212 ; vpshufb %ymm4,%ymm2,%ymm2
DB 196,226,101,0,220 ; vpshufb %ymm4,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 197,237,239,210 ; vpxor %ymm2,%ymm2,%ymm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,213 ; ja 236de <_sk_load_bgra_dst_hsw_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,24,1,0,0 ; lea 0x118(%rip),%rcx # 2382c <_sk_load_bgra_dst_hsw_8bit+0x17c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,210 ; ja 236a9 <_sk_load_bgra_dst_hsw_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,22,1,0,0 ; lea 0x116(%rip),%r10 # 237f8 <_sk_load_bgra_dst_hsw_8bit+0x178>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 196,161,121,110,20,130 ; vmovd (%rdx,%r8,4),%xmm2
- DB 235,185 ; jmp 236de <_sk_load_bgra_dst_hsw_8bit+0x2e>
- DB 196,161,121,110,84,130,8 ; vmovd 0x8(%rdx,%r8,4),%xmm2
+ DB 196,129,121,110,20,152 ; vmovd (%r8,%r11,4),%xmm2
+ DB 235,182 ; jmp 236a9 <_sk_load_bgra_dst_hsw_8bit+0x29>
+ DB 196,129,121,110,84,152,8 ; vmovd 0x8(%r8,%r11,4),%xmm2
DB 196,226,121,89,210 ; vpbroadcastq %xmm2,%xmm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,210,4 ; vpblendd $0x4,%ymm2,%ymm3,%ymm2
- DB 196,162,121,53,36,130 ; vpmovzxdq (%rdx,%r8,4),%xmm4
+ DB 196,130,121,53,36,152 ; vpmovzxdq (%r8,%r11,4),%xmm4
DB 197,249,112,228,232 ; vpshufd $0xe8,%xmm4,%xmm4
DB 196,227,109,2,212,3 ; vpblendd $0x3,%ymm4,%ymm2,%ymm2
- DB 235,144 ; jmp 236de <_sk_load_bgra_dst_hsw_8bit+0x2e>
- DB 196,161,121,110,84,130,24 ; vmovd 0x18(%rdx,%r8,4),%xmm2
+ DB 235,141 ; jmp 236a9 <_sk_load_bgra_dst_hsw_8bit+0x29>
+ DB 196,129,121,110,84,152,24 ; vmovd 0x18(%r8,%r11,4),%xmm2
DB 196,226,125,89,210 ; vpbroadcastq %xmm2,%ymm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,210,64 ; vpblendd $0x40,%ymm2,%ymm3,%ymm2
DB 196,227,125,57,212,1 ; vextracti128 $0x1,%ymm2,%xmm4
- DB 196,163,89,34,100,130,20,1 ; vpinsrd $0x1,0x14(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,20,1 ; vpinsrd $0x1,0x14(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,109,56,212,1 ; vinserti128 $0x1,%xmm4,%ymm2,%ymm2
DB 196,227,125,57,212,1 ; vextracti128 $0x1,%ymm2,%xmm4
- DB 196,163,89,34,100,130,16,0 ; vpinsrd $0x0,0x10(%rdx,%r8,4),%xmm4,%xmm4
+ DB 196,131,89,34,100,152,16,0 ; vpinsrd $0x0,0x10(%r8,%r11,4),%xmm4,%xmm4
DB 196,227,109,56,212,1 ; vinserti128 $0x1,%xmm4,%ymm2,%ymm2
- DB 196,161,122,111,36,130 ; vmovdqu (%rdx,%r8,4),%xmm4
+ DB 196,129,122,111,36,152 ; vmovdqu (%r8,%r11,4),%xmm4
DB 196,227,93,2,210,240 ; vpblendd $0xf0,%ymm2,%ymm4,%ymm2
- DB 233,65,255,255,255 ; jmpq 236de <_sk_load_bgra_dst_hsw_8bit+0x2e>
- DB 196,161,121,110,84,130,40 ; vmovd 0x28(%rdx,%r8,4),%xmm2
+ DB 233,62,255,255,255 ; jmpq 236a9 <_sk_load_bgra_dst_hsw_8bit+0x29>
+ DB 196,129,121,110,84,152,40 ; vmovd 0x28(%r8,%r11,4),%xmm2
DB 196,226,121,89,210 ; vpbroadcastq %xmm2,%xmm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,218,4 ; vpblendd $0x4,%ymm2,%ymm3,%ymm3
- DB 196,163,97,34,84,130,36,1 ; vpinsrd $0x1,0x24(%rdx,%r8,4),%xmm3,%xmm2
+ DB 196,131,97,34,84,152,36,1 ; vpinsrd $0x1,0x24(%r8,%r11,4),%xmm3,%xmm2
DB 196,227,101,2,218,15 ; vpblendd $0xf,%ymm2,%ymm3,%ymm3
- DB 196,161,121,110,84,130,32 ; vmovd 0x20(%rdx,%r8,4),%xmm2
+ DB 196,129,121,110,84,152,32 ; vmovd 0x20(%r8,%r11,4),%xmm2
DB 196,227,101,2,218,1 ; vpblendd $0x1,%ymm2,%ymm3,%ymm3
- DB 233,5,255,255,255 ; jmpq 236d8 <_sk_load_bgra_dst_hsw_8bit+0x28>
- DB 196,161,121,110,84,130,56 ; vmovd 0x38(%rdx,%r8,4),%xmm2
+ DB 233,2,255,255,255 ; jmpq 236a3 <_sk_load_bgra_dst_hsw_8bit+0x23>
+ DB 196,129,121,110,84,152,56 ; vmovd 0x38(%r8,%r11,4),%xmm2
DB 196,226,125,89,210 ; vpbroadcastq %xmm2,%ymm2
DB 197,229,239,219 ; vpxor %ymm3,%ymm3,%ymm3
DB 196,227,101,2,218,64 ; vpblendd $0x40,%ymm2,%ymm3,%ymm3
DB 196,227,125,57,218,1 ; vextracti128 $0x1,%ymm3,%xmm2
- DB 196,163,105,34,84,130,52,1 ; vpinsrd $0x1,0x34(%rdx,%r8,4),%xmm2,%xmm2
+ DB 196,131,105,34,84,152,52,1 ; vpinsrd $0x1,0x34(%r8,%r11,4),%xmm2,%xmm2
DB 196,227,101,56,218,1 ; vinserti128 $0x1,%xmm2,%ymm3,%ymm3
DB 196,227,125,57,218,1 ; vextracti128 $0x1,%ymm3,%xmm2
- DB 196,163,105,34,84,130,48,0 ; vpinsrd $0x0,0x30(%rdx,%r8,4),%xmm2,%xmm2
+ DB 196,131,105,34,84,152,48,0 ; vpinsrd $0x0,0x30(%r8,%r11,4),%xmm2,%xmm2
DB 196,227,101,56,218,1 ; vinserti128 $0x1,%xmm2,%ymm3,%ymm3
- DB 196,161,126,111,20,130 ; vmovdqu (%rdx,%r8,4),%ymm2
- DB 196,161,122,111,100,130,32 ; vmovdqu 0x20(%rdx,%r8,4),%xmm4
+ DB 196,129,126,111,20,152 ; vmovdqu (%r8,%r11,4),%ymm2
+ DB 196,129,122,111,100,152,32 ; vmovdqu 0x20(%r8,%r11,4),%xmm4
DB 196,227,93,2,219,240 ; vpblendd $0xf0,%ymm3,%ymm4,%ymm3
- DB 233,181,254,255,255 ; jmpq 236de <_sk_load_bgra_dst_hsw_8bit+0x2e>
- DB 15,31,0 ; nopl (%rax)
- DB 241 ; icebp
- DB 254 ; (bad)
+ DB 233,178,254,255,255 ; jmpq 236a9 <_sk_load_bgra_dst_hsw_8bit+0x29>
+ DB 144 ; nop
+ DB 243,254 ; repz (bad)
DB 255 ; (bad)
- DB 255,15 ; decl (%rdi)
+ DB 255,17 ; callq *(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 249 ; stc
+ DB 251 ; sti
DB 254 ; (bad)
DB 255 ; (bad)
- DB 255,96,255 ; jmpq *-0x1(%rax)
+ DB 255,98,255 ; jmpq *-0x1(%rdx)
DB 255 ; (bad)
- DB 255,76,255,255 ; decl -0x1(%rdi,%rdi,8)
+ DB 255,78,255 ; decl -0x1(%rsi)
DB 255 ; (bad)
- DB 56,255 ; cmp %bh,%bh
DB 255 ; (bad)
- DB 255,34 ; jmpq *(%rdx)
+ DB 58,255 ; cmp %bh,%bh
DB 255 ; (bad)
+ DB 255,36,255 ; jmpq *(%rdi,%rdi,8)
DB 255 ; (bad)
- DB 255,172,254,255,255,149,255 ; ljmp *-0x6a0001(%rsi,%rdi,8)
+ DB 255,171,254,255,255,151 ; ljmp *-0x68000002(%rbx)
DB 255 ; (bad)
- DB 255,135,255,255,255,113 ; incl 0x71ffffff(%rdi)
DB 255 ; (bad)
+ DB 255,137,255,255,255,115 ; decl 0x73ffffff(%rcx)
DB 255 ; (bad)
- DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
+ DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
- DB 255,209 ; callq *%rcx
DB 255 ; (bad)
+ DB 255,211 ; callq *%rbx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 189,255,255,255,167 ; mov $0xa7ffffff,%ebp
+ DB 255 ; (bad)
+ DB 191,255,255,255,169 ; mov $0xa9ffffff,%edi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_bgra_hsw_8bit
_sk_store_bgra_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 197,253,111,37,20,143,0,0 ; vmovdqa 0x8f14(%rip),%ymm4 # 2c7a0 <_sk_overlay_sse2_8bit+0xb2b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 197,253,111,37,141,142,0,0 ; vmovdqa 0x8e8d(%rip),%ymm4 # 2c6e0 <_sk_overlay_sse2_8bit+0xb30>
DB 196,226,117,0,236 ; vpshufb %ymm4,%ymm1,%ymm5
DB 196,226,125,0,228 ; vpshufb %ymm4,%ymm0,%ymm4
- DB 77,133,201 ; test %r9,%r9
- DB 117,17 ; jne 238ac <_sk_store_bgra_hsw_8bit+0x44>
- DB 196,161,126,127,36,130 ; vmovdqu %ymm4,(%rdx,%r8,4)
- DB 196,161,126,127,108,130,32 ; vmovdqu %ymm5,0x20(%rdx,%r8,4)
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 23873 <_sk_store_bgra_hsw_8bit+0x3f>
+ DB 196,129,126,127,36,152 ; vmovdqu %ymm4,(%r8,%r11,4)
+ DB 196,129,126,127,108,152,32 ; vmovdqu %ymm5,0x20(%r8,%r11,4)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,239 ; ja 238a8 <_sk_store_bgra_hsw_8bit+0x40>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,176,0,0,0 ; lea 0xb0(%rip),%rcx # 23974 <_sk_store_bgra_hsw_8bit+0x10c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 196,161,121,126,36,130 ; vmovd %xmm4,(%rdx,%r8,4)
- DB 235,211 ; jmp 238a8 <_sk_store_bgra_hsw_8bit+0x40>
- DB 196,163,121,22,100,130,8,2 ; vpextrd $0x2,%xmm4,0x8(%rdx,%r8,4)
- DB 196,161,121,214,36,130 ; vmovq %xmm4,(%rdx,%r8,4)
- DB 235,195 ; jmp 238a8 <_sk_store_bgra_hsw_8bit+0x40>
+ DB 119,236 ; ja 2386f <_sk_store_bgra_hsw_8bit+0x3b>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,178,0,0,0 ; lea 0xb2(%rip),%r10 # 23940 <_sk_store_bgra_hsw_8bit+0x10c>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 196,129,121,126,36,152 ; vmovd %xmm4,(%r8,%r11,4)
+ DB 235,208 ; jmp 2386f <_sk_store_bgra_hsw_8bit+0x3b>
+ DB 196,131,121,22,100,152,8,2 ; vpextrd $0x2,%xmm4,0x8(%r8,%r11,4)
+ DB 196,129,121,214,36,152 ; vmovq %xmm4,(%r8,%r11,4)
+ DB 235,192 ; jmp 2386f <_sk_store_bgra_hsw_8bit+0x3b>
DB 196,227,125,57,229,1 ; vextracti128 $0x1,%ymm4,%xmm5
- DB 196,163,121,22,108,130,24,2 ; vpextrd $0x2,%xmm5,0x18(%rdx,%r8,4)
+ DB 196,131,121,22,108,152,24,2 ; vpextrd $0x2,%xmm5,0x18(%r8,%r11,4)
DB 196,227,125,57,229,1 ; vextracti128 $0x1,%ymm4,%xmm5
- DB 196,163,121,22,108,130,20,1 ; vpextrd $0x1,%xmm5,0x14(%rdx,%r8,4)
+ DB 196,131,121,22,108,152,20,1 ; vpextrd $0x1,%xmm5,0x14(%r8,%r11,4)
DB 196,227,125,57,229,1 ; vextracti128 $0x1,%ymm4,%xmm5
- DB 196,161,121,126,108,130,16 ; vmovd %xmm5,0x10(%rdx,%r8,4)
- DB 196,161,122,127,36,130 ; vmovdqu %xmm4,(%rdx,%r8,4)
- DB 235,146 ; jmp 238a8 <_sk_store_bgra_hsw_8bit+0x40>
- DB 196,163,121,22,108,130,40,2 ; vpextrd $0x2,%xmm5,0x28(%rdx,%r8,4)
- DB 196,163,121,22,108,130,36,1 ; vpextrd $0x1,%xmm5,0x24(%rdx,%r8,4)
- DB 196,161,121,126,108,130,32 ; vmovd %xmm5,0x20(%rdx,%r8,4)
- DB 196,161,126,127,36,130 ; vmovdqu %ymm4,(%rdx,%r8,4)
- DB 233,112,255,255,255 ; jmpq 238a8 <_sk_store_bgra_hsw_8bit+0x40>
+ DB 196,129,121,126,108,152,16 ; vmovd %xmm5,0x10(%r8,%r11,4)
+ DB 196,129,122,127,36,152 ; vmovdqu %xmm4,(%r8,%r11,4)
+ DB 235,143 ; jmp 2386f <_sk_store_bgra_hsw_8bit+0x3b>
+ DB 196,131,121,22,108,152,40,2 ; vpextrd $0x2,%xmm5,0x28(%r8,%r11,4)
+ DB 196,131,121,22,108,152,36,1 ; vpextrd $0x1,%xmm5,0x24(%r8,%r11,4)
+ DB 196,129,121,126,108,152,32 ; vmovd %xmm5,0x20(%r8,%r11,4)
+ DB 196,129,126,127,36,152 ; vmovdqu %ymm4,(%r8,%r11,4)
+ DB 233,109,255,255,255 ; jmpq 2386f <_sk_store_bgra_hsw_8bit+0x3b>
DB 196,227,125,57,238,1 ; vextracti128 $0x1,%ymm5,%xmm6
- DB 196,163,121,22,116,130,56,2 ; vpextrd $0x2,%xmm6,0x38(%rdx,%r8,4)
+ DB 196,131,121,22,116,152,56,2 ; vpextrd $0x2,%xmm6,0x38(%r8,%r11,4)
DB 196,227,125,57,238,1 ; vextracti128 $0x1,%ymm5,%xmm6
- DB 196,163,121,22,116,130,52,1 ; vpextrd $0x1,%xmm6,0x34(%rdx,%r8,4)
+ DB 196,131,121,22,116,152,52,1 ; vpextrd $0x1,%xmm6,0x34(%r8,%r11,4)
DB 196,227,125,57,238,1 ; vextracti128 $0x1,%ymm5,%xmm6
- DB 196,161,121,126,116,130,48 ; vmovd %xmm6,0x30(%rdx,%r8,4)
- DB 196,161,126,127,36,130 ; vmovdqu %ymm4,(%rdx,%r8,4)
- DB 196,161,122,127,108,130,32 ; vmovdqu %xmm5,0x20(%rdx,%r8,4)
- DB 233,53,255,255,255 ; jmpq 238a8 <_sk_store_bgra_hsw_8bit+0x40>
- DB 144 ; nop
- DB 89 ; pop %rcx
- DB 255 ; (bad)
- DB 255 ; (bad)
- DB 255,105,255 ; ljmp *-0x1(%rcx)
+ DB 196,129,121,126,116,152,48 ; vmovd %xmm6,0x30(%r8,%r11,4)
+ DB 196,129,126,127,36,152 ; vmovdqu %ymm4,(%r8,%r11,4)
+ DB 196,129,122,127,108,152,32 ; vmovdqu %xmm5,0x20(%r8,%r11,4)
+ DB 233,50,255,255,255 ; jmpq 2386f <_sk_store_bgra_hsw_8bit+0x3b>
+ DB 15,31,0 ; nopl (%rax)
+ DB 87 ; push %rdi
DB 255 ; (bad)
- DB 255,97,255 ; jmpq *-0x1(%rcx)
DB 255 ; (bad)
- DB 255,154,255,255,255,141 ; lcall *-0x72000001(%rdx)
+ DB 255,103,255 ; jmpq *-0x1(%rdi)
DB 255 ; (bad)
+ DB 255,95,255 ; lcall *-0x1(%rdi)
DB 255 ; (bad)
+ DB 255,152,255,255,255,139 ; lcall *-0x74000001(%rax)
DB 255 ; (bad)
- DB 127,255 ; jg 23989 <_sk_store_bgra_hsw_8bit+0x121>
DB 255 ; (bad)
- DB 255,113,255 ; pushq -0x1(%rcx)
DB 255 ; (bad)
+ DB 125,255 ; jge 23955 <_sk_store_bgra_hsw_8bit+0x121>
DB 255 ; (bad)
- DB 185,255,255,255,178 ; mov $0xb2ffffff,%ecx
+ DB 255,111,255 ; ljmp *-0x1(%rdi)
DB 255 ; (bad)
+ DB 255,183,255,255,255,176 ; pushq -0x4f000001(%rdi)
DB 255 ; (bad)
- DB 255,170,255,255,255,162 ; ljmp *-0x5d000001(%rdx)
DB 255 ; (bad)
+ DB 255,168,255,255,255,160 ; ljmp *-0x5f000001(%rax)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 237 ; in (%dx),%eax
DB 255 ; (bad)
+ DB 235,255 ; jmp 2396d <_sk_store_bgra_hsw_8bit+0x139>
DB 255 ; (bad)
- DB 255,224 ; jmpq *%rax
DB 255 ; (bad)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,210 ; callq *%rdx
+ DB 255,208 ; callq *%rax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,196 ; inc %esp
+ DB 255,194 ; inc %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_a8_hsw_8bit
_sk_load_a8_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,35 ; jne 239f0 <_sk_load_a8_hsw_8bit+0x40>
- DB 196,161,122,111,4,2 ; vmovdqu (%rdx,%r8,1),%xmm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,35 ; jne 239b7 <_sk_load_a8_hsw_8bit+0x3b>
+ DB 196,129,122,111,4,24 ; vmovdqu (%r8,%r11,1),%xmm0
DB 197,249,112,200,78 ; vpshufd $0x4e,%xmm0,%xmm1
DB 196,226,125,49,201 ; vpmovzxbd %xmm1,%ymm1
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
@@ -33948,93 +33944,95 @@ _sk_load_a8_hsw_8bit LABEL PROC
DB 197,245,114,241,24 ; vpslld $0x18,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,210 ; ja 239d3 <_sk_load_a8_hsw_8bit+0x23>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,192,0,0,0 ; lea 0xc0(%rip),%rcx # 23acc <_sk_load_a8_hsw_8bit+0x11c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,207 ; ja 2399a <_sk_load_a8_hsw_8bit+0x1e>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,194,0,0,0 ; lea 0xc2(%rip),%r10 # 23a98 <_sk_load_a8_hsw_8bit+0x11c>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 197,249,110,192 ; vmovd %eax,%xmm0
- DB 235,179 ; jmp 239d3 <_sk_load_a8_hsw_8bit+0x23>
+ DB 235,176 ; jmp 2399a <_sk_load_a8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,2,2 ; vpinsrb $0x2,0x2(%rdx,%r8,1),%xmm0,%xmm0
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 196,131,121,32,68,24,2,2 ; vpinsrb $0x2,0x2(%r8,%r11,1),%xmm0,%xmm0
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 197,249,110,200 ; vmovd %eax,%xmm1
DB 196,227,121,14,193,1 ; vpblendw $0x1,%xmm1,%xmm0,%xmm0
- DB 235,150 ; jmp 239d3 <_sk_load_a8_hsw_8bit+0x23>
+ DB 235,147 ; jmp 2399a <_sk_load_a8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,6,6 ; vpinsrb $0x6,0x6(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,5,5 ; vpinsrb $0x5,0x5(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,4,4 ; vpinsrb $0x4,0x4(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,161,121,110,12,2 ; vmovd (%rdx,%r8,1),%xmm1
+ DB 196,131,121,32,68,24,6,6 ; vpinsrb $0x6,0x6(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,5,5 ; vpinsrb $0x5,0x5(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,4,4 ; vpinsrb $0x4,0x4(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,129,121,110,12,24 ; vmovd (%r8,%r11,1),%xmm1
DB 196,227,121,2,193,1 ; vpblendd $0x1,%xmm1,%xmm0,%xmm0
- DB 233,105,255,255,255 ; jmpq 239d3 <_sk_load_a8_hsw_8bit+0x23>
+ DB 233,102,255,255,255 ; jmpq 2399a <_sk_load_a8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,10,10 ; vpinsrb $0xa,0xa(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,9,9 ; vpinsrb $0x9,0x9(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,8,8 ; vpinsrb $0x8,0x8(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,161,122,126,12,2 ; vmovq (%rdx,%r8,1),%xmm1
+ DB 196,131,121,32,68,24,10,10 ; vpinsrb $0xa,0xa(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,9,9 ; vpinsrb $0x9,0x9(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,8,8 ; vpinsrb $0x8,0x8(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,129,122,126,12,24 ; vmovq (%r8,%r11,1),%xmm1
DB 196,227,113,2,192,12 ; vpblendd $0xc,%xmm0,%xmm1,%xmm0
- DB 233,60,255,255,255 ; jmpq 239d3 <_sk_load_a8_hsw_8bit+0x23>
+ DB 233,57,255,255,255 ; jmpq 2399a <_sk_load_a8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,14,14 ; vpinsrb $0xe,0xe(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,13,13 ; vpinsrb $0xd,0xd(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,12,12 ; vpinsrb $0xc,0xc(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,161,122,126,12,2 ; vmovq (%rdx,%r8,1),%xmm1
- DB 196,163,113,34,76,2,8,2 ; vpinsrd $0x2,0x8(%rdx,%r8,1),%xmm1,%xmm1
+ DB 196,131,121,32,68,24,14,14 ; vpinsrb $0xe,0xe(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,13,13 ; vpinsrb $0xd,0xd(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,12,12 ; vpinsrb $0xc,0xc(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,129,122,126,12,24 ; vmovq (%r8,%r11,1),%xmm1
+ DB 196,131,113,34,76,24,8,2 ; vpinsrd $0x2,0x8(%r8,%r11,1),%xmm1,%xmm1
DB 196,227,113,2,192,8 ; vpblendd $0x8,%xmm0,%xmm1,%xmm0
- DB 233,7,255,255,255 ; jmpq 239d3 <_sk_load_a8_hsw_8bit+0x23>
- DB 73,255 ; rex.WB (bad)
+ DB 233,4,255,255,255 ; jmpq 2399a <_sk_load_a8_hsw_8bit+0x1e>
+ DB 102,144 ; xchg %ax,%ax
+ DB 71,255 ; rex.RXB (bad)
DB 255 ; (bad)
- DB 255,96,255 ; jmpq *-0x1(%rax)
+ DB 255,94,255 ; lcall *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,84,255,255 ; callq *-0x1(%rdi,%rdi,8)
- DB 255,141,255,255,255,133 ; decl -0x7a000001(%rbp)
+ DB 255,82,255 ; callq *-0x1(%rdx)
DB 255 ; (bad)
+ DB 255,139,255,255,255,131 ; decl -0x7c000001(%rbx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 125,255 ; jge 23ae1 <_sk_load_a8_hsw_8bit+0x131>
DB 255 ; (bad)
- DB 255,113,255 ; pushq -0x1(%rcx)
+ DB 123,255 ; jnp 23aad <_sk_load_a8_hsw_8bit+0x131>
DB 255 ; (bad)
+ DB 255,111,255 ; ljmp *-0x1(%rdi)
DB 255 ; (bad)
- DB 186,255,255,255,178 ; mov $0xb2ffffff,%edx
DB 255 ; (bad)
+ DB 184,255,255,255,176 ; mov $0xb0ffffff,%eax
DB 255 ; (bad)
- DB 255,170,255,255,255,158 ; ljmp *-0x61000001(%rdx)
DB 255 ; (bad)
+ DB 255,168,255,255,255,156 ; ljmp *-0x63000001(%rax)
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
+ DB 255 ; (bad)
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 223,255 ; (bad)
+ DB 221,255 ; (bad)
DB 255 ; (bad)
- DB 255,215 ; callq *%rdi
+ DB 255,213 ; callq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,203 ; dec %ebx
+ DB 255,201 ; dec %ecx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_a8_dst_hsw_8bit
_sk_load_a8_dst_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,35 ; jne 23b48 <_sk_load_a8_dst_hsw_8bit+0x40>
- DB 196,161,122,111,20,2 ; vmovdqu (%rdx,%r8,1),%xmm2
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,35 ; jne 23b0f <_sk_load_a8_dst_hsw_8bit+0x3b>
+ DB 196,129,122,111,20,24 ; vmovdqu (%r8,%r11,1),%xmm2
DB 197,249,112,218,78 ; vpshufd $0x4e,%xmm2,%xmm3
DB 196,226,125,49,219 ; vpmovzxbd %xmm3,%ymm3
DB 196,226,125,49,210 ; vpmovzxbd %xmm2,%ymm2
@@ -34042,381 +34040,382 @@ _sk_load_a8_dst_hsw_8bit LABEL PROC
DB 197,229,114,243,24 ; vpslld $0x18,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,210 ; ja 23b2b <_sk_load_a8_dst_hsw_8bit+0x23>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,192,0,0,0 ; lea 0xc0(%rip),%rcx # 23c24 <_sk_load_a8_dst_hsw_8bit+0x11c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,207 ; ja 23af2 <_sk_load_a8_dst_hsw_8bit+0x1e>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,194,0,0,0 ; lea 0xc2(%rip),%r10 # 23bf0 <_sk_load_a8_dst_hsw_8bit+0x11c>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 197,249,110,208 ; vmovd %eax,%xmm2
- DB 235,179 ; jmp 23b2b <_sk_load_a8_dst_hsw_8bit+0x23>
+ DB 235,176 ; jmp 23af2 <_sk_load_a8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,2,2 ; vpinsrb $0x2,0x2(%rdx,%r8,1),%xmm2,%xmm2
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 196,131,105,32,84,24,2,2 ; vpinsrb $0x2,0x2(%r8,%r11,1),%xmm2,%xmm2
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 197,249,110,216 ; vmovd %eax,%xmm3
DB 196,227,105,14,211,1 ; vpblendw $0x1,%xmm3,%xmm2,%xmm2
- DB 235,150 ; jmp 23b2b <_sk_load_a8_dst_hsw_8bit+0x23>
+ DB 235,147 ; jmp 23af2 <_sk_load_a8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,6,6 ; vpinsrb $0x6,0x6(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,5,5 ; vpinsrb $0x5,0x5(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,4,4 ; vpinsrb $0x4,0x4(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,161,121,110,28,2 ; vmovd (%rdx,%r8,1),%xmm3
+ DB 196,131,105,32,84,24,6,6 ; vpinsrb $0x6,0x6(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,5,5 ; vpinsrb $0x5,0x5(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,4,4 ; vpinsrb $0x4,0x4(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,129,121,110,28,24 ; vmovd (%r8,%r11,1),%xmm3
DB 196,227,105,2,211,1 ; vpblendd $0x1,%xmm3,%xmm2,%xmm2
- DB 233,105,255,255,255 ; jmpq 23b2b <_sk_load_a8_dst_hsw_8bit+0x23>
+ DB 233,102,255,255,255 ; jmpq 23af2 <_sk_load_a8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,10,10 ; vpinsrb $0xa,0xa(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,9,9 ; vpinsrb $0x9,0x9(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,8,8 ; vpinsrb $0x8,0x8(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,161,122,126,28,2 ; vmovq (%rdx,%r8,1),%xmm3
+ DB 196,131,105,32,84,24,10,10 ; vpinsrb $0xa,0xa(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,9,9 ; vpinsrb $0x9,0x9(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,8,8 ; vpinsrb $0x8,0x8(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,129,122,126,28,24 ; vmovq (%r8,%r11,1),%xmm3
DB 196,227,97,2,210,12 ; vpblendd $0xc,%xmm2,%xmm3,%xmm2
- DB 233,60,255,255,255 ; jmpq 23b2b <_sk_load_a8_dst_hsw_8bit+0x23>
+ DB 233,57,255,255,255 ; jmpq 23af2 <_sk_load_a8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,14,14 ; vpinsrb $0xe,0xe(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,13,13 ; vpinsrb $0xd,0xd(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,12,12 ; vpinsrb $0xc,0xc(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,161,122,126,28,2 ; vmovq (%rdx,%r8,1),%xmm3
- DB 196,163,97,34,92,2,8,2 ; vpinsrd $0x2,0x8(%rdx,%r8,1),%xmm3,%xmm3
+ DB 196,131,105,32,84,24,14,14 ; vpinsrb $0xe,0xe(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,13,13 ; vpinsrb $0xd,0xd(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,12,12 ; vpinsrb $0xc,0xc(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,129,122,126,28,24 ; vmovq (%r8,%r11,1),%xmm3
+ DB 196,131,97,34,92,24,8,2 ; vpinsrd $0x2,0x8(%r8,%r11,1),%xmm3,%xmm3
DB 196,227,97,2,210,8 ; vpblendd $0x8,%xmm2,%xmm3,%xmm2
- DB 233,7,255,255,255 ; jmpq 23b2b <_sk_load_a8_dst_hsw_8bit+0x23>
- DB 73,255 ; rex.WB (bad)
+ DB 233,4,255,255,255 ; jmpq 23af2 <_sk_load_a8_dst_hsw_8bit+0x1e>
+ DB 102,144 ; xchg %ax,%ax
+ DB 71,255 ; rex.RXB (bad)
DB 255 ; (bad)
- DB 255,96,255 ; jmpq *-0x1(%rax)
+ DB 255,94,255 ; lcall *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,84,255,255 ; callq *-0x1(%rdi,%rdi,8)
- DB 255,141,255,255,255,133 ; decl -0x7a000001(%rbp)
+ DB 255,82,255 ; callq *-0x1(%rdx)
DB 255 ; (bad)
+ DB 255,139,255,255,255,131 ; decl -0x7c000001(%rbx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 125,255 ; jge 23c39 <_sk_load_a8_dst_hsw_8bit+0x131>
DB 255 ; (bad)
- DB 255,113,255 ; pushq -0x1(%rcx)
+ DB 123,255 ; jnp 23c05 <_sk_load_a8_dst_hsw_8bit+0x131>
DB 255 ; (bad)
+ DB 255,111,255 ; ljmp *-0x1(%rdi)
DB 255 ; (bad)
- DB 186,255,255,255,178 ; mov $0xb2ffffff,%edx
DB 255 ; (bad)
+ DB 184,255,255,255,176 ; mov $0xb0ffffff,%eax
DB 255 ; (bad)
- DB 255,170,255,255,255,158 ; ljmp *-0x61000001(%rdx)
DB 255 ; (bad)
+ DB 255,168,255,255,255,156 ; ljmp *-0x63000001(%rax)
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 223,255 ; (bad)
DB 255 ; (bad)
- DB 255,215 ; callq *%rdi
+ DB 221,255 ; (bad)
DB 255 ; (bad)
+ DB 255,213 ; callq *%rbp
DB 255 ; (bad)
- DB 255,203 ; dec %ebx
+ DB 255 ; (bad)
+ DB 255,201 ; dec %ecx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_a8_hsw_8bit
_sk_store_a8_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 197,253,111,37,64,139,0,0 ; vmovdqa 0x8b40(%rip),%ymm4 # 2c7c0 <_sk_overlay_sse2_8bit+0xb4b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 197,253,111,37,185,138,0,0 ; vmovdqa 0x8ab9(%rip),%ymm4 # 2c700 <_sk_overlay_sse2_8bit+0xb50>
DB 196,226,117,0,236 ; vpshufb %ymm4,%ymm1,%ymm5
DB 196,227,253,0,237,232 ; vpermq $0xe8,%ymm5,%ymm5
- DB 197,249,111,53,109,149,0,0 ; vmovdqa 0x956d(%rip),%xmm6 # 2d200 <_sk_overlay_sse2_8bit+0x158b>
+ DB 197,249,111,53,230,148,0,0 ; vmovdqa 0x94e6(%rip),%xmm6 # 2d140 <_sk_overlay_sse2_8bit+0x1590>
DB 196,226,81,0,238 ; vpshufb %xmm6,%xmm5,%xmm5
DB 196,226,125,0,228 ; vpshufb %ymm4,%ymm0,%ymm4
DB 196,227,253,0,228,232 ; vpermq $0xe8,%ymm4,%ymm4
DB 196,226,89,0,230 ; vpshufb %xmm6,%xmm4,%xmm4
DB 197,217,108,229 ; vpunpcklqdq %xmm5,%xmm4,%xmm4
- DB 77,133,201 ; test %r9,%r9
- DB 117,10 ; jne 23cbb <_sk_store_a8_hsw_8bit+0x5b>
- DB 196,161,122,127,36,2 ; vmovdqu %xmm4,(%rdx,%r8,1)
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,10 ; jne 23c82 <_sk_store_a8_hsw_8bit+0x56>
+ DB 196,129,122,127,36,24 ; vmovdqu %xmm4,(%r8,%r11,1)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,239 ; ja 23cb7 <_sk_store_a8_hsw_8bit+0x57>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,137,0,0,0 ; lea 0x89(%rip),%rcx # 23d5c <_sk_store_a8_hsw_8bit+0xfc>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 196,163,121,20,36,2,0 ; vpextrb $0x0,%xmm4,(%rdx,%r8,1)
- DB 235,210 ; jmp 23cb7 <_sk_store_a8_hsw_8bit+0x57>
- DB 196,163,121,20,100,2,2,2 ; vpextrb $0x2,%xmm4,0x2(%rdx,%r8,1)
- DB 196,163,121,21,36,2,0 ; vpextrw $0x0,%xmm4,(%rdx,%r8,1)
- DB 235,193 ; jmp 23cb7 <_sk_store_a8_hsw_8bit+0x57>
- DB 196,163,121,20,100,2,6,6 ; vpextrb $0x6,%xmm4,0x6(%rdx,%r8,1)
- DB 196,163,121,20,100,2,5,5 ; vpextrb $0x5,%xmm4,0x5(%rdx,%r8,1)
- DB 196,163,121,20,100,2,4,4 ; vpextrb $0x4,%xmm4,0x4(%rdx,%r8,1)
- DB 196,161,121,126,36,2 ; vmovd %xmm4,(%rdx,%r8,1)
- DB 235,161 ; jmp 23cb7 <_sk_store_a8_hsw_8bit+0x57>
- DB 196,163,121,20,100,2,10,10 ; vpextrb $0xa,%xmm4,0xa(%rdx,%r8,1)
- DB 196,163,121,20,100,2,9,9 ; vpextrb $0x9,%xmm4,0x9(%rdx,%r8,1)
- DB 196,163,121,20,100,2,8,8 ; vpextrb $0x8,%xmm4,0x8(%rdx,%r8,1)
- DB 235,32 ; jmp 23d50 <_sk_store_a8_hsw_8bit+0xf0>
- DB 196,163,121,20,100,2,14,14 ; vpextrb $0xe,%xmm4,0xe(%rdx,%r8,1)
- DB 196,163,121,20,100,2,13,13 ; vpextrb $0xd,%xmm4,0xd(%rdx,%r8,1)
- DB 196,163,121,20,100,2,12,12 ; vpextrb $0xc,%xmm4,0xc(%rdx,%r8,1)
- DB 196,163,121,22,100,2,8,2 ; vpextrd $0x2,%xmm4,0x8(%rdx,%r8,1)
- DB 196,161,121,214,36,2 ; vmovq %xmm4,(%rdx,%r8,1)
- DB 233,92,255,255,255 ; jmpq 23cb7 <_sk_store_a8_hsw_8bit+0x57>
- DB 144 ; nop
- DB 128,255,255 ; cmp $0xff,%bh
- DB 255,145,255,255,255,137 ; callq *-0x76000001(%rcx)
+ DB 119,236 ; ja 23c7e <_sk_store_a8_hsw_8bit+0x52>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,139,0,0,0 ; lea 0x8b(%rip),%r10 # 23d28 <_sk_store_a8_hsw_8bit+0xfc>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 196,131,121,20,36,24,0 ; vpextrb $0x0,%xmm4,(%r8,%r11,1)
+ DB 235,207 ; jmp 23c7e <_sk_store_a8_hsw_8bit+0x52>
+ DB 196,131,121,20,100,24,2,2 ; vpextrb $0x2,%xmm4,0x2(%r8,%r11,1)
+ DB 196,131,121,21,36,24,0 ; vpextrw $0x0,%xmm4,(%r8,%r11,1)
+ DB 235,190 ; jmp 23c7e <_sk_store_a8_hsw_8bit+0x52>
+ DB 196,131,121,20,100,24,6,6 ; vpextrb $0x6,%xmm4,0x6(%r8,%r11,1)
+ DB 196,131,121,20,100,24,5,5 ; vpextrb $0x5,%xmm4,0x5(%r8,%r11,1)
+ DB 196,131,121,20,100,24,4,4 ; vpextrb $0x4,%xmm4,0x4(%r8,%r11,1)
+ DB 196,129,121,126,36,24 ; vmovd %xmm4,(%r8,%r11,1)
+ DB 235,158 ; jmp 23c7e <_sk_store_a8_hsw_8bit+0x52>
+ DB 196,131,121,20,100,24,10,10 ; vpextrb $0xa,%xmm4,0xa(%r8,%r11,1)
+ DB 196,131,121,20,100,24,9,9 ; vpextrb $0x9,%xmm4,0x9(%r8,%r11,1)
+ DB 196,131,121,20,100,24,8,8 ; vpextrb $0x8,%xmm4,0x8(%r8,%r11,1)
+ DB 235,32 ; jmp 23d1a <_sk_store_a8_hsw_8bit+0xee>
+ DB 196,131,121,20,100,24,14,14 ; vpextrb $0xe,%xmm4,0xe(%r8,%r11,1)
+ DB 196,131,121,20,100,24,13,13 ; vpextrb $0xd,%xmm4,0xd(%r8,%r11,1)
+ DB 196,131,121,20,100,24,12,12 ; vpextrb $0xc,%xmm4,0xc(%r8,%r11,1)
+ DB 196,131,121,22,100,24,8,2 ; vpextrd $0x2,%xmm4,0x8(%r8,%r11,1)
+ DB 196,129,121,214,36,24 ; vmovq %xmm4,(%r8,%r11,1)
+ DB 233,89,255,255,255 ; jmpq 23c7e <_sk_store_a8_hsw_8bit+0x52>
+ DB 15,31,0 ; nopl (%rax)
+ DB 126,255 ; jle 23d29 <_sk_store_a8_hsw_8bit+0xfd>
DB 255 ; (bad)
+ DB 255,143,255,255,255,135 ; decl -0x78000001(%rdi)
DB 255 ; (bad)
- DB 255,178,255,255,255,170 ; pushq -0x55000001(%rdx)
DB 255 ; (bad)
+ DB 255,176,255,255,255,168 ; pushq -0x57000001(%rax)
DB 255 ; (bad)
- DB 255,162,255,255,255,154 ; jmpq *-0x65000001(%rdx)
DB 255 ; (bad)
+ DB 255,160,255,255,255,152 ; jmpq *-0x67000001(%rax)
DB 255 ; (bad)
- DB 255,244 ; push %rsp
DB 255 ; (bad)
+ DB 255,242 ; push %rdx
DB 255 ; (bad)
- DB 255,202 ; dec %edx
DB 255 ; (bad)
+ DB 255,200 ; dec %eax
DB 255 ; (bad)
- DB 255,194 ; inc %edx
DB 255 ; (bad)
+ DB 255,192 ; inc %eax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 186,255,255,255,236 ; mov $0xecffffff,%edx
DB 255 ; (bad)
+ DB 184,255,255,255,234 ; mov $0xeaffffff,%eax
DB 255 ; (bad)
- DB 255,228 ; jmpq *%rsp
DB 255 ; (bad)
+ DB 255,226 ; jmpq *%rdx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 218,255 ; (bad)
+ DB 255 ; (bad)
+ DB 255,210 ; callq *%rdx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_g8_hsw_8bit
_sk_load_g8_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,61 ; jne 23df2 <_sk_load_g8_hsw_8bit+0x5a>
- DB 196,161,122,111,4,2 ; vmovdqu (%rdx,%r8,1),%xmm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,61 ; jne 23db9 <_sk_load_g8_hsw_8bit+0x55>
+ DB 196,129,122,111,4,24 ; vmovdqu (%r8,%r11,1),%xmm0
DB 196,226,125,49,200 ; vpmovzxbd %xmm0,%ymm1
DB 197,249,112,192,78 ; vpshufd $0x4e,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
- DB 196,226,125,88,37,161,132,0,0 ; vpbroadcastd 0x84a1(%rip),%ymm4 # 2c274 <_sk_overlay_sse2_8bit+0x5ff>
+ DB 196,226,125,88,37,22,132,0,0 ; vpbroadcastd 0x8416(%rip),%ymm4 # 2c1b0 <_sk_overlay_sse2_8bit+0x600>
DB 196,226,125,64,236 ; vpmulld %ymm4,%ymm0,%ymm5
DB 196,226,117,64,196 ; vpmulld %ymm4,%ymm1,%ymm0
- DB 196,226,125,88,13,146,132,0,0 ; vpbroadcastd 0x8492(%rip),%ymm1 # 2c278 <_sk_overlay_sse2_8bit+0x603>
+ DB 196,226,125,88,13,7,132,0,0 ; vpbroadcastd 0x8407(%rip),%ymm1 # 2c1b4 <_sk_overlay_sse2_8bit+0x604>
DB 197,253,235,193 ; vpor %ymm1,%ymm0,%ymm0
DB 197,213,235,201 ; vpor %ymm1,%ymm5,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,184 ; ja 23dbb <_sk_load_g8_hsw_8bit+0x23>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,198,0,0,0 ; lea 0xc6(%rip),%rcx # 23ed4 <_sk_load_g8_hsw_8bit+0x13c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,181 ; ja 23d82 <_sk_load_g8_hsw_8bit+0x1e>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,196,0,0,0 ; lea 0xc4(%rip),%r10 # 23e9c <_sk_load_g8_hsw_8bit+0x138>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 197,249,110,192 ; vmovd %eax,%xmm0
- DB 235,153 ; jmp 23dbb <_sk_load_g8_hsw_8bit+0x23>
+ DB 235,150 ; jmp 23d82 <_sk_load_g8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,2,2 ; vpinsrb $0x2,0x2(%rdx,%r8,1),%xmm0,%xmm0
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 196,131,121,32,68,24,2,2 ; vpinsrb $0x2,0x2(%r8,%r11,1),%xmm0,%xmm0
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 197,249,110,200 ; vmovd %eax,%xmm1
DB 196,227,121,14,193,1 ; vpblendw $0x1,%xmm1,%xmm0,%xmm0
- DB 233,121,255,255,255 ; jmpq 23dbb <_sk_load_g8_hsw_8bit+0x23>
+ DB 233,118,255,255,255 ; jmpq 23d82 <_sk_load_g8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,6,6 ; vpinsrb $0x6,0x6(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,5,5 ; vpinsrb $0x5,0x5(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,4,4 ; vpinsrb $0x4,0x4(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,161,121,110,12,2 ; vmovd (%rdx,%r8,1),%xmm1
+ DB 196,131,121,32,68,24,6,6 ; vpinsrb $0x6,0x6(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,5,5 ; vpinsrb $0x5,0x5(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,4,4 ; vpinsrb $0x4,0x4(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,129,121,110,12,24 ; vmovd (%r8,%r11,1),%xmm1
DB 196,227,121,2,193,1 ; vpblendd $0x1,%xmm1,%xmm0,%xmm0
- DB 233,76,255,255,255 ; jmpq 23dbb <_sk_load_g8_hsw_8bit+0x23>
+ DB 233,73,255,255,255 ; jmpq 23d82 <_sk_load_g8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,10,10 ; vpinsrb $0xa,0xa(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,9,9 ; vpinsrb $0x9,0x9(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,8,8 ; vpinsrb $0x8,0x8(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,161,122,126,12,2 ; vmovq (%rdx,%r8,1),%xmm1
+ DB 196,131,121,32,68,24,10,10 ; vpinsrb $0xa,0xa(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,9,9 ; vpinsrb $0x9,0x9(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,8,8 ; vpinsrb $0x8,0x8(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,129,122,126,12,24 ; vmovq (%r8,%r11,1),%xmm1
DB 196,227,113,2,192,12 ; vpblendd $0xc,%xmm0,%xmm1,%xmm0
- DB 233,31,255,255,255 ; jmpq 23dbb <_sk_load_g8_hsw_8bit+0x23>
+ DB 233,28,255,255,255 ; jmpq 23d82 <_sk_load_g8_hsw_8bit+0x1e>
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
- DB 196,163,121,32,68,2,14,14 ; vpinsrb $0xe,0xe(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,13,13 ; vpinsrb $0xd,0xd(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,163,121,32,68,2,12,12 ; vpinsrb $0xc,0xc(%rdx,%r8,1),%xmm0,%xmm0
- DB 196,161,122,126,12,2 ; vmovq (%rdx,%r8,1),%xmm1
- DB 196,163,113,34,76,2,8,2 ; vpinsrd $0x2,0x8(%rdx,%r8,1),%xmm1,%xmm1
+ DB 196,131,121,32,68,24,14,14 ; vpinsrb $0xe,0xe(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,13,13 ; vpinsrb $0xd,0xd(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,131,121,32,68,24,12,12 ; vpinsrb $0xc,0xc(%r8,%r11,1),%xmm0,%xmm0
+ DB 196,129,122,126,12,24 ; vmovq (%r8,%r11,1),%xmm1
+ DB 196,131,113,34,76,24,8,2 ; vpinsrd $0x2,0x8(%r8,%r11,1),%xmm1,%xmm1
DB 196,227,113,2,192,8 ; vpblendd $0x8,%xmm0,%xmm1,%xmm0
- DB 233,234,254,255,255 ; jmpq 23dbb <_sk_load_g8_hsw_8bit+0x23>
- DB 15,31,0 ; nopl (%rax)
- DB 67,255 ; rex.XB (bad)
- DB 255 ; (bad)
- DB 255,90,255 ; lcall *-0x1(%rdx)
+ DB 233,231,254,255,255 ; jmpq 23d82 <_sk_load_g8_hsw_8bit+0x1e>
+ DB 144 ; nop
+ DB 69,255 ; rex.RB (bad)
DB 255 ; (bad)
- DB 255,78,255 ; decl -0x1(%rsi)
+ DB 255,92,255,255 ; lcall *-0x1(%rdi,%rdi,8)
+ DB 255,80,255 ; callq *-0x1(%rax)
DB 255 ; (bad)
- DB 255,138,255,255,255,130 ; decl -0x7d000001(%rdx)
+ DB 255,140,255,255,255,132,255 ; decl -0x7b0001(%rdi,%rdi,8)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 124,255 ; jl 23eb1 <_sk_load_g8_hsw_8bit+0x14d>
DB 255 ; (bad)
- DB 122,255 ; jp 23ee9 <_sk_load_g8_hsw_8bit+0x151>
+ DB 255,112,255 ; pushq -0x1(%rax)
DB 255 ; (bad)
- DB 255,110,255 ; ljmp *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,183,255,255,255,175 ; pushq -0x50000001(%rdi)
+ DB 185,255,255,255,177 ; mov $0xb1ffffff,%ecx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,167,255,255,255,155 ; jmpq *-0x64000001(%rdi)
+ DB 255,169,255,255,255,157 ; ljmp *-0x62000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,228 ; jmpq *%rsp
+ DB 255,230 ; jmpq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,200 ; dec %eax
+ DB 255,202 ; dec %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_g8_dst_hsw_8bit
_sk_load_g8_dst_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,61 ; jne 23f6a <_sk_load_g8_dst_hsw_8bit+0x5a>
- DB 196,161,122,111,20,2 ; vmovdqu (%rdx,%r8,1),%xmm2
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,61 ; jne 23f2d <_sk_load_g8_dst_hsw_8bit+0x55>
+ DB 196,129,122,111,20,24 ; vmovdqu (%r8,%r11,1),%xmm2
DB 196,226,125,49,218 ; vpmovzxbd %xmm2,%ymm3
DB 197,249,112,210,78 ; vpshufd $0x4e,%xmm2,%xmm2
DB 196,226,125,49,210 ; vpmovzxbd %xmm2,%ymm2
- DB 196,226,125,88,37,41,131,0,0 ; vpbroadcastd 0x8329(%rip),%ymm4 # 2c274 <_sk_overlay_sse2_8bit+0x5ff>
+ DB 196,226,125,88,37,162,130,0,0 ; vpbroadcastd 0x82a2(%rip),%ymm4 # 2c1b0 <_sk_overlay_sse2_8bit+0x600>
DB 196,226,109,64,236 ; vpmulld %ymm4,%ymm2,%ymm5
DB 196,226,101,64,212 ; vpmulld %ymm4,%ymm3,%ymm2
- DB 196,226,125,88,29,26,131,0,0 ; vpbroadcastd 0x831a(%rip),%ymm3 # 2c278 <_sk_overlay_sse2_8bit+0x603>
+ DB 196,226,125,88,29,147,130,0,0 ; vpbroadcastd 0x8293(%rip),%ymm3 # 2c1b4 <_sk_overlay_sse2_8bit+0x604>
DB 197,237,235,211 ; vpor %ymm3,%ymm2,%ymm2
DB 197,213,235,219 ; vpor %ymm3,%ymm5,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 119,184 ; ja 23f33 <_sk_load_g8_dst_hsw_8bit+0x23>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,198,0,0,0 ; lea 0xc6(%rip),%rcx # 2404c <_sk_load_g8_dst_hsw_8bit+0x13c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,181 ; ja 23ef6 <_sk_load_g8_dst_hsw_8bit+0x1e>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,196,0,0,0 ; lea 0xc4(%rip),%r10 # 24010 <_sk_load_g8_dst_hsw_8bit+0x138>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 197,249,110,208 ; vmovd %eax,%xmm2
- DB 235,153 ; jmp 23f33 <_sk_load_g8_dst_hsw_8bit+0x23>
+ DB 235,150 ; jmp 23ef6 <_sk_load_g8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,2,2 ; vpinsrb $0x2,0x2(%rdx,%r8,1),%xmm2,%xmm2
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 196,131,105,32,84,24,2,2 ; vpinsrb $0x2,0x2(%r8,%r11,1),%xmm2,%xmm2
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 197,249,110,216 ; vmovd %eax,%xmm3
DB 196,227,105,14,211,1 ; vpblendw $0x1,%xmm3,%xmm2,%xmm2
- DB 233,121,255,255,255 ; jmpq 23f33 <_sk_load_g8_dst_hsw_8bit+0x23>
+ DB 233,118,255,255,255 ; jmpq 23ef6 <_sk_load_g8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,6,6 ; vpinsrb $0x6,0x6(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,5,5 ; vpinsrb $0x5,0x5(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,4,4 ; vpinsrb $0x4,0x4(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,161,121,110,28,2 ; vmovd (%rdx,%r8,1),%xmm3
+ DB 196,131,105,32,84,24,6,6 ; vpinsrb $0x6,0x6(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,5,5 ; vpinsrb $0x5,0x5(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,4,4 ; vpinsrb $0x4,0x4(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,129,121,110,28,24 ; vmovd (%r8,%r11,1),%xmm3
DB 196,227,105,2,211,1 ; vpblendd $0x1,%xmm3,%xmm2,%xmm2
- DB 233,76,255,255,255 ; jmpq 23f33 <_sk_load_g8_dst_hsw_8bit+0x23>
+ DB 233,73,255,255,255 ; jmpq 23ef6 <_sk_load_g8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,10,10 ; vpinsrb $0xa,0xa(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,9,9 ; vpinsrb $0x9,0x9(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,8,8 ; vpinsrb $0x8,0x8(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,161,122,126,28,2 ; vmovq (%rdx,%r8,1),%xmm3
+ DB 196,131,105,32,84,24,10,10 ; vpinsrb $0xa,0xa(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,9,9 ; vpinsrb $0x9,0x9(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,8,8 ; vpinsrb $0x8,0x8(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,129,122,126,28,24 ; vmovq (%r8,%r11,1),%xmm3
DB 196,227,97,2,210,12 ; vpblendd $0xc,%xmm2,%xmm3,%xmm2
- DB 233,31,255,255,255 ; jmpq 23f33 <_sk_load_g8_dst_hsw_8bit+0x23>
+ DB 233,28,255,255,255 ; jmpq 23ef6 <_sk_load_g8_dst_hsw_8bit+0x1e>
DB 197,233,239,210 ; vpxor %xmm2,%xmm2,%xmm2
- DB 196,163,105,32,84,2,14,14 ; vpinsrb $0xe,0xe(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,13,13 ; vpinsrb $0xd,0xd(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,163,105,32,84,2,12,12 ; vpinsrb $0xc,0xc(%rdx,%r8,1),%xmm2,%xmm2
- DB 196,161,122,126,28,2 ; vmovq (%rdx,%r8,1),%xmm3
- DB 196,163,97,34,92,2,8,2 ; vpinsrd $0x2,0x8(%rdx,%r8,1),%xmm3,%xmm3
+ DB 196,131,105,32,84,24,14,14 ; vpinsrb $0xe,0xe(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,13,13 ; vpinsrb $0xd,0xd(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,131,105,32,84,24,12,12 ; vpinsrb $0xc,0xc(%r8,%r11,1),%xmm2,%xmm2
+ DB 196,129,122,126,28,24 ; vmovq (%r8,%r11,1),%xmm3
+ DB 196,131,97,34,92,24,8,2 ; vpinsrd $0x2,0x8(%r8,%r11,1),%xmm3,%xmm3
DB 196,227,97,2,210,8 ; vpblendd $0x8,%xmm2,%xmm3,%xmm2
- DB 233,234,254,255,255 ; jmpq 23f33 <_sk_load_g8_dst_hsw_8bit+0x23>
- DB 15,31,0 ; nopl (%rax)
- DB 67,255 ; rex.XB (bad)
- DB 255 ; (bad)
- DB 255,90,255 ; lcall *-0x1(%rdx)
+ DB 233,231,254,255,255 ; jmpq 23ef6 <_sk_load_g8_dst_hsw_8bit+0x1e>
+ DB 144 ; nop
+ DB 69,255 ; rex.RB (bad)
DB 255 ; (bad)
- DB 255,78,255 ; decl -0x1(%rsi)
+ DB 255,92,255,255 ; lcall *-0x1(%rdi,%rdi,8)
+ DB 255,80,255 ; callq *-0x1(%rax)
DB 255 ; (bad)
- DB 255,138,255,255,255,130 ; decl -0x7d000001(%rdx)
+ DB 255,140,255,255,255,132,255 ; decl -0x7b0001(%rdi,%rdi,8)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 124,255 ; jl 24025 <_sk_load_g8_dst_hsw_8bit+0x14d>
DB 255 ; (bad)
- DB 122,255 ; jp 24061 <_sk_load_g8_dst_hsw_8bit+0x151>
+ DB 255,112,255 ; pushq -0x1(%rax)
DB 255 ; (bad)
- DB 255,110,255 ; ljmp *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,183,255,255,255,175 ; pushq -0x50000001(%rdi)
+ DB 185,255,255,255,177 ; mov $0xb1ffffff,%ecx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,167,255,255,255,155 ; jmpq *-0x64000001(%rdi)
+ DB 255,169,255,255,255,157 ; ljmp *-0x62000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,228 ; jmpq *%rsp
+ DB 255,230 ; jmpq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,200 ; dec %eax
+ DB 255,202 ; dec %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_srcover_rgba_8888_hsw_8bit
_sk_srcover_rgba_8888_hsw_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,192 ; test %r8,%r8
- DB 15,133,222,0,0,0 ; jne 2418b <_sk_srcover_rgba_8888_hsw_8bit+0x103>
- DB 196,33,126,111,76,138,32 ; vmovdqu 0x20(%rdx,%r9,4),%ymm9
- DB 196,33,126,111,28,138 ; vmovdqu (%rdx,%r9,4),%ymm11
- DB 197,253,111,53,30,135,0,0 ; vmovdqa 0x871e(%rip),%ymm6 # 2c7e0 <_sk_overlay_sse2_8bit+0xb6b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,222,0,0,0 ; jne 2414a <_sk_srcover_rgba_8888_hsw_8bit+0xfe>
+ DB 196,1,126,111,76,152,32 ; vmovdqu 0x20(%r8,%r11,4),%ymm9
+ DB 196,1,126,111,28,152 ; vmovdqu (%r8,%r11,4),%ymm11
+ DB 197,253,111,53,159,134,0,0 ; vmovdqa 0x869f(%rip),%ymm6 # 2c720 <_sk_overlay_sse2_8bit+0xb70>
DB 196,226,117,0,254 ; vpshufb %ymm6,%ymm1,%ymm7
DB 196,226,125,0,246 ; vpshufb %ymm6,%ymm0,%ymm6
DB 196,66,125,48,195 ; vpmovzxbw %xmm11,%ymm8
@@ -34453,108 +34452,108 @@ _sk_srcover_rgba_8888_hsw_8bit LABEL PROC
DB 197,165,248,228 ; vpsubb %ymm4,%ymm11,%ymm4
DB 197,221,252,224 ; vpaddb %ymm0,%ymm4,%ymm4
DB 197,213,252,233 ; vpaddb %ymm1,%ymm5,%ymm5
- DB 77,133,192 ; test %r8,%r8
- DB 117,72 ; jne 241c2 <_sk_srcover_rgba_8888_hsw_8bit+0x13a>
- DB 196,161,126,127,36,138 ; vmovdqu %ymm4,(%rdx,%r9,4)
- DB 196,161,126,127,108,138,32 ; vmovdqu %ymm5,0x20(%rdx,%r9,4)
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,78 ; jne 24187 <_sk_srcover_rgba_8888_hsw_8bit+0x13b>
+ DB 196,129,126,127,36,152 ; vmovdqu %ymm4,(%r8,%r11,4)
+ DB 196,129,126,127,108,152,32 ; vmovdqu %ymm5,0x20(%r8,%r11,4)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
- DB 68,137,192 ; mov %r8d,%eax
- DB 36,15 ; and $0xf,%al
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,15 ; and $0xf,%r9b
DB 196,65,53,239,201 ; vpxor %ymm9,%ymm9,%ymm9
DB 196,65,37,239,219 ; vpxor %ymm11,%ymm11,%ymm11
- DB 254,200 ; dec %al
- DB 60,14 ; cmp $0xe,%al
- DB 15,135,22,255,255,255 ; ja 240ba <_sk_srcover_rgba_8888_hsw_8bit+0x32>
- DB 15,182,192 ; movzbl %al,%eax
- DB 72,141,13,234,1,0,0 ; lea 0x1ea(%rip),%rcx # 24398 <_sk_srcover_rgba_8888_hsw_8bit+0x310>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 196,33,121,110,28,138 ; vmovd (%rdx,%r9,4),%xmm11
- DB 233,248,254,255,255 ; jmpq 240ba <_sk_srcover_rgba_8888_hsw_8bit+0x32>
- DB 65,128,224,15 ; and $0xf,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,14 ; cmp $0xe,%r8b
- DB 119,184 ; ja 24187 <_sk_srcover_rgba_8888_hsw_8bit+0xff>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,250,1,0,0 ; lea 0x1fa(%rip),%rcx # 243d4 <_sk_srcover_rgba_8888_hsw_8bit+0x34c>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 196,161,121,126,36,138 ; vmovd %xmm4,(%rdx,%r9,4)
- DB 235,156 ; jmp 24187 <_sk_srcover_rgba_8888_hsw_8bit+0xff>
- DB 196,161,121,110,100,138,8 ; vmovd 0x8(%rdx,%r9,4),%xmm4
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,14 ; cmp $0xe,%r9b
+ DB 15,135,17,255,255,255 ; ja 24079 <_sk_srcover_rgba_8888_hsw_8bit+0x2d>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,237,1,0,0 ; lea 0x1ed(%rip),%r10 # 24360 <_sk_srcover_rgba_8888_hsw_8bit+0x314>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 196,1,121,110,28,152 ; vmovd (%r8,%r11,4),%xmm11
+ DB 233,242,254,255,255 ; jmpq 24079 <_sk_srcover_rgba_8888_hsw_8bit+0x2d>
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,15 ; and $0xf,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,14 ; cmp $0xe,%r9b
+ DB 119,175 ; ja 24146 <_sk_srcover_rgba_8888_hsw_8bit+0xfa>
+ DB 65,15,182,193 ; movzbl %r9b,%eax
+ DB 76,141,13,250,1,0,0 ; lea 0x1fa(%rip),%r9 # 2439c <_sk_srcover_rgba_8888_hsw_8bit+0x350>
+ DB 73,99,4,129 ; movslq (%r9,%rax,4),%rax
+ DB 76,1,200 ; add %r9,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 196,129,121,126,36,152 ; vmovd %xmm4,(%r8,%r11,4)
+ DB 235,147 ; jmp 24146 <_sk_srcover_rgba_8888_hsw_8bit+0xfa>
+ DB 196,129,121,110,100,152,8 ; vmovd 0x8(%r8,%r11,4),%xmm4
DB 196,226,121,89,236 ; vpbroadcastq %xmm4,%xmm5
DB 196,65,53,239,201 ; vpxor %ymm9,%ymm9,%ymm9
DB 196,99,53,2,221,4 ; vpblendd $0x4,%ymm5,%ymm9,%ymm11
- DB 196,162,121,53,52,138 ; vpmovzxdq (%rdx,%r9,4),%xmm6
+ DB 196,130,121,53,52,152 ; vpmovzxdq (%r8,%r11,4),%xmm6
DB 197,249,112,246,232 ; vpshufd $0xe8,%xmm6,%xmm6
DB 196,99,37,2,222,3 ; vpblendd $0x3,%ymm6,%ymm11,%ymm11
- DB 233,162,254,255,255 ; jmpq 240ba <_sk_srcover_rgba_8888_hsw_8bit+0x32>
- DB 196,161,121,110,100,138,24 ; vmovd 0x18(%rdx,%r9,4),%xmm4
+ DB 233,153,254,255,255 ; jmpq 24079 <_sk_srcover_rgba_8888_hsw_8bit+0x2d>
+ DB 196,129,121,110,100,152,24 ; vmovd 0x18(%r8,%r11,4),%xmm4
DB 196,226,125,89,236 ; vpbroadcastq %xmm4,%ymm5
DB 196,65,53,239,201 ; vpxor %ymm9,%ymm9,%ymm9
DB 196,99,53,2,221,64 ; vpblendd $0x40,%ymm5,%ymm9,%ymm11
DB 196,99,125,57,222,1 ; vextracti128 $0x1,%ymm11,%xmm6
- DB 196,163,73,34,116,138,20,1 ; vpinsrd $0x1,0x14(%rdx,%r9,4),%xmm6,%xmm6
+ DB 196,131,73,34,116,152,20,1 ; vpinsrd $0x1,0x14(%r8,%r11,4),%xmm6,%xmm6
DB 196,99,37,56,222,1 ; vinserti128 $0x1,%xmm6,%ymm11,%ymm11
DB 196,99,125,57,222,1 ; vextracti128 $0x1,%ymm11,%xmm6
- DB 196,163,73,34,116,138,16,0 ; vpinsrd $0x0,0x10(%rdx,%r9,4),%xmm6,%xmm6
+ DB 196,131,73,34,116,152,16,0 ; vpinsrd $0x0,0x10(%r8,%r11,4),%xmm6,%xmm6
DB 196,99,37,56,222,1 ; vinserti128 $0x1,%xmm6,%ymm11,%ymm11
- DB 196,161,122,111,52,138 ; vmovdqu (%rdx,%r9,4),%xmm6
+ DB 196,129,122,111,52,152 ; vmovdqu (%r8,%r11,4),%xmm6
DB 196,67,77,2,219,240 ; vpblendd $0xf0,%ymm11,%ymm6,%ymm11
- DB 233,82,254,255,255 ; jmpq 240ba <_sk_srcover_rgba_8888_hsw_8bit+0x32>
- DB 196,161,121,110,100,138,40 ; vmovd 0x28(%rdx,%r9,4),%xmm4
+ DB 233,73,254,255,255 ; jmpq 24079 <_sk_srcover_rgba_8888_hsw_8bit+0x2d>
+ DB 196,129,121,110,100,152,40 ; vmovd 0x28(%r8,%r11,4),%xmm4
DB 196,226,121,89,228 ; vpbroadcastq %xmm4,%xmm4
DB 197,213,239,237 ; vpxor %ymm5,%ymm5,%ymm5
DB 196,99,85,2,204,4 ; vpblendd $0x4,%ymm4,%ymm5,%ymm9
- DB 196,163,49,34,108,138,36,1 ; vpinsrd $0x1,0x24(%rdx,%r9,4),%xmm9,%xmm5
+ DB 196,131,49,34,108,152,36,1 ; vpinsrd $0x1,0x24(%r8,%r11,4),%xmm9,%xmm5
DB 196,99,53,2,205,15 ; vpblendd $0xf,%ymm5,%ymm9,%ymm9
- DB 196,161,121,110,108,138,32 ; vmovd 0x20(%rdx,%r9,4),%xmm5
+ DB 196,129,121,110,108,152,32 ; vmovd 0x20(%r8,%r11,4),%xmm5
DB 196,99,53,2,205,1 ; vpblendd $0x1,%ymm5,%ymm9,%ymm9
- DB 233,22,254,255,255 ; jmpq 240b4 <_sk_srcover_rgba_8888_hsw_8bit+0x2c>
- DB 196,161,121,110,100,138,56 ; vmovd 0x38(%rdx,%r9,4),%xmm4
+ DB 233,13,254,255,255 ; jmpq 24073 <_sk_srcover_rgba_8888_hsw_8bit+0x27>
+ DB 196,129,121,110,100,152,56 ; vmovd 0x38(%r8,%r11,4),%xmm4
DB 196,226,125,89,228 ; vpbroadcastq %xmm4,%ymm4
DB 197,213,239,237 ; vpxor %ymm5,%ymm5,%ymm5
DB 196,99,85,2,204,64 ; vpblendd $0x40,%ymm4,%ymm5,%ymm9
DB 196,99,125,57,205,1 ; vextracti128 $0x1,%ymm9,%xmm5
- DB 196,163,81,34,108,138,52,1 ; vpinsrd $0x1,0x34(%rdx,%r9,4),%xmm5,%xmm5
+ DB 196,131,81,34,108,152,52,1 ; vpinsrd $0x1,0x34(%r8,%r11,4),%xmm5,%xmm5
DB 196,99,53,56,205,1 ; vinserti128 $0x1,%xmm5,%ymm9,%ymm9
DB 196,99,125,57,205,1 ; vextracti128 $0x1,%ymm9,%xmm5
- DB 196,163,81,34,108,138,48,0 ; vpinsrd $0x0,0x30(%rdx,%r9,4),%xmm5,%xmm5
+ DB 196,131,81,34,108,152,48,0 ; vpinsrd $0x0,0x30(%r8,%r11,4),%xmm5,%xmm5
DB 196,99,53,56,205,1 ; vinserti128 $0x1,%xmm5,%ymm9,%ymm9
- DB 196,33,126,111,28,138 ; vmovdqu (%rdx,%r9,4),%ymm11
- DB 196,161,122,111,116,138,32 ; vmovdqu 0x20(%rdx,%r9,4),%xmm6
+ DB 196,1,126,111,28,152 ; vmovdqu (%r8,%r11,4),%ymm11
+ DB 196,129,122,111,116,152,32 ; vmovdqu 0x20(%r8,%r11,4),%xmm6
DB 196,67,77,2,201,240 ; vpblendd $0xf0,%ymm9,%ymm6,%ymm9
- DB 233,198,253,255,255 ; jmpq 240ba <_sk_srcover_rgba_8888_hsw_8bit+0x32>
- DB 196,163,121,22,100,138,8,2 ; vpextrd $0x2,%xmm4,0x8(%rdx,%r9,4)
- DB 196,161,121,214,36,138 ; vmovq %xmm4,(%rdx,%r9,4)
- DB 233,128,254,255,255 ; jmpq 24187 <_sk_srcover_rgba_8888_hsw_8bit+0xff>
+ DB 233,189,253,255,255 ; jmpq 24079 <_sk_srcover_rgba_8888_hsw_8bit+0x2d>
+ DB 196,131,121,22,100,152,8,2 ; vpextrd $0x2,%xmm4,0x8(%r8,%r11,4)
+ DB 196,129,121,214,36,152 ; vmovq %xmm4,(%r8,%r11,4)
+ DB 233,119,254,255,255 ; jmpq 24146 <_sk_srcover_rgba_8888_hsw_8bit+0xfa>
DB 196,227,125,57,229,1 ; vextracti128 $0x1,%ymm4,%xmm5
- DB 196,163,121,22,108,138,24,2 ; vpextrd $0x2,%xmm5,0x18(%rdx,%r9,4)
+ DB 196,131,121,22,108,152,24,2 ; vpextrd $0x2,%xmm5,0x18(%r8,%r11,4)
DB 196,227,125,57,229,1 ; vextracti128 $0x1,%ymm4,%xmm5
- DB 196,163,121,22,108,138,20,1 ; vpextrd $0x1,%xmm5,0x14(%rdx,%r9,4)
+ DB 196,131,121,22,108,152,20,1 ; vpextrd $0x1,%xmm5,0x14(%r8,%r11,4)
DB 196,227,125,57,229,1 ; vextracti128 $0x1,%ymm4,%xmm5
- DB 196,161,121,126,108,138,16 ; vmovd %xmm5,0x10(%rdx,%r9,4)
- DB 196,161,122,127,36,138 ; vmovdqu %xmm4,(%rdx,%r9,4)
- DB 233,76,254,255,255 ; jmpq 24187 <_sk_srcover_rgba_8888_hsw_8bit+0xff>
- DB 196,163,121,22,108,138,40,2 ; vpextrd $0x2,%xmm5,0x28(%rdx,%r9,4)
- DB 196,163,121,22,108,138,36,1 ; vpextrd $0x1,%xmm5,0x24(%rdx,%r9,4)
- DB 196,161,121,126,108,138,32 ; vmovd %xmm5,0x20(%rdx,%r9,4)
- DB 196,161,126,127,36,138 ; vmovdqu %ymm4,(%rdx,%r9,4)
- DB 233,42,254,255,255 ; jmpq 24187 <_sk_srcover_rgba_8888_hsw_8bit+0xff>
+ DB 196,129,121,126,108,152,16 ; vmovd %xmm5,0x10(%r8,%r11,4)
+ DB 196,129,122,127,36,152 ; vmovdqu %xmm4,(%r8,%r11,4)
+ DB 233,67,254,255,255 ; jmpq 24146 <_sk_srcover_rgba_8888_hsw_8bit+0xfa>
+ DB 196,131,121,22,108,152,40,2 ; vpextrd $0x2,%xmm5,0x28(%r8,%r11,4)
+ DB 196,131,121,22,108,152,36,1 ; vpextrd $0x1,%xmm5,0x24(%r8,%r11,4)
+ DB 196,129,121,126,108,152,32 ; vmovd %xmm5,0x20(%r8,%r11,4)
+ DB 196,129,126,127,36,152 ; vmovdqu %ymm4,(%r8,%r11,4)
+ DB 233,33,254,255,255 ; jmpq 24146 <_sk_srcover_rgba_8888_hsw_8bit+0xfa>
DB 196,227,125,57,238,1 ; vextracti128 $0x1,%ymm5,%xmm6
- DB 196,163,121,22,116,138,56,2 ; vpextrd $0x2,%xmm6,0x38(%rdx,%r9,4)
+ DB 196,131,121,22,116,152,56,2 ; vpextrd $0x2,%xmm6,0x38(%r8,%r11,4)
DB 196,227,125,57,238,1 ; vextracti128 $0x1,%ymm5,%xmm6
- DB 196,163,121,22,116,138,52,1 ; vpextrd $0x1,%xmm6,0x34(%rdx,%r9,4)
+ DB 196,131,121,22,116,152,52,1 ; vpextrd $0x1,%xmm6,0x34(%r8,%r11,4)
DB 196,227,125,57,238,1 ; vextracti128 $0x1,%ymm5,%xmm6
- DB 196,161,121,126,116,138,48 ; vmovd %xmm6,0x30(%rdx,%r9,4)
- DB 196,161,126,127,36,138 ; vmovdqu %ymm4,(%rdx,%r9,4)
- DB 196,161,122,127,108,138,32 ; vmovdqu %xmm5,0x20(%rdx,%r9,4)
- DB 233,239,253,255,255 ; jmpq 24187 <_sk_srcover_rgba_8888_hsw_8bit+0xff>
- DB 31 ; (bad)
- DB 254 ; (bad)
+ DB 196,129,121,126,116,152,48 ; vmovd %xmm6,0x30(%r8,%r11,4)
+ DB 196,129,126,127,36,152 ; vmovdqu %ymm4,(%r8,%r11,4)
+ DB 196,129,122,127,108,152,32 ; vmovdqu %xmm5,0x20(%r8,%r11,4)
+ DB 233,230,253,255,255 ; jmpq 24146 <_sk_srcover_rgba_8888_hsw_8bit+0xfa>
+ DB 28,254 ; sbb $0xfe,%al
DB 255 ; (bad)
DB 255,106,254 ; ljmp *-0x2(%rdx)
DB 255 ; (bad)
@@ -34567,7 +34566,11 @@ _sk_srcover_rgba_8888_hsw_8bit LABEL PROC
DB 255,151,254,255,255,128 ; callq *-0x7f000002(%rdi)
DB 254 ; (bad)
DB 255 ; (bad)
- DB 255,28,253,255,255,244,254 ; lcall *-0x10b0001(,%rdi,8)
+ DB 255,19 ; callq *(%rbx)
+ DB 253 ; std
+ DB 255 ; (bad)
+ DB 255,244 ; push %rsp
+ DB 254 ; (bad)
DB 255 ; (bad)
DB 255,230 ; jmpq *%rsi
DB 254 ; (bad)
@@ -34602,7 +34605,7 @@ _sk_srcover_rgba_8888_hsw_8bit LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 126,255 ; jle 243f1 <_sk_srcover_rgba_8888_hsw_8bit+0x369>
+ DB 126,255 ; jle 243b9 <_sk_srcover_rgba_8888_hsw_8bit+0x36d>
DB 255 ; (bad)
DB 255,119,255 ; pushq -0x1(%rdi)
DB 255 ; (bad)
@@ -34622,7 +34625,7 @@ PUBLIC _sk_scale_1_float_hsw_8bit
_sk_scale_1_float_hsw_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,250,16,32 ; vmovss (%rax),%xmm4
- DB 197,218,89,37,242,124,0,0 ; vmulss 0x7cf2(%rip),%xmm4,%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 197,218,89,37,102,124,0,0 ; vmulss 0x7c66(%rip),%xmm4,%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 197,250,44,196 ; vcvttss2si %xmm4,%eax
DB 197,249,110,224 ; vmovd %eax,%xmm4
DB 196,226,125,120,228 ; vpbroadcastb %xmm4,%ymm4
@@ -34632,7 +34635,7 @@ _sk_scale_1_float_hsw_8bit LABEL PROC
DB 196,226,125,48,241 ; vpmovzxbw %xmm1,%ymm6
DB 196,227,125,57,201,1 ; vextracti128 $0x1,%ymm1,%xmm1
DB 196,226,125,48,201 ; vpmovzxbw %xmm1,%ymm1
- DB 197,221,219,37,173,131,0,0 ; vpand 0x83ad(%rip),%ymm4,%ymm4 # 2c800 <_sk_overlay_sse2_8bit+0xb8b>
+ DB 197,221,219,37,37,131,0,0 ; vpand 0x8325(%rip),%ymm4,%ymm4 # 2c740 <_sk_overlay_sse2_8bit+0xb90>
DB 197,221,213,249 ; vpmullw %ymm1,%ymm4,%ymm7
DB 197,93,213,198 ; vpmullw %ymm6,%ymm4,%ymm8
DB 197,93,213,200 ; vpmullw %ymm0,%ymm4,%ymm9
@@ -34656,20 +34659,19 @@ _sk_scale_1_float_hsw_8bit LABEL PROC
PUBLIC _sk_scale_u8_hsw_8bit
_sk_scale_u8_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 15,133,191,0,0,0 ; jne 2458b <_sk_scale_u8_hsw_8bit+0xe0>
- DB 196,161,122,111,36,2 ; vmovdqu (%rdx,%r8,1),%xmm4
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,191,0,0,0 ; jne 2454e <_sk_scale_u8_hsw_8bit+0xdb>
+ DB 196,129,122,111,36,24 ; vmovdqu (%r8,%r11,1),%xmm4
DB 196,226,125,49,236 ; vpmovzxbd %xmm4,%ymm5
DB 197,249,112,228,78 ; vpshufd $0x4e,%xmm4,%xmm4
DB 196,226,125,49,228 ; vpmovzxbd %xmm4,%ymm4
- DB 197,253,111,53,55,131,0,0 ; vmovdqa 0x8337(%rip),%ymm6 # 2c820 <_sk_overlay_sse2_8bit+0xbab>
+ DB 197,253,111,53,180,130,0,0 ; vmovdqa 0x82b4(%rip),%ymm6 # 2c760 <_sk_overlay_sse2_8bit+0xbb0>
DB 196,226,93,0,230 ; vpshufb %ymm6,%ymm4,%ymm4
DB 196,226,85,0,238 ; vpshufb %ymm6,%ymm5,%ymm5
DB 196,226,125,48,240 ; vpmovzxbw %xmm0,%ymm6
@@ -34704,78 +34706,78 @@ _sk_scale_u8_hsw_8bit LABEL PROC
DB 197,213,103,201 ; vpackuswb %ymm1,%ymm5,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 15,135,50,255,255,255 ; ja 244d2 <_sk_scale_u8_hsw_8bit+0x27>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,201,0,0,0 ; lea 0xc9(%rip),%rcx # 24674 <_sk_scale_u8_hsw_8bit+0x1c9>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 15,135,47,255,255,255 ; ja 24495 <_sk_scale_u8_hsw_8bit+0x22>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,199,0,0,0 ; lea 0xc7(%rip),%r10 # 24638 <_sk_scale_u8_hsw_8bit+0x1c5>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 197,249,110,224 ; vmovd %eax,%xmm4
- DB 233,16,255,255,255 ; jmpq 244d2 <_sk_scale_u8_hsw_8bit+0x27>
+ DB 233,13,255,255,255 ; jmpq 24495 <_sk_scale_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,2,2 ; vpinsrb $0x2,0x2(%rdx,%r8,1),%xmm4,%xmm4
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 196,131,89,32,100,24,2,2 ; vpinsrb $0x2,0x2(%r8,%r11,1),%xmm4,%xmm4
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 197,249,110,232 ; vmovd %eax,%xmm5
DB 196,227,89,14,229,1 ; vpblendw $0x1,%xmm5,%xmm4,%xmm4
- DB 233,240,254,255,255 ; jmpq 244d2 <_sk_scale_u8_hsw_8bit+0x27>
+ DB 233,237,254,255,255 ; jmpq 24495 <_sk_scale_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,6,6 ; vpinsrb $0x6,0x6(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,5,5 ; vpinsrb $0x5,0x5(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,4,4 ; vpinsrb $0x4,0x4(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,161,121,110,44,2 ; vmovd (%rdx,%r8,1),%xmm5
+ DB 196,131,89,32,100,24,6,6 ; vpinsrb $0x6,0x6(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,5,5 ; vpinsrb $0x5,0x5(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,4,4 ; vpinsrb $0x4,0x4(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,129,121,110,44,24 ; vmovd (%r8,%r11,1),%xmm5
DB 196,227,89,2,229,1 ; vpblendd $0x1,%xmm5,%xmm4,%xmm4
- DB 233,195,254,255,255 ; jmpq 244d2 <_sk_scale_u8_hsw_8bit+0x27>
+ DB 233,192,254,255,255 ; jmpq 24495 <_sk_scale_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,10,10 ; vpinsrb $0xa,0xa(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,9,9 ; vpinsrb $0x9,0x9(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,8,8 ; vpinsrb $0x8,0x8(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,161,122,126,44,2 ; vmovq (%rdx,%r8,1),%xmm5
+ DB 196,131,89,32,100,24,10,10 ; vpinsrb $0xa,0xa(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,9,9 ; vpinsrb $0x9,0x9(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,8,8 ; vpinsrb $0x8,0x8(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,129,122,126,44,24 ; vmovq (%r8,%r11,1),%xmm5
DB 196,227,81,2,228,12 ; vpblendd $0xc,%xmm4,%xmm5,%xmm4
- DB 233,150,254,255,255 ; jmpq 244d2 <_sk_scale_u8_hsw_8bit+0x27>
+ DB 233,147,254,255,255 ; jmpq 24495 <_sk_scale_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,14,14 ; vpinsrb $0xe,0xe(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,13,13 ; vpinsrb $0xd,0xd(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,12,12 ; vpinsrb $0xc,0xc(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,161,122,126,44,2 ; vmovq (%rdx,%r8,1),%xmm5
- DB 196,163,81,34,108,2,8,2 ; vpinsrd $0x2,0x8(%rdx,%r8,1),%xmm5,%xmm5
+ DB 196,131,89,32,100,24,14,14 ; vpinsrb $0xe,0xe(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,13,13 ; vpinsrb $0xd,0xd(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,12,12 ; vpinsrb $0xc,0xc(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,129,122,126,44,24 ; vmovq (%r8,%r11,1),%xmm5
+ DB 196,131,81,34,108,24,8,2 ; vpinsrd $0x2,0x8(%r8,%r11,1),%xmm5,%xmm5
DB 196,227,81,2,228,8 ; vpblendd $0x8,%xmm4,%xmm5,%xmm4
- DB 233,97,254,255,255 ; jmpq 244d2 <_sk_scale_u8_hsw_8bit+0x27>
- DB 15,31,0 ; nopl (%rax)
- DB 64,255 ; rex (bad)
- DB 255 ; (bad)
- DB 255,90,255 ; lcall *-0x1(%rdx)
+ DB 233,94,254,255,255 ; jmpq 24495 <_sk_scale_u8_hsw_8bit+0x22>
+ DB 144 ; nop
+ DB 66,255 ; rex.X (bad)
DB 255 ; (bad)
- DB 255,78,255 ; decl -0x1(%rsi)
+ DB 255,92,255,255 ; lcall *-0x1(%rdi,%rdi,8)
+ DB 255,80,255 ; callq *-0x1(%rax)
DB 255 ; (bad)
- DB 255,138,255,255,255,130 ; decl -0x7d000001(%rdx)
+ DB 255,140,255,255,255,132,255 ; decl -0x7b0001(%rdi,%rdi,8)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 124,255 ; jl 2464d <_sk_scale_u8_hsw_8bit+0x1da>
DB 255 ; (bad)
- DB 122,255 ; jp 24689 <_sk_scale_u8_hsw_8bit+0x1de>
+ DB 255,112,255 ; pushq -0x1(%rax)
DB 255 ; (bad)
- DB 255,110,255 ; ljmp *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,183,255,255,255,175 ; pushq -0x50000001(%rdi)
+ DB 185,255,255,255,177 ; mov $0xb1ffffff,%ecx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,167,255,255,255,155 ; jmpq *-0x64000001(%rdi)
+ DB 255,169,255,255,255,157 ; ljmp *-0x62000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,228 ; jmpq *%rsp
+ DB 255,230 ; jmpq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,200 ; dec %eax
+ DB 255,202 ; dec %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -34784,7 +34786,7 @@ PUBLIC _sk_lerp_1_float_hsw_8bit
_sk_lerp_1_float_hsw_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,250,16,32 ; vmovss (%rax),%xmm4
- DB 197,218,89,37,82,122,0,0 ; vmulss 0x7a52(%rip),%xmm4,%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 197,218,89,37,202,121,0,0 ; vmulss 0x79ca(%rip),%xmm4,%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 197,250,44,196 ; vcvttss2si %xmm4,%eax
DB 197,249,110,224 ; vmovd %eax,%xmm4
DB 196,226,125,120,228 ; vpbroadcastb %xmm4,%ymm4
@@ -34794,7 +34796,7 @@ _sk_lerp_1_float_hsw_8bit LABEL PROC
DB 196,226,125,48,241 ; vpmovzxbw %xmm1,%ymm6
DB 196,227,125,57,201,1 ; vextracti128 $0x1,%ymm1,%xmm1
DB 196,226,125,48,201 ; vpmovzxbw %xmm1,%ymm1
- DB 197,221,219,61,77,129,0,0 ; vpand 0x814d(%rip),%ymm4,%ymm7 # 2c840 <_sk_overlay_sse2_8bit+0xbcb>
+ DB 197,221,219,61,201,128,0,0 ; vpand 0x80c9(%rip),%ymm4,%ymm7 # 2c780 <_sk_overlay_sse2_8bit+0xbd0>
DB 197,69,213,193 ; vpmullw %ymm1,%ymm7,%ymm8
DB 197,69,213,206 ; vpmullw %ymm6,%ymm7,%ymm9
DB 197,69,213,208 ; vpmullw %ymm0,%ymm7,%ymm10
@@ -34849,20 +34851,19 @@ _sk_lerp_1_float_hsw_8bit LABEL PROC
PUBLIC _sk_lerp_u8_hsw_8bit
_sk_lerp_u8_hsw_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 15,133,106,1,0,0 ; jne 2496b <_sk_lerp_u8_hsw_8bit+0x18b>
- DB 196,161,122,111,36,2 ; vmovdqu (%rdx,%r8,1),%xmm4
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,106,1,0,0 ; jne 2492a <_sk_lerp_u8_hsw_8bit+0x186>
+ DB 196,129,122,111,36,24 ; vmovdqu (%r8,%r11,1),%xmm4
DB 196,226,125,49,236 ; vpmovzxbd %xmm4,%ymm5
DB 197,249,112,228,78 ; vpshufd $0x4e,%xmm4,%xmm4
DB 196,226,125,49,228 ; vpmovzxbd %xmm4,%ymm4
- DB 197,253,111,53,66,128,0,0 ; vmovdqa 0x8042(%rip),%ymm6 # 2c860 <_sk_overlay_sse2_8bit+0xbeb>
+ DB 197,253,111,53,195,127,0,0 ; vmovdqa 0x7fc3(%rip),%ymm6 # 2c7a0 <_sk_overlay_sse2_8bit+0xbf0>
DB 196,98,93,0,206 ; vpshufb %ymm6,%ymm4,%ymm9
DB 196,98,85,0,222 ; vpshufb %ymm6,%ymm5,%ymm11
DB 196,226,125,48,240 ; vpmovzxbw %xmm0,%ymm6
@@ -34932,78 +34933,78 @@ _sk_lerp_u8_hsw_8bit LABEL PROC
DB 197,213,252,201 ; vpaddb %ymm1,%ymm5,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,15 ; and $0xf,%r9b
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
DB 65,254,201 ; dec %r9b
DB 65,128,249,14 ; cmp $0xe,%r9b
- DB 15,135,135,254,255,255 ; ja 24807 <_sk_lerp_u8_hsw_8bit+0x27>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,201,0,0,0 ; lea 0xc9(%rip),%rcx # 24a54 <_sk_lerp_u8_hsw_8bit+0x274>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 15,135,132,254,255,255 ; ja 247c6 <_sk_lerp_u8_hsw_8bit+0x22>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,199,0,0,0 ; lea 0xc7(%rip),%r10 # 24a14 <_sk_lerp_u8_hsw_8bit+0x270>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 197,249,110,224 ; vmovd %eax,%xmm4
- DB 233,101,254,255,255 ; jmpq 24807 <_sk_lerp_u8_hsw_8bit+0x27>
+ DB 233,98,254,255,255 ; jmpq 247c6 <_sk_lerp_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,2,2 ; vpinsrb $0x2,0x2(%rdx,%r8,1),%xmm4,%xmm4
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 196,131,89,32,100,24,2,2 ; vpinsrb $0x2,0x2(%r8,%r11,1),%xmm4,%xmm4
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 197,249,110,232 ; vmovd %eax,%xmm5
DB 196,227,89,14,229,1 ; vpblendw $0x1,%xmm5,%xmm4,%xmm4
- DB 233,69,254,255,255 ; jmpq 24807 <_sk_lerp_u8_hsw_8bit+0x27>
+ DB 233,66,254,255,255 ; jmpq 247c6 <_sk_lerp_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,6,6 ; vpinsrb $0x6,0x6(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,5,5 ; vpinsrb $0x5,0x5(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,4,4 ; vpinsrb $0x4,0x4(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,161,121,110,44,2 ; vmovd (%rdx,%r8,1),%xmm5
+ DB 196,131,89,32,100,24,6,6 ; vpinsrb $0x6,0x6(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,5,5 ; vpinsrb $0x5,0x5(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,4,4 ; vpinsrb $0x4,0x4(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,129,121,110,44,24 ; vmovd (%r8,%r11,1),%xmm5
DB 196,227,89,2,229,1 ; vpblendd $0x1,%xmm5,%xmm4,%xmm4
- DB 233,24,254,255,255 ; jmpq 24807 <_sk_lerp_u8_hsw_8bit+0x27>
+ DB 233,21,254,255,255 ; jmpq 247c6 <_sk_lerp_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,10,10 ; vpinsrb $0xa,0xa(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,9,9 ; vpinsrb $0x9,0x9(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,8,8 ; vpinsrb $0x8,0x8(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,161,122,126,44,2 ; vmovq (%rdx,%r8,1),%xmm5
+ DB 196,131,89,32,100,24,10,10 ; vpinsrb $0xa,0xa(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,9,9 ; vpinsrb $0x9,0x9(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,8,8 ; vpinsrb $0x8,0x8(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,129,122,126,44,24 ; vmovq (%r8,%r11,1),%xmm5
DB 196,227,81,2,228,12 ; vpblendd $0xc,%xmm4,%xmm5,%xmm4
- DB 233,235,253,255,255 ; jmpq 24807 <_sk_lerp_u8_hsw_8bit+0x27>
+ DB 233,232,253,255,255 ; jmpq 247c6 <_sk_lerp_u8_hsw_8bit+0x22>
DB 197,217,239,228 ; vpxor %xmm4,%xmm4,%xmm4
- DB 196,163,89,32,100,2,14,14 ; vpinsrb $0xe,0xe(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,13,13 ; vpinsrb $0xd,0xd(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,163,89,32,100,2,12,12 ; vpinsrb $0xc,0xc(%rdx,%r8,1),%xmm4,%xmm4
- DB 196,161,122,126,44,2 ; vmovq (%rdx,%r8,1),%xmm5
- DB 196,163,81,34,108,2,8,2 ; vpinsrd $0x2,0x8(%rdx,%r8,1),%xmm5,%xmm5
+ DB 196,131,89,32,100,24,14,14 ; vpinsrb $0xe,0xe(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,13,13 ; vpinsrb $0xd,0xd(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,131,89,32,100,24,12,12 ; vpinsrb $0xc,0xc(%r8,%r11,1),%xmm4,%xmm4
+ DB 196,129,122,126,44,24 ; vmovq (%r8,%r11,1),%xmm5
+ DB 196,131,81,34,108,24,8,2 ; vpinsrd $0x2,0x8(%r8,%r11,1),%xmm5,%xmm5
DB 196,227,81,2,228,8 ; vpblendd $0x8,%xmm4,%xmm5,%xmm4
- DB 233,182,253,255,255 ; jmpq 24807 <_sk_lerp_u8_hsw_8bit+0x27>
- DB 15,31,0 ; nopl (%rax)
- DB 64,255 ; rex (bad)
- DB 255 ; (bad)
- DB 255,90,255 ; lcall *-0x1(%rdx)
+ DB 233,179,253,255,255 ; jmpq 247c6 <_sk_lerp_u8_hsw_8bit+0x22>
+ DB 144 ; nop
+ DB 66,255 ; rex.X (bad)
DB 255 ; (bad)
- DB 255,78,255 ; decl -0x1(%rsi)
+ DB 255,92,255,255 ; lcall *-0x1(%rdi,%rdi,8)
+ DB 255,80,255 ; callq *-0x1(%rax)
DB 255 ; (bad)
- DB 255,138,255,255,255,130 ; decl -0x7d000001(%rdx)
+ DB 255,140,255,255,255,132,255 ; decl -0x7b0001(%rdi,%rdi,8)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 124,255 ; jl 24a29 <_sk_lerp_u8_hsw_8bit+0x285>
DB 255 ; (bad)
- DB 122,255 ; jp 24a69 <_sk_lerp_u8_hsw_8bit+0x289>
+ DB 255,112,255 ; pushq -0x1(%rax)
DB 255 ; (bad)
- DB 255,110,255 ; ljmp *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,183,255,255,255,175 ; pushq -0x50000001(%rdi)
+ DB 185,255,255,255,177 ; mov $0xb1ffffff,%ecx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,167,255,255,255,155 ; jmpq *-0x64000001(%rdi)
+ DB 255,169,255,255,255,157 ; ljmp *-0x62000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,228 ; jmpq *%rsp
+ DB 255,230 ; jmpq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,200 ; dec %eax
+ DB 255,202 ; dec %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -35025,7 +35026,7 @@ _sk_move_dst_src_hsw_8bit LABEL PROC
PUBLIC _sk_black_color_hsw_8bit
_sk_black_color_hsw_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,197,119,0,0 ; vbroadcastss 0x77c5(%rip),%ymm0 # 2c278 <_sk_overlay_sse2_8bit+0x603>
+ DB 196,226,125,24,5,65,119,0,0 ; vbroadcastss 0x7741(%rip),%ymm0 # 2c1b4 <_sk_overlay_sse2_8bit+0x604>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 255,224 ; jmpq *%rax
@@ -35045,7 +35046,7 @@ _sk_clear_hsw_8bit LABEL PROC
PUBLIC _sk_srcatop_hsw_8bit
_sk_srcatop_hsw_8bit LABEL PROC
- DB 197,125,111,5,167,125,0,0 ; vmovdqa 0x7da7(%rip),%ymm8 # 2c880 <_sk_overlay_sse2_8bit+0xc0b>
+ DB 197,125,111,5,39,125,0,0 ; vmovdqa 0x7d27(%rip),%ymm8 # 2c7c0 <_sk_overlay_sse2_8bit+0xc10>
DB 196,194,101,0,224 ; vpshufb %ymm8,%ymm3,%ymm4
DB 196,194,109,0,232 ; vpshufb %ymm8,%ymm2,%ymm5
DB 196,98,125,48,208 ; vpmovzxbw %xmm0,%ymm10
@@ -35120,7 +35121,7 @@ _sk_srcatop_hsw_8bit LABEL PROC
PUBLIC _sk_dstatop_hsw_8bit
_sk_dstatop_hsw_8bit LABEL PROC
- DB 197,125,111,5,98,124,0,0 ; vmovdqa 0x7c62(%rip),%ymm8 # 2c8a0 <_sk_overlay_sse2_8bit+0xc2b>
+ DB 197,125,111,5,226,123,0,0 ; vmovdqa 0x7be2(%rip),%ymm8 # 2c7e0 <_sk_overlay_sse2_8bit+0xc30>
DB 196,194,117,0,224 ; vpshufb %ymm8,%ymm1,%ymm4
DB 196,194,125,0,232 ; vpshufb %ymm8,%ymm0,%ymm5
DB 196,98,125,48,210 ; vpmovzxbw %xmm2,%ymm10
@@ -35195,7 +35196,7 @@ _sk_dstatop_hsw_8bit LABEL PROC
PUBLIC _sk_srcin_hsw_8bit
_sk_srcin_hsw_8bit LABEL PROC
- DB 197,253,111,37,25,123,0,0 ; vmovdqa 0x7b19(%rip),%ymm4 # 2c8c0 <_sk_overlay_sse2_8bit+0xc4b>
+ DB 197,253,111,37,153,122,0,0 ; vmovdqa 0x7a99(%rip),%ymm4 # 2c800 <_sk_overlay_sse2_8bit+0xc50>
DB 196,226,101,0,236 ; vpshufb %ymm4,%ymm3,%ymm5
DB 196,226,109,0,228 ; vpshufb %ymm4,%ymm2,%ymm4
DB 196,226,125,48,240 ; vpmovzxbw %xmm0,%ymm6
@@ -35233,7 +35234,7 @@ _sk_srcin_hsw_8bit LABEL PROC
PUBLIC _sk_dstin_hsw_8bit
_sk_dstin_hsw_8bit LABEL PROC
- DB 197,253,111,37,143,122,0,0 ; vmovdqa 0x7a8f(%rip),%ymm4 # 2c8e0 <_sk_overlay_sse2_8bit+0xc6b>
+ DB 197,253,111,37,15,122,0,0 ; vmovdqa 0x7a0f(%rip),%ymm4 # 2c820 <_sk_overlay_sse2_8bit+0xc70>
DB 196,226,117,0,204 ; vpshufb %ymm4,%ymm1,%ymm1
DB 196,226,125,0,196 ; vpshufb %ymm4,%ymm0,%ymm0
DB 196,226,125,48,226 ; vpmovzxbw %xmm2,%ymm4
@@ -35271,7 +35272,7 @@ _sk_dstin_hsw_8bit LABEL PROC
PUBLIC _sk_srcout_hsw_8bit
_sk_srcout_hsw_8bit LABEL PROC
- DB 197,253,111,37,3,122,0,0 ; vmovdqa 0x7a03(%rip),%ymm4 # 2c900 <_sk_overlay_sse2_8bit+0xc8b>
+ DB 197,253,111,37,131,121,0,0 ; vmovdqa 0x7983(%rip),%ymm4 # 2c840 <_sk_overlay_sse2_8bit+0xc90>
DB 196,226,109,0,236 ; vpshufb %ymm4,%ymm2,%ymm5
DB 196,226,101,0,228 ; vpshufb %ymm4,%ymm3,%ymm4
DB 197,205,118,246 ; vpcmpeqd %ymm6,%ymm6,%ymm6
@@ -35312,7 +35313,7 @@ _sk_srcout_hsw_8bit LABEL PROC
PUBLIC _sk_dstout_hsw_8bit
_sk_dstout_hsw_8bit LABEL PROC
- DB 197,253,111,37,109,121,0,0 ; vmovdqa 0x796d(%rip),%ymm4 # 2c920 <_sk_overlay_sse2_8bit+0xcab>
+ DB 197,253,111,37,237,120,0,0 ; vmovdqa 0x78ed(%rip),%ymm4 # 2c860 <_sk_overlay_sse2_8bit+0xcb0>
DB 196,226,125,0,196 ; vpshufb %ymm4,%ymm0,%ymm0
DB 196,226,117,0,204 ; vpshufb %ymm4,%ymm1,%ymm1
DB 197,221,118,228 ; vpcmpeqd %ymm4,%ymm4,%ymm4
@@ -35353,7 +35354,7 @@ _sk_dstout_hsw_8bit LABEL PROC
PUBLIC _sk_srcover_hsw_8bit
_sk_srcover_hsw_8bit LABEL PROC
- DB 197,253,111,37,213,120,0,0 ; vmovdqa 0x78d5(%rip),%ymm4 # 2c940 <_sk_overlay_sse2_8bit+0xccb>
+ DB 197,253,111,37,85,120,0,0 ; vmovdqa 0x7855(%rip),%ymm4 # 2c880 <_sk_overlay_sse2_8bit+0xcd0>
DB 196,226,117,0,236 ; vpshufb %ymm4,%ymm1,%ymm5
DB 196,226,125,0,228 ; vpshufb %ymm4,%ymm0,%ymm4
DB 196,98,125,48,202 ; vpmovzxbw %xmm2,%ymm9
@@ -35395,7 +35396,7 @@ _sk_srcover_hsw_8bit LABEL PROC
PUBLIC _sk_dstover_hsw_8bit
_sk_dstover_hsw_8bit LABEL PROC
- DB 197,253,111,37,54,120,0,0 ; vmovdqa 0x7836(%rip),%ymm4 # 2c960 <_sk_overlay_sse2_8bit+0xceb>
+ DB 197,253,111,37,182,119,0,0 ; vmovdqa 0x77b6(%rip),%ymm4 # 2c8a0 <_sk_overlay_sse2_8bit+0xcf0>
DB 196,226,101,0,236 ; vpshufb %ymm4,%ymm3,%ymm5
DB 196,226,109,0,228 ; vpshufb %ymm4,%ymm2,%ymm4
DB 196,98,125,48,200 ; vpmovzxbw %xmm0,%ymm9
@@ -35475,7 +35476,7 @@ _sk_multiply_hsw_8bit LABEL PROC
DB 72,131,236,56 ; sub $0x38,%rsp
DB 197,253,111,243 ; vmovdqa %ymm3,%ymm6
DB 197,253,111,218 ; vmovdqa %ymm2,%ymm3
- DB 197,125,111,13,243,118,0,0 ; vmovdqa 0x76f3(%rip),%ymm9 # 2c980 <_sk_overlay_sse2_8bit+0xd0b>
+ DB 197,125,111,13,115,118,0,0 ; vmovdqa 0x7673(%rip),%ymm9 # 2c8c0 <_sk_overlay_sse2_8bit+0xd10>
DB 196,194,101,0,225 ; vpshufb %ymm9,%ymm3,%ymm4
DB 196,194,77,0,233 ; vpshufb %ymm9,%ymm6,%ymm5
DB 196,65,45,118,210 ; vpcmpeqd %ymm10,%ymm10,%ymm10
@@ -35616,7 +35617,7 @@ _sk_screen_hsw_8bit LABEL PROC
PUBLIC _sk_xor__hsw_8bit
_sk_xor__hsw_8bit LABEL PROC
- DB 197,125,111,13,127,116,0,0 ; vmovdqa 0x747f(%rip),%ymm9 # 2c9a0 <_sk_overlay_sse2_8bit+0xd2b>
+ DB 197,125,111,13,255,115,0,0 ; vmovdqa 0x73ff(%rip),%ymm9 # 2c8e0 <_sk_overlay_sse2_8bit+0xd30>
DB 196,194,109,0,225 ; vpshufb %ymm9,%ymm2,%ymm4
DB 196,194,101,0,249 ; vpshufb %ymm9,%ymm3,%ymm7
DB 196,65,37,118,219 ; vpcmpeqd %ymm11,%ymm11,%ymm11
@@ -35700,7 +35701,7 @@ _sk_plus__hsw_8bit LABEL PROC
PUBLIC _sk_darken_hsw_8bit
_sk_darken_hsw_8bit LABEL PROC
- DB 197,125,111,5,33,115,0,0 ; vmovdqa 0x7321(%rip),%ymm8 # 2c9c0 <_sk_overlay_sse2_8bit+0xd4b>
+ DB 197,125,111,5,161,114,0,0 ; vmovdqa 0x72a1(%rip),%ymm8 # 2c900 <_sk_overlay_sse2_8bit+0xd50>
DB 196,194,101,0,224 ; vpshufb %ymm8,%ymm3,%ymm4
DB 196,194,109,0,240 ; vpshufb %ymm8,%ymm2,%ymm6
DB 196,98,125,48,208 ; vpmovzxbw %xmm0,%ymm10
@@ -35773,7 +35774,7 @@ _sk_darken_hsw_8bit LABEL PROC
DB 197,253,248,246 ; vpsubb %ymm6,%ymm0,%ymm6
DB 197,245,248,205 ; vpsubb %ymm5,%ymm1,%ymm1
DB 197,253,248,196 ; vpsubb %ymm4,%ymm0,%ymm0
- DB 196,226,125,88,37,110,106,0,0 ; vpbroadcastd 0x6a6e(%rip),%ymm4 # 2c27c <_sk_overlay_sse2_8bit+0x607>
+ DB 196,226,125,88,37,234,105,0,0 ; vpbroadcastd 0x69ea(%rip),%ymm4 # 2c1b8 <_sk_overlay_sse2_8bit+0x608>
DB 196,227,125,76,198,64 ; vpblendvb %ymm4,%ymm6,%ymm0,%ymm0
DB 196,227,117,76,207,64 ; vpblendvb %ymm4,%ymm7,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -35781,7 +35782,7 @@ _sk_darken_hsw_8bit LABEL PROC
PUBLIC _sk_lighten_hsw_8bit
_sk_lighten_hsw_8bit LABEL PROC
- DB 197,125,111,5,186,113,0,0 ; vmovdqa 0x71ba(%rip),%ymm8 # 2c9e0 <_sk_overlay_sse2_8bit+0xd6b>
+ DB 197,125,111,5,58,113,0,0 ; vmovdqa 0x713a(%rip),%ymm8 # 2c920 <_sk_overlay_sse2_8bit+0xd70>
DB 196,194,101,0,224 ; vpshufb %ymm8,%ymm3,%ymm4
DB 196,194,109,0,240 ; vpshufb %ymm8,%ymm2,%ymm6
DB 196,98,125,48,208 ; vpmovzxbw %xmm0,%ymm10
@@ -35854,7 +35855,7 @@ _sk_lighten_hsw_8bit LABEL PROC
DB 197,253,248,246 ; vpsubb %ymm6,%ymm0,%ymm6
DB 197,245,248,205 ; vpsubb %ymm5,%ymm1,%ymm1
DB 197,253,248,196 ; vpsubb %ymm4,%ymm0,%ymm0
- DB 196,226,125,88,37,231,104,0,0 ; vpbroadcastd 0x68e7(%rip),%ymm4 # 2c27c <_sk_overlay_sse2_8bit+0x607>
+ DB 196,226,125,88,37,99,104,0,0 ; vpbroadcastd 0x6863(%rip),%ymm4 # 2c1b8 <_sk_overlay_sse2_8bit+0x608>
DB 196,227,125,76,198,64 ; vpblendvb %ymm4,%ymm6,%ymm0,%ymm0
DB 196,227,117,76,207,64 ; vpblendvb %ymm4,%ymm7,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -35892,7 +35893,7 @@ _sk_exclusion_hsw_8bit LABEL PROC
DB 196,227,77,56,252,1 ; vinserti128 $0x1,%xmm4,%ymm6,%ymm7
DB 196,227,77,70,228,49 ; vperm2i128 $0x31,%ymm4,%ymm6,%ymm4
DB 197,197,103,228 ; vpackuswb %ymm4,%ymm7,%ymm4
- DB 197,253,111,53,188,111,0,0 ; vmovdqa 0x6fbc(%rip),%ymm6 # 2ca00 <_sk_overlay_sse2_8bit+0xd8b>
+ DB 197,253,111,53,60,111,0,0 ; vmovdqa 0x6f3c(%rip),%ymm6 # 2c940 <_sk_overlay_sse2_8bit+0xd90>
DB 197,221,219,254 ; vpand %ymm6,%ymm4,%ymm7
DB 197,213,219,246 ; vpand %ymm6,%ymm5,%ymm6
DB 197,237,252,192 ; vpaddb %ymm0,%ymm2,%ymm0
@@ -35906,7 +35907,7 @@ _sk_exclusion_hsw_8bit LABEL PROC
PUBLIC _sk_difference_hsw_8bit
_sk_difference_hsw_8bit LABEL PROC
- DB 197,125,111,5,176,111,0,0 ; vmovdqa 0x6fb0(%rip),%ymm8 # 2ca20 <_sk_overlay_sse2_8bit+0xdab>
+ DB 197,125,111,5,48,111,0,0 ; vmovdqa 0x6f30(%rip),%ymm8 # 2c960 <_sk_overlay_sse2_8bit+0xdb0>
DB 196,194,101,0,224 ; vpshufb %ymm8,%ymm3,%ymm4
DB 196,194,109,0,240 ; vpshufb %ymm8,%ymm2,%ymm6
DB 196,98,125,48,208 ; vpmovzxbw %xmm0,%ymm10
@@ -35973,7 +35974,7 @@ _sk_difference_hsw_8bit LABEL PROC
DB 197,197,103,237 ; vpackuswb %ymm5,%ymm7,%ymm5
DB 197,181,218,228 ; vpminub %ymm4,%ymm9,%ymm4
DB 197,165,218,237 ; vpminub %ymm5,%ymm11,%ymm5
- DB 197,253,111,53,122,110,0,0 ; vmovdqa 0x6e7a(%rip),%ymm6 # 2ca40 <_sk_overlay_sse2_8bit+0xdcb>
+ DB 197,253,111,53,250,109,0,0 ; vmovdqa 0x6dfa(%rip),%ymm6 # 2c980 <_sk_overlay_sse2_8bit+0xdd0>
DB 197,213,219,254 ; vpand %ymm6,%ymm5,%ymm7
DB 197,221,219,246 ; vpand %ymm6,%ymm4,%ymm6
DB 197,237,252,192 ; vpaddb %ymm0,%ymm2,%ymm0
@@ -35987,87 +35988,86 @@ _sk_difference_hsw_8bit LABEL PROC
PUBLIC _sk_hardlight_hsw_8bit
_sk_hardlight_hsw_8bit LABEL PROC
- DB 72,129,236,56,2,0,0 ; sub $0x238,%rsp
- DB 197,252,17,28,36 ; vmovups %ymm3,(%rsp)
- DB 196,226,125,48,248 ; vpmovzxbw %xmm0,%ymm7
- DB 196,227,125,57,195,1 ; vextracti128 $0x1,%ymm0,%xmm3
- DB 196,226,125,48,243 ; vpmovzxbw %xmm3,%ymm6
- DB 196,98,125,48,217 ; vpmovzxbw %xmm1,%ymm11
- DB 197,126,127,156,36,0,1,0,0 ; vmovdqu %ymm11,0x100(%rsp)
- DB 196,227,125,57,203,1 ; vextracti128 $0x1,%ymm1,%xmm3
- DB 196,98,125,48,195 ; vpmovzxbw %xmm3,%ymm8
- DB 197,126,127,132,36,64,1,0,0 ; vmovdqu %ymm8,0x140(%rsp)
- DB 197,253,111,29,48,110,0,0 ; vmovdqa 0x6e30(%rip),%ymm3 # 2ca60 <_sk_overlay_sse2_8bit+0xdeb>
- DB 196,226,125,0,227 ; vpshufb %ymm3,%ymm0,%ymm4
- DB 196,226,117,0,203 ; vpshufb %ymm3,%ymm1,%ymm1
+ DB 72,129,236,24,2,0,0 ; sub $0x218,%rsp
DB 197,125,111,251 ; vmovdqa %ymm3,%ymm15
+ DB 196,226,125,48,248 ; vpmovzxbw %xmm0,%ymm7
+ DB 196,227,125,57,196,1 ; vextracti128 $0x1,%ymm0,%xmm4
+ DB 196,226,125,48,244 ; vpmovzxbw %xmm4,%ymm6
+ DB 196,226,125,48,217 ; vpmovzxbw %xmm1,%ymm3
+ DB 196,227,125,57,204,1 ; vextracti128 $0x1,%ymm1,%xmm4
+ DB 196,98,125,48,196 ; vpmovzxbw %xmm4,%ymm8
+ DB 197,126,127,132,36,224,0,0,0 ; vmovdqu %ymm8,0xe0(%rsp)
+ DB 197,253,111,45,186,109,0,0 ; vmovdqa 0x6dba(%rip),%ymm5 # 2c9a0 <_sk_overlay_sse2_8bit+0xdf0>
+ DB 196,226,125,0,229 ; vpshufb %ymm5,%ymm0,%ymm4
+ DB 196,226,117,0,205 ; vpshufb %ymm5,%ymm1,%ymm1
DB 196,227,125,57,200,1 ; vextracti128 $0x1,%ymm1,%xmm0
- DB 196,98,125,48,232 ; vpmovzxbw %xmm0,%ymm13
+ DB 196,98,125,48,240 ; vpmovzxbw %xmm0,%ymm14
DB 196,226,125,48,233 ; vpmovzxbw %xmm1,%ymm5
- DB 196,227,125,57,227,1 ; vextracti128 $0x1,%ymm4,%xmm3
- DB 196,98,125,48,203 ; vpmovzxbw %xmm3,%ymm9
+ DB 196,227,125,57,224,1 ; vextracti128 $0x1,%ymm4,%xmm0
+ DB 196,98,125,48,200 ; vpmovzxbw %xmm0,%ymm9
DB 196,98,125,48,212 ; vpmovzxbw %xmm4,%ymm10
DB 197,197,253,199 ; vpaddw %ymm7,%ymm7,%ymm0
- DB 197,205,253,222 ; vpaddw %ymm6,%ymm6,%ymm3
- DB 196,65,37,253,227 ; vpaddw %ymm11,%ymm11,%ymm12
+ DB 197,205,253,206 ; vpaddw %ymm6,%ymm6,%ymm1
+ DB 197,101,253,227 ; vpaddw %ymm3,%ymm3,%ymm12
DB 196,65,61,253,216 ; vpaddw %ymm8,%ymm8,%ymm11
- DB 196,66,37,58,245 ; vpminuw %ymm13,%ymm11,%ymm14
- DB 196,193,37,117,206 ; vpcmpeqw %ymm14,%ymm11,%ymm1
- DB 197,254,127,140,36,224,1,0,0 ; vmovdqu %ymm1,0x1e0(%rsp)
- DB 196,98,29,58,245 ; vpminuw %ymm5,%ymm12,%ymm14
- DB 196,193,29,117,206 ; vpcmpeqw %ymm14,%ymm12,%ymm1
- DB 197,254,127,140,36,192,1,0,0 ; vmovdqu %ymm1,0x1c0(%rsp)
- DB 196,66,101,58,241 ; vpminuw %ymm9,%ymm3,%ymm14
- DB 196,193,101,117,206 ; vpcmpeqw %ymm14,%ymm3,%ymm1
- DB 197,254,127,140,36,128,1,0,0 ; vmovdqu %ymm1,0x180(%rsp)
- DB 196,194,125,58,218 ; vpminuw %ymm10,%ymm0,%ymm3
- DB 197,125,117,243 ; vpcmpeqw %ymm3,%ymm0,%ymm14
+ DB 196,66,37,58,238 ; vpminuw %ymm14,%ymm11,%ymm13
+ DB 196,193,37,117,229 ; vpcmpeqw %ymm13,%ymm11,%ymm4
+ DB 197,254,127,164,36,160,1,0,0 ; vmovdqu %ymm4,0x1a0(%rsp)
+ DB 196,98,29,58,237 ; vpminuw %ymm5,%ymm12,%ymm13
+ DB 196,193,29,117,229 ; vpcmpeqw %ymm13,%ymm12,%ymm4
+ DB 197,254,127,164,36,128,1,0,0 ; vmovdqu %ymm4,0x180(%rsp)
+ DB 196,66,117,58,233 ; vpminuw %ymm9,%ymm1,%ymm13
+ DB 196,193,117,117,205 ; vpcmpeqw %ymm13,%ymm1,%ymm1
+ DB 197,254,127,140,36,64,1,0,0 ; vmovdqu %ymm1,0x140(%rsp)
+ DB 196,194,125,58,202 ; vpminuw %ymm10,%ymm0,%ymm1
+ DB 197,253,117,193 ; vpcmpeqw %ymm1,%ymm0,%ymm0
+ DB 197,254,127,132,36,0,1,0,0 ; vmovdqu %ymm0,0x100(%rsp)
DB 197,253,111,226 ; vmovdqa %ymm2,%ymm4
- DB 196,65,125,111,231 ; vmovdqa %ymm15,%ymm12
- DB 196,194,93,0,220 ; vpshufb %ymm12,%ymm4,%ymm3
- DB 196,226,125,48,211 ; vpmovzxbw %xmm3,%ymm2
- DB 196,226,125,121,5,178,109,0,0 ; vpbroadcastw 0x6db2(%rip),%ymm0 # 2ca80 <_sk_overlay_sse2_8bit+0xe0b>
- DB 197,109,239,248 ; vpxor %ymm0,%ymm2,%ymm15
- DB 197,133,213,207 ; vpmullw %ymm7,%ymm15,%ymm1
- DB 197,254,127,140,36,160,1,0,0 ; vmovdqu %ymm1,0x1a0(%rsp)
+ DB 197,125,111,37,40,109,0,0 ; vmovdqa 0x6d28(%rip),%ymm12 # 2c9a0 <_sk_overlay_sse2_8bit+0xdf0>
+ DB 196,66,93,0,196 ; vpshufb %ymm12,%ymm4,%ymm8
+ DB 196,194,125,48,208 ; vpmovzxbw %xmm8,%ymm2
+ DB 196,226,125,121,5,53,109,0,0 ; vpbroadcastw 0x6d35(%rip),%ymm0 # 2c9c0 <_sk_overlay_sse2_8bit+0xe10>
+ DB 197,109,239,232 ; vpxor %ymm0,%ymm2,%ymm13
+ DB 197,149,213,207 ; vpmullw %ymm7,%ymm13,%ymm1
+ DB 197,254,127,140,36,96,1,0,0 ; vmovdqu %ymm1,0x160(%rsp)
DB 196,226,125,48,204 ; vpmovzxbw %xmm4,%ymm1
- DB 197,254,127,164,36,0,2,0,0 ; vmovdqu %ymm4,0x200(%rsp)
- DB 197,45,239,248 ; vpxor %ymm0,%ymm10,%ymm15
- DB 197,5,213,193 ; vpmullw %ymm1,%ymm15,%ymm8
- DB 197,126,127,132,36,96,1,0,0 ; vmovdqu %ymm8,0x160(%rsp)
- DB 197,117,213,199 ; vpmullw %ymm7,%ymm1,%ymm8
- DB 197,126,127,132,36,32,1,0,0 ; vmovdqu %ymm8,0x120(%rsp)
+ DB 197,254,127,164,36,224,1,0,0 ; vmovdqu %ymm4,0x1e0(%rsp)
+ DB 197,45,239,232 ; vpxor %ymm0,%ymm10,%ymm13
+ DB 197,21,213,217 ; vpmullw %ymm1,%ymm13,%ymm11
+ DB 197,126,127,156,36,32,1,0,0 ; vmovdqu %ymm11,0x120(%rsp)
+ DB 197,117,213,223 ; vpmullw %ymm7,%ymm1,%ymm11
+ DB 197,126,127,156,36,192,0,0,0 ; vmovdqu %ymm11,0xc0(%rsp)
DB 197,237,249,201 ; vpsubw %ymm1,%ymm2,%ymm1
- DB 197,254,127,76,36,64 ; vmovdqu %ymm1,0x40(%rsp)
+ DB 197,254,127,12,36 ; vmovdqu %ymm1,(%rsp)
DB 196,193,109,213,202 ; vpmullw %ymm10,%ymm2,%ymm1
- DB 197,254,127,140,36,160,0,0,0 ; vmovdqu %ymm1,0xa0(%rsp)
+ DB 197,254,127,76,36,96 ; vmovdqu %ymm1,0x60(%rsp)
DB 197,45,249,223 ; vpsubw %ymm7,%ymm10,%ymm11
DB 196,227,125,57,226,1 ; vextracti128 $0x1,%ymm4,%xmm2
DB 196,226,125,48,210 ; vpmovzxbw %xmm2,%ymm2
- DB 196,227,125,57,219,1 ; vextracti128 $0x1,%ymm3,%xmm3
- DB 196,226,125,48,219 ; vpmovzxbw %xmm3,%ymm3
- DB 197,101,239,208 ; vpxor %ymm0,%ymm3,%ymm10
- DB 197,173,213,206 ; vpmullw %ymm6,%ymm10,%ymm1
- DB 197,254,127,140,36,224,0,0,0 ; vmovdqu %ymm1,0xe0(%rsp)
+ DB 196,99,125,57,193,1 ; vextracti128 $0x1,%ymm8,%xmm1
+ DB 196,226,125,48,201 ; vpmovzxbw %xmm1,%ymm1
+ DB 197,117,239,208 ; vpxor %ymm0,%ymm1,%ymm10
+ DB 197,173,213,230 ; vpmullw %ymm6,%ymm10,%ymm4
+ DB 197,254,127,164,36,160,0,0,0 ; vmovdqu %ymm4,0xa0(%rsp)
DB 197,53,239,208 ; vpxor %ymm0,%ymm9,%ymm10
- DB 197,173,213,202 ; vpmullw %ymm2,%ymm10,%ymm1
- DB 197,254,127,140,36,192,0,0,0 ; vmovdqu %ymm1,0xc0(%rsp)
- DB 197,237,213,206 ; vpmullw %ymm6,%ymm2,%ymm1
- DB 197,254,127,76,36,32 ; vmovdqu %ymm1,0x20(%rsp)
- DB 197,229,249,226 ; vpsubw %ymm2,%ymm3,%ymm4
- DB 196,65,101,213,193 ; vpmullw %ymm9,%ymm3,%ymm8
+ DB 197,173,213,226 ; vpmullw %ymm2,%ymm10,%ymm4
+ DB 197,254,127,164,36,128,0,0,0 ; vmovdqu %ymm4,0x80(%rsp)
+ DB 197,109,213,238 ; vpmullw %ymm6,%ymm2,%ymm13
+ DB 197,245,249,226 ; vpsubw %ymm2,%ymm1,%ymm4
+ DB 196,65,117,213,193 ; vpmullw %ymm9,%ymm1,%ymm8
DB 197,181,249,246 ; vpsubw %ymm6,%ymm9,%ymm6
- DB 197,254,111,60,36 ; vmovdqu (%rsp),%ymm7
+ DB 197,125,127,255 ; vmovdqa %ymm15,%ymm7
+ DB 197,254,127,188,36,192,1,0,0 ; vmovdqu %ymm7,0x1c0(%rsp)
DB 196,66,69,0,204 ; vpshufb %ymm12,%ymm7,%ymm9
DB 196,194,125,48,209 ; vpmovzxbw %xmm9,%ymm2
DB 197,109,239,248 ; vpxor %ymm0,%ymm2,%ymm15
- DB 197,126,111,164,36,0,1,0,0 ; vmovdqu 0x100(%rsp),%ymm12
+ DB 197,125,111,227 ; vmovdqa %ymm3,%ymm12
DB 196,193,5,213,204 ; vpmullw %ymm12,%ymm15,%ymm1
- DB 197,254,127,140,36,128,0,0,0 ; vmovdqu %ymm1,0x80(%rsp)
+ DB 197,254,127,76,36,64 ; vmovdqu %ymm1,0x40(%rsp)
DB 196,226,125,48,207 ; vpmovzxbw %xmm7,%ymm1
DB 197,85,239,248 ; vpxor %ymm0,%ymm5,%ymm15
DB 197,133,213,217 ; vpmullw %ymm1,%ymm15,%ymm3
- DB 197,254,127,92,36,96 ; vmovdqu %ymm3,0x60(%rsp)
+ DB 197,254,127,92,36,32 ; vmovdqu %ymm3,0x20(%rsp)
DB 196,65,117,213,212 ; vpmullw %ymm12,%ymm1,%ymm10
DB 197,237,249,217 ; vpsubw %ymm1,%ymm2,%ymm3
DB 197,237,213,213 ; vpmullw %ymm5,%ymm2,%ymm2
@@ -36077,56 +36077,56 @@ _sk_hardlight_hsw_8bit LABEL PROC
DB 196,99,125,57,207,1 ; vextracti128 $0x1,%ymm9,%xmm7
DB 196,226,125,48,255 ; vpmovzxbw %xmm7,%ymm7
DB 197,69,239,200 ; vpxor %ymm0,%ymm7,%ymm9
- DB 197,254,111,140,36,64,1,0,0 ; vmovdqu 0x140(%rsp),%ymm1
+ DB 197,254,111,140,36,224,0,0,0 ; vmovdqu 0xe0(%rsp),%ymm1
DB 197,53,213,225 ; vpmullw %ymm1,%ymm9,%ymm12
- DB 197,149,239,192 ; vpxor %ymm0,%ymm13,%ymm0
+ DB 197,141,239,192 ; vpxor %ymm0,%ymm14,%ymm0
DB 196,65,125,213,207 ; vpmullw %ymm15,%ymm0,%ymm9
DB 197,133,213,193 ; vpmullw %ymm1,%ymm15,%ymm0
DB 196,65,69,249,255 ; vpsubw %ymm15,%ymm7,%ymm15
- DB 196,193,69,213,253 ; vpmullw %ymm13,%ymm7,%ymm7
- DB 197,21,249,233 ; vpsubw %ymm1,%ymm13,%ymm13
- DB 196,65,5,213,237 ; vpmullw %ymm13,%ymm15,%ymm13
+ DB 196,193,69,213,254 ; vpmullw %ymm14,%ymm7,%ymm7
+ DB 197,13,249,241 ; vpsubw %ymm1,%ymm14,%ymm14
+ DB 196,65,5,213,246 ; vpmullw %ymm14,%ymm15,%ymm14
DB 197,229,213,205 ; vpmullw %ymm5,%ymm3,%ymm1
DB 197,221,213,230 ; vpmullw %ymm6,%ymm4,%ymm4
- DB 197,165,213,108,36,64 ; vpmullw 0x40(%rsp),%ymm11,%ymm5
- DB 196,193,21,253,245 ; vpaddw %ymm13,%ymm13,%ymm6
+ DB 197,165,213,44,36 ; vpmullw (%rsp),%ymm11,%ymm5
+ DB 196,193,13,253,246 ; vpaddw %ymm14,%ymm14,%ymm6
DB 197,197,249,246 ; vpsubw %ymm6,%ymm7,%ymm6
DB 197,245,253,201 ; vpaddw %ymm1,%ymm1,%ymm1
DB 197,237,249,201 ; vpsubw %ymm1,%ymm2,%ymm1
DB 197,221,253,212 ; vpaddw %ymm4,%ymm4,%ymm2
DB 197,189,249,210 ; vpsubw %ymm2,%ymm8,%ymm2
DB 197,213,253,221 ; vpaddw %ymm5,%ymm5,%ymm3
- DB 197,254,111,164,36,160,0,0,0 ; vmovdqu 0xa0(%rsp),%ymm4
+ DB 197,254,111,100,36,96 ; vmovdqu 0x60(%rsp),%ymm4
DB 197,221,249,219 ; vpsubw %ymm3,%ymm4,%ymm3
- DB 197,254,111,164,36,32,1,0,0 ; vmovdqu 0x120(%rsp),%ymm4
+ DB 197,254,111,164,36,192,0,0,0 ; vmovdqu 0xc0(%rsp),%ymm4
DB 197,221,253,228 ; vpaddw %ymm4,%ymm4,%ymm4
- DB 197,141,223,219 ; vpandn %ymm3,%ymm14,%ymm3
- DB 196,193,93,219,230 ; vpand %ymm14,%ymm4,%ymm4
+ DB 197,254,111,172,36,0,1,0,0 ; vmovdqu 0x100(%rsp),%ymm5
+ DB 197,213,223,219 ; vpandn %ymm3,%ymm5,%ymm3
+ DB 197,221,219,229 ; vpand %ymm5,%ymm4,%ymm4
DB 197,221,235,219 ; vpor %ymm3,%ymm4,%ymm3
- DB 197,254,111,100,36,32 ; vmovdqu 0x20(%rsp),%ymm4
- DB 197,221,253,228 ; vpaddw %ymm4,%ymm4,%ymm4
- DB 197,254,111,172,36,128,1,0,0 ; vmovdqu 0x180(%rsp),%ymm5
+ DB 196,193,21,253,229 ; vpaddw %ymm13,%ymm13,%ymm4
+ DB 197,254,111,172,36,64,1,0,0 ; vmovdqu 0x140(%rsp),%ymm5
DB 197,213,223,210 ; vpandn %ymm2,%ymm5,%ymm2
DB 197,221,219,229 ; vpand %ymm5,%ymm4,%ymm4
DB 197,221,235,210 ; vpor %ymm2,%ymm4,%ymm2
DB 196,193,45,253,226 ; vpaddw %ymm10,%ymm10,%ymm4
- DB 197,254,111,172,36,192,1,0,0 ; vmovdqu 0x1c0(%rsp),%ymm5
+ DB 197,254,111,172,36,128,1,0,0 ; vmovdqu 0x180(%rsp),%ymm5
DB 197,213,223,201 ; vpandn %ymm1,%ymm5,%ymm1
DB 197,221,219,229 ; vpand %ymm5,%ymm4,%ymm4
DB 197,221,235,201 ; vpor %ymm1,%ymm4,%ymm1
DB 197,253,253,192 ; vpaddw %ymm0,%ymm0,%ymm0
- DB 197,254,111,172,36,224,1,0,0 ; vmovdqu 0x1e0(%rsp),%ymm5
+ DB 197,254,111,172,36,160,1,0,0 ; vmovdqu 0x1a0(%rsp),%ymm5
DB 197,213,223,230 ; vpandn %ymm6,%ymm5,%ymm4
DB 197,253,219,197 ; vpand %ymm5,%ymm0,%ymm0
DB 197,253,235,196 ; vpor %ymm4,%ymm0,%ymm0
- DB 197,254,111,164,36,96,1,0,0 ; vmovdqu 0x160(%rsp),%ymm4
- DB 197,221,253,164,36,160,1,0,0 ; vpaddw 0x1a0(%rsp),%ymm4,%ymm4
- DB 197,254,111,172,36,192,0,0,0 ; vmovdqu 0xc0(%rsp),%ymm5
- DB 197,213,253,172,36,224,0,0,0 ; vpaddw 0xe0(%rsp),%ymm5,%ymm5
- DB 197,254,111,116,36,96 ; vmovdqu 0x60(%rsp),%ymm6
- DB 197,205,253,180,36,128,0,0,0 ; vpaddw 0x80(%rsp),%ymm6,%ymm6
+ DB 197,254,111,164,36,32,1,0,0 ; vmovdqu 0x120(%rsp),%ymm4
+ DB 197,221,253,164,36,96,1,0,0 ; vpaddw 0x160(%rsp),%ymm4,%ymm4
+ DB 197,254,111,172,36,128,0,0,0 ; vmovdqu 0x80(%rsp),%ymm5
+ DB 197,213,253,172,36,160,0,0,0 ; vpaddw 0xa0(%rsp),%ymm5,%ymm5
+ DB 197,254,111,116,36,32 ; vmovdqu 0x20(%rsp),%ymm6
+ DB 197,205,253,116,36,64 ; vpaddw 0x40(%rsp),%ymm6,%ymm6
DB 196,193,53,253,252 ; vpaddw %ymm12,%ymm9,%ymm7
- DB 196,98,125,121,5,145,107,0,0 ; vpbroadcastw 0x6b91(%rip),%ymm8 # 2ca82 <_sk_overlay_sse2_8bit+0xe0d>
+ DB 196,98,125,121,5,34,107,0,0 ; vpbroadcastw 0x6b22(%rip),%ymm8 # 2c9c2 <_sk_overlay_sse2_8bit+0xe12>
DB 196,193,93,253,224 ; vpaddw %ymm8,%ymm4,%ymm4
DB 197,229,253,220 ; vpaddw %ymm4,%ymm3,%ymm3
DB 196,193,85,253,224 ; vpaddw %ymm8,%ymm5,%ymm4
@@ -36135,7 +36135,7 @@ _sk_hardlight_hsw_8bit LABEL PROC
DB 197,245,253,204 ; vpaddw %ymm4,%ymm1,%ymm1
DB 196,193,69,253,224 ; vpaddw %ymm8,%ymm7,%ymm4
DB 197,253,253,196 ; vpaddw %ymm4,%ymm0,%ymm0
- DB 196,226,125,121,37,102,107,0,0 ; vpbroadcastw 0x6b66(%rip),%ymm4 # 2ca84 <_sk_overlay_sse2_8bit+0xe0f>
+ DB 196,226,125,121,37,247,106,0,0 ; vpbroadcastw 0x6af7(%rip),%ymm4 # 2c9c4 <_sk_overlay_sse2_8bit+0xe14>
DB 197,253,228,196 ; vpmulhuw %ymm4,%ymm0,%ymm0
DB 197,245,228,204 ; vpmulhuw %ymm4,%ymm1,%ymm1
DB 197,237,228,212 ; vpmulhuw %ymm4,%ymm2,%ymm2
@@ -36151,16 +36151,16 @@ _sk_hardlight_hsw_8bit LABEL PROC
DB 196,227,117,70,203,49 ; vperm2i128 $0x31,%ymm3,%ymm1,%ymm1
DB 197,237,103,201 ; vpackuswb %ymm1,%ymm2,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 197,252,16,148,36,0,2,0,0 ; vmovups 0x200(%rsp),%ymm2
- DB 197,252,16,28,36 ; vmovups (%rsp),%ymm3
- DB 72,129,196,56,2,0,0 ; add $0x238,%rsp
+ DB 197,252,16,148,36,224,1,0,0 ; vmovups 0x1e0(%rsp),%ymm2
+ DB 197,252,16,156,36,192,1,0,0 ; vmovups 0x1c0(%rsp),%ymm3
+ DB 72,129,196,24,2,0,0 ; add $0x218,%rsp
DB 255,224 ; jmpq *%rax
PUBLIC _sk_overlay_hsw_8bit
_sk_overlay_hsw_8bit LABEL PROC
DB 72,129,236,24,2,0,0 ; sub $0x218,%rsp
DB 197,252,17,140,36,192,1,0,0 ; vmovups %ymm1,0x1c0(%rsp)
- DB 197,253,111,45,13,107,0,0 ; vmovdqa 0x6b0d(%rip),%ymm5 # 2caa0 <_sk_overlay_sse2_8bit+0xe2b>
+ DB 197,253,111,45,154,106,0,0 ; vmovdqa 0x6a9a(%rip),%ymm5 # 2c9e0 <_sk_overlay_sse2_8bit+0xe30>
DB 197,253,111,226 ; vmovdqa %ymm2,%ymm4
DB 196,227,125,57,225,1 ; vextracti128 $0x1,%ymm4,%xmm1
DB 196,98,125,48,193 ; vpmovzxbw %xmm1,%ymm8
@@ -36195,7 +36195,7 @@ _sk_overlay_hsw_8bit LABEL PROC
DB 197,93,117,251 ; vpcmpeqw %ymm3,%ymm4,%ymm15
DB 197,253,111,216 ; vmovdqa %ymm0,%ymm3
DB 196,226,125,48,227 ; vpmovzxbw %xmm3,%ymm4
- DB 196,226,125,121,5,103,106,0,0 ; vpbroadcastw 0x6a67(%rip),%ymm0 # 2cac0 <_sk_overlay_sse2_8bit+0xe4b>
+ DB 196,226,125,121,5,244,105,0,0 ; vpbroadcastw 0x69f4(%rip),%ymm0 # 2ca00 <_sk_overlay_sse2_8bit+0xe50>
DB 197,117,239,232 ; vpxor %ymm0,%ymm1,%ymm13
DB 197,21,213,212 ; vpmullw %ymm4,%ymm13,%ymm10
DB 197,126,127,148,36,64,1,0,0 ; vmovdqu %ymm10,0x140(%rsp)
@@ -36296,7 +36296,7 @@ _sk_overlay_hsw_8bit LABEL PROC
DB 197,254,111,116,36,64 ; vmovdqu 0x40(%rsp),%ymm6
DB 197,205,253,116,36,96 ; vpaddw 0x60(%rsp),%ymm6,%ymm6
DB 196,193,29,253,253 ; vpaddw %ymm13,%ymm12,%ymm7
- DB 196,98,125,121,5,90,104,0,0 ; vpbroadcastw 0x685a(%rip),%ymm8 # 2cac2 <_sk_overlay_sse2_8bit+0xe4d>
+ DB 196,98,125,121,5,231,103,0,0 ; vpbroadcastw 0x67e7(%rip),%ymm8 # 2ca02 <_sk_overlay_sse2_8bit+0xe52>
DB 196,193,109,253,208 ; vpaddw %ymm8,%ymm2,%ymm2
DB 197,229,253,210 ; vpaddw %ymm2,%ymm3,%ymm2
DB 196,193,85,253,216 ; vpaddw %ymm8,%ymm5,%ymm3
@@ -36305,7 +36305,7 @@ _sk_overlay_hsw_8bit LABEL PROC
DB 197,245,253,204 ; vpaddw %ymm4,%ymm1,%ymm1
DB 196,193,69,253,224 ; vpaddw %ymm8,%ymm7,%ymm4
DB 197,253,253,196 ; vpaddw %ymm4,%ymm0,%ymm0
- DB 196,226,125,121,37,47,104,0,0 ; vpbroadcastw 0x682f(%rip),%ymm4 # 2cac4 <_sk_overlay_sse2_8bit+0xe4f>
+ DB 196,226,125,121,37,188,103,0,0 ; vpbroadcastw 0x67bc(%rip),%ymm4 # 2ca04 <_sk_overlay_sse2_8bit+0xe54>
DB 197,253,228,196 ; vpmulhuw %ymm4,%ymm0,%ymm0
DB 197,245,228,204 ; vpmulhuw %ymm4,%ymm1,%ymm1
DB 197,229,228,220 ; vpmulhuw %ymm4,%ymm3,%ymm3
@@ -36327,6 +36327,7 @@ _sk_overlay_hsw_8bit LABEL PROC
DB 255,224 ; jmpq *%rax
DB 144 ; nop
DB 144 ; nop
+ DB 144 ; nop
PUBLIC _sk_start_pipeline_sse41_8bit
_sk_start_pipeline_sse41_8bit LABEL PROC
@@ -36339,7 +36340,7 @@ _sk_start_pipeline_sse41_8bit LABEL PROC
DB 86 ; push %rsi
DB 87 ; push %rdi
DB 83 ; push %rbx
- DB 72,129,236,216,0,0,0 ; sub $0xd8,%rsp
+ DB 72,129,236,200,0,0,0 ; sub $0xc8,%rsp
DB 68,15,41,125,176 ; movaps %xmm15,-0x50(%rbp)
DB 68,15,41,117,160 ; movaps %xmm14,-0x60(%rbp)
DB 68,15,41,109,144 ; movaps %xmm13,-0x70(%rbp)
@@ -36350,45 +36351,42 @@ _sk_start_pipeline_sse41_8bit LABEL PROC
DB 68,15,41,133,64,255,255,255 ; movaps %xmm8,-0xc0(%rbp)
DB 15,41,189,48,255,255,255 ; movaps %xmm7,-0xd0(%rbp)
DB 15,41,181,32,255,255,255 ; movaps %xmm6,-0xe0(%rbp)
- DB 76,137,195 ; mov %r8,%rbx
- DB 73,137,215 ; mov %rdx,%r15
+ DB 77,137,199 ; mov %r8,%r15
+ DB 72,137,211 ; mov %rdx,%rbx
DB 72,137,141,24,255,255,255 ; mov %rcx,-0xe8(%rbp)
DB 72,139,117,48 ; mov 0x30(%rbp),%rsi
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,197 ; mov %rax,%r13
DB 73,137,246 ; mov %rsi,%r14
- DB 76,137,141,240,254,255,255 ; mov %r9,-0x110(%rbp)
- DB 77,57,207 ; cmp %r9,%r15
- DB 15,131,138,0,0,0 ; jae 26403 <_sk_start_pipeline_sse41_8bit+0x10b>
+ DB 76,137,141,8,255,255,255 ; mov %r9,-0xf8(%rbp)
+ DB 76,57,203 ; cmp %r9,%rbx
+ DB 115,101 ; jae 2638e <_sk_start_pipeline_sse41_8bit+0xe2>
DB 72,139,133,24,255,255,255 ; mov -0xe8(%rbp),%rax
DB 72,141,64,8 ; lea 0x8(%rax),%rax
- DB 72,137,133,248,254,255,255 ; mov %rax,-0x108(%rbp)
- DB 76,141,165,0,255,255,255 ; lea -0x100(%rbp),%r12
- DB 72,57,157,248,254,255,255 ; cmp %rbx,-0x108(%rbp)
- DB 72,139,133,24,255,255,255 ; mov -0xe8(%rbp),%rax
- DB 72,137,133,0,255,255,255 ; mov %rax,-0x100(%rbp)
- DB 76,137,189,8,255,255,255 ; mov %r15,-0xf8(%rbp)
- DB 72,199,133,16,255,255,255,0,0,0,0 ; movq $0x0,-0xf0(%rbp)
- DB 119,36 ; ja 263df <_sk_start_pipeline_sse41_8bit+0xe7>
- DB 76,137,231 ; mov %r12,%rdi
+ DB 72,137,133,16,255,255,255 ; mov %rax,-0xf0(%rbp)
+ DB 76,57,189,16,255,255,255 ; cmp %r15,-0xf0(%rbp)
+ DB 72,139,149,24,255,255,255 ; mov -0xe8(%rbp),%rdx
+ DB 119,38 ; ja 26371 <_sk_start_pipeline_sse41_8bit+0xc5>
+ DB 76,139,165,24,255,255,255 ; mov -0xe8(%rbp),%r12
+ DB 49,255 ; xor %edi,%edi
DB 76,137,246 ; mov %r14,%rsi
- DB 65,255,213 ; callq *%r13
- DB 72,139,141,0,255,255,255 ; mov -0x100(%rbp),%rcx
- DB 72,141,65,8 ; lea 0x8(%rcx),%rax
- DB 72,137,133,0,255,255,255 ; mov %rax,-0x100(%rbp)
- DB 72,131,193,16 ; add $0x10,%rcx
- DB 72,57,217 ; cmp %rbx,%rcx
- DB 118,220 ; jbe 263bb <_sk_start_pipeline_sse41_8bit+0xc3>
+ DB 76,137,226 ; mov %r12,%rdx
DB 72,137,217 ; mov %rbx,%rcx
- DB 72,41,193 ; sub %rax,%rcx
- DB 116,16 ; je 263f7 <_sk_start_pipeline_sse41_8bit+0xff>
- DB 72,137,141,16,255,255,255 ; mov %rcx,-0xf0(%rbp)
- DB 76,137,231 ; mov %r12,%rdi
+ DB 65,255,213 ; callq *%r13
+ DB 73,141,84,36,8 ; lea 0x8(%r12),%rdx
+ DB 73,131,196,16 ; add $0x10,%r12
+ DB 77,57,252 ; cmp %r15,%r12
+ DB 73,137,212 ; mov %rdx,%r12
+ DB 118,225 ; jbe 26352 <_sk_start_pipeline_sse41_8bit+0xa6>
+ DB 76,137,255 ; mov %r15,%rdi
+ DB 72,41,215 ; sub %rdx,%rdi
+ DB 116,9 ; je 26382 <_sk_start_pipeline_sse41_8bit+0xd6>
DB 76,137,246 ; mov %r14,%rsi
+ DB 72,137,217 ; mov %rbx,%rcx
DB 65,255,213 ; callq *%r13
- DB 73,255,199 ; inc %r15
- DB 76,59,189,240,254,255,255 ; cmp -0x110(%rbp),%r15
- DB 117,143 ; jne 26392 <_sk_start_pipeline_sse41_8bit+0x9a>
+ DB 72,255,195 ; inc %rbx
+ DB 72,59,157,8,255,255,255 ; cmp -0xf8(%rbp),%rbx
+ DB 117,173 ; jne 2633b <_sk_start_pipeline_sse41_8bit+0x8f>
DB 15,40,181,32,255,255,255 ; movaps -0xe0(%rbp),%xmm6
DB 15,40,189,48,255,255,255 ; movaps -0xd0(%rbp),%xmm7
DB 68,15,40,133,64,255,255,255 ; movaps -0xc0(%rbp),%xmm8
@@ -36399,7 +36397,7 @@ _sk_start_pipeline_sse41_8bit LABEL PROC
DB 68,15,40,109,144 ; movaps -0x70(%rbp),%xmm13
DB 68,15,40,117,160 ; movaps -0x60(%rbp),%xmm14
DB 68,15,40,125,176 ; movaps -0x50(%rbp),%xmm15
- DB 72,129,196,216,0,0,0 ; add $0xd8,%rsp
+ DB 72,129,196,200,0,0,0 ; add $0xc8,%rsp
DB 91 ; pop %rbx
DB 95 ; pop %rdi
DB 94 ; pop %rsi
@@ -36426,22 +36424,22 @@ _sk_uniform_color_sse41_8bit LABEL PROC
PUBLIC _sk_set_rgb_sse41_8bit
_sk_set_rgb_sse41_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 243,15,16,37,152,92,0,0 ; movss 0x5c98(%rip),%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 243,15,16,37,73,92,0,0 ; movss 0x5c49(%rip),%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 243,15,16,40 ; movss (%rax),%xmm5
DB 243,15,89,236 ; mulss %xmm4,%xmm5
- DB 243,72,15,44,205 ; cvttss2si %xmm5,%rcx
+ DB 243,76,15,44,197 ; cvttss2si %xmm5,%r8
DB 243,15,16,104,4 ; movss 0x4(%rax),%xmm5
DB 243,15,89,236 ; mulss %xmm4,%xmm5
- DB 243,72,15,44,213 ; cvttss2si %xmm5,%rdx
- DB 193,226,8 ; shl $0x8,%edx
- DB 9,202 ; or %ecx,%edx
+ DB 243,76,15,44,205 ; cvttss2si %xmm5,%r9
+ DB 65,193,225,8 ; shl $0x8,%r9d
+ DB 69,9,193 ; or %r8d,%r9d
DB 243,15,89,96,8 ; mulss 0x8(%rax),%xmm4
DB 243,72,15,44,196 ; cvttss2si %xmm4,%rax
DB 193,224,16 ; shl $0x10,%eax
- DB 9,208 ; or %edx,%eax
+ DB 68,9,200 ; or %r9d,%eax
DB 102,15,110,224 ; movd %eax,%xmm4
DB 102,15,112,228,0 ; pshufd $0x0,%xmm4,%xmm4
- DB 102,15,111,45,88,109,0,0 ; movdqa 0x6d58(%rip),%xmm5 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,45,10,109,0,0 ; movdqa 0x6d0a(%rip),%xmm5 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,219,205 ; pand %xmm5,%xmm1
DB 102,15,219,197 ; pand %xmm5,%xmm0
DB 102,15,235,196 ; por %xmm4,%xmm0
@@ -36453,12 +36451,12 @@ PUBLIC _sk_premul_sse41_8bit
_sk_premul_sse41_8bit LABEL PROC
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
- DB 102,15,111,5,68,109,0,0 ; movdqa 0x6d44(%rip),%xmm0 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,5,246,108,0,0 ; movdqa 0x6cf6(%rip),%xmm0 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,15,111,253 ; movdqa %xmm5,%xmm7
DB 102,15,56,0,248 ; pshufb %xmm0,%xmm7
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
DB 102,15,56,0,240 ; pshufb %xmm0,%xmm6
- DB 102,15,111,5,26,109,0,0 ; movdqa 0x6d1a(%rip),%xmm0 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,5,204,108,0,0 ; movdqa 0x6ccc(%rip),%xmm0 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,235,240 ; por %xmm0,%xmm6
DB 102,15,235,248 ; por %xmm0,%xmm7
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
@@ -36489,7 +36487,7 @@ _sk_premul_sse41_8bit LABEL PROC
PUBLIC _sk_swap_rb_sse41_8bit
_sk_swap_rb_sse41_8bit LABEL PROC
- DB 102,15,111,37,183,108,0,0 ; movdqa 0x6cb7(%rip),%xmm4 # 2d230 <_sk_overlay_sse2_8bit+0x15bb>
+ DB 102,15,111,37,105,108,0,0 ; movdqa 0x6c69(%rip),%xmm4 # 2d170 <_sk_overlay_sse2_8bit+0x15c0>
DB 102,15,56,0,196 ; pshufb %xmm4,%xmm0
DB 102,15,56,0,204 ; pshufb %xmm4,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -36505,50 +36503,50 @@ _sk_invert_sse41_8bit LABEL PROC
PUBLIC _sk_load_8888_sse41_8bit
_sk_load_8888_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,17 ; jne 265c9 <_sk_load_8888_sse41_8bit+0x32>
- DB 243,66,15,111,76,130,16 ; movdqu 0x10(%rdx,%r8,4),%xmm1
- DB 243,66,15,111,4,130 ; movdqu (%rdx,%r8,4),%xmm0
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 26552 <_sk_load_8888_sse41_8bit+0x2d>
+ DB 243,67,15,111,76,152,16 ; movdqu 0x10(%r8,%r11,4),%xmm1
+ DB 243,67,15,111,4,152 ; movdqu (%r8,%r11,4),%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,231 ; ja 265c5 <_sk_load_8888_sse41_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,75,0,0,0 ; lea 0x4b(%rip),%rcx # 26634 <_sk_load_8888_sse41_8bit+0x9d>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,228 ; ja 2654e <_sk_load_8888_sse41_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,75,0,0,0 ; lea 0x4b(%rip),%r10 # 265c0 <_sk_load_8888_sse41_8bit+0x9b>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 102,66,15,110,4,130 ; movd (%rdx,%r8,4),%xmm0
- DB 235,203 ; jmp 265c5 <_sk_load_8888_sse41_8bit+0x2e>
- DB 102,66,15,110,68,130,8 ; movd 0x8(%rdx,%r8,4),%xmm0
+ DB 102,67,15,110,4,152 ; movd (%r8,%r11,4),%xmm0
+ DB 235,200 ; jmp 2654e <_sk_load_8888_sse41_8bit+0x29>
+ DB 102,67,15,110,68,152,8 ; movd 0x8(%r8,%r11,4),%xmm0
DB 102,15,112,192,69 ; pshufd $0x45,%xmm0,%xmm0
- DB 243,66,15,126,36,130 ; movq (%rdx,%r8,4),%xmm4
+ DB 243,67,15,126,36,152 ; movq (%r8,%r11,4),%xmm4
DB 102,15,58,14,196,15 ; pblendw $0xf,%xmm4,%xmm0
- DB 235,177 ; jmp 265c5 <_sk_load_8888_sse41_8bit+0x2e>
- DB 102,66,15,110,68,130,24 ; movd 0x18(%rdx,%r8,4),%xmm0
+ DB 235,174 ; jmp 2654e <_sk_load_8888_sse41_8bit+0x29>
+ DB 102,67,15,110,68,152,24 ; movd 0x18(%r8,%r11,4),%xmm0
DB 102,15,112,200,69 ; pshufd $0x45,%xmm0,%xmm1
- DB 102,66,15,58,34,76,130,20,1 ; pinsrd $0x1,0x14(%rdx,%r8,4),%xmm1
- DB 102,66,15,58,34,76,130,16,0 ; pinsrd $0x0,0x10(%rdx,%r8,4),%xmm1
- DB 235,139 ; jmp 265bf <_sk_load_8888_sse41_8bit+0x28>
+ DB 102,67,15,58,34,76,152,20,1 ; pinsrd $0x1,0x14(%r8,%r11,4),%xmm1
+ DB 102,67,15,58,34,76,152,16,0 ; pinsrd $0x0,0x10(%r8,%r11,4),%xmm1
+ DB 235,136 ; jmp 26548 <_sk_load_8888_sse41_8bit+0x23>
DB 190,255,255,255,210 ; mov $0xd2ffffff,%esi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,198 ; inc %esi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,139,255,255,255,245 ; decl -0xa000001(%rbx)
+ DB 255,136,255,255,255,245 ; decl -0xa000001(%rax)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
@@ -36562,316 +36560,313 @@ _sk_load_8888_sse41_8bit LABEL PROC
PUBLIC _sk_load_8888_dst_sse41_8bit
_sk_load_8888_dst_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,17 ; jne 26682 <_sk_load_8888_dst_sse41_8bit+0x32>
- DB 243,66,15,111,92,130,16 ; movdqu 0x10(%rdx,%r8,4),%xmm3
- DB 243,66,15,111,20,130 ; movdqu (%rdx,%r8,4),%xmm2
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 26609 <_sk_load_8888_dst_sse41_8bit+0x2d>
+ DB 243,67,15,111,92,152,16 ; movdqu 0x10(%r8,%r11,4),%xmm3
+ DB 243,67,15,111,20,152 ; movdqu (%r8,%r11,4),%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,231 ; ja 2667e <_sk_load_8888_dst_sse41_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,78,0,0,0 ; lea 0x4e(%rip),%rcx # 266f0 <_sk_load_8888_dst_sse41_8bit+0xa0>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,228 ; ja 26605 <_sk_load_8888_dst_sse41_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,76,0,0,0 ; lea 0x4c(%rip),%r10 # 26678 <_sk_load_8888_dst_sse41_8bit+0x9c>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 102,66,15,110,20,130 ; movd (%rdx,%r8,4),%xmm2
- DB 235,203 ; jmp 2667e <_sk_load_8888_dst_sse41_8bit+0x2e>
- DB 102,66,15,110,84,130,8 ; movd 0x8(%rdx,%r8,4),%xmm2
+ DB 102,67,15,110,20,152 ; movd (%r8,%r11,4),%xmm2
+ DB 235,200 ; jmp 26605 <_sk_load_8888_dst_sse41_8bit+0x29>
+ DB 102,67,15,110,84,152,8 ; movd 0x8(%r8,%r11,4),%xmm2
DB 102,15,112,210,69 ; pshufd $0x45,%xmm2,%xmm2
- DB 243,66,15,126,36,130 ; movq (%rdx,%r8,4),%xmm4
+ DB 243,67,15,126,36,152 ; movq (%r8,%r11,4),%xmm4
DB 102,15,58,14,212,15 ; pblendw $0xf,%xmm4,%xmm2
- DB 235,177 ; jmp 2667e <_sk_load_8888_dst_sse41_8bit+0x2e>
- DB 102,66,15,110,84,130,24 ; movd 0x18(%rdx,%r8,4),%xmm2
+ DB 235,174 ; jmp 26605 <_sk_load_8888_dst_sse41_8bit+0x29>
+ DB 102,67,15,110,84,152,24 ; movd 0x18(%r8,%r11,4),%xmm2
DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3
- DB 102,66,15,58,34,92,130,20,1 ; pinsrd $0x1,0x14(%rdx,%r8,4),%xmm3
- DB 102,66,15,58,34,92,130,16,0 ; pinsrd $0x0,0x10(%rdx,%r8,4),%xmm3
- DB 235,139 ; jmp 26678 <_sk_load_8888_dst_sse41_8bit+0x28>
- DB 15,31,0 ; nopl (%rax)
- DB 187,255,255,255,207 ; mov $0xcfffffff,%ebx
+ DB 102,67,15,58,34,92,152,20,1 ; pinsrd $0x1,0x14(%r8,%r11,4),%xmm3
+ DB 102,67,15,58,34,92,152,16,0 ; pinsrd $0x0,0x10(%r8,%r11,4),%xmm3
+ DB 235,136 ; jmp 265ff <_sk_load_8888_dst_sse41_8bit+0x23>
+ DB 144 ; nop
+ DB 189,255,255,255,209 ; mov $0xd1ffffff,%ebp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,195 ; inc %ebx
+ DB 255,197 ; inc %ebp
+ DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,135,255,255,255,244 ; incl -0xb000001(%rdi)
DB 255 ; (bad)
- DB 255,136,255,255,255,242 ; decl -0xd000001(%rax)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 235,255 ; jmp 2668d <_sk_load_8888_dst_sse41_8bit+0xb1>
DB 255 ; (bad)
- DB 233,255,255,255,221 ; jmpq ffffffffde026708 <_sk_overlay_sse2_8bit+0xffffffffddffaa93>
DB 255 ; (bad)
+ DB 223,255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_8888_sse41_8bit
_sk_store_8888_sse41_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,192 ; test %r8,%r8
- DB 117,17 ; jne 2673e <_sk_store_8888_sse41_8bit+0x32>
- DB 243,66,15,127,4,138 ; movdqu %xmm0,(%rdx,%r9,4)
- DB 243,66,15,127,76,138,16 ; movdqu %xmm1,0x10(%rdx,%r9,4)
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 255,224 ; jmpq *%rax
- DB 65,128,224,7 ; and $0x7,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,239 ; ja 2673a <_sk_store_8888_sse41_8bit+0x2e>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,70,0,0,0 ; lea 0x46(%rip),%rcx # 2679c <_sk_store_8888_sse41_8bit+0x90>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,66,15,126,4,138 ; movd %xmm0,(%rdx,%r9,4)
- DB 235,211 ; jmp 2673a <_sk_store_8888_sse41_8bit+0x2e>
- DB 102,66,15,58,22,68,138,8,2 ; pextrd $0x2,%xmm0,0x8(%rdx,%r9,4)
- DB 102,66,15,214,4,138 ; movq %xmm0,(%rdx,%r9,4)
- DB 235,194 ; jmp 2673a <_sk_store_8888_sse41_8bit+0x2e>
- DB 102,66,15,58,22,76,138,24,2 ; pextrd $0x2,%xmm1,0x18(%rdx,%r9,4)
- DB 102,66,15,58,22,76,138,20,1 ; pextrd $0x1,%xmm1,0x14(%rdx,%r9,4)
- DB 102,66,15,126,76,138,16 ; movd %xmm1,0x10(%rdx,%r9,4)
- DB 243,66,15,127,4,138 ; movdqu %xmm0,(%rdx,%r9,4)
- DB 235,161 ; jmp 2673a <_sk_store_8888_sse41_8bit+0x2e>
- DB 15,31,0 ; nopl (%rax)
- DB 195 ; retq
- DB 255 ; (bad)
- DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
- DB 255 ; (bad)
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 266c1 <_sk_store_8888_sse41_8bit+0x2d>
+ DB 243,67,15,127,4,152 ; movdqu %xmm0,(%r8,%r11,4)
+ DB 243,67,15,127,76,152,16 ; movdqu %xmm1,0x10(%r8,%r11,4)
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 119,236 ; ja 266bd <_sk_store_8888_sse41_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,68,0,0,0 ; lea 0x44(%rip),%r10 # 26720 <_sk_store_8888_sse41_8bit+0x8c>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,67,15,126,4,152 ; movd %xmm0,(%r8,%r11,4)
+ DB 235,208 ; jmp 266bd <_sk_store_8888_sse41_8bit+0x29>
+ DB 102,67,15,58,22,68,152,8,2 ; pextrd $0x2,%xmm0,0x8(%r8,%r11,4)
+ DB 102,67,15,214,4,152 ; movq %xmm0,(%r8,%r11,4)
+ DB 235,191 ; jmp 266bd <_sk_store_8888_sse41_8bit+0x29>
+ DB 102,67,15,58,22,76,152,24,2 ; pextrd $0x2,%xmm1,0x18(%r8,%r11,4)
+ DB 102,67,15,58,22,76,152,20,1 ; pextrd $0x1,%xmm1,0x14(%r8,%r11,4)
+ DB 102,67,15,126,76,152,16 ; movd %xmm1,0x10(%r8,%r11,4)
+ DB 243,67,15,127,4,152 ; movdqu %xmm0,(%r8,%r11,4)
+ DB 235,158 ; jmp 266bd <_sk_store_8888_sse41_8bit+0x29>
+ DB 144 ; nop
+ DB 197,255,255 ; (bad)
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
- DB 255,203 ; dec %ebx
DB 255 ; (bad)
+ DB 255,205 ; dec %ebp
DB 255 ; (bad)
- DB 255,245 ; push %rbp
DB 255 ; (bad)
+ DB 255,247 ; push %rdi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 238 ; out %al,(%dx)
+ DB 255,240 ; push %rax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,229 ; jmpq *%rbp
+ DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_bgra_sse41_8bit
_sk_load_bgra_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,35 ; jne 267fc <_sk_load_bgra_sse41_8bit+0x44>
- DB 243,66,15,111,76,130,16 ; movdqu 0x10(%rdx,%r8,4),%xmm1
- DB 243,66,15,111,4,130 ; movdqu (%rdx,%r8,4),%xmm0
- DB 102,15,111,37,66,106,0,0 ; movdqa 0x6a42(%rip),%xmm4 # 2d230 <_sk_overlay_sse2_8bit+0x15bb>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,35 ; jne 2677b <_sk_load_bgra_sse41_8bit+0x3f>
+ DB 243,67,15,111,76,152,16 ; movdqu 0x10(%r8,%r11,4),%xmm1
+ DB 243,67,15,111,4,152 ; movdqu (%r8,%r11,4),%xmm0
+ DB 102,15,111,37,3,106,0,0 ; movdqa 0x6a03(%rip),%xmm4 # 2d170 <_sk_overlay_sse2_8bit+0x15c0>
DB 102,15,56,0,196 ; pshufb %xmm4,%xmm0
DB 102,15,56,0,204 ; pshufb %xmm4,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,213 ; ja 267e6 <_sk_load_bgra_sse41_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,80,0,0,0 ; lea 0x50(%rip),%rcx # 2686c <_sk_load_bgra_sse41_8bit+0xb4>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,210 ; ja 26765 <_sk_load_bgra_sse41_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,78,0,0,0 ; lea 0x4e(%rip),%r10 # 267ec <_sk_load_bgra_sse41_8bit+0xb0>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 102,66,15,110,4,130 ; movd (%rdx,%r8,4),%xmm0
- DB 235,185 ; jmp 267e6 <_sk_load_bgra_sse41_8bit+0x2e>
- DB 102,66,15,110,68,130,8 ; movd 0x8(%rdx,%r8,4),%xmm0
+ DB 102,67,15,110,4,152 ; movd (%r8,%r11,4),%xmm0
+ DB 235,182 ; jmp 26765 <_sk_load_bgra_sse41_8bit+0x29>
+ DB 102,67,15,110,68,152,8 ; movd 0x8(%r8,%r11,4),%xmm0
DB 102,15,112,192,69 ; pshufd $0x45,%xmm0,%xmm0
- DB 243,66,15,126,36,130 ; movq (%rdx,%r8,4),%xmm4
+ DB 243,67,15,126,36,152 ; movq (%r8,%r11,4),%xmm4
DB 102,15,58,14,196,15 ; pblendw $0xf,%xmm4,%xmm0
- DB 235,159 ; jmp 267e6 <_sk_load_bgra_sse41_8bit+0x2e>
- DB 102,66,15,110,68,130,24 ; movd 0x18(%rdx,%r8,4),%xmm0
+ DB 235,156 ; jmp 26765 <_sk_load_bgra_sse41_8bit+0x29>
+ DB 102,67,15,110,68,152,24 ; movd 0x18(%r8,%r11,4),%xmm0
DB 102,15,112,200,69 ; pshufd $0x45,%xmm0,%xmm1
- DB 102,66,15,58,34,76,130,20,1 ; pinsrd $0x1,0x14(%rdx,%r8,4),%xmm1
- DB 102,66,15,58,34,76,130,16,0 ; pinsrd $0x0,0x10(%rdx,%r8,4),%xmm1
- DB 233,118,255,255,255 ; jmpq 267e0 <_sk_load_bgra_sse41_8bit+0x28>
- DB 102,144 ; xchg %ax,%ax
- DB 185,255,255,255,205 ; mov $0xcdffffff,%ecx
+ DB 102,67,15,58,34,76,152,20,1 ; pinsrd $0x1,0x14(%r8,%r11,4),%xmm1
+ DB 102,67,15,58,34,76,152,16,0 ; pinsrd $0x0,0x10(%r8,%r11,4),%xmm1
+ DB 233,115,255,255,255 ; jmpq 2675f <_sk_load_bgra_sse41_8bit+0x23>
+ DB 187,255,255,255,207 ; mov $0xcfffffff,%ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,193 ; inc %ecx
+ DB 255,195 ; inc %ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,116,255,255 ; pushq -0x1(%rdi,%rdi,8)
- DB 255,240 ; push %rax
+ DB 255,115,255 ; pushq -0x1(%rbx)
DB 255 ; (bad)
+ DB 255,242 ; push %rdx
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 233,255,255,255,221 ; jmpq ffffffffde026804 <_sk_overlay_sse2_8bit+0xffffffffddffac54>
DB 255 ; (bad)
- DB 219,255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_bgra_dst_sse41_8bit
_sk_load_bgra_dst_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,35 ; jne 268cc <_sk_load_bgra_dst_sse41_8bit+0x44>
- DB 243,66,15,111,92,130,16 ; movdqu 0x10(%rdx,%r8,4),%xmm3
- DB 243,66,15,111,20,130 ; movdqu (%rdx,%r8,4),%xmm2
- DB 102,15,111,37,114,105,0,0 ; movdqa 0x6972(%rip),%xmm4 # 2d230 <_sk_overlay_sse2_8bit+0x15bb>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,35 ; jne 26847 <_sk_load_bgra_dst_sse41_8bit+0x3f>
+ DB 243,67,15,111,92,152,16 ; movdqu 0x10(%r8,%r11,4),%xmm3
+ DB 243,67,15,111,20,152 ; movdqu (%r8,%r11,4),%xmm2
+ DB 102,15,111,37,55,105,0,0 ; movdqa 0x6937(%rip),%xmm4 # 2d170 <_sk_overlay_sse2_8bit+0x15c0>
DB 102,15,56,0,212 ; pshufb %xmm4,%xmm2
DB 102,15,56,0,220 ; pshufb %xmm4,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,213 ; ja 268b6 <_sk_load_bgra_dst_sse41_8bit+0x2e>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,80,0,0,0 ; lea 0x50(%rip),%rcx # 2693c <_sk_load_bgra_dst_sse41_8bit+0xb4>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,210 ; ja 26831 <_sk_load_bgra_dst_sse41_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,78,0,0,0 ; lea 0x4e(%rip),%r10 # 268b8 <_sk_load_bgra_dst_sse41_8bit+0xb0>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 102,66,15,110,20,130 ; movd (%rdx,%r8,4),%xmm2
- DB 235,185 ; jmp 268b6 <_sk_load_bgra_dst_sse41_8bit+0x2e>
- DB 102,66,15,110,84,130,8 ; movd 0x8(%rdx,%r8,4),%xmm2
+ DB 102,67,15,110,20,152 ; movd (%r8,%r11,4),%xmm2
+ DB 235,182 ; jmp 26831 <_sk_load_bgra_dst_sse41_8bit+0x29>
+ DB 102,67,15,110,84,152,8 ; movd 0x8(%r8,%r11,4),%xmm2
DB 102,15,112,210,69 ; pshufd $0x45,%xmm2,%xmm2
- DB 243,66,15,126,36,130 ; movq (%rdx,%r8,4),%xmm4
+ DB 243,67,15,126,36,152 ; movq (%r8,%r11,4),%xmm4
DB 102,15,58,14,212,15 ; pblendw $0xf,%xmm4,%xmm2
- DB 235,159 ; jmp 268b6 <_sk_load_bgra_dst_sse41_8bit+0x2e>
- DB 102,66,15,110,84,130,24 ; movd 0x18(%rdx,%r8,4),%xmm2
+ DB 235,156 ; jmp 26831 <_sk_load_bgra_dst_sse41_8bit+0x29>
+ DB 102,67,15,110,84,152,24 ; movd 0x18(%r8,%r11,4),%xmm2
DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3
- DB 102,66,15,58,34,92,130,20,1 ; pinsrd $0x1,0x14(%rdx,%r8,4),%xmm3
- DB 102,66,15,58,34,92,130,16,0 ; pinsrd $0x0,0x10(%rdx,%r8,4),%xmm3
- DB 233,118,255,255,255 ; jmpq 268b0 <_sk_load_bgra_dst_sse41_8bit+0x28>
- DB 102,144 ; xchg %ax,%ax
- DB 185,255,255,255,205 ; mov $0xcdffffff,%ecx
+ DB 102,67,15,58,34,92,152,20,1 ; pinsrd $0x1,0x14(%r8,%r11,4),%xmm3
+ DB 102,67,15,58,34,92,152,16,0 ; pinsrd $0x0,0x10(%r8,%r11,4),%xmm3
+ DB 233,115,255,255,255 ; jmpq 2682b <_sk_load_bgra_dst_sse41_8bit+0x23>
+ DB 187,255,255,255,207 ; mov $0xcfffffff,%ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,193 ; inc %ecx
+ DB 255,195 ; inc %ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,116,255,255 ; pushq -0x1(%rdi,%rdi,8)
- DB 255,240 ; push %rax
+ DB 255,115,255 ; pushq -0x1(%rbx)
DB 255 ; (bad)
+ DB 255,242 ; push %rdx
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 233,255,255,255,221 ; jmpq ffffffffde0268d0 <_sk_overlay_sse2_8bit+0xffffffffddffad20>
DB 255 ; (bad)
- DB 219,255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_bgra_sse41_8bit
_sk_store_bgra_sse41_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 102,15,111,53,180,104,0,0 ; movdqa 0x68b4(%rip),%xmm6 # 2d230 <_sk_overlay_sse2_8bit+0x15bb>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 102,15,111,53,125,104,0,0 ; movdqa 0x687d(%rip),%xmm6 # 2d170 <_sk_overlay_sse2_8bit+0x15c0>
DB 102,15,111,233 ; movdqa %xmm1,%xmm5
DB 102,15,56,0,238 ; pshufb %xmm6,%xmm5
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
DB 102,15,56,0,230 ; pshufb %xmm6,%xmm4
- DB 77,133,192 ; test %r8,%r8
- DB 117,17 ; jne 269a4 <_sk_store_bgra_sse41_8bit+0x4c>
- DB 243,66,15,127,36,138 ; movdqu %xmm4,(%rdx,%r9,4)
- DB 243,66,15,127,108,138,16 ; movdqu %xmm5,0x10(%rdx,%r9,4)
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 255,224 ; jmpq *%rax
- DB 65,128,224,7 ; and $0x7,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,239 ; ja 269a0 <_sk_store_bgra_sse41_8bit+0x48>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,68,0,0,0 ; lea 0x44(%rip),%rcx # 26a00 <_sk_store_bgra_sse41_8bit+0xa8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,66,15,126,36,138 ; movd %xmm4,(%rdx,%r9,4)
- DB 235,211 ; jmp 269a0 <_sk_store_bgra_sse41_8bit+0x48>
- DB 102,66,15,58,22,100,138,8,2 ; pextrd $0x2,%xmm4,0x8(%rdx,%r9,4)
- DB 102,66,15,214,36,138 ; movq %xmm4,(%rdx,%r9,4)
- DB 235,194 ; jmp 269a0 <_sk_store_bgra_sse41_8bit+0x48>
- DB 102,66,15,58,22,108,138,24,2 ; pextrd $0x2,%xmm5,0x18(%rdx,%r9,4)
- DB 102,66,15,58,22,108,138,20,1 ; pextrd $0x1,%xmm5,0x14(%rdx,%r9,4)
- DB 102,66,15,126,108,138,16 ; movd %xmm5,0x10(%rdx,%r9,4)
- DB 243,66,15,127,36,138 ; movdqu %xmm4,(%rdx,%r9,4)
- DB 235,161 ; jmp 269a0 <_sk_store_bgra_sse41_8bit+0x48>
- DB 144 ; nop
- DB 197,255,255 ; (bad)
- DB 255,214 ; callq *%rsi
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 2691b <_sk_store_bgra_sse41_8bit+0x47>
+ DB 243,67,15,127,36,152 ; movdqu %xmm4,(%r8,%r11,4)
+ DB 243,67,15,127,108,152,16 ; movdqu %xmm5,0x10(%r8,%r11,4)
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 119,236 ; ja 26917 <_sk_store_bgra_sse41_8bit+0x43>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,70,0,0,0 ; lea 0x46(%rip),%r10 # 2697c <_sk_store_bgra_sse41_8bit+0xa8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,67,15,126,36,152 ; movd %xmm4,(%r8,%r11,4)
+ DB 235,208 ; jmp 26917 <_sk_store_bgra_sse41_8bit+0x43>
+ DB 102,67,15,58,22,100,152,8,2 ; pextrd $0x2,%xmm4,0x8(%r8,%r11,4)
+ DB 102,67,15,214,36,152 ; movq %xmm4,(%r8,%r11,4)
+ DB 235,191 ; jmp 26917 <_sk_store_bgra_sse41_8bit+0x43>
+ DB 102,67,15,58,22,108,152,24,2 ; pextrd $0x2,%xmm5,0x18(%r8,%r11,4)
+ DB 102,67,15,58,22,108,152,20,1 ; pextrd $0x1,%xmm5,0x14(%r8,%r11,4)
+ DB 102,67,15,126,108,152,16 ; movd %xmm5,0x10(%r8,%r11,4)
+ DB 243,67,15,127,36,152 ; movdqu %xmm4,(%r8,%r11,4)
+ DB 235,158 ; jmp 26917 <_sk_store_bgra_sse41_8bit+0x43>
+ DB 15,31,0 ; nopl (%rax)
+ DB 195 ; retq
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,205 ; dec %ebp
+ DB 255,212 ; callq *%rsp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,247 ; push %rdi
+ DB 255,203 ; dec %ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,240 ; push %rax
+ DB 255,245 ; push %rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
+ DB 238 ; out %al,(%dx)
+ DB 255 ; (bad)
+ DB 255 ; (bad)
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 222,255 ; fdivrp %st,%st(7)
+ DB 255 ; (bad)
+ DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_a8_sse41_8bit
_sk_load_a8_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,42 ; jne 26a63 <_sk_load_a8_sse41_8bit+0x47>
- DB 102,66,15,56,48,12,2 ; pmovzxbw (%rdx,%r8,1),%xmm1
- DB 102,15,219,13,136,96,0,0 ; pand 0x6088(%rip),%xmm1 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,42 ; jne 269da <_sk_load_a8_sse41_8bit+0x42>
+ DB 102,67,15,56,48,12,24 ; pmovzxbw (%r8,%r11,1),%xmm1
+ DB 102,15,219,13,81,96,0,0 ; pand 0x6051(%rip),%xmm1 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,56,51,193 ; pmovzxwd %xmm1,%xmm0
DB 102,15,105,204 ; punpckhwd %xmm4,%xmm1
@@ -36879,70 +36874,71 @@ _sk_load_a8_sse41_8bit LABEL PROC
DB 102,15,114,240,24 ; pslld $0x18,%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,204 ; ja 26a40 <_sk_load_a8_sse41_8bit+0x24>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,117,0,0,0 ; lea 0x75(%rip),%rcx # 26af4 <_sk_load_a8_sse41_8bit+0xd8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,201 ; ja 269b7 <_sk_load_a8_sse41_8bit+0x1f>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,119,0,0,0 ; lea 0x77(%rip),%r10 # 26a70 <_sk_load_a8_sse41_8bit+0xd8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,200 ; movd %eax,%xmm1
- DB 235,173 ; jmp 26a40 <_sk_load_a8_sse41_8bit+0x24>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 235,170 ; jmp 269b7 <_sk_load_a8_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,196,200,2 ; pinsrw $0x2,%eax,%xmm1
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,192 ; movd %eax,%xmm0
DB 102,15,56,48,192 ; pmovzxbw %xmm0,%xmm0
DB 102,15,58,14,200,3 ; pblendw $0x3,%xmm0,%xmm1
- DB 235,136 ; jmp 26a40 <_sk_load_a8_sse41_8bit+0x24>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 235,133 ; jmp 269b7 <_sk_load_a8_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,196,200,6 ; pinsrw $0x6,%eax,%xmm1
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,200,5 ; pinsrw $0x5,%eax,%xmm1
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,200,4 ; pinsrw $0x4,%eax,%xmm1
- DB 102,66,15,110,4,2 ; movd (%rdx,%r8,1),%xmm0
+ DB 102,67,15,110,4,24 ; movd (%r8,%r11,1),%xmm0
DB 102,15,56,48,192 ; pmovzxbw %xmm0,%xmm0
DB 102,15,58,14,200,15 ; pblendw $0xf,%xmm0,%xmm1
- DB 233,77,255,255,255 ; jmpq 26a40 <_sk_load_a8_sse41_8bit+0x24>
- DB 144 ; nop
- DB 148 ; xchg %eax,%esp
+ DB 233,74,255,255,255 ; jmpq 269b7 <_sk_load_a8_sse41_8bit+0x1f>
+ DB 15,31,0 ; nopl (%rax)
+ DB 146 ; xchg %eax,%edx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,174,255,255,255,159 ; ljmp *-0x60000001(%rsi)
+ DB 255,172,255,255,255,157,255 ; ljmp *-0x620001(%rdi,%rdi,8)
DB 255 ; (bad)
+ DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf026b04 <_sk_overlay_sse2_8bit+0xffffffffdeffae8f>
DB 255 ; (bad)
+ DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
- DB 255,211 ; callq *%rbx
+ DB 255,209 ; callq *%rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,196 ; inc %esp
+ DB 255,194 ; inc %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_a8_dst_sse41_8bit
_sk_load_a8_dst_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,42 ; jne 26b57 <_sk_load_a8_dst_sse41_8bit+0x47>
- DB 102,66,15,56,48,28,2 ; pmovzxbw (%rdx,%r8,1),%xmm3
- DB 102,15,219,29,148,95,0,0 ; pand 0x5f94(%rip),%xmm3 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,42 ; jne 26ace <_sk_load_a8_dst_sse41_8bit+0x42>
+ DB 102,67,15,56,48,28,24 ; pmovzxbw (%r8,%r11,1),%xmm3
+ DB 102,15,219,29,93,95,0,0 ; pand 0x5f5d(%rip),%xmm3 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,56,51,211 ; pmovzxwd %xmm3,%xmm2
DB 102,15,105,220 ; punpckhwd %xmm4,%xmm3
@@ -36950,288 +36946,289 @@ _sk_load_a8_dst_sse41_8bit LABEL PROC
DB 102,15,114,242,24 ; pslld $0x18,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,204 ; ja 26b34 <_sk_load_a8_dst_sse41_8bit+0x24>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,117,0,0,0 ; lea 0x75(%rip),%rcx # 26be8 <_sk_load_a8_dst_sse41_8bit+0xd8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,201 ; ja 26aab <_sk_load_a8_dst_sse41_8bit+0x1f>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,119,0,0,0 ; lea 0x77(%rip),%r10 # 26b64 <_sk_load_a8_dst_sse41_8bit+0xd8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,216 ; movd %eax,%xmm3
- DB 235,173 ; jmp 26b34 <_sk_load_a8_dst_sse41_8bit+0x24>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 235,170 ; jmp 26aab <_sk_load_a8_dst_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,216,2 ; pinsrw $0x2,%eax,%xmm3
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,208 ; movd %eax,%xmm2
DB 102,15,56,48,210 ; pmovzxbw %xmm2,%xmm2
DB 102,15,58,14,218,3 ; pblendw $0x3,%xmm2,%xmm3
- DB 235,136 ; jmp 26b34 <_sk_load_a8_dst_sse41_8bit+0x24>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 235,133 ; jmp 26aab <_sk_load_a8_dst_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,216,6 ; pinsrw $0x6,%eax,%xmm3
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,216,5 ; pinsrw $0x5,%eax,%xmm3
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,216,4 ; pinsrw $0x4,%eax,%xmm3
- DB 102,66,15,110,20,2 ; movd (%rdx,%r8,1),%xmm2
+ DB 102,67,15,110,20,24 ; movd (%r8,%r11,1),%xmm2
DB 102,15,56,48,210 ; pmovzxbw %xmm2,%xmm2
DB 102,15,58,14,218,15 ; pblendw $0xf,%xmm2,%xmm3
- DB 233,77,255,255,255 ; jmpq 26b34 <_sk_load_a8_dst_sse41_8bit+0x24>
- DB 144 ; nop
- DB 148 ; xchg %eax,%esp
+ DB 233,74,255,255,255 ; jmpq 26aab <_sk_load_a8_dst_sse41_8bit+0x1f>
+ DB 15,31,0 ; nopl (%rax)
+ DB 146 ; xchg %eax,%edx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,174,255,255,255,159 ; ljmp *-0x60000001(%rsi)
+ DB 255,172,255,255,255,157,255 ; ljmp *-0x620001(%rdi,%rdi,8)
DB 255 ; (bad)
+ DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf026bf8 <_sk_overlay_sse2_8bit+0xffffffffdeffaf83>
DB 255 ; (bad)
+ DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
- DB 255,211 ; callq *%rbx
+ DB 255,209 ; callq *%rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,196 ; inc %esp
+ DB 255,194 ; inc %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_a8_sse41_8bit
_sk_store_a8_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 102,15,111,45,28,102,0,0 ; movdqa 0x661c(%rip),%xmm5 # 2d240 <_sk_overlay_sse2_8bit+0x15cb>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 102,15,111,45,229,101,0,0 ; movdqa 0x65e5(%rip),%xmm5 # 2d180 <_sk_overlay_sse2_8bit+0x15d0>
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,56,0,245 ; pshufb %xmm5,%xmm6
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
DB 102,15,56,0,229 ; pshufb %xmm5,%xmm4
DB 102,15,108,230 ; punpcklqdq %xmm6,%xmm4
- DB 77,133,201 ; test %r9,%r9
- DB 117,19 ; jne 26c52 <_sk_store_a8_sse41_8bit+0x4e>
- DB 102,15,56,0,37,184,101,0,0 ; pshufb 0x65b8(%rip),%xmm4 # 2d200 <_sk_overlay_sse2_8bit+0x158b>
- DB 102,66,15,214,36,2 ; movq %xmm4,(%rdx,%r8,1)
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,19 ; jne 26bc9 <_sk_store_a8_sse41_8bit+0x49>
+ DB 102,15,56,0,37,129,101,0,0 ; pshufb 0x6581(%rip),%xmm4 # 2d140 <_sk_overlay_sse2_8bit+0x1590>
+ DB 102,67,15,214,36,24 ; movq %xmm4,(%r8,%r11,1)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,239 ; ja 26c4e <_sk_store_a8_sse41_8bit+0x4a>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,94,0,0,0 ; lea 0x5e(%rip),%rcx # 26cc8 <_sk_store_a8_sse41_8bit+0xc4>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,66,15,58,20,36,2,0 ; pextrb $0x0,%xmm4,(%rdx,%r8,1)
- DB 235,209 ; jmp 26c4e <_sk_store_a8_sse41_8bit+0x4a>
- DB 102,66,15,58,20,100,2,2,4 ; pextrb $0x4,%xmm4,0x2(%rdx,%r8,1)
- DB 102,15,56,0,37,81,94,0,0 ; pshufb 0x5e51(%rip),%xmm4 # 2cae0 <_sk_overlay_sse2_8bit+0xe6b>
- DB 102,66,15,58,21,36,2,0 ; pextrw $0x0,%xmm4,(%rdx,%r8,1)
- DB 235,181 ; jmp 26c4e <_sk_store_a8_sse41_8bit+0x4a>
- DB 102,66,15,58,20,100,2,6,12 ; pextrb $0xc,%xmm4,0x6(%rdx,%r8,1)
- DB 102,66,15,58,20,100,2,5,10 ; pextrb $0xa,%xmm4,0x5(%rdx,%r8,1)
- DB 102,66,15,58,20,100,2,4,8 ; pextrb $0x8,%xmm4,0x4(%rdx,%r8,1)
- DB 102,15,56,0,37,51,94,0,0 ; pshufb 0x5e33(%rip),%xmm4 # 2caf0 <_sk_overlay_sse2_8bit+0xe7b>
- DB 102,66,15,126,36,2 ; movd %xmm4,(%rdx,%r8,1)
- DB 235,137 ; jmp 26c4e <_sk_store_a8_sse41_8bit+0x4a>
- DB 15,31,0 ; nopl (%rax)
- DB 171 ; stos %eax,%es:(%rdi)
- DB 255 ; (bad)
- DB 255 ; (bad)
+ DB 119,236 ; ja 26bc5 <_sk_store_a8_sse41_8bit+0x45>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,92,0,0,0 ; lea 0x5c(%rip),%r10 # 26c40 <_sk_store_a8_sse41_8bit+0xc0>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,67,15,58,20,36,24,0 ; pextrb $0x0,%xmm4,(%r8,%r11,1)
+ DB 235,206 ; jmp 26bc5 <_sk_store_a8_sse41_8bit+0x45>
+ DB 102,67,15,58,20,100,24,2,4 ; pextrb $0x4,%xmm4,0x2(%r8,%r11,1)
+ DB 102,15,56,0,37,23,94,0,0 ; pshufb 0x5e17(%rip),%xmm4 # 2ca20 <_sk_overlay_sse2_8bit+0xe70>
+ DB 102,67,15,58,21,36,24,0 ; pextrw $0x0,%xmm4,(%r8,%r11,1)
+ DB 235,178 ; jmp 26bc5 <_sk_store_a8_sse41_8bit+0x45>
+ DB 102,67,15,58,20,100,24,6,12 ; pextrb $0xc,%xmm4,0x6(%r8,%r11,1)
+ DB 102,67,15,58,20,100,24,5,10 ; pextrb $0xa,%xmm4,0x5(%r8,%r11,1)
+ DB 102,67,15,58,20,100,24,4,8 ; pextrb $0x8,%xmm4,0x4(%r8,%r11,1)
+ DB 102,15,56,0,37,249,93,0,0 ; pshufb 0x5df9(%rip),%xmm4 # 2ca30 <_sk_overlay_sse2_8bit+0xe80>
+ DB 102,67,15,126,36,24 ; movd %xmm4,(%r8,%r11,1)
+ DB 235,134 ; jmp 26bc5 <_sk_store_a8_sse41_8bit+0x45>
+ DB 144 ; nop
+ DB 173 ; lods %ds:(%rsi),%eax
DB 255 ; (bad)
- DB 190,255,255,255,181 ; mov $0xb5ffffff,%esi
DB 255 ; (bad)
+ DB 255,192 ; inc %eax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 236 ; in (%dx),%al
+ DB 255,183,255,255,255,238 ; pushq -0x11000001(%rdi)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,227 ; jmpq *%rbx
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 218,255 ; (bad)
+ DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
- DB 255,209 ; callq *%rcx
+ DB 255,211 ; callq *%rbx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_g8_sse41_8bit
_sk_load_g8_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,66 ; jne 26d43 <_sk_load_g8_sse41_8bit+0x5f>
- DB 102,66,15,56,48,12,2 ; pmovzxbw (%rdx,%r8,1),%xmm1
- DB 102,15,219,13,192,93,0,0 ; pand 0x5dc0(%rip),%xmm1 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,66 ; jne 26cb6 <_sk_load_g8_sse41_8bit+0x5a>
+ DB 102,67,15,56,48,12,24 ; pmovzxbw (%r8,%r11,1),%xmm1
+ DB 102,15,219,13,141,93,0,0 ; pand 0x5d8d(%rip),%xmm1 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,56,51,193 ; pmovzxwd %xmm1,%xmm0
DB 102,15,105,204 ; punpckhwd %xmm4,%xmm1
- DB 102,15,111,37,43,101,0,0 ; movdqa 0x652b(%rip),%xmm4 # 2d250 <_sk_overlay_sse2_8bit+0x15db>
+ DB 102,15,111,37,248,100,0,0 ; movdqa 0x64f8(%rip),%xmm4 # 2d190 <_sk_overlay_sse2_8bit+0x15e0>
DB 102,15,56,64,204 ; pmulld %xmm4,%xmm1
DB 102,15,56,64,196 ; pmulld %xmm4,%xmm0
- DB 102,15,111,37,217,100,0,0 ; movdqa 0x64d9(%rip),%xmm4 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,37,166,100,0,0 ; movdqa 0x64a6(%rip),%xmm4 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,235,196 ; por %xmm4,%xmm0
DB 102,15,235,204 ; por %xmm4,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,180 ; ja 26d08 <_sk_load_g8_sse41_8bit+0x24>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,121,0,0,0 ; lea 0x79(%rip),%rcx # 26dd8 <_sk_load_g8_sse41_8bit+0xf4>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,177 ; ja 26c7b <_sk_load_g8_sse41_8bit+0x1f>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,119,0,0,0 ; lea 0x77(%rip),%r10 # 26d4c <_sk_load_g8_sse41_8bit+0xf0>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,200 ; movd %eax,%xmm1
- DB 235,149 ; jmp 26d08 <_sk_load_g8_sse41_8bit+0x24>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 235,146 ; jmp 26c7b <_sk_load_g8_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,196,200,2 ; pinsrw $0x2,%eax,%xmm1
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,192 ; movd %eax,%xmm0
DB 102,15,56,48,192 ; pmovzxbw %xmm0,%xmm0
DB 102,15,58,14,200,3 ; pblendw $0x3,%xmm0,%xmm1
- DB 233,109,255,255,255 ; jmpq 26d08 <_sk_load_g8_sse41_8bit+0x24>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,106,255,255,255 ; jmpq 26c7b <_sk_load_g8_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,196,200,6 ; pinsrw $0x6,%eax,%xmm1
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,200,5 ; pinsrw $0x5,%eax,%xmm1
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,200,4 ; pinsrw $0x4,%eax,%xmm1
- DB 102,66,15,110,4,2 ; movd (%rdx,%r8,1),%xmm0
+ DB 102,67,15,110,4,24 ; movd (%r8,%r11,1),%xmm0
DB 102,15,56,48,192 ; pmovzxbw %xmm0,%xmm0
DB 102,15,58,14,200,15 ; pblendw $0xf,%xmm0,%xmm1
- DB 233,50,255,255,255 ; jmpq 26d08 <_sk_load_g8_sse41_8bit+0x24>
- DB 102,144 ; xchg %ax,%ax
- DB 144 ; nop
+ DB 233,47,255,255,255 ; jmpq 26c7b <_sk_load_g8_sse41_8bit+0x1f>
+ DB 146 ; xchg %eax,%edx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,170,255,255,255,155 ; ljmp *-0x64000001(%rdx)
+ DB 255,172,255,255,255,157,255 ; ljmp *-0x620001(%rdi,%rdi,8)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 234 ; (bad)
DB 255 ; (bad)
- DB 232,255,255,255,221 ; callq ffffffffde026de8 <_sk_overlay_sse2_8bit+0xffffffffddffb173>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,210 ; callq *%rdx
+ DB 223,255 ; (bad)
DB 255 ; (bad)
+ DB 255,212 ; callq *%rsp
DB 255 ; (bad)
- DB 255,195 ; inc %ebx
+ DB 255 ; (bad)
+ DB 255,197 ; inc %ebp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_g8_dst_sse41_8bit
_sk_load_g8_dst_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,66 ; jne 26e53 <_sk_load_g8_dst_sse41_8bit+0x5f>
- DB 102,66,15,56,48,28,2 ; pmovzxbw (%rdx,%r8,1),%xmm3
- DB 102,15,219,29,176,92,0,0 ; pand 0x5cb0(%rip),%xmm3 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,66 ; jne 26dc2 <_sk_load_g8_dst_sse41_8bit+0x5a>
+ DB 102,67,15,56,48,28,24 ; pmovzxbw (%r8,%r11,1),%xmm3
+ DB 102,15,219,29,129,92,0,0 ; pand 0x5c81(%rip),%xmm3 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,56,51,211 ; pmovzxwd %xmm3,%xmm2
DB 102,15,105,220 ; punpckhwd %xmm4,%xmm3
- DB 102,15,111,37,27,100,0,0 ; movdqa 0x641b(%rip),%xmm4 # 2d250 <_sk_overlay_sse2_8bit+0x15db>
+ DB 102,15,111,37,236,99,0,0 ; movdqa 0x63ec(%rip),%xmm4 # 2d190 <_sk_overlay_sse2_8bit+0x15e0>
DB 102,15,56,64,220 ; pmulld %xmm4,%xmm3
DB 102,15,56,64,212 ; pmulld %xmm4,%xmm2
- DB 102,15,111,37,201,99,0,0 ; movdqa 0x63c9(%rip),%xmm4 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,37,154,99,0,0 ; movdqa 0x639a(%rip),%xmm4 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,235,212 ; por %xmm4,%xmm2
DB 102,15,235,220 ; por %xmm4,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,180 ; ja 26e18 <_sk_load_g8_dst_sse41_8bit+0x24>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,121,0,0,0 ; lea 0x79(%rip),%rcx # 26ee8 <_sk_load_g8_dst_sse41_8bit+0xf4>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,177 ; ja 26d87 <_sk_load_g8_dst_sse41_8bit+0x1f>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,119,0,0,0 ; lea 0x77(%rip),%r10 # 26e58 <_sk_load_g8_dst_sse41_8bit+0xf0>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,216 ; movd %eax,%xmm3
- DB 235,149 ; jmp 26e18 <_sk_load_g8_dst_sse41_8bit+0x24>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 235,146 ; jmp 26d87 <_sk_load_g8_dst_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,216,2 ; pinsrw $0x2,%eax,%xmm3
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,208 ; movd %eax,%xmm2
DB 102,15,56,48,210 ; pmovzxbw %xmm2,%xmm2
DB 102,15,58,14,218,3 ; pblendw $0x3,%xmm2,%xmm3
- DB 233,109,255,255,255 ; jmpq 26e18 <_sk_load_g8_dst_sse41_8bit+0x24>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,106,255,255,255 ; jmpq 26d87 <_sk_load_g8_dst_sse41_8bit+0x1f>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,216,6 ; pinsrw $0x6,%eax,%xmm3
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,216,5 ; pinsrw $0x5,%eax,%xmm3
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,216,4 ; pinsrw $0x4,%eax,%xmm3
- DB 102,66,15,110,20,2 ; movd (%rdx,%r8,1),%xmm2
+ DB 102,67,15,110,20,24 ; movd (%r8,%r11,1),%xmm2
DB 102,15,56,48,210 ; pmovzxbw %xmm2,%xmm2
DB 102,15,58,14,218,15 ; pblendw $0xf,%xmm2,%xmm3
- DB 233,50,255,255,255 ; jmpq 26e18 <_sk_load_g8_dst_sse41_8bit+0x24>
- DB 102,144 ; xchg %ax,%ax
- DB 144 ; nop
+ DB 233,47,255,255,255 ; jmpq 26d87 <_sk_load_g8_dst_sse41_8bit+0x1f>
+ DB 146 ; xchg %eax,%edx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,170,255,255,255,155 ; ljmp *-0x64000001(%rdx)
+ DB 255,172,255,255,255,157,255 ; ljmp *-0x620001(%rdi,%rdi,8)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 234 ; (bad)
DB 255 ; (bad)
- DB 232,255,255,255,221 ; callq ffffffffde026ef8 <_sk_overlay_sse2_8bit+0xffffffffddffb283>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,210 ; callq *%rdx
+ DB 223,255 ; (bad)
DB 255 ; (bad)
+ DB 255,212 ; callq *%rsp
DB 255 ; (bad)
- DB 255,195 ; inc %ebx
+ DB 255 ; (bad)
+ DB 255,197 ; inc %ebp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_srcover_rgba_8888_sse41_8bit
_sk_srcover_rgba_8888_sse41_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,192 ; test %r8,%r8
- DB 15,133,206,0,0,0 ; jne 26ff7 <_sk_srcover_rgba_8888_sse41_8bit+0xf3>
- DB 243,70,15,111,68,138,16 ; movdqu 0x10(%rdx,%r9,4),%xmm8
- DB 243,70,15,111,12,138 ; movdqu (%rdx,%r9,4),%xmm9
- DB 77,133,192 ; test %r8,%r8
- DB 102,15,111,37,223,98,0,0 ; movdqa 0x62df(%rip),%xmm4 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,206,0,0,0 ; jne 26f62 <_sk_srcover_rgba_8888_sse41_8bit+0xee>
+ DB 243,71,15,111,68,152,16 ; movdqu 0x10(%r8,%r11,4),%xmm8
+ DB 243,71,15,111,12,152 ; movdqu (%r8,%r11,4),%xmm9
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 102,15,111,37,180,98,0,0 ; movdqa 0x62b4(%rip),%xmm4 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,56,0,244 ; pshufb %xmm4,%xmm6
DB 102,15,111,248 ; movdqa %xmm0,%xmm7
@@ -37265,61 +37262,63 @@ _sk_srcover_rgba_8888_sse41_8bit LABEL PROC
DB 102,68,15,248,204 ; psubb %xmm4,%xmm9
DB 102,68,15,252,200 ; paddb %xmm0,%xmm9
DB 102,68,15,252,193 ; paddb %xmm1,%xmm8
- DB 117,72 ; jne 2702e <_sk_srcover_rgba_8888_sse41_8bit+0x12a>
- DB 243,70,15,127,12,138 ; movdqu %xmm9,(%rdx,%r9,4)
- DB 243,70,15,127,68,138,16 ; movdqu %xmm8,0x10(%rdx,%r9,4)
+ DB 117,78 ; jne 26f9f <_sk_srcover_rgba_8888_sse41_8bit+0x12b>
+ DB 243,71,15,127,12,152 ; movdqu %xmm9,(%r8,%r11,4)
+ DB 243,71,15,127,68,152,16 ; movdqu %xmm8,0x10(%r8,%r11,4)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
- DB 68,137,192 ; mov %r8d,%eax
- DB 36,7 ; and $0x7,%al
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
- DB 254,200 ; dec %al
- DB 60,6 ; cmp $0x6,%al
- DB 15,135,38,255,255,255 ; ja 26f36 <_sk_srcover_rgba_8888_sse41_8bit+0x32>
- DB 15,182,192 ; movzbl %al,%eax
- DB 72,141,13,186,0,0,0 ; lea 0xba(%rip),%rcx # 270d4 <_sk_srcover_rgba_8888_sse41_8bit+0x1d0>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,70,15,110,12,138 ; movd (%rdx,%r9,4),%xmm9
- DB 233,8,255,255,255 ; jmpq 26f36 <_sk_srcover_rgba_8888_sse41_8bit+0x32>
- DB 65,128,224,7 ; and $0x7,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,184 ; ja 26ff3 <_sk_srcover_rgba_8888_sse41_8bit+0xef>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,170,0,0,0 ; lea 0xaa(%rip),%rcx # 270f0 <_sk_srcover_rgba_8888_sse41_8bit+0x1ec>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,70,15,126,12,138 ; movd %xmm9,(%rdx,%r9,4)
- DB 235,156 ; jmp 26ff3 <_sk_srcover_rgba_8888_sse41_8bit+0xef>
- DB 102,66,15,110,100,138,8 ; movd 0x8(%rdx,%r9,4),%xmm4
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 15,135,33,255,255,255 ; ja 26ea1 <_sk_srcover_rgba_8888_sse41_8bit+0x2d>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,189,0,0,0 ; lea 0xbd(%rip),%r10 # 27048 <_sk_srcover_rgba_8888_sse41_8bit+0x1d4>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,71,15,110,12,152 ; movd (%r8,%r11,4),%xmm9
+ DB 233,2,255,255,255 ; jmpq 26ea1 <_sk_srcover_rgba_8888_sse41_8bit+0x2d>
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 119,175 ; ja 26f5e <_sk_srcover_rgba_8888_sse41_8bit+0xea>
+ DB 65,15,182,193 ; movzbl %r9b,%eax
+ DB 76,141,13,170,0,0,0 ; lea 0xaa(%rip),%r9 # 27064 <_sk_srcover_rgba_8888_sse41_8bit+0x1f0>
+ DB 73,99,4,129 ; movslq (%r9,%rax,4),%rax
+ DB 76,1,200 ; add %r9,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,71,15,126,12,152 ; movd %xmm9,(%r8,%r11,4)
+ DB 235,147 ; jmp 26f5e <_sk_srcover_rgba_8888_sse41_8bit+0xea>
+ DB 102,67,15,110,100,152,8 ; movd 0x8(%r8,%r11,4),%xmm4
DB 102,68,15,112,204,69 ; pshufd $0x45,%xmm4,%xmm9
- DB 243,66,15,126,36,138 ; movq (%rdx,%r9,4),%xmm4
+ DB 243,67,15,126,36,152 ; movq (%r8,%r11,4),%xmm4
DB 102,68,15,58,14,204,15 ; pblendw $0xf,%xmm4,%xmm9
- DB 233,192,254,255,255 ; jmpq 26f36 <_sk_srcover_rgba_8888_sse41_8bit+0x32>
- DB 102,66,15,110,100,138,24 ; movd 0x18(%rdx,%r9,4),%xmm4
+ DB 233,183,254,255,255 ; jmpq 26ea1 <_sk_srcover_rgba_8888_sse41_8bit+0x2d>
+ DB 102,67,15,110,100,152,24 ; movd 0x18(%r8,%r11,4),%xmm4
DB 102,68,15,112,196,69 ; pshufd $0x45,%xmm4,%xmm8
- DB 102,70,15,58,34,68,138,20,1 ; pinsrd $0x1,0x14(%rdx,%r9,4),%xmm8
- DB 102,70,15,58,34,68,138,16,0 ; pinsrd $0x0,0x10(%rdx,%r9,4),%xmm8
- DB 233,150,254,255,255 ; jmpq 26f30 <_sk_srcover_rgba_8888_sse41_8bit+0x2c>
- DB 102,70,15,58,22,76,138,8,2 ; pextrd $0x2,%xmm9,0x8(%rdx,%r9,4)
- DB 102,70,15,214,12,138 ; movq %xmm9,(%rdx,%r9,4)
- DB 233,69,255,255,255 ; jmpq 26ff3 <_sk_srcover_rgba_8888_sse41_8bit+0xef>
- DB 102,70,15,58,22,68,138,24,2 ; pextrd $0x2,%xmm8,0x18(%rdx,%r9,4)
- DB 102,70,15,58,22,68,138,20,1 ; pextrd $0x1,%xmm8,0x14(%rdx,%r9,4)
- DB 102,70,15,126,68,138,16 ; movd %xmm8,0x10(%rdx,%r9,4)
- DB 243,70,15,127,12,138 ; movdqu %xmm9,(%rdx,%r9,4)
- DB 233,33,255,255,255 ; jmpq 26ff3 <_sk_srcover_rgba_8888_sse41_8bit+0xef>
+ DB 102,71,15,58,34,68,152,20,1 ; pinsrd $0x1,0x14(%r8,%r11,4),%xmm8
+ DB 102,71,15,58,34,68,152,16,0 ; pinsrd $0x0,0x10(%r8,%r11,4),%xmm8
+ DB 233,141,254,255,255 ; jmpq 26e9b <_sk_srcover_rgba_8888_sse41_8bit+0x27>
+ DB 102,71,15,58,22,76,152,8,2 ; pextrd $0x2,%xmm9,0x8(%r8,%r11,4)
+ DB 102,71,15,214,12,152 ; movq %xmm9,(%r8,%r11,4)
+ DB 233,60,255,255,255 ; jmpq 26f5e <_sk_srcover_rgba_8888_sse41_8bit+0xea>
+ DB 102,71,15,58,22,68,152,24,2 ; pextrd $0x2,%xmm8,0x18(%r8,%r11,4)
+ DB 102,71,15,58,22,68,152,20,1 ; pextrd $0x1,%xmm8,0x14(%r8,%r11,4)
+ DB 102,71,15,126,68,152,16 ; movd %xmm8,0x10(%r8,%r11,4)
+ DB 243,71,15,127,12,152 ; movdqu %xmm9,(%r8,%r11,4)
+ DB 233,24,255,255,255 ; jmpq 26f5e <_sk_srcover_rgba_8888_sse41_8bit+0xea>
DB 102,144 ; xchg %ax,%ax
- DB 79,255 ; rex.WRXB (bad)
+ DB 76,255 ; rex.WR (bad)
DB 255 ; (bad)
DB 255,144,255,255,255,131 ; callq *-0x7c000001(%rax)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,92,254,255 ; lcall *-0x1(%rsi,%rdi,8)
+ DB 255,83,254 ; callq *-0x2(%rbx)
+ DB 255 ; (bad)
DB 255 ; (bad)
DB 184,255,255,255,175 ; mov $0xafffffff,%eax
DB 255 ; (bad)
@@ -37351,7 +37350,7 @@ _sk_scale_1_float_sse41_8bit LABEL PROC
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
DB 72,173 ; lods %ds:(%rsi),%rax
DB 243,15,16,0 ; movss (%rax),%xmm0
- DB 243,15,89,5,238,79,0,0 ; mulss 0x4fee(%rip),%xmm0 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 243,15,89,5,182,79,0,0 ; mulss 0x4fb6(%rip),%xmm0 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 243,15,44,192 ; cvttss2si %xmm0,%eax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,68,15,56,48,197 ; pmovzxbw %xmm5,%xmm8
@@ -37359,7 +37358,7 @@ _sk_scale_1_float_sse41_8bit LABEL PROC
DB 102,68,15,56,48,204 ; pmovzxbw %xmm4,%xmm9
DB 102,15,104,224 ; punpckhbw %xmm0,%xmm4
DB 102,15,110,240 ; movd %eax,%xmm6
- DB 102,15,56,0,53,22,97,0,0 ; pshufb 0x6116(%rip),%xmm6 # 2d260 <_sk_overlay_sse2_8bit+0x15eb>
+ DB 102,15,56,0,53,226,96,0,0 ; pshufb 0x60e2(%rip),%xmm6 # 2d1a0 <_sk_overlay_sse2_8bit+0x15f0>
DB 102,15,111,206 ; movdqa %xmm6,%xmm1
DB 102,65,15,213,201 ; pmullw %xmm9,%xmm1
DB 102,15,111,198 ; movdqa %xmm6,%xmm0
@@ -37382,21 +37381,20 @@ _sk_scale_1_float_sse41_8bit LABEL PROC
PUBLIC _sk_scale_u8_sse41_8bit
_sk_scale_u8_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 15,133,160,0,0,0 ; jne 2725b <_sk_scale_u8_sse41_8bit+0xc1>
- DB 102,66,15,56,48,52,2 ; pmovzxbw (%rdx,%r8,1),%xmm6
- DB 102,15,219,53,6,89,0,0 ; pand 0x5906(%rip),%xmm6 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,160,0,0,0 ; jne 271ca <_sk_scale_u8_sse41_8bit+0xbc>
+ DB 102,67,15,56,48,52,24 ; pmovzxbw (%r8,%r11,1),%xmm6
+ DB 102,15,219,53,215,88,0,0 ; pand 0x58d7(%rip),%xmm6 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,15,111,254 ; movdqa %xmm6,%xmm7
- DB 102,15,56,0,61,148,96,0,0 ; pshufb 0x6094(%rip),%xmm7 # 2d270 <_sk_overlay_sse2_8bit+0x15fb>
- DB 102,15,56,0,53,155,96,0,0 ; pshufb 0x609b(%rip),%xmm6 # 2d280 <_sk_overlay_sse2_8bit+0x160b>
+ DB 102,15,56,0,61,101,96,0,0 ; pshufb 0x6065(%rip),%xmm7 # 2d1b0 <_sk_overlay_sse2_8bit+0x1600>
+ DB 102,15,56,0,53,108,96,0,0 ; pshufb 0x606c(%rip),%xmm6 # 2d1c0 <_sk_overlay_sse2_8bit+0x1610>
DB 102,68,15,56,48,200 ; pmovzxbw %xmm0,%xmm9
DB 102,65,15,104,192 ; punpckhbw %xmm8,%xmm0
DB 102,68,15,56,48,209 ; pmovzxbw %xmm1,%xmm10
@@ -37423,54 +37421,53 @@ _sk_scale_u8_sse41_8bit LABEL PROC
DB 102,15,111,196 ; movdqa %xmm4,%xmm0
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,246 ; pxor %xmm6,%xmm6
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 15,135,82,255,255,255 ; ja 271c2 <_sk_scale_u8_sse41_8bit+0x28>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,125,0,0,0 ; lea 0x7d(%rip),%rcx # 272f8 <_sk_scale_u8_sse41_8bit+0x15e>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 15,135,79,255,255,255 ; ja 27131 <_sk_scale_u8_sse41_8bit+0x23>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,123,0,0,0 ; lea 0x7b(%rip),%r10 # 27268 <_sk_scale_u8_sse41_8bit+0x15a>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,240 ; movd %eax,%xmm6
- DB 233,48,255,255,255 ; jmpq 271c2 <_sk_scale_u8_sse41_8bit+0x28>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 233,45,255,255,255 ; jmpq 27131 <_sk_scale_u8_sse41_8bit+0x23>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,246 ; pxor %xmm6,%xmm6
DB 102,15,196,240,2 ; pinsrw $0x2,%eax,%xmm6
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,224 ; movd %eax,%xmm4
DB 102,15,56,48,228 ; pmovzxbw %xmm4,%xmm4
DB 102,15,58,14,244,3 ; pblendw $0x3,%xmm4,%xmm6
- DB 233,8,255,255,255 ; jmpq 271c2 <_sk_scale_u8_sse41_8bit+0x28>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,5,255,255,255 ; jmpq 27131 <_sk_scale_u8_sse41_8bit+0x23>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,246 ; pxor %xmm6,%xmm6
DB 102,15,196,240,6 ; pinsrw $0x6,%eax,%xmm6
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,240,5 ; pinsrw $0x5,%eax,%xmm6
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,240,4 ; pinsrw $0x4,%eax,%xmm6
- DB 102,66,15,110,36,2 ; movd (%rdx,%r8,1),%xmm4
+ DB 102,67,15,110,36,24 ; movd (%r8,%r11,1),%xmm4
DB 102,15,56,48,228 ; pmovzxbw %xmm4,%xmm4
DB 102,15,58,14,244,15 ; pblendw $0xf,%xmm4,%xmm6
- DB 233,205,254,255,255 ; jmpq 271c2 <_sk_scale_u8_sse41_8bit+0x28>
- DB 15,31,0 ; nopl (%rax)
- DB 140,255 ; mov %?,%edi
- DB 255 ; (bad)
- DB 255,169,255,255,255,154 ; ljmp *-0x65000001(%rcx)
+ DB 233,202,254,255,255 ; jmpq 27131 <_sk_scale_u8_sse41_8bit+0x23>
+ DB 144 ; nop
+ DB 142,255 ; mov %edi,%?
DB 255 ; (bad)
+ DB 255,171,255,255,255,156 ; ljmp *-0x63000001(%rbx)
DB 255 ; (bad)
- DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 233,255,255,255,222 ; jmpq ffffffffdf027278 <_sk_overlay_sse2_8bit+0xffffffffdeffb6c8>
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
- DB 255,209 ; callq *%rcx
+ DB 255,211 ; callq *%rbx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,194 ; inc %edx
+ DB 255,196 ; inc %esp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -37479,7 +37476,7 @@ PUBLIC _sk_lerp_1_float_sse41_8bit
_sk_lerp_1_float_sse41_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 243,15,16,32 ; movss (%rax),%xmm4
- DB 243,15,89,37,238,77,0,0 ; mulss 0x4dee(%rip),%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 243,15,89,37,186,77,0,0 ; mulss 0x4dba(%rip),%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 243,15,44,196 ; cvttss2si %xmm4,%eax
DB 102,15,110,224 ; movd %eax,%xmm4
DB 102,15,96,228 ; punpcklbw %xmm4,%xmm4
@@ -37490,7 +37487,7 @@ _sk_lerp_1_float_sse41_8bit LABEL PROC
DB 102,65,15,104,193 ; punpckhbw %xmm9,%xmm0
DB 102,68,15,56,48,217 ; pmovzxbw %xmm1,%xmm11
DB 102,65,15,104,201 ; punpckhbw %xmm9,%xmm1
- DB 102,15,56,0,61,51,95,0,0 ; pshufb 0x5f33(%rip),%xmm7 # 2d290 <_sk_overlay_sse2_8bit+0x161b>
+ DB 102,15,56,0,61,3,95,0,0 ; pshufb 0x5f03(%rip),%xmm7 # 2d1d0 <_sk_overlay_sse2_8bit+0x1620>
DB 102,68,15,111,231 ; movdqa %xmm7,%xmm12
DB 102,69,15,213,227 ; pmullw %xmm11,%xmm12
DB 102,68,15,111,239 ; movdqa %xmm7,%xmm13
@@ -37541,21 +37538,20 @@ _sk_lerp_1_float_sse41_8bit LABEL PROC
PUBLIC _sk_lerp_u8_sse41_8bit
_sk_lerp_u8_sse41_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 15,133,46,1,0,0 ; jne 27585 <_sk_lerp_u8_sse41_8bit+0x14f>
- DB 102,66,15,56,48,60,2 ; pmovzxbw (%rdx,%r8,1),%xmm7
- DB 102,15,219,61,106,86,0,0 ; pand 0x566a(%rip),%xmm7 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,46,1,0,0 ; jne 274f0 <_sk_lerp_u8_sse41_8bit+0x14a>
+ DB 102,67,15,56,48,60,24 ; pmovzxbw (%r8,%r11,1),%xmm7
+ DB 102,15,219,61,63,86,0,0 ; pand 0x563f(%rip),%xmm7 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,15,111,247 ; movdqa %xmm7,%xmm6
- DB 102,15,56,0,53,248,93,0,0 ; pshufb 0x5df8(%rip),%xmm6 # 2d270 <_sk_overlay_sse2_8bit+0x15fb>
- DB 102,15,56,0,61,255,93,0,0 ; pshufb 0x5dff(%rip),%xmm7 # 2d280 <_sk_overlay_sse2_8bit+0x160b>
+ DB 102,15,56,0,53,205,93,0,0 ; pshufb 0x5dcd(%rip),%xmm6 # 2d1b0 <_sk_overlay_sse2_8bit+0x1600>
+ DB 102,15,56,0,61,212,93,0,0 ; pshufb 0x5dd4(%rip),%xmm7 # 2d1c0 <_sk_overlay_sse2_8bit+0x1610>
DB 102,68,15,56,48,200 ; pmovzxbw %xmm0,%xmm9
DB 102,65,15,104,192 ; punpckhbw %xmm8,%xmm0
DB 102,68,15,56,48,209 ; pmovzxbw %xmm1,%xmm10
@@ -37611,52 +37607,55 @@ _sk_lerp_u8_sse41_8bit LABEL PROC
DB 102,65,15,252,203 ; paddb %xmm11,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,255 ; pxor %xmm7,%xmm7
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 15,135,196,254,255,255 ; ja 2745e <_sk_lerp_u8_sse41_8bit+0x28>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,123,0,0,0 ; lea 0x7b(%rip),%rcx # 27620 <_sk_lerp_u8_sse41_8bit+0x1ea>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 15,135,193,254,255,255 ; ja 273c9 <_sk_lerp_u8_sse41_8bit+0x23>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,125,0,0,0 ; lea 0x7d(%rip),%r10 # 27590 <_sk_lerp_u8_sse41_8bit+0x1ea>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,248 ; movd %eax,%xmm7
- DB 233,162,254,255,255 ; jmpq 2745e <_sk_lerp_u8_sse41_8bit+0x28>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 233,159,254,255,255 ; jmpq 273c9 <_sk_lerp_u8_sse41_8bit+0x23>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,255 ; pxor %xmm7,%xmm7
DB 102,15,196,248,2 ; pinsrw $0x2,%eax,%xmm7
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,232 ; movd %eax,%xmm5
DB 102,15,56,48,237 ; pmovzxbw %xmm5,%xmm5
DB 102,15,58,14,253,3 ; pblendw $0x3,%xmm5,%xmm7
- DB 233,122,254,255,255 ; jmpq 2745e <_sk_lerp_u8_sse41_8bit+0x28>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,119,254,255,255 ; jmpq 273c9 <_sk_lerp_u8_sse41_8bit+0x23>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,255 ; pxor %xmm7,%xmm7
DB 102,15,196,248,6 ; pinsrw $0x6,%eax,%xmm7
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,248,5 ; pinsrw $0x5,%eax,%xmm7
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,248,4 ; pinsrw $0x4,%eax,%xmm7
- DB 102,66,15,110,44,2 ; movd (%rdx,%r8,1),%xmm5
+ DB 102,67,15,110,44,24 ; movd (%r8,%r11,1),%xmm5
DB 102,15,56,48,237 ; pmovzxbw %xmm5,%xmm5
DB 102,15,58,14,253,15 ; pblendw $0xf,%xmm5,%xmm7
- DB 233,63,254,255,255 ; jmpq 2745e <_sk_lerp_u8_sse41_8bit+0x28>
- DB 144 ; nop
- DB 142,255 ; mov %edi,%?
+ DB 233,60,254,255,255 ; jmpq 273c9 <_sk_lerp_u8_sse41_8bit+0x23>
+ DB 15,31,0 ; nopl (%rax)
+ DB 140,255 ; mov %?,%edi
DB 255 ; (bad)
- DB 255,171,255,255,255,156 ; ljmp *-0x63000001(%rbx)
+ DB 255,169,255,255,255,154 ; ljmp *-0x65000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,231 ; jmpq *%rdi
DB 255 ; (bad)
- DB 233,255,255,255,222 ; jmpq ffffffffdf027630 <_sk_overlay_sse2_8bit+0xffffffffdeffb9bb>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,211 ; callq *%rbx
+ DB 220,255 ; fdivr %st,%st(7)
DB 255 ; (bad)
+ DB 255,209 ; callq *%rcx
DB 255 ; (bad)
- DB 255,196 ; inc %esp
+ DB 255 ; (bad)
+ DB 255,194 ; inc %edx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -37678,7 +37677,7 @@ _sk_move_dst_src_sse41_8bit LABEL PROC
PUBLIC _sk_black_color_sse41_8bit
_sk_black_color_sse41_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,5,183,91,0,0 ; movaps 0x5bb7(%rip),%xmm0 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 15,40,5,135,91,0,0 ; movaps 0x5b87(%rip),%xmm0 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 255,224 ; jmpq *%rax
@@ -37698,7 +37697,7 @@ _sk_clear_sse41_8bit LABEL PROC
PUBLIC _sk_srcatop_sse41_8bit
_sk_srcatop_sse41_8bit LABEL PROC
- DB 102,68,15,111,21,163,91,0,0 ; movdqa 0x5ba3(%rip),%xmm10 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,21,115,91,0,0 ; movdqa 0x5b73(%rip),%xmm10 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,219 ; movdqa %xmm3,%xmm11
DB 102,68,15,56,48,195 ; pmovzxbw %xmm3,%xmm8
DB 102,15,111,235 ; movdqa %xmm3,%xmm5
@@ -37766,7 +37765,7 @@ _sk_srcatop_sse41_8bit LABEL PROC
PUBLIC _sk_dstatop_sse41_8bit
_sk_dstatop_sse41_8bit LABEL PROC
- DB 102,68,15,111,29,104,90,0,0 ; movdqa 0x5a68(%rip),%xmm11 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,29,56,90,0,0 ; movdqa 0x5a38(%rip),%xmm11 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,233 ; movdqa %xmm1,%xmm13
DB 102,69,15,56,0,235 ; pshufb %xmm11,%xmm13
DB 102,68,15,111,248 ; movdqa %xmm0,%xmm15
@@ -37836,7 +37835,7 @@ PUBLIC _sk_srcin_sse41_8bit
_sk_srcin_sse41_8bit LABEL PROC
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
- DB 102,15,111,5,31,89,0,0 ; movdqa 0x591f(%rip),%xmm0 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,5,239,88,0,0 ; movdqa 0x58ef(%rip),%xmm0 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
DB 102,15,56,0,240 ; pshufb %xmm0,%xmm6
DB 102,15,111,250 ; movdqa %xmm2,%xmm7
@@ -37869,9 +37868,10 @@ _sk_srcin_sse41_8bit LABEL PROC
PUBLIC _sk_dstin_sse41_8bit
_sk_dstin_sse41_8bit LABEL PROC
- DB 102,15,111,37,146,88,0,0 ; movdqa 0x5892(%rip),%xmm4 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
- DB 102,15,56,0,204 ; pshufb %xmm4,%xmm1
- DB 102,15,56,0,196 ; pshufb %xmm4,%xmm0
+ DB 102,15,111,232 ; movdqa %xmm0,%xmm5
+ DB 102,15,111,5,94,88,0,0 ; movdqa 0x585e(%rip),%xmm0 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
+ DB 102,15,56,0,200 ; pshufb %xmm0,%xmm1
+ DB 102,15,56,0,232 ; pshufb %xmm0,%xmm5
DB 102,69,15,239,210 ; pxor %xmm10,%xmm10
DB 102,68,15,56,48,194 ; pmovzxbw %xmm2,%xmm8
DB 102,15,111,250 ; movdqa %xmm2,%xmm7
@@ -37879,34 +37879,33 @@ _sk_dstin_sse41_8bit LABEL PROC
DB 102,68,15,56,48,203 ; pmovzxbw %xmm3,%xmm9
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
DB 102,65,15,104,242 ; punpckhbw %xmm10,%xmm6
- DB 102,15,56,48,224 ; pmovzxbw %xmm0,%xmm4
- DB 102,15,56,48,233 ; pmovzxbw %xmm1,%xmm5
- DB 102,65,15,104,194 ; punpckhbw %xmm10,%xmm0
+ DB 102,15,56,48,197 ; pmovzxbw %xmm5,%xmm0
+ DB 102,15,56,48,225 ; pmovzxbw %xmm1,%xmm4
+ DB 102,65,15,104,234 ; punpckhbw %xmm10,%xmm5
DB 102,65,15,104,202 ; punpckhbw %xmm10,%xmm1
DB 102,15,213,206 ; pmullw %xmm6,%xmm1
- DB 102,15,213,199 ; pmullw %xmm7,%xmm0
- DB 102,65,15,213,233 ; pmullw %xmm9,%xmm5
- DB 102,65,15,213,224 ; pmullw %xmm8,%xmm4
- DB 102,15,253,199 ; paddw %xmm7,%xmm0
+ DB 102,15,213,239 ; pmullw %xmm7,%xmm5
+ DB 102,65,15,213,225 ; pmullw %xmm9,%xmm4
+ DB 102,65,15,213,192 ; pmullw %xmm8,%xmm0
+ DB 102,15,253,239 ; paddw %xmm7,%xmm5
DB 102,15,253,206 ; paddw %xmm6,%xmm1
- DB 102,65,15,253,224 ; paddw %xmm8,%xmm4
- DB 102,65,15,253,233 ; paddw %xmm9,%xmm5
+ DB 102,65,15,253,192 ; paddw %xmm8,%xmm0
+ DB 102,65,15,253,225 ; paddw %xmm9,%xmm4
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
- DB 102,15,113,208,8 ; psrlw $0x8,%xmm0
DB 102,15,113,213,8 ; psrlw $0x8,%xmm5
DB 102,15,113,212,8 ; psrlw $0x8,%xmm4
- DB 102,15,103,224 ; packuswb %xmm0,%xmm4
- DB 102,15,103,233 ; packuswb %xmm1,%xmm5
+ DB 102,15,113,208,8 ; psrlw $0x8,%xmm0
+ DB 102,15,103,197 ; packuswb %xmm5,%xmm0
+ DB 102,15,103,225 ; packuswb %xmm1,%xmm4
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 102,15,111,196 ; movdqa %xmm4,%xmm0
- DB 102,15,111,205 ; movdqa %xmm5,%xmm1
+ DB 102,15,111,204 ; movdqa %xmm4,%xmm1
DB 255,224 ; jmpq *%rax
PUBLIC _sk_srcout_sse41_8bit
_sk_srcout_sse41_8bit LABEL PROC
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
- DB 102,15,111,5,245,87,0,0 ; movdqa 0x57f5(%rip),%xmm0 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,5,197,87,0,0 ; movdqa 0x57c5(%rip),%xmm0 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,15,111,250 ; movdqa %xmm2,%xmm7
DB 102,15,56,0,248 ; pshufb %xmm0,%xmm7
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
@@ -37942,7 +37941,7 @@ _sk_srcout_sse41_8bit LABEL PROC
PUBLIC _sk_dstout_sse41_8bit
_sk_dstout_sse41_8bit LABEL PROC
- DB 102,15,111,37,92,87,0,0 ; movdqa 0x575c(%rip),%xmm4 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,37,44,87,0,0 ; movdqa 0x572c(%rip),%xmm4 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,15,56,0,196 ; pshufb %xmm4,%xmm0
DB 102,15,56,0,204 ; pshufb %xmm4,%xmm1
DB 102,15,118,228 ; pcmpeqd %xmm4,%xmm4
@@ -37980,7 +37979,7 @@ _sk_dstout_sse41_8bit LABEL PROC
PUBLIC _sk_srcover_sse41_8bit
_sk_srcover_sse41_8bit LABEL PROC
- DB 102,15,111,53,187,86,0,0 ; movdqa 0x56bb(%rip),%xmm6 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,53,139,86,0,0 ; movdqa 0x568b(%rip),%xmm6 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,217 ; movdqa %xmm1,%xmm11
DB 102,68,15,56,0,222 ; pshufb %xmm6,%xmm11
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
@@ -38019,7 +38018,7 @@ _sk_srcover_sse41_8bit LABEL PROC
PUBLIC _sk_dstover_sse41_8bit
_sk_dstover_sse41_8bit LABEL PROC
- DB 102,68,15,111,5,11,86,0,0 ; movdqa 0x560b(%rip),%xmm8 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,5,219,85,0,0 ; movdqa 0x55db(%rip),%xmm8 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,209 ; movdqa %xmm1,%xmm10
DB 102,68,15,56,48,201 ; pmovzxbw %xmm1,%xmm9
DB 102,15,252,203 ; paddb %xmm3,%xmm1
@@ -38094,7 +38093,7 @@ _sk_multiply_sse41_8bit LABEL PROC
DB 102,15,111,218 ; movdqa %xmm2,%xmm3
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,68,15,111,53,201,84,0,0 ; movdqa 0x54c9(%rip),%xmm14 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,53,153,84,0,0 ; movdqa 0x5499(%rip),%xmm14 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,195 ; movdqa %xmm3,%xmm8
DB 102,15,111,235 ; movdqa %xmm3,%xmm5
DB 102,65,15,56,0,238 ; pshufb %xmm14,%xmm5
@@ -38219,7 +38218,7 @@ _sk_screen_sse41_8bit LABEL PROC
PUBLIC _sk_xor__sse41_8bit
_sk_xor__sse41_8bit LABEL PROC
- DB 102,68,15,111,21,135,82,0,0 ; movdqa 0x5287(%rip),%xmm10 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,21,87,82,0,0 ; movdqa 0x5257(%rip),%xmm10 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,226 ; movdqa %xmm2,%xmm12
DB 102,68,15,56,48,194 ; pmovzxbw %xmm2,%xmm8
DB 102,15,111,234 ; movdqa %xmm2,%xmm5
@@ -38297,7 +38296,7 @@ _sk_plus__sse41_8bit LABEL PROC
PUBLIC _sk_darken_sse41_8bit
_sk_darken_sse41_8bit LABEL PROC
DB 102,68,15,111,240 ; movdqa %xmm0,%xmm14
- DB 102,68,15,111,5,46,81,0,0 ; movdqa 0x512e(%rip),%xmm8 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,5,254,80,0,0 ; movdqa 0x50fe(%rip),%xmm8 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,219 ; movdqa %xmm3,%xmm11
DB 102,68,15,56,48,203 ; pmovzxbw %xmm3,%xmm9
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
@@ -38364,7 +38363,7 @@ _sk_darken_sse41_8bit LABEL PROC
DB 102,15,248,231 ; psubb %xmm7,%xmm4
DB 102,15,248,206 ; psubb %xmm6,%xmm1
DB 102,68,15,248,245 ; psubb %xmm5,%xmm14
- DB 15,40,5,98,80,0,0 ; movaps 0x5062(%rip),%xmm0 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 15,40,5,50,80,0,0 ; movaps 0x5032(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,68,15,56,16,244 ; pblendvb %xmm0,%xmm4,%xmm14
DB 102,65,15,56,16,200 ; pblendvb %xmm0,%xmm8,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -38374,7 +38373,7 @@ _sk_darken_sse41_8bit LABEL PROC
PUBLIC _sk_lighten_sse41_8bit
_sk_lighten_sse41_8bit LABEL PROC
DB 102,68,15,111,240 ; movdqa %xmm0,%xmm14
- DB 102,68,15,111,5,191,79,0,0 ; movdqa 0x4fbf(%rip),%xmm8 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,68,15,111,5,143,79,0,0 ; movdqa 0x4f8f(%rip),%xmm8 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,219 ; movdqa %xmm3,%xmm11
DB 102,68,15,56,48,203 ; pmovzxbw %xmm3,%xmm9
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
@@ -38441,7 +38440,7 @@ _sk_lighten_sse41_8bit LABEL PROC
DB 102,15,248,231 ; psubb %xmm7,%xmm4
DB 102,15,248,206 ; psubb %xmm6,%xmm1
DB 102,68,15,248,245 ; psubb %xmm5,%xmm14
- DB 15,40,5,243,78,0,0 ; movaps 0x4ef3(%rip),%xmm0 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 15,40,5,195,78,0,0 ; movaps 0x4ec3(%rip),%xmm0 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,68,15,56,16,244 ; pblendvb %xmm0,%xmm4,%xmm14
DB 102,65,15,56,16,200 ; pblendvb %xmm0,%xmm8,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -38479,7 +38478,7 @@ _sk_exclusion_sse41_8bit LABEL PROC
DB 102,15,113,215,8 ; psrlw $0x8,%xmm7
DB 102,15,103,253 ; packuswb %xmm5,%xmm7
DB 102,15,103,230 ; packuswb %xmm6,%xmm4
- DB 102,15,111,45,73,78,0,0 ; movdqa 0x4e49(%rip),%xmm5 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 102,15,111,45,25,78,0,0 ; movdqa 0x4e19(%rip),%xmm5 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,15,248,204 ; psubb %xmm4,%xmm1
DB 102,15,219,229 ; pand %xmm5,%xmm4
DB 102,15,219,239 ; pand %xmm7,%xmm5
@@ -38492,7 +38491,7 @@ _sk_exclusion_sse41_8bit LABEL PROC
PUBLIC _sk_difference_sse41_8bit
_sk_difference_sse41_8bit LABEL PROC
DB 102,68,15,111,193 ; movdqa %xmm1,%xmm8
- DB 102,15,111,13,160,77,0,0 ; movdqa 0x4da0(%rip),%xmm1 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,13,112,77,0,0 ; movdqa 0x4d70(%rip),%xmm1 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,111,219 ; movdqa %xmm3,%xmm11
DB 102,68,15,56,48,203 ; pmovzxbw %xmm3,%xmm9
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
@@ -38530,7 +38529,7 @@ _sk_difference_sse41_8bit LABEL PROC
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
DB 102,15,113,215,8 ; psrlw $0x8,%xmm7
DB 102,15,103,254 ; packuswb %xmm6,%xmm7
- DB 102,15,111,37,229,76,0,0 ; movdqa 0x4ce5(%rip),%xmm4 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,37,181,76,0,0 ; movdqa 0x4cb5(%rip),%xmm4 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,15,56,0,204 ; pshufb %xmm4,%xmm1
DB 102,15,56,0,236 ; pshufb %xmm4,%xmm5
DB 102,69,15,104,236 ; punpckhbw %xmm12,%xmm13
@@ -38555,7 +38554,7 @@ _sk_difference_sse41_8bit LABEL PROC
DB 102,15,103,241 ; packuswb %xmm1,%xmm6
DB 102,65,15,218,230 ; pminub %xmm14,%xmm4
DB 102,15,218,247 ; pminub %xmm7,%xmm6
- DB 102,15,111,13,232,76,0,0 ; movdqa 0x4ce8(%rip),%xmm1 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 102,15,111,13,184,76,0,0 ; movdqa 0x4cb8(%rip),%xmm1 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,68,15,248,198 ; psubb %xmm6,%xmm8
DB 102,15,219,241 ; pand %xmm1,%xmm6
DB 102,15,219,204 ; pand %xmm4,%xmm1
@@ -38569,138 +38568,142 @@ _sk_difference_sse41_8bit LABEL PROC
PUBLIC _sk_hardlight_sse41_8bit
_sk_hardlight_sse41_8bit LABEL PROC
DB 72,129,236,24,1,0,0 ; sub $0x118,%rsp
- DB 102,68,15,111,251 ; movdqa %xmm3,%xmm15
+ DB 102,68,15,111,211 ; movdqa %xmm3,%xmm10
DB 102,68,15,111,233 ; movdqa %xmm1,%xmm13
DB 102,68,15,111,240 ; movdqa %xmm0,%xmm14
DB 102,15,239,192 ; pxor %xmm0,%xmm0
- DB 102,69,15,111,198 ; movdqa %xmm14,%xmm8
- DB 102,68,15,104,192 ; punpckhbw %xmm0,%xmm8
- DB 102,15,104,200 ; punpckhbw %xmm0,%xmm1
- DB 102,15,111,225 ; movdqa %xmm1,%xmm4
- DB 102,15,127,100,36,16 ; movdqa %xmm4,0x10(%rsp)
+ DB 102,65,15,111,230 ; movdqa %xmm14,%xmm4
+ DB 102,15,104,224 ; punpckhbw %xmm0,%xmm4
+ DB 102,65,15,111,253 ; movdqa %xmm13,%xmm7
+ DB 102,15,104,248 ; punpckhbw %xmm0,%xmm7
DB 102,65,15,56,48,206 ; pmovzxbw %xmm14,%xmm1
DB 102,15,127,12,36 ; movdqa %xmm1,(%rsp)
DB 102,69,15,56,48,221 ; pmovzxbw %xmm13,%xmm11
DB 102,68,15,127,156,36,176,0,0,0 ; movdqa %xmm11,0xb0(%rsp)
- DB 102,15,111,13,240,75,0,0 ; movdqa 0x4bf0(%rip),%xmm1 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,13,198,75,0,0 ; movdqa 0x4bc6(%rip),%xmm1 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,56,0,241 ; pshufb %xmm1,%xmm14
DB 102,68,15,56,0,233 ; pshufb %xmm1,%xmm13
- DB 102,69,15,56,48,205 ; pmovzxbw %xmm13,%xmm9
+ DB 102,69,15,56,48,197 ; pmovzxbw %xmm13,%xmm8
DB 102,68,15,104,232 ; punpckhbw %xmm0,%xmm13
- DB 102,69,15,56,48,214 ; pmovzxbw %xmm14,%xmm10
+ DB 102,69,15,56,48,254 ; pmovzxbw %xmm14,%xmm15
DB 102,68,15,104,240 ; punpckhbw %xmm0,%xmm14
- DB 102,15,127,84,36,64 ; movdqa %xmm2,0x40(%rsp)
+ DB 102,15,127,84,36,80 ; movdqa %xmm2,0x50(%rsp)
DB 102,15,111,242 ; movdqa %xmm2,%xmm6
DB 102,15,111,234 ; movdqa %xmm2,%xmm5
DB 102,15,104,232 ; punpckhbw %xmm0,%xmm5
- DB 102,68,15,127,124,36,80 ; movdqa %xmm15,0x50(%rsp)
- DB 102,65,15,111,215 ; movdqa %xmm15,%xmm2
- DB 102,68,15,104,248 ; punpckhbw %xmm0,%xmm15
+ DB 102,68,15,127,84,36,96 ; movdqa %xmm10,0x60(%rsp)
+ DB 102,65,15,111,210 ; movdqa %xmm10,%xmm2
+ DB 102,68,15,104,208 ; punpckhbw %xmm0,%xmm10
DB 102,15,56,0,241 ; pshufb %xmm1,%xmm6
DB 102,15,56,0,209 ; pshufb %xmm1,%xmm2
- DB 102,68,15,56,48,226 ; pmovzxbw %xmm2,%xmm12
- DB 102,68,15,127,100,36,32 ; movdqa %xmm12,0x20(%rsp)
+ DB 102,15,56,48,202 ; pmovzxbw %xmm2,%xmm1
+ DB 102,15,127,76,36,16 ; movdqa %xmm1,0x10(%rsp)
DB 102,15,104,208 ; punpckhbw %xmm0,%xmm2
+ DB 102,15,127,84,36,64 ; movdqa %xmm2,0x40(%rsp)
+ DB 102,15,56,48,214 ; pmovzxbw %xmm6,%xmm2
DB 102,15,127,84,36,48 ; movdqa %xmm2,0x30(%rsp)
- DB 102,15,56,48,222 ; pmovzxbw %xmm6,%xmm3
DB 102,15,104,240 ; punpckhbw %xmm0,%xmm6
- DB 102,15,111,254 ; movdqa %xmm6,%xmm7
- DB 102,15,111,196 ; movdqa %xmm4,%xmm0
+ DB 102,68,15,111,206 ; movdqa %xmm6,%xmm9
+ DB 102,15,111,199 ; movdqa %xmm7,%xmm0
DB 102,15,253,192 ; paddw %xmm0,%xmm0
- DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,65,15,56,58,205 ; pminuw %xmm13,%xmm1
- DB 102,15,117,200 ; pcmpeqw %xmm0,%xmm1
- DB 102,15,127,140,36,240,0,0,0 ; movdqa %xmm1,0xf0(%rsp)
- DB 102,65,15,111,192 ; movdqa %xmm8,%xmm0
+ DB 102,15,111,208 ; movdqa %xmm0,%xmm2
+ DB 102,65,15,56,58,213 ; pminuw %xmm13,%xmm2
+ DB 102,15,117,208 ; pcmpeqw %xmm0,%xmm2
+ DB 102,15,127,148,36,240,0,0,0 ; movdqa %xmm2,0xf0(%rsp)
+ DB 102,15,111,196 ; movdqa %xmm4,%xmm0
DB 102,15,253,192 ; paddw %xmm0,%xmm0
- DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,65,15,56,58,206 ; pminuw %xmm14,%xmm1
- DB 102,15,117,200 ; pcmpeqw %xmm0,%xmm1
- DB 102,15,127,140,36,208,0,0,0 ; movdqa %xmm1,0xd0(%rsp)
+ DB 102,15,111,208 ; movdqa %xmm0,%xmm2
+ DB 102,65,15,56,58,214 ; pminuw %xmm14,%xmm2
+ DB 102,15,117,208 ; pcmpeqw %xmm0,%xmm2
+ DB 102,15,127,148,36,208,0,0,0 ; movdqa %xmm2,0xd0(%rsp)
DB 102,65,15,111,195 ; movdqa %xmm11,%xmm0
DB 102,15,253,192 ; paddw %xmm0,%xmm0
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
- DB 102,65,15,111,225 ; movdqa %xmm9,%xmm4
- DB 102,15,127,100,36,96 ; movdqa %xmm4,0x60(%rsp)
- DB 102,15,56,58,212 ; pminuw %xmm4,%xmm2
+ DB 102,65,15,111,216 ; movdqa %xmm8,%xmm3
+ DB 102,15,127,92,36,112 ; movdqa %xmm3,0x70(%rsp)
+ DB 102,15,56,58,211 ; pminuw %xmm3,%xmm2
DB 102,15,117,208 ; pcmpeqw %xmm0,%xmm2
DB 102,15,127,148,36,0,1,0,0 ; movdqa %xmm2,0x100(%rsp)
DB 102,15,111,4,36 ; movdqa (%rsp),%xmm0
DB 102,15,253,192 ; paddw %xmm0,%xmm0
DB 102,15,111,240 ; movdqa %xmm0,%xmm6
- DB 102,65,15,56,58,242 ; pminuw %xmm10,%xmm6
+ DB 102,65,15,56,58,247 ; pminuw %xmm15,%xmm6
DB 102,15,117,240 ; pcmpeqw %xmm0,%xmm6
DB 102,15,127,180,36,192,0,0,0 ; movdqa %xmm6,0xc0(%rsp)
- DB 102,15,111,53,156,67,0,0 ; movdqa 0x439c(%rip),%xmm6 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
- DB 102,15,111,199 ; movdqa %xmm7,%xmm0
+ DB 102,15,111,53,110,67,0,0 ; movdqa 0x436e(%rip),%xmm6 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
+ DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,239,198 ; pxor %xmm6,%xmm0
- DB 102,65,15,213,192 ; pmullw %xmm8,%xmm0
+ DB 102,15,213,196 ; pmullw %xmm4,%xmm0
DB 102,15,127,132,36,224,0,0,0 ; movdqa %xmm0,0xe0(%rsp)
DB 102,69,15,111,222 ; movdqa %xmm14,%xmm11
DB 102,68,15,239,222 ; pxor %xmm6,%xmm11
DB 102,68,15,213,221 ; pmullw %xmm5,%xmm11
- DB 102,15,111,199 ; movdqa %xmm7,%xmm0
- DB 102,15,249,253 ; psubw %xmm5,%xmm7
- DB 102,15,127,188,36,128,0,0,0 ; movdqa %xmm7,0x80(%rsp)
+ DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
+ DB 102,68,15,249,205 ; psubw %xmm5,%xmm9
+ DB 102,68,15,127,140,36,128,0,0,0 ; movdqa %xmm9,0x80(%rsp)
DB 102,68,15,111,205 ; movdqa %xmm5,%xmm9
- DB 102,69,15,213,200 ; pmullw %xmm8,%xmm9
+ DB 102,68,15,213,204 ; pmullw %xmm4,%xmm9
DB 102,65,15,213,198 ; pmullw %xmm14,%xmm0
DB 102,15,127,132,36,144,0,0,0 ; movdqa %xmm0,0x90(%rsp)
- DB 102,69,15,249,240 ; psubw %xmm8,%xmm14
- DB 102,15,111,195 ; movdqa %xmm3,%xmm0
+ DB 102,68,15,249,244 ; psubw %xmm4,%xmm14
+ DB 102,15,111,108,36,48 ; movdqa 0x30(%rsp),%xmm5
+ DB 102,15,111,197 ; movdqa %xmm5,%xmm0
DB 102,15,239,198 ; pxor %xmm6,%xmm0
- DB 102,68,15,111,192 ; movdqa %xmm0,%xmm8
- DB 102,65,15,111,212 ; movdqa %xmm12,%xmm2
+ DB 102,15,127,68,36,32 ; movdqa %xmm0,0x20(%rsp)
+ DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,239,214 ; pxor %xmm6,%xmm2
- DB 102,15,111,76,36,48 ; movdqa 0x30(%rsp),%xmm1
- DB 102,15,111,193 ; movdqa %xmm1,%xmm0
+ DB 102,15,111,100,36,64 ; movdqa 0x40(%rsp),%xmm4
+ DB 102,15,111,196 ; movdqa %xmm4,%xmm0
DB 102,15,239,198 ; pxor %xmm6,%xmm0
- DB 102,68,15,111,100,36,16 ; movdqa 0x10(%rsp),%xmm12
- DB 102,65,15,213,196 ; pmullw %xmm12,%xmm0
+ DB 102,15,111,207 ; movdqa %xmm7,%xmm1
+ DB 102,15,213,193 ; pmullw %xmm1,%xmm0
DB 102,15,127,132,36,160,0,0,0 ; movdqa %xmm0,0xa0(%rsp)
- DB 102,65,15,111,194 ; movdqa %xmm10,%xmm0
- DB 102,15,111,248 ; movdqa %xmm0,%xmm7
+ DB 102,65,15,111,199 ; movdqa %xmm15,%xmm0
+ DB 102,68,15,111,192 ; movdqa %xmm0,%xmm8
+ DB 102,68,15,239,198 ; pxor %xmm6,%xmm8
+ DB 102,15,111,251 ; movdqa %xmm3,%xmm7
DB 102,15,239,254 ; pxor %xmm6,%xmm7
- DB 102,15,111,236 ; movdqa %xmm4,%xmm5
- DB 102,15,239,238 ; pxor %xmm6,%xmm5
DB 102,65,15,239,245 ; pxor %xmm13,%xmm6
- DB 102,65,15,111,231 ; movdqa %xmm15,%xmm4
- DB 102,15,213,244 ; pmullw %xmm4,%xmm6
- DB 102,68,15,111,249 ; movdqa %xmm1,%xmm15
- DB 102,15,249,204 ; psubw %xmm4,%xmm1
- DB 102,15,127,76,36,48 ; movdqa %xmm1,0x30(%rsp)
- DB 102,65,15,213,228 ; pmullw %xmm12,%xmm4
+ DB 102,65,15,213,242 ; pmullw %xmm10,%xmm6
+ DB 102,68,15,111,252 ; movdqa %xmm4,%xmm15
+ DB 102,65,15,249,226 ; psubw %xmm10,%xmm4
+ DB 102,15,127,100,36,64 ; movdqa %xmm4,0x40(%rsp)
+ DB 102,65,15,111,226 ; movdqa %xmm10,%xmm4
+ DB 102,15,213,225 ; pmullw %xmm1,%xmm4
DB 102,69,15,213,253 ; pmullw %xmm13,%xmm15
- DB 102,69,15,249,236 ; psubw %xmm12,%xmm13
- DB 102,68,15,111,20,36 ; movdqa (%rsp),%xmm10
- DB 102,69,15,213,194 ; pmullw %xmm10,%xmm8
- DB 102,68,15,127,68,36,16 ; movdqa %xmm8,0x10(%rsp)
- DB 102,68,15,56,48,68,36,64 ; pmovzxbw 0x40(%rsp),%xmm8
- DB 102,65,15,213,248 ; pmullw %xmm8,%xmm7
- DB 102,68,15,111,227 ; movdqa %xmm3,%xmm12
- DB 102,65,15,249,216 ; psubw %xmm8,%xmm3
- DB 102,15,127,92,36,112 ; movdqa %xmm3,0x70(%rsp)
- DB 102,69,15,213,194 ; pmullw %xmm10,%xmm8
+ DB 102,68,15,249,233 ; psubw %xmm1,%xmm13
+ DB 102,15,111,28,36 ; movdqa (%rsp),%xmm3
+ DB 102,15,111,76,36,32 ; movdqa 0x20(%rsp),%xmm1
+ DB 102,15,213,203 ; pmullw %xmm3,%xmm1
+ DB 102,15,127,76,36,32 ; movdqa %xmm1,0x20(%rsp)
+ DB 102,15,56,48,76,36,80 ; pmovzxbw 0x50(%rsp),%xmm1
+ DB 102,68,15,213,193 ; pmullw %xmm1,%xmm8
+ DB 102,68,15,111,229 ; movdqa %xmm5,%xmm12
+ DB 102,15,249,233 ; psubw %xmm1,%xmm5
+ DB 102,15,127,108,36,48 ; movdqa %xmm5,0x30(%rsp)
+ DB 102,15,111,233 ; movdqa %xmm1,%xmm5
+ DB 102,68,15,111,211 ; movdqa %xmm3,%xmm10
+ DB 102,65,15,213,234 ; pmullw %xmm10,%xmm5
DB 102,68,15,213,224 ; pmullw %xmm0,%xmm12
DB 102,65,15,249,194 ; psubw %xmm10,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,111,156,36,176,0,0,0 ; movdqa 0xb0(%rsp),%xmm3
DB 102,15,213,211 ; pmullw %xmm3,%xmm2
DB 102,15,127,20,36 ; movdqa %xmm2,(%rsp)
- DB 102,15,56,48,84,36,80 ; pmovzxbw 0x50(%rsp),%xmm2
- DB 102,15,213,234 ; pmullw %xmm2,%xmm5
- DB 102,15,111,68,36,32 ; movdqa 0x20(%rsp),%xmm0
+ DB 102,15,56,48,84,36,96 ; pmovzxbw 0x60(%rsp),%xmm2
+ DB 102,15,213,250 ; pmullw %xmm2,%xmm7
+ DB 102,15,111,68,36,16 ; movdqa 0x10(%rsp),%xmm0
DB 102,68,15,111,208 ; movdqa %xmm0,%xmm10
DB 102,15,249,194 ; psubw %xmm2,%xmm0
- DB 102,15,127,68,36,32 ; movdqa %xmm0,0x20(%rsp)
+ DB 102,15,127,68,36,16 ; movdqa %xmm0,0x10(%rsp)
DB 102,15,213,211 ; pmullw %xmm3,%xmm2
- DB 102,15,111,68,36,96 ; movdqa 0x60(%rsp),%xmm0
+ DB 102,15,111,68,36,112 ; movdqa 0x70(%rsp),%xmm0
DB 102,68,15,213,208 ; pmullw %xmm0,%xmm10
DB 102,15,249,195 ; psubw %xmm3,%xmm0
- DB 102,68,15,213,108,36,48 ; pmullw 0x30(%rsp),%xmm13
+ DB 102,68,15,213,108,36,64 ; pmullw 0x40(%rsp),%xmm13
DB 102,68,15,213,180,36,128,0,0,0 ; pmullw 0x80(%rsp),%xmm14
- DB 102,15,213,68,36,32 ; pmullw 0x20(%rsp),%xmm0
- DB 102,15,213,76,36,112 ; pmullw 0x70(%rsp),%xmm1
+ DB 102,15,213,68,36,16 ; pmullw 0x10(%rsp),%xmm0
+ DB 102,15,213,76,36,48 ; pmullw 0x30(%rsp),%xmm1
DB 102,15,253,192 ; paddw %xmm0,%xmm0
DB 102,68,15,249,208 ; psubw %xmm0,%xmm10
DB 102,15,253,201 ; paddw %xmm1,%xmm1
@@ -38722,11 +38725,11 @@ _sk_hardlight_sse41_8bit LABEL PROC
DB 102,65,15,223,199 ; pandn %xmm15,%xmm0
DB 102,15,235,196 ; por %xmm4,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,69,15,253,192 ; paddw %xmm8,%xmm8
+ DB 102,15,253,237 ; paddw %xmm5,%xmm5
DB 102,15,111,132,36,192,0,0,0 ; movdqa 0xc0(%rsp),%xmm0
- DB 102,68,15,219,192 ; pand %xmm0,%xmm8
+ DB 102,15,219,232 ; pand %xmm0,%xmm5
DB 102,65,15,223,196 ; pandn %xmm12,%xmm0
- DB 102,65,15,235,192 ; por %xmm8,%xmm0
+ DB 102,15,235,197 ; por %xmm5,%xmm0
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
DB 102,15,253,210 ; paddw %xmm2,%xmm2
DB 102,15,111,132,36,0,1,0,0 ; movdqa 0x100(%rsp),%xmm0
@@ -38736,33 +38739,33 @@ _sk_hardlight_sse41_8bit LABEL PROC
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
DB 102,68,15,253,156,36,224,0,0,0 ; paddw 0xe0(%rsp),%xmm11
DB 102,15,253,180,36,160,0,0,0 ; paddw 0xa0(%rsp),%xmm6
- DB 102,15,253,124,36,16 ; paddw 0x10(%rsp),%xmm7
- DB 102,15,253,44,36 ; paddw (%rsp),%xmm5
- DB 102,15,111,5,57,73,0,0 ; movdqa 0x4939(%rip),%xmm0 # 2d2b0 <_sk_overlay_sse2_8bit+0x163b>
+ DB 102,68,15,253,68,36,32 ; paddw 0x20(%rsp),%xmm8
+ DB 102,15,253,60,36 ; paddw (%rsp),%xmm7
+ DB 102,15,111,5,251,72,0,0 ; movdqa 0x48fb(%rip),%xmm0 # 2d1f0 <_sk_overlay_sse2_8bit+0x1640>
DB 102,68,15,253,216 ; paddw %xmm0,%xmm11
DB 102,68,15,253,219 ; paddw %xmm3,%xmm11
DB 102,15,253,240 ; paddw %xmm0,%xmm6
DB 102,15,253,241 ; paddw %xmm1,%xmm6
+ DB 102,68,15,253,192 ; paddw %xmm0,%xmm8
+ DB 102,68,15,253,196 ; paddw %xmm4,%xmm8
DB 102,15,253,248 ; paddw %xmm0,%xmm7
- DB 102,15,253,252 ; paddw %xmm4,%xmm7
- DB 102,15,253,232 ; paddw %xmm0,%xmm5
- DB 102,15,253,234 ; paddw %xmm2,%xmm5
- DB 102,15,111,5,31,73,0,0 ; movdqa 0x491f(%rip),%xmm0 # 2d2c0 <_sk_overlay_sse2_8bit+0x164b>
+ DB 102,15,253,250 ; paddw %xmm2,%xmm7
+ DB 102,15,111,5,223,72,0,0 ; movdqa 0x48df(%rip),%xmm0 # 2d200 <_sk_overlay_sse2_8bit+0x1650>
DB 102,15,228,240 ; pmulhuw %xmm0,%xmm6
DB 102,68,15,228,216 ; pmulhuw %xmm0,%xmm11
- DB 102,15,228,232 ; pmulhuw %xmm0,%xmm5
DB 102,15,228,248 ; pmulhuw %xmm0,%xmm7
+ DB 102,68,15,228,192 ; pmulhuw %xmm0,%xmm8
DB 102,65,15,113,211,7 ; psrlw $0x7,%xmm11
- DB 102,15,113,215,7 ; psrlw $0x7,%xmm7
- DB 102,65,15,103,251 ; packuswb %xmm11,%xmm7
+ DB 102,65,15,113,208,7 ; psrlw $0x7,%xmm8
+ DB 102,69,15,103,195 ; packuswb %xmm11,%xmm8
DB 102,15,113,214,7 ; psrlw $0x7,%xmm6
- DB 102,15,113,213,7 ; psrlw $0x7,%xmm5
- DB 102,15,103,238 ; packuswb %xmm6,%xmm5
+ DB 102,15,113,215,7 ; psrlw $0x7,%xmm7
+ DB 102,15,103,254 ; packuswb %xmm6,%xmm7
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,84,36,64 ; movaps 0x40(%rsp),%xmm2
- DB 15,40,92,36,80 ; movaps 0x50(%rsp),%xmm3
- DB 102,15,111,199 ; movdqa %xmm7,%xmm0
- DB 102,15,111,205 ; movdqa %xmm5,%xmm1
+ DB 15,40,84,36,80 ; movaps 0x50(%rsp),%xmm2
+ DB 15,40,92,36,96 ; movaps 0x60(%rsp),%xmm3
+ DB 102,65,15,111,192 ; movdqa %xmm8,%xmm0
+ DB 102,15,111,207 ; movdqa %xmm7,%xmm1
DB 72,129,196,24,1,0,0 ; add $0x118,%rsp
DB 255,224 ; jmpq *%rax
@@ -38780,7 +38783,7 @@ _sk_overlay_sse41_8bit LABEL PROC
DB 102,15,127,12,36 ; movdqa %xmm1,(%rsp)
DB 102,65,15,56,48,206 ; pmovzxbw %xmm14,%xmm1
DB 102,15,127,140,36,16,1,0,0 ; movdqa %xmm1,0x110(%rsp)
- DB 102,15,111,13,233,71,0,0 ; movdqa 0x47e9(%rip),%xmm1 # 2d220 <_sk_overlay_sse2_8bit+0x15ab>
+ DB 102,15,111,13,166,71,0,0 ; movdqa 0x47a6(%rip),%xmm1 # 2d160 <_sk_overlay_sse2_8bit+0x15b0>
DB 102,68,15,56,0,249 ; pshufb %xmm1,%xmm15
DB 102,68,15,56,0,241 ; pshufb %xmm1,%xmm14
DB 102,65,15,56,48,238 ; pmovzxbw %xmm14,%xmm5
@@ -38832,7 +38835,7 @@ _sk_overlay_sse41_8bit LABEL PROC
DB 102,65,15,56,58,221 ; pminuw %xmm13,%xmm3
DB 102,15,117,216 ; pcmpeqw %xmm0,%xmm3
DB 102,15,127,156,36,176,0,0,0 ; movdqa %xmm3,0xb0(%rsp)
- DB 102,15,111,53,124,63,0,0 ; movdqa 0x3f7c(%rip),%xmm6 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,111,53,57,63,0,0 ; movdqa 0x3f39(%rip),%xmm6 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,239,198 ; pxor %xmm6,%xmm0
DB 102,15,213,196 ; pmullw %xmm4,%xmm0
@@ -38941,7 +38944,7 @@ _sk_overlay_sse41_8bit LABEL PROC
DB 102,15,253,180,36,160,0,0,0 ; paddw 0xa0(%rsp),%xmm6
DB 102,68,15,253,132,36,128,0,0,0 ; paddw 0x80(%rsp),%xmm8
DB 102,15,253,44,36 ; paddw (%rsp),%xmm5
- DB 102,15,111,5,24,69,0,0 ; movdqa 0x4518(%rip),%xmm0 # 2d2b0 <_sk_overlay_sse2_8bit+0x163b>
+ DB 102,15,111,5,213,68,0,0 ; movdqa 0x44d5(%rip),%xmm0 # 2d1f0 <_sk_overlay_sse2_8bit+0x1640>
DB 102,68,15,253,216 ; paddw %xmm0,%xmm11
DB 102,69,15,253,217 ; paddw %xmm9,%xmm11
DB 102,15,253,240 ; paddw %xmm0,%xmm6
@@ -38950,7 +38953,7 @@ _sk_overlay_sse41_8bit LABEL PROC
DB 102,68,15,253,195 ; paddw %xmm3,%xmm8
DB 102,15,253,232 ; paddw %xmm0,%xmm5
DB 102,15,253,234 ; paddw %xmm2,%xmm5
- DB 102,15,111,5,252,68,0,0 ; movdqa 0x44fc(%rip),%xmm0 # 2d2c0 <_sk_overlay_sse2_8bit+0x164b>
+ DB 102,15,111,5,185,68,0,0 ; movdqa 0x44b9(%rip),%xmm0 # 2d200 <_sk_overlay_sse2_8bit+0x1650>
DB 102,15,228,240 ; pmulhuw %xmm0,%xmm6
DB 102,68,15,228,216 ; pmulhuw %xmm0,%xmm11
DB 102,15,228,232 ; pmulhuw %xmm0,%xmm5
@@ -38968,9 +38971,6 @@ _sk_overlay_sse41_8bit LABEL PROC
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 72,129,196,72,1,0,0 ; add $0x148,%rsp
DB 255,224 ; jmpq *%rax
- DB 144 ; nop
- DB 144 ; nop
- DB 144 ; nop
PUBLIC _sk_start_pipeline_sse2_8bit
_sk_start_pipeline_sse2_8bit LABEL PROC
@@ -38983,7 +38983,7 @@ _sk_start_pipeline_sse2_8bit LABEL PROC
DB 86 ; push %rsi
DB 87 ; push %rdi
DB 83 ; push %rbx
- DB 72,129,236,216,0,0,0 ; sub $0xd8,%rsp
+ DB 72,129,236,200,0,0,0 ; sub $0xc8,%rsp
DB 68,15,41,125,176 ; movaps %xmm15,-0x50(%rbp)
DB 68,15,41,117,160 ; movaps %xmm14,-0x60(%rbp)
DB 68,15,41,109,144 ; movaps %xmm13,-0x70(%rbp)
@@ -38994,45 +38994,42 @@ _sk_start_pipeline_sse2_8bit LABEL PROC
DB 68,15,41,133,64,255,255,255 ; movaps %xmm8,-0xc0(%rbp)
DB 15,41,189,48,255,255,255 ; movaps %xmm7,-0xd0(%rbp)
DB 15,41,181,32,255,255,255 ; movaps %xmm6,-0xe0(%rbp)
- DB 76,137,195 ; mov %r8,%rbx
- DB 73,137,215 ; mov %rdx,%r15
+ DB 77,137,199 ; mov %r8,%r15
+ DB 72,137,211 ; mov %rdx,%rbx
DB 72,137,141,24,255,255,255 ; mov %rcx,-0xe8(%rbp)
DB 72,139,117,48 ; mov 0x30(%rbp),%rsi
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,197 ; mov %rax,%r13
DB 73,137,246 ; mov %rsi,%r14
- DB 76,137,141,240,254,255,255 ; mov %r9,-0x110(%rbp)
- DB 77,57,207 ; cmp %r9,%r15
- DB 15,131,138,0,0,0 ; jae 28f27 <_sk_start_pipeline_sse2_8bit+0x10b>
+ DB 76,137,141,8,255,255,255 ; mov %r9,-0xf8(%rbp)
+ DB 76,57,203 ; cmp %r9,%rbx
+ DB 115,101 ; jae 28e7e <_sk_start_pipeline_sse2_8bit+0xe2>
DB 72,139,133,24,255,255,255 ; mov -0xe8(%rbp),%rax
DB 72,141,64,8 ; lea 0x8(%rax),%rax
- DB 72,137,133,248,254,255,255 ; mov %rax,-0x108(%rbp)
- DB 76,141,165,0,255,255,255 ; lea -0x100(%rbp),%r12
- DB 72,57,157,248,254,255,255 ; cmp %rbx,-0x108(%rbp)
- DB 72,139,133,24,255,255,255 ; mov -0xe8(%rbp),%rax
- DB 72,137,133,0,255,255,255 ; mov %rax,-0x100(%rbp)
- DB 76,137,189,8,255,255,255 ; mov %r15,-0xf8(%rbp)
- DB 72,199,133,16,255,255,255,0,0,0,0 ; movq $0x0,-0xf0(%rbp)
- DB 119,36 ; ja 28f03 <_sk_start_pipeline_sse2_8bit+0xe7>
- DB 76,137,231 ; mov %r12,%rdi
+ DB 72,137,133,16,255,255,255 ; mov %rax,-0xf0(%rbp)
+ DB 76,57,189,16,255,255,255 ; cmp %r15,-0xf0(%rbp)
+ DB 72,139,149,24,255,255,255 ; mov -0xe8(%rbp),%rdx
+ DB 119,38 ; ja 28e61 <_sk_start_pipeline_sse2_8bit+0xc5>
+ DB 76,139,165,24,255,255,255 ; mov -0xe8(%rbp),%r12
+ DB 49,255 ; xor %edi,%edi
DB 76,137,246 ; mov %r14,%rsi
- DB 65,255,213 ; callq *%r13
- DB 72,139,141,0,255,255,255 ; mov -0x100(%rbp),%rcx
- DB 72,141,65,8 ; lea 0x8(%rcx),%rax
- DB 72,137,133,0,255,255,255 ; mov %rax,-0x100(%rbp)
- DB 72,131,193,16 ; add $0x10,%rcx
- DB 72,57,217 ; cmp %rbx,%rcx
- DB 118,220 ; jbe 28edf <_sk_start_pipeline_sse2_8bit+0xc3>
+ DB 76,137,226 ; mov %r12,%rdx
DB 72,137,217 ; mov %rbx,%rcx
- DB 72,41,193 ; sub %rax,%rcx
- DB 116,16 ; je 28f1b <_sk_start_pipeline_sse2_8bit+0xff>
- DB 72,137,141,16,255,255,255 ; mov %rcx,-0xf0(%rbp)
- DB 76,137,231 ; mov %r12,%rdi
+ DB 65,255,213 ; callq *%r13
+ DB 73,141,84,36,8 ; lea 0x8(%r12),%rdx
+ DB 73,131,196,16 ; add $0x10,%r12
+ DB 77,57,252 ; cmp %r15,%r12
+ DB 73,137,212 ; mov %rdx,%r12
+ DB 118,225 ; jbe 28e42 <_sk_start_pipeline_sse2_8bit+0xa6>
+ DB 76,137,255 ; mov %r15,%rdi
+ DB 72,41,215 ; sub %rdx,%rdi
+ DB 116,9 ; je 28e72 <_sk_start_pipeline_sse2_8bit+0xd6>
DB 76,137,246 ; mov %r14,%rsi
+ DB 72,137,217 ; mov %rbx,%rcx
DB 65,255,213 ; callq *%r13
- DB 73,255,199 ; inc %r15
- DB 76,59,189,240,254,255,255 ; cmp -0x110(%rbp),%r15
- DB 117,143 ; jne 28eb6 <_sk_start_pipeline_sse2_8bit+0x9a>
+ DB 72,255,195 ; inc %rbx
+ DB 72,59,157,8,255,255,255 ; cmp -0xf8(%rbp),%rbx
+ DB 117,173 ; jne 28e2b <_sk_start_pipeline_sse2_8bit+0x8f>
DB 15,40,181,32,255,255,255 ; movaps -0xe0(%rbp),%xmm6
DB 15,40,189,48,255,255,255 ; movaps -0xd0(%rbp),%xmm7
DB 68,15,40,133,64,255,255,255 ; movaps -0xc0(%rbp),%xmm8
@@ -39043,7 +39040,7 @@ _sk_start_pipeline_sse2_8bit LABEL PROC
DB 68,15,40,109,144 ; movaps -0x70(%rbp),%xmm13
DB 68,15,40,117,160 ; movaps -0x60(%rbp),%xmm14
DB 68,15,40,125,176 ; movaps -0x50(%rbp),%xmm15
- DB 72,129,196,216,0,0,0 ; add $0xd8,%rsp
+ DB 72,129,196,200,0,0,0 ; add $0xc8,%rsp
DB 91 ; pop %rbx
DB 95 ; pop %rdi
DB 94 ; pop %rsi
@@ -39070,22 +39067,22 @@ _sk_uniform_color_sse2_8bit LABEL PROC
PUBLIC _sk_set_rgb_sse2_8bit
_sk_set_rgb_sse2_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 243,15,16,37,116,49,0,0 ; movss 0x3174(%rip),%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 243,15,16,37,89,49,0,0 ; movss 0x3159(%rip),%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 243,15,16,40 ; movss (%rax),%xmm5
DB 243,15,89,236 ; mulss %xmm4,%xmm5
- DB 243,72,15,44,205 ; cvttss2si %xmm5,%rcx
+ DB 243,76,15,44,197 ; cvttss2si %xmm5,%r8
DB 243,15,16,104,4 ; movss 0x4(%rax),%xmm5
DB 243,15,89,236 ; mulss %xmm4,%xmm5
- DB 243,72,15,44,213 ; cvttss2si %xmm5,%rdx
- DB 193,226,8 ; shl $0x8,%edx
- DB 9,202 ; or %ecx,%edx
+ DB 243,76,15,44,205 ; cvttss2si %xmm5,%r9
+ DB 65,193,225,8 ; shl $0x8,%r9d
+ DB 69,9,193 ; or %r8d,%r9d
DB 243,15,89,96,8 ; mulss 0x8(%rax),%xmm4
DB 243,72,15,44,196 ; cvttss2si %xmm4,%rax
DB 193,224,16 ; shl $0x10,%eax
- DB 9,208 ; or %edx,%eax
+ DB 68,9,200 ; or %r9d,%eax
DB 102,15,110,224 ; movd %eax,%xmm4
DB 102,15,112,228,0 ; pshufd $0x0,%xmm4,%xmm4
- DB 102,15,111,45,52,66,0,0 ; movdqa 0x4234(%rip),%xmm5 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,45,26,66,0,0 ; movdqa 0x421a(%rip),%xmm5 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,219,205 ; pand %xmm5,%xmm1
DB 102,15,219,197 ; pand %xmm5,%xmm0
DB 102,15,235,196 ; por %xmm4,%xmm0
@@ -39108,7 +39105,7 @@ _sk_premul_sse2_8bit LABEL PROC
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
DB 242,15,112,192,95 ; pshuflw $0x5f,%xmm0,%xmm0
DB 243,15,112,248,95 ; pshufhw $0x5f,%xmm0,%xmm7
- DB 102,15,111,5,216,65,0,0 ; movdqa 0x41d8(%rip),%xmm0 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,5,190,65,0,0 ; movdqa 0x41be(%rip),%xmm0 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,235,248 ; por %xmm0,%xmm7
DB 102,15,235,240 ; por %xmm0,%xmm6
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
@@ -39174,53 +39171,53 @@ _sk_invert_sse2_8bit LABEL PROC
PUBLIC _sk_load_8888_sse2_8bit
_sk_load_8888_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,16 ; jne 29158 <_sk_load_8888_sse2_8bit+0x31>
- DB 66,15,16,76,130,16 ; movups 0x10(%rdx,%r8,4),%xmm1
- DB 102,66,15,16,4,130 ; movupd (%rdx,%r8,4),%xmm0
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,16 ; jne 290ad <_sk_load_8888_sse2_8bit+0x2c>
+ DB 67,15,16,76,152,16 ; movups 0x10(%r8,%r11,4),%xmm1
+ DB 102,67,15,16,4,152 ; movupd (%r8,%r11,4),%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,231 ; ja 29154 <_sk_load_8888_sse2_8bit+0x2d>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,80,0,0,0 ; lea 0x50(%rip),%rcx # 291c8 <_sk_load_8888_sse2_8bit+0xa1>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,228 ; ja 290a9 <_sk_load_8888_sse2_8bit+0x28>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,80,0,0,0 ; lea 0x50(%rip),%r10 # 29120 <_sk_load_8888_sse2_8bit+0x9f>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 243,66,15,16,4,130 ; movss (%rdx,%r8,4),%xmm0
- DB 235,203 ; jmp 29154 <_sk_load_8888_sse2_8bit+0x2d>
- DB 102,66,15,110,68,130,8 ; movd 0x8(%rdx,%r8,4),%xmm0
+ DB 243,67,15,16,4,152 ; movss (%r8,%r11,4),%xmm0
+ DB 235,200 ; jmp 290a9 <_sk_load_8888_sse2_8bit+0x28>
+ DB 102,67,15,110,68,152,8 ; movd 0x8(%r8,%r11,4),%xmm0
DB 102,15,112,192,69 ; pshufd $0x45,%xmm0,%xmm0
- DB 102,66,15,18,4,130 ; movlpd (%rdx,%r8,4),%xmm0
- DB 235,183 ; jmp 29154 <_sk_load_8888_sse2_8bit+0x2d>
- DB 102,66,15,110,68,130,24 ; movd 0x18(%rdx,%r8,4),%xmm0
+ DB 102,67,15,18,4,152 ; movlpd (%r8,%r11,4),%xmm0
+ DB 235,180 ; jmp 290a9 <_sk_load_8888_sse2_8bit+0x28>
+ DB 102,67,15,110,68,152,24 ; movd 0x18(%r8,%r11,4),%xmm0
DB 102,15,112,200,69 ; pshufd $0x45,%xmm0,%xmm1
- DB 243,66,15,16,68,130,20 ; movss 0x14(%rdx,%r8,4),%xmm0
+ DB 243,67,15,16,68,152,20 ; movss 0x14(%r8,%r11,4),%xmm0
DB 15,198,193,0 ; shufps $0x0,%xmm1,%xmm0
DB 15,198,193,226 ; shufps $0xe2,%xmm1,%xmm0
DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 243,66,15,16,68,130,16 ; movss 0x10(%rdx,%r8,4),%xmm0
+ DB 243,67,15,16,68,152,16 ; movss 0x10(%r8,%r11,4),%xmm0
DB 243,15,16,200 ; movss %xmm0,%xmm1
- DB 235,134 ; jmp 2914e <_sk_load_8888_sse2_8bit+0x27>
+ DB 235,131 ; jmp 290a3 <_sk_load_8888_sse2_8bit+0x22>
DB 185,255,255,255,205 ; mov $0xcdffffff,%ecx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,193 ; inc %ecx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,134,255,255,255,243 ; incl -0xc000001(%rsi)
+ DB 255,131,255,255,255,243 ; incl -0xc000001(%rbx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,225 ; jmpq *%rcx
@@ -39233,141 +39230,136 @@ _sk_load_8888_sse2_8bit LABEL PROC
PUBLIC _sk_load_8888_dst_sse2_8bit
_sk_load_8888_dst_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,16 ; jne 29215 <_sk_load_8888_dst_sse2_8bit+0x31>
- DB 66,15,16,92,130,16 ; movups 0x10(%rdx,%r8,4),%xmm3
- DB 102,66,15,16,20,130 ; movupd (%rdx,%r8,4),%xmm2
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,16 ; jne 29168 <_sk_load_8888_dst_sse2_8bit+0x2c>
+ DB 67,15,16,92,152,16 ; movups 0x10(%r8,%r11,4),%xmm3
+ DB 102,67,15,16,20,152 ; movupd (%r8,%r11,4),%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,231 ; ja 29211 <_sk_load_8888_dst_sse2_8bit+0x2d>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,83,0,0,0 ; lea 0x53(%rip),%rcx # 29288 <_sk_load_8888_dst_sse2_8bit+0xa4>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,228 ; ja 29164 <_sk_load_8888_dst_sse2_8bit+0x28>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,81,0,0,0 ; lea 0x51(%rip),%r10 # 291dc <_sk_load_8888_dst_sse2_8bit+0xa0>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 243,66,15,16,20,130 ; movss (%rdx,%r8,4),%xmm2
- DB 235,203 ; jmp 29211 <_sk_load_8888_dst_sse2_8bit+0x2d>
- DB 102,66,15,110,84,130,8 ; movd 0x8(%rdx,%r8,4),%xmm2
+ DB 243,67,15,16,20,152 ; movss (%r8,%r11,4),%xmm2
+ DB 235,200 ; jmp 29164 <_sk_load_8888_dst_sse2_8bit+0x28>
+ DB 102,67,15,110,84,152,8 ; movd 0x8(%r8,%r11,4),%xmm2
DB 102,15,112,210,69 ; pshufd $0x45,%xmm2,%xmm2
- DB 102,66,15,18,20,130 ; movlpd (%rdx,%r8,4),%xmm2
- DB 235,183 ; jmp 29211 <_sk_load_8888_dst_sse2_8bit+0x2d>
- DB 102,66,15,110,84,130,24 ; movd 0x18(%rdx,%r8,4),%xmm2
+ DB 102,67,15,18,20,152 ; movlpd (%r8,%r11,4),%xmm2
+ DB 235,180 ; jmp 29164 <_sk_load_8888_dst_sse2_8bit+0x28>
+ DB 102,67,15,110,84,152,24 ; movd 0x18(%r8,%r11,4),%xmm2
DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3
- DB 243,66,15,16,84,130,20 ; movss 0x14(%rdx,%r8,4),%xmm2
+ DB 243,67,15,16,84,152,20 ; movss 0x14(%r8,%r11,4),%xmm2
DB 15,198,211,0 ; shufps $0x0,%xmm3,%xmm2
DB 15,198,211,226 ; shufps $0xe2,%xmm3,%xmm2
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 243,66,15,16,84,130,16 ; movss 0x10(%rdx,%r8,4),%xmm2
+ DB 243,67,15,16,84,152,16 ; movss 0x10(%r8,%r11,4),%xmm2
DB 243,15,16,218 ; movss %xmm2,%xmm3
- DB 235,134 ; jmp 2920b <_sk_load_8888_dst_sse2_8bit+0x27>
- DB 15,31,0 ; nopl (%rax)
- DB 182,255 ; mov $0xff,%dh
- DB 255 ; (bad)
- DB 255,202 ; dec %edx
+ DB 235,131 ; jmp 2915e <_sk_load_8888_dst_sse2_8bit+0x22>
+ DB 144 ; nop
+ DB 184,255,255,255,204 ; mov $0xccffffff,%eax
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,192 ; inc %eax
DB 255 ; (bad)
- DB 190,255,255,255,131 ; mov $0x83ffffff,%esi
DB 255 ; (bad)
- DB 255 ; (bad)
- DB 255,240 ; push %rax
+ DB 255,130,255,255,255,242 ; incl -0xd000001(%rdx)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,224 ; jmpq *%rax
DB 255 ; (bad)
- DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,210 ; callq *%rdx
+ DB 255,212 ; callq *%rsp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_8888_sse2_8bit
_sk_store_8888_sse2_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,192 ; test %r8,%r8
- DB 117,17 ; jne 292d6 <_sk_store_8888_sse2_8bit+0x32>
- DB 243,66,15,127,4,138 ; movdqu %xmm0,(%rdx,%r9,4)
- DB 243,66,15,127,76,138,16 ; movdqu %xmm1,0x10(%rdx,%r9,4)
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 255,224 ; jmpq *%rax
- DB 65,128,224,7 ; and $0x7,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,239 ; ja 292d2 <_sk_store_8888_sse2_8bit+0x2e>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,78,0,0,0 ; lea 0x4e(%rip),%rcx # 2933c <_sk_store_8888_sse2_8bit+0x98>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,66,15,126,4,138 ; movd %xmm0,(%rdx,%r9,4)
- DB 235,211 ; jmp 292d2 <_sk_store_8888_sse2_8bit+0x2e>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 29225 <_sk_store_8888_sse2_8bit+0x2d>
+ DB 243,67,15,127,4,152 ; movdqu %xmm0,(%r8,%r11,4)
+ DB 243,67,15,127,76,152,16 ; movdqu %xmm1,0x10(%r8,%r11,4)
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 119,236 ; ja 29221 <_sk_store_8888_sse2_8bit+0x29>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,76,0,0,0 ; lea 0x4c(%rip),%r10 # 2928c <_sk_store_8888_sse2_8bit+0x94>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,67,15,126,4,152 ; movd %xmm0,(%r8,%r11,4)
+ DB 235,208 ; jmp 29221 <_sk_store_8888_sse2_8bit+0x29>
DB 102,15,112,224,78 ; pshufd $0x4e,%xmm0,%xmm4
- DB 102,66,15,126,100,138,8 ; movd %xmm4,0x8(%rdx,%r9,4)
- DB 102,66,15,214,4,138 ; movq %xmm0,(%rdx,%r9,4)
- DB 235,191 ; jmp 292d2 <_sk_store_8888_sse2_8bit+0x2e>
+ DB 102,67,15,126,100,152,8 ; movd %xmm4,0x8(%r8,%r11,4)
+ DB 102,67,15,214,4,152 ; movq %xmm0,(%r8,%r11,4)
+ DB 235,188 ; jmp 29221 <_sk_store_8888_sse2_8bit+0x29>
DB 102,15,112,225,78 ; pshufd $0x4e,%xmm1,%xmm4
- DB 102,66,15,126,100,138,24 ; movd %xmm4,0x18(%rdx,%r9,4)
+ DB 102,67,15,126,100,152,24 ; movd %xmm4,0x18(%r8,%r11,4)
DB 102,15,112,225,229 ; pshufd $0xe5,%xmm1,%xmm4
- DB 102,66,15,126,100,138,20 ; movd %xmm4,0x14(%rdx,%r9,4)
- DB 102,66,15,126,76,138,16 ; movd %xmm1,0x10(%rdx,%r9,4)
- DB 243,66,15,127,4,138 ; movdqu %xmm0,(%rdx,%r9,4)
- DB 235,152 ; jmp 292d2 <_sk_store_8888_sse2_8bit+0x2e>
- DB 102,144 ; xchg %ax,%ax
- DB 187,255,255,255,207 ; mov $0xcfffffff,%ebx
+ DB 102,67,15,126,100,152,20 ; movd %xmm4,0x14(%r8,%r11,4)
+ DB 102,67,15,126,76,152,16 ; movd %xmm1,0x10(%r8,%r11,4)
+ DB 243,67,15,127,4,152 ; movdqu %xmm0,(%r8,%r11,4)
+ DB 235,149 ; jmp 29221 <_sk_store_8888_sse2_8bit+0x29>
+ DB 189,255,255,255,209 ; mov $0xd1ffffff,%ebp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,195 ; inc %ebx
+ DB 255,197 ; inc %ebp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,246 ; push %rsi
DB 255 ; (bad)
+ DB 248 ; clc
DB 255 ; (bad)
DB 255 ; (bad)
- DB 239 ; out %eax,(%dx)
+ DB 255,241 ; push %rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,227 ; jmpq *%rbx
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,215 ; callq *%rdi
DB 255 ; (bad)
+ DB 217,255 ; fcos
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_bgra_sse2_8bit
_sk_load_bgra_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,92 ; jne 293d5 <_sk_load_bgra_sse2_8bit+0x7d>
- DB 66,15,16,76,130,16 ; movups 0x10(%rdx,%r8,4),%xmm1
- DB 102,66,15,16,4,130 ; movupd (%rdx,%r8,4),%xmm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,92 ; jne 29320 <_sk_load_bgra_sse2_8bit+0x78>
+ DB 67,15,16,76,152,16 ; movups 0x10(%r8,%r11,4),%xmm1
+ DB 102,67,15,16,4,152 ; movupd (%r8,%r11,4),%xmm0
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,40,232 ; movapd %xmm0,%xmm5
DB 102,15,104,236 ; punpckhbw %xmm4,%xmm5
@@ -39387,69 +39379,66 @@ _sk_load_bgra_sse2_8bit LABEL PROC
DB 102,15,103,205 ; packuswb %xmm5,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,155 ; ja 29385 <_sk_load_bgra_sse2_8bit+0x2d>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,91,0,0,0 ; lea 0x5b(%rip),%rcx # 29450 <_sk_load_bgra_sse2_8bit+0xf8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,152 ; ja 292d0 <_sk_load_bgra_sse2_8bit+0x28>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,89,0,0,0 ; lea 0x59(%rip),%r10 # 2939c <_sk_load_bgra_sse2_8bit+0xf4>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 243,66,15,16,4,130 ; movss (%rdx,%r8,4),%xmm0
- DB 233,124,255,255,255 ; jmpq 29385 <_sk_load_bgra_sse2_8bit+0x2d>
- DB 102,66,15,110,68,130,8 ; movd 0x8(%rdx,%r8,4),%xmm0
+ DB 243,67,15,16,4,152 ; movss (%r8,%r11,4),%xmm0
+ DB 233,121,255,255,255 ; jmpq 292d0 <_sk_load_bgra_sse2_8bit+0x28>
+ DB 102,67,15,110,68,152,8 ; movd 0x8(%r8,%r11,4),%xmm0
DB 102,15,112,192,69 ; pshufd $0x45,%xmm0,%xmm0
- DB 102,66,15,18,4,130 ; movlpd (%rdx,%r8,4),%xmm0
- DB 233,101,255,255,255 ; jmpq 29385 <_sk_load_bgra_sse2_8bit+0x2d>
- DB 102,66,15,110,68,130,24 ; movd 0x18(%rdx,%r8,4),%xmm0
+ DB 102,67,15,18,4,152 ; movlpd (%r8,%r11,4),%xmm0
+ DB 233,98,255,255,255 ; jmpq 292d0 <_sk_load_bgra_sse2_8bit+0x28>
+ DB 102,67,15,110,68,152,24 ; movd 0x18(%r8,%r11,4),%xmm0
DB 102,15,112,200,69 ; pshufd $0x45,%xmm0,%xmm1
- DB 243,66,15,16,68,130,20 ; movss 0x14(%rdx,%r8,4),%xmm0
+ DB 243,67,15,16,68,152,20 ; movss 0x14(%r8,%r11,4),%xmm0
DB 15,198,193,0 ; shufps $0x0,%xmm1,%xmm0
DB 15,198,193,226 ; shufps $0xe2,%xmm1,%xmm0
DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 243,66,15,16,68,130,16 ; movss 0x10(%rdx,%r8,4),%xmm0
+ DB 243,67,15,16,68,152,16 ; movss 0x10(%r8,%r11,4),%xmm0
DB 243,15,16,200 ; movss %xmm0,%xmm1
- DB 233,49,255,255,255 ; jmpq 2937f <_sk_load_bgra_sse2_8bit+0x27>
- DB 102,144 ; xchg %ax,%ax
- DB 174 ; scas %es:(%rdi),%al
- DB 255 ; (bad)
- DB 255 ; (bad)
- DB 255,197 ; inc %ebp
+ DB 233,46,255,255,255 ; jmpq 292ca <_sk_load_bgra_sse2_8bit+0x22>
+ DB 176,255 ; mov $0xff,%al
DB 255 ; (bad)
+ DB 255,199 ; inc %edi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 185,255,255,255,47 ; mov $0x2fffffff,%ecx
DB 255 ; (bad)
+ DB 187,255,255,255,46 ; mov $0x2effffff,%ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 238 ; out %al,(%dx)
+ DB 255,240 ; push %rax
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,208 ; callq *%rax
+ DB 255,210 ; callq *%rdx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_bgra_dst_sse2_8bit
_sk_load_bgra_dst_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,92 ; jne 294e9 <_sk_load_bgra_dst_sse2_8bit+0x7d>
- DB 66,15,16,92,130,16 ; movups 0x10(%rdx,%r8,4),%xmm3
- DB 102,66,15,16,20,130 ; movupd (%rdx,%r8,4),%xmm2
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,92 ; jne 29430 <_sk_load_bgra_dst_sse2_8bit+0x78>
+ DB 67,15,16,92,152,16 ; movups 0x10(%r8,%r11,4),%xmm3
+ DB 102,67,15,16,20,152 ; movupd (%r8,%r11,4),%xmm2
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,40,234 ; movapd %xmm2,%xmm5
DB 102,15,104,236 ; punpckhbw %xmm4,%xmm5
@@ -39469,65 +39458,62 @@ _sk_load_bgra_dst_sse2_8bit LABEL PROC
DB 102,15,103,221 ; packuswb %xmm5,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,155 ; ja 29499 <_sk_load_bgra_dst_sse2_8bit+0x2d>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,91,0,0,0 ; lea 0x5b(%rip),%rcx # 29564 <_sk_load_bgra_dst_sse2_8bit+0xf8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,152 ; ja 293e0 <_sk_load_bgra_dst_sse2_8bit+0x28>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,89,0,0,0 ; lea 0x59(%rip),%r10 # 294ac <_sk_load_bgra_dst_sse2_8bit+0xf4>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 243,66,15,16,20,130 ; movss (%rdx,%r8,4),%xmm2
- DB 233,124,255,255,255 ; jmpq 29499 <_sk_load_bgra_dst_sse2_8bit+0x2d>
- DB 102,66,15,110,84,130,8 ; movd 0x8(%rdx,%r8,4),%xmm2
+ DB 243,67,15,16,20,152 ; movss (%r8,%r11,4),%xmm2
+ DB 233,121,255,255,255 ; jmpq 293e0 <_sk_load_bgra_dst_sse2_8bit+0x28>
+ DB 102,67,15,110,84,152,8 ; movd 0x8(%r8,%r11,4),%xmm2
DB 102,15,112,210,69 ; pshufd $0x45,%xmm2,%xmm2
- DB 102,66,15,18,20,130 ; movlpd (%rdx,%r8,4),%xmm2
- DB 233,101,255,255,255 ; jmpq 29499 <_sk_load_bgra_dst_sse2_8bit+0x2d>
- DB 102,66,15,110,84,130,24 ; movd 0x18(%rdx,%r8,4),%xmm2
+ DB 102,67,15,18,20,152 ; movlpd (%r8,%r11,4),%xmm2
+ DB 233,98,255,255,255 ; jmpq 293e0 <_sk_load_bgra_dst_sse2_8bit+0x28>
+ DB 102,67,15,110,84,152,24 ; movd 0x18(%r8,%r11,4),%xmm2
DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3
- DB 243,66,15,16,84,130,20 ; movss 0x14(%rdx,%r8,4),%xmm2
+ DB 243,67,15,16,84,152,20 ; movss 0x14(%r8,%r11,4),%xmm2
DB 15,198,211,0 ; shufps $0x0,%xmm3,%xmm2
DB 15,198,211,226 ; shufps $0xe2,%xmm3,%xmm2
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 243,66,15,16,84,130,16 ; movss 0x10(%rdx,%r8,4),%xmm2
+ DB 243,67,15,16,84,152,16 ; movss 0x10(%r8,%r11,4),%xmm2
DB 243,15,16,218 ; movss %xmm2,%xmm3
- DB 233,49,255,255,255 ; jmpq 29493 <_sk_load_bgra_dst_sse2_8bit+0x27>
- DB 102,144 ; xchg %ax,%ax
- DB 174 ; scas %es:(%rdi),%al
- DB 255 ; (bad)
- DB 255 ; (bad)
- DB 255,197 ; inc %ebp
+ DB 233,46,255,255,255 ; jmpq 293da <_sk_load_bgra_dst_sse2_8bit+0x22>
+ DB 176,255 ; mov $0xff,%al
DB 255 ; (bad)
+ DB 255,199 ; inc %edi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 185,255,255,255,47 ; mov $0x2fffffff,%ecx
DB 255 ; (bad)
+ DB 187,255,255,255,46 ; mov $0x2effffff,%ebx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 238 ; out %al,(%dx)
+ DB 255,240 ; push %rax
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 220,255 ; fdivr %st,%st(7)
+ DB 222,255 ; fdivrp %st,%st(7)
DB 255 ; (bad)
- DB 255,208 ; callq *%rax
+ DB 255,210 ; callq *%rdx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_store_bgra_sse2_8bit
_sk_store_bgra_sse2_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
DB 102,15,239,237 ; pxor %xmm5,%xmm5
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,104,229 ; punpckhbw %xmm5,%xmm4
@@ -39547,70 +39533,69 @@ _sk_store_bgra_sse2_8bit LABEL PROC
DB 242,15,112,239,198 ; pshuflw $0xc6,%xmm7,%xmm5
DB 243,15,112,237,198 ; pshufhw $0xc6,%xmm5,%xmm5
DB 102,15,103,238 ; packuswb %xmm6,%xmm5
- DB 77,133,192 ; test %r8,%r8
- DB 117,17 ; jne 29606 <_sk_store_bgra_sse2_8bit+0x86>
- DB 243,66,15,127,44,138 ; movdqu %xmm5,(%rdx,%r9,4)
- DB 243,66,15,127,100,138,16 ; movdqu %xmm4,0x10(%rdx,%r9,4)
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 255,224 ; jmpq *%rax
- DB 65,128,224,7 ; and $0x7,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,239 ; ja 29602 <_sk_store_bgra_sse2_8bit+0x82>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,78,0,0,0 ; lea 0x4e(%rip),%rcx # 2966c <_sk_store_bgra_sse2_8bit+0xec>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,66,15,126,44,138 ; movd %xmm5,(%rdx,%r9,4)
- DB 235,211 ; jmp 29602 <_sk_store_bgra_sse2_8bit+0x82>
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,17 ; jne 29549 <_sk_store_bgra_sse2_8bit+0x81>
+ DB 243,67,15,127,44,152 ; movdqu %xmm5,(%r8,%r11,4)
+ DB 243,67,15,127,100,152,16 ; movdqu %xmm4,0x10(%r8,%r11,4)
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 119,236 ; ja 29545 <_sk_store_bgra_sse2_8bit+0x7d>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,76,0,0,0 ; lea 0x4c(%rip),%r10 # 295b0 <_sk_store_bgra_sse2_8bit+0xe8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,67,15,126,44,152 ; movd %xmm5,(%r8,%r11,4)
+ DB 235,208 ; jmp 29545 <_sk_store_bgra_sse2_8bit+0x7d>
DB 102,15,112,229,78 ; pshufd $0x4e,%xmm5,%xmm4
- DB 102,66,15,126,100,138,8 ; movd %xmm4,0x8(%rdx,%r9,4)
- DB 102,66,15,214,44,138 ; movq %xmm5,(%rdx,%r9,4)
- DB 235,191 ; jmp 29602 <_sk_store_bgra_sse2_8bit+0x82>
+ DB 102,67,15,126,100,152,8 ; movd %xmm4,0x8(%r8,%r11,4)
+ DB 102,67,15,214,44,152 ; movq %xmm5,(%r8,%r11,4)
+ DB 235,188 ; jmp 29545 <_sk_store_bgra_sse2_8bit+0x7d>
DB 102,15,112,244,78 ; pshufd $0x4e,%xmm4,%xmm6
- DB 102,66,15,126,116,138,24 ; movd %xmm6,0x18(%rdx,%r9,4)
+ DB 102,67,15,126,116,152,24 ; movd %xmm6,0x18(%r8,%r11,4)
DB 102,15,112,244,229 ; pshufd $0xe5,%xmm4,%xmm6
- DB 102,66,15,126,116,138,20 ; movd %xmm6,0x14(%rdx,%r9,4)
- DB 102,66,15,126,100,138,16 ; movd %xmm4,0x10(%rdx,%r9,4)
- DB 243,66,15,127,44,138 ; movdqu %xmm5,(%rdx,%r9,4)
- DB 235,152 ; jmp 29602 <_sk_store_bgra_sse2_8bit+0x82>
- DB 102,144 ; xchg %ax,%ax
- DB 187,255,255,255,207 ; mov $0xcfffffff,%ebx
+ DB 102,67,15,126,116,152,20 ; movd %xmm6,0x14(%r8,%r11,4)
+ DB 102,67,15,126,100,152,16 ; movd %xmm4,0x10(%r8,%r11,4)
+ DB 243,67,15,127,44,152 ; movdqu %xmm5,(%r8,%r11,4)
+ DB 235,149 ; jmp 29545 <_sk_store_bgra_sse2_8bit+0x7d>
+ DB 189,255,255,255,209 ; mov $0xd1ffffff,%ebp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,195 ; inc %ebx
+ DB 255,197 ; inc %ebp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,246 ; push %rsi
DB 255 ; (bad)
+ DB 248 ; clc
DB 255 ; (bad)
DB 255 ; (bad)
- DB 239 ; out %eax,(%dx)
+ DB 255,241 ; push %rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,227 ; jmpq *%rbx
+ DB 255,229 ; jmpq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,215 ; callq *%rdi
DB 255 ; (bad)
+ DB 217,255 ; fcos
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_a8_sse2_8bit
_sk_load_a8_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,48 ; jne 296d5 <_sk_load_a8_sse2_8bit+0x4d>
- DB 243,66,15,126,4,2 ; movq (%rdx,%r8,1),%xmm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,48 ; jne 29614 <_sk_load_a8_sse2_8bit+0x48>
+ DB 243,67,15,126,4,24 ; movq (%r8,%r11,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
- DB 102,15,219,5,25,52,0,0 ; pand 0x3419(%rip),%xmm0 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,5,26,52,0,0 ; pand 0x341a(%rip),%xmm0 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,105,204 ; punpckhwd %xmm4,%xmm1
@@ -39619,73 +39604,74 @@ _sk_load_a8_sse2_8bit LABEL PROC
DB 102,15,114,241,24 ; pslld $0x18,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,201 ; ja 296af <_sk_load_a8_sse2_8bit+0x27>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,111,0,0,0 ; lea 0x6f(%rip),%rcx # 29760 <_sk_load_a8_sse2_8bit+0xd8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,198 ; ja 295ee <_sk_load_a8_sse2_8bit+0x22>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,113,0,0,0 ; lea 0x71(%rip),%r10 # 296a4 <_sk_load_a8_sse2_8bit+0xd8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,192 ; movd %eax,%xmm0
- DB 235,170 ; jmp 296af <_sk_load_a8_sse2_8bit+0x27>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 235,167 ; jmp 295ee <_sk_load_a8_sse2_8bit+0x22>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,192,2 ; pinsrw $0x2,%eax,%xmm0
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,200 ; movd %eax,%xmm1
DB 102,15,96,200 ; punpcklbw %xmm0,%xmm1
DB 243,15,16,193 ; movss %xmm1,%xmm0
- DB 235,136 ; jmp 296af <_sk_load_a8_sse2_8bit+0x27>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 235,133 ; jmp 295ee <_sk_load_a8_sse2_8bit+0x22>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,192,6 ; pinsrw $0x6,%eax,%xmm0
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,192,5 ; pinsrw $0x5,%eax,%xmm0
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,192,4 ; pinsrw $0x4,%eax,%xmm0
- DB 102,66,15,110,12,2 ; movd (%rdx,%r8,1),%xmm1
+ DB 102,67,15,110,12,24 ; movd (%r8,%r11,1),%xmm1
DB 102,15,96,200 ; punpcklbw %xmm0,%xmm1
DB 242,15,16,193 ; movsd %xmm1,%xmm0
- DB 233,80,255,255,255 ; jmpq 296af <_sk_load_a8_sse2_8bit+0x27>
- DB 144 ; nop
- DB 154 ; (bad)
+ DB 233,77,255,255,255 ; jmpq 295ee <_sk_load_a8_sse2_8bit+0x22>
+ DB 15,31,0 ; nopl (%rax)
+ DB 152 ; cwtl
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,180,255,255,255,165,255 ; pushq -0x5a0001(%rdi,%rdi,8)
+ DB 255,178,255,255,255,163 ; pushq -0x5c000001(%rdx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 236 ; in (%dx),%al
+ DB 255 ; (bad)
+ DB 234 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,225 ; jmpq *%rcx
DB 255 ; (bad)
+ DB 223,255 ; (bad)
DB 255 ; (bad)
- DB 255,214 ; callq *%rsi
+ DB 255,212 ; callq *%rsp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,199 ; inc %edi
+ DB 255,197 ; inc %ebp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_a8_dst_sse2_8bit
_sk_load_a8_dst_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,48 ; jne 297c9 <_sk_load_a8_dst_sse2_8bit+0x4d>
- DB 243,66,15,126,20,2 ; movq (%rdx,%r8,1),%xmm2
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,48 ; jne 29708 <_sk_load_a8_dst_sse2_8bit+0x48>
+ DB 243,67,15,126,20,24 ; movq (%r8,%r11,1),%xmm2
DB 102,15,96,208 ; punpcklbw %xmm0,%xmm2
- DB 102,15,219,21,37,51,0,0 ; pand 0x3325(%rip),%xmm2 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,21,38,51,0,0 ; pand 0x3326(%rip),%xmm2 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,111,218 ; movdqa %xmm2,%xmm3
DB 102,15,105,220 ; punpckhwd %xmm4,%xmm3
@@ -39694,55 +39680,57 @@ _sk_load_a8_dst_sse2_8bit LABEL PROC
DB 102,15,114,243,24 ; pslld $0x18,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,201 ; ja 297a3 <_sk_load_a8_dst_sse2_8bit+0x27>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,111,0,0,0 ; lea 0x6f(%rip),%rcx # 29854 <_sk_load_a8_dst_sse2_8bit+0xd8>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,198 ; ja 296e2 <_sk_load_a8_dst_sse2_8bit+0x22>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,113,0,0,0 ; lea 0x71(%rip),%r10 # 29798 <_sk_load_a8_dst_sse2_8bit+0xd8>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,208 ; movd %eax,%xmm2
- DB 235,170 ; jmp 297a3 <_sk_load_a8_dst_sse2_8bit+0x27>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 235,167 ; jmp 296e2 <_sk_load_a8_dst_sse2_8bit+0x22>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 102,15,196,208,2 ; pinsrw $0x2,%eax,%xmm2
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,216 ; movd %eax,%xmm3
DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3
DB 243,15,16,211 ; movss %xmm3,%xmm2
- DB 235,136 ; jmp 297a3 <_sk_load_a8_dst_sse2_8bit+0x27>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 235,133 ; jmp 296e2 <_sk_load_a8_dst_sse2_8bit+0x22>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 102,15,196,208,6 ; pinsrw $0x6,%eax,%xmm2
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,208,5 ; pinsrw $0x5,%eax,%xmm2
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,208,4 ; pinsrw $0x4,%eax,%xmm2
- DB 102,66,15,110,28,2 ; movd (%rdx,%r8,1),%xmm3
+ DB 102,67,15,110,28,24 ; movd (%r8,%r11,1),%xmm3
DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3
DB 242,15,16,211 ; movsd %xmm3,%xmm2
- DB 233,80,255,255,255 ; jmpq 297a3 <_sk_load_a8_dst_sse2_8bit+0x27>
- DB 144 ; nop
- DB 154 ; (bad)
+ DB 233,77,255,255,255 ; jmpq 296e2 <_sk_load_a8_dst_sse2_8bit+0x22>
+ DB 15,31,0 ; nopl (%rax)
+ DB 152 ; cwtl
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,180,255,255,255,165,255 ; pushq -0x5a0001(%rdi,%rdi,8)
+ DB 255,178,255,255,255,163 ; pushq -0x5c000001(%rdx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 236 ; in (%dx),%al
DB 255 ; (bad)
+ DB 234 ; (bad)
DB 255 ; (bad)
- DB 255,225 ; jmpq *%rcx
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,214 ; callq *%rsi
+ DB 223,255 ; (bad)
DB 255 ; (bad)
+ DB 255,212 ; callq *%rsp
DB 255 ; (bad)
- DB 255,199 ; inc %edi
+ DB 255 ; (bad)
+ DB 255,197 ; inc %ebp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -39750,13 +39738,12 @@ _sk_load_a8_dst_sse2_8bit LABEL PROC
PUBLIC _sk_store_a8_sse2_8bit
_sk_store_a8_sse2_8bit LABEL PROC
DB 72,131,236,88 ; sub $0x58,%rsp
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
DB 102,15,114,212,24 ; psrld $0x18,%xmm4
DB 102,15,111,233 ; movdqa %xmm1,%xmm5
@@ -39766,86 +39753,88 @@ _sk_store_a8_sse2_8bit LABEL PROC
DB 102,15,114,244,16 ; pslld $0x10,%xmm4
DB 102,15,114,228,16 ; psrad $0x10,%xmm4
DB 102,15,107,229 ; packssdw %xmm5,%xmm4
- DB 77,133,201 ; test %r9,%r9
- DB 117,26 ; jne 298d5 <_sk_store_a8_sse2_8bit+0x65>
- DB 102,15,219,37,13,50,0,0 ; pand 0x320d(%rip),%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,26 ; jne 29814 <_sk_store_a8_sse2_8bit+0x60>
+ DB 102,15,219,37,14,50,0,0 ; pand 0x320e(%rip),%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
- DB 102,66,15,214,36,2 ; movq %xmm4,(%rdx,%r8,1)
+ DB 102,67,15,214,36,24 ; movq %xmm4,(%r8,%r11,1)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,131,196,88 ; add $0x58,%rsp
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,235 ; ja 298cd <_sk_store_a8_sse2_8bit+0x5d>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,131,0,0,0 ; lea 0x83(%rip),%rcx # 29970 <_sk_store_a8_sse2_8bit+0x100>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,232 ; ja 2980c <_sk_store_a8_sse2_8bit+0x58>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,133,0,0,0 ; lea 0x85(%rip),%r10 # 298b4 <_sk_store_a8_sse2_8bit+0x100>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
DB 102,15,127,100,36,64 ; movdqa %xmm4,0x40(%rsp)
DB 138,68,36,64 ; mov 0x40(%rsp),%al
- DB 66,136,4,2 ; mov %al,(%rdx,%r8,1)
- DB 235,199 ; jmp 298cd <_sk_store_a8_sse2_8bit+0x5d>
+ DB 67,136,4,24 ; mov %al,(%r8,%r11,1)
+ DB 235,196 ; jmp 2980c <_sk_store_a8_sse2_8bit+0x58>
DB 102,15,127,100,36,48 ; movdqa %xmm4,0x30(%rsp)
DB 138,68,36,52 ; mov 0x34(%rsp),%al
- DB 66,136,68,2,2 ; mov %al,0x2(%rdx,%r8,1)
- DB 102,15,219,37,179,49,0,0 ; pand 0x31b3(%rip),%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 67,136,68,24,2 ; mov %al,0x2(%r8,%r11,1)
+ DB 102,15,219,37,177,49,0,0 ; pand 0x31b1(%rip),%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
DB 102,15,126,224 ; movd %xmm4,%eax
- DB 102,66,137,4,2 ; mov %ax,(%rdx,%r8,1)
- DB 235,161 ; jmp 298cd <_sk_store_a8_sse2_8bit+0x5d>
+ DB 102,67,137,4,24 ; mov %ax,(%r8,%r11,1)
+ DB 235,158 ; jmp 2980c <_sk_store_a8_sse2_8bit+0x58>
DB 102,15,127,100,36,32 ; movdqa %xmm4,0x20(%rsp)
DB 138,68,36,44 ; mov 0x2c(%rsp),%al
- DB 66,136,68,2,6 ; mov %al,0x6(%rdx,%r8,1)
+ DB 67,136,68,24,6 ; mov %al,0x6(%r8,%r11,1)
DB 102,15,127,100,36,16 ; movdqa %xmm4,0x10(%rsp)
DB 138,68,36,26 ; mov 0x1a(%rsp),%al
- DB 66,136,68,2,5 ; mov %al,0x5(%rdx,%r8,1)
+ DB 67,136,68,24,5 ; mov %al,0x5(%r8,%r11,1)
DB 102,15,127,36,36 ; movdqa %xmm4,(%rsp)
DB 138,68,36,8 ; mov 0x8(%rsp),%al
- DB 66,136,68,2,4 ; mov %al,0x4(%rdx,%r8,1)
- DB 102,15,219,37,112,49,0,0 ; pand 0x3170(%rip),%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 67,136,68,24,4 ; mov %al,0x4(%r8,%r11,1)
+ DB 102,15,219,37,110,49,0,0 ; pand 0x316e(%rip),%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
- DB 102,66,15,126,36,2 ; movd %xmm4,(%rdx,%r8,1)
- DB 233,94,255,255,255 ; jmpq 298cd <_sk_store_a8_sse2_8bit+0x5d>
- DB 144 ; nop
- DB 134,255 ; xchg %bh,%bh
+ DB 102,67,15,126,36,24 ; movd %xmm4,(%r8,%r11,1)
+ DB 233,91,255,255,255 ; jmpq 2980c <_sk_store_a8_sse2_8bit+0x58>
+ DB 15,31,0 ; nopl (%rax)
+ DB 132,255 ; test %bh,%bh
DB 255 ; (bad)
- DB 255,165,255,255,255,150 ; jmpq *-0x69000001(%rbp)
+ DB 255,163,255,255,255,148 ; jmpq *-0x6b000001(%rbx)
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,230 ; jmpq *%rsi
DB 255 ; (bad)
- DB 232,255,255,255,218 ; callq ffffffffdb029980 <_sk_overlay_sse2_8bit+0xffffffffdaffdd0b>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,203 ; dec %ebx
+ DB 216,255 ; fdivr %st(7),%st
+ DB 255 ; (bad)
+ DB 255,201 ; dec %ecx
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 188 ; .byte 0xbc
+ DB 186 ; .byte 0xba
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_g8_sse2_8bit
_sk_load_g8_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,116 ; jne 29a1d <_sk_load_g8_sse2_8bit+0x91>
- DB 243,66,15,126,4,2 ; movq (%rdx,%r8,1),%xmm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,116 ; jne 2995c <_sk_load_g8_sse2_8bit+0x8c>
+ DB 243,67,15,126,4,24 ; movq (%r8,%r11,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
- DB 102,15,219,5,21,49,0,0 ; pand 0x3115(%rip),%xmm0 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,5,22,49,0,0 ; pand 0x3116(%rip),%xmm0 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
DB 102,15,97,225 ; punpcklwd %xmm1,%xmm4
DB 102,15,105,193 ; punpckhwd %xmm1,%xmm0
- DB 102,15,111,45,125,56,0,0 ; movdqa 0x387d(%rip),%xmm5 # 2d250 <_sk_overlay_sse2_8bit+0x15db>
+ DB 102,15,111,45,126,56,0,0 ; movdqa 0x387e(%rip),%xmm5 # 2d190 <_sk_overlay_sse2_8bit+0x15e0>
DB 102,15,112,240,245 ; pshufd $0xf5,%xmm0,%xmm6
DB 102,15,244,197 ; pmuludq %xmm5,%xmm0
DB 102,15,112,200,232 ; pshufd $0xe8,%xmm0,%xmm1
@@ -39858,84 +39847,84 @@ _sk_load_g8_sse2_8bit LABEL PROC
DB 102,15,244,245 ; pmuludq %xmm5,%xmm6
DB 102,15,112,230,232 ; pshufd $0xe8,%xmm6,%xmm4
DB 102,15,98,196 ; punpckldq %xmm4,%xmm0
- DB 102,15,111,37,255,55,0,0 ; movdqa 0x37ff(%rip),%xmm4 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,37,0,56,0,0 ; movdqa 0x3800(%rip),%xmm4 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,235,196 ; por %xmm4,%xmm0
DB 102,15,235,204 ; por %xmm4,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,133 ; ja 299b3 <_sk_load_g8_sse2_8bit+0x27>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,119,0,0,0 ; lea 0x77(%rip),%rcx # 29ab0 <_sk_load_g8_sse2_8bit+0x124>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,130 ; ja 298f2 <_sk_load_g8_sse2_8bit+0x22>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,117,0,0,0 ; lea 0x75(%rip),%r10 # 299f0 <_sk_load_g8_sse2_8bit+0x120>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,192 ; movd %eax,%xmm0
- DB 233,99,255,255,255 ; jmpq 299b3 <_sk_load_g8_sse2_8bit+0x27>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 233,96,255,255,255 ; jmpq 298f2 <_sk_load_g8_sse2_8bit+0x22>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,192,2 ; pinsrw $0x2,%eax,%xmm0
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,200 ; movd %eax,%xmm1
DB 102,15,96,200 ; punpcklbw %xmm0,%xmm1
DB 243,15,16,193 ; movss %xmm1,%xmm0
- DB 233,62,255,255,255 ; jmpq 299b3 <_sk_load_g8_sse2_8bit+0x27>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,59,255,255,255 ; jmpq 298f2 <_sk_load_g8_sse2_8bit+0x22>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,192,6 ; pinsrw $0x6,%eax,%xmm0
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,192,5 ; pinsrw $0x5,%eax,%xmm0
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,192,4 ; pinsrw $0x4,%eax,%xmm0
- DB 102,66,15,110,12,2 ; movd (%rdx,%r8,1),%xmm1
+ DB 102,67,15,110,12,24 ; movd (%r8,%r11,1),%xmm1
DB 102,15,96,200 ; punpcklbw %xmm0,%xmm1
DB 242,15,16,193 ; movsd %xmm1,%xmm0
- DB 233,6,255,255,255 ; jmpq 299b3 <_sk_load_g8_sse2_8bit+0x27>
- DB 15,31,0 ; nopl (%rax)
- DB 146 ; xchg %eax,%edx
+ DB 233,3,255,255,255 ; jmpq 298f2 <_sk_load_g8_sse2_8bit+0x22>
+ DB 144 ; nop
+ DB 148 ; xchg %eax,%esp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,175,255,255,255,160 ; ljmp *-0x5f000001(%rdi)
+ DB 255,177,255,255,255,162 ; pushq -0x5d000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 234 ; (bad)
+ DB 236 ; in (%dx),%al
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,225 ; jmpq *%rcx
DB 255 ; (bad)
- DB 223,255 ; (bad)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,197 ; inc %ebp
+ DB 255,199 ; inc %edi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_load_g8_dst_sse2_8bit
_sk_load_g8_dst_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 117,116 ; jne 29b5d <_sk_load_g8_dst_sse2_8bit+0x91>
- DB 243,66,15,126,20,2 ; movq (%rdx,%r8,1),%xmm2
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 117,116 ; jne 29a98 <_sk_load_g8_dst_sse2_8bit+0x8c>
+ DB 243,67,15,126,20,24 ; movq (%r8,%r11,1),%xmm2
DB 102,15,96,208 ; punpcklbw %xmm0,%xmm2
- DB 102,15,219,21,213,47,0,0 ; pand 0x2fd5(%rip),%xmm2 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,21,218,47,0,0 ; pand 0x2fda(%rip),%xmm2 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,111,226 ; movdqa %xmm2,%xmm4
DB 102,15,97,227 ; punpcklwd %xmm3,%xmm4
DB 102,15,105,211 ; punpckhwd %xmm3,%xmm2
- DB 102,15,111,45,61,55,0,0 ; movdqa 0x373d(%rip),%xmm5 # 2d250 <_sk_overlay_sse2_8bit+0x15db>
+ DB 102,15,111,45,66,55,0,0 ; movdqa 0x3742(%rip),%xmm5 # 2d190 <_sk_overlay_sse2_8bit+0x15e0>
DB 102,15,112,242,245 ; pshufd $0xf5,%xmm2,%xmm6
DB 102,15,244,213 ; pmuludq %xmm5,%xmm2
DB 102,15,112,218,232 ; pshufd $0xe8,%xmm2,%xmm3
@@ -39948,80 +39937,80 @@ _sk_load_g8_dst_sse2_8bit LABEL PROC
DB 102,15,244,245 ; pmuludq %xmm5,%xmm6
DB 102,15,112,230,232 ; pshufd $0xe8,%xmm6,%xmm4
DB 102,15,98,212 ; punpckldq %xmm4,%xmm2
- DB 102,15,111,37,191,54,0,0 ; movdqa 0x36bf(%rip),%xmm4 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 102,15,111,37,196,54,0,0 ; movdqa 0x36c4(%rip),%xmm4 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 102,15,235,212 ; por %xmm4,%xmm2
DB 102,15,235,220 ; por %xmm4,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 119,133 ; ja 29af3 <_sk_load_g8_dst_sse2_8bit+0x27>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,119,0,0,0 ; lea 0x77(%rip),%rcx # 29bf0 <_sk_load_g8_dst_sse2_8bit+0x124>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 119,130 ; ja 29a2e <_sk_load_g8_dst_sse2_8bit+0x22>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,117,0,0,0 ; lea 0x75(%rip),%r10 # 29b2c <_sk_load_g8_dst_sse2_8bit+0x120>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,208 ; movd %eax,%xmm2
- DB 233,99,255,255,255 ; jmpq 29af3 <_sk_load_g8_dst_sse2_8bit+0x27>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 233,96,255,255,255 ; jmpq 29a2e <_sk_load_g8_dst_sse2_8bit+0x22>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 102,15,196,208,2 ; pinsrw $0x2,%eax,%xmm2
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,216 ; movd %eax,%xmm3
DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3
DB 243,15,16,211 ; movss %xmm3,%xmm2
- DB 233,62,255,255,255 ; jmpq 29af3 <_sk_load_g8_dst_sse2_8bit+0x27>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,59,255,255,255 ; jmpq 29a2e <_sk_load_g8_dst_sse2_8bit+0x22>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 102,15,196,208,6 ; pinsrw $0x6,%eax,%xmm2
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,208,5 ; pinsrw $0x5,%eax,%xmm2
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,208,4 ; pinsrw $0x4,%eax,%xmm2
- DB 102,66,15,110,28,2 ; movd (%rdx,%r8,1),%xmm3
+ DB 102,67,15,110,28,24 ; movd (%r8,%r11,1),%xmm3
DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3
DB 242,15,16,211 ; movsd %xmm3,%xmm2
- DB 233,6,255,255,255 ; jmpq 29af3 <_sk_load_g8_dst_sse2_8bit+0x27>
- DB 15,31,0 ; nopl (%rax)
- DB 146 ; xchg %eax,%edx
+ DB 233,3,255,255,255 ; jmpq 29a2e <_sk_load_g8_dst_sse2_8bit+0x22>
+ DB 144 ; nop
+ DB 148 ; xchg %eax,%esp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,175,255,255,255,160 ; ljmp *-0x5f000001(%rdi)
+ DB 255,177,255,255,255,162 ; pushq -0x5d000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 234 ; (bad)
+ DB 236 ; in (%dx),%al
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,225 ; jmpq *%rcx
DB 255 ; (bad)
- DB 223,255 ; (bad)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,197 ; inc %ebp
+ DB 255,199 ; inc %edi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
PUBLIC _sk_srcover_rgba_8888_sse2_8bit
_sk_srcover_rgba_8888_sse2_8bit LABEL PROC
- DB 76,99,15 ; movslq (%rdi),%r9
- DB 76,139,71,16 ; mov 0x10(%rdi),%r8
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,193,226,2 ; shl $0x2,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,192 ; test %r8,%r8
- DB 15,133,253,0,0,0 ; jne 29d2e <_sk_srcover_rgba_8888_sse2_8bit+0x122>
- DB 70,15,16,68,138,16 ; movups 0x10(%rdx,%r9,4),%xmm8
- DB 102,70,15,16,12,138 ; movupd (%rdx,%r9,4),%xmm9
- DB 77,133,192 ; test %r8,%r8
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 73,193,224,2 ; shl $0x2,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,253,0,0,0 ; jne 29c65 <_sk_srcover_rgba_8888_sse2_8bit+0x11d>
+ DB 71,15,16,68,152,16 ; movups 0x10(%r8,%r11,4),%xmm8
+ DB 102,71,15,16,12,152 ; movupd (%r8,%r11,4),%xmm9
+ DB 72,133,255 ; test %rdi,%rdi
DB 242,15,112,225,231 ; pshuflw $0xe7,%xmm1,%xmm4
DB 243,15,112,228,231 ; pshufhw $0xe7,%xmm4,%xmm4
DB 102,15,112,228,232 ; pshufd $0xe8,%xmm4,%xmm4
@@ -40067,69 +40056,71 @@ _sk_srcover_rgba_8888_sse2_8bit LABEL PROC
DB 102,68,15,248,207 ; psubb %xmm7,%xmm9
DB 102,68,15,252,200 ; paddb %xmm0,%xmm9
DB 102,68,15,252,193 ; paddb %xmm1,%xmm8
- DB 117,72 ; jne 29d65 <_sk_srcover_rgba_8888_sse2_8bit+0x159>
- DB 243,70,15,127,12,138 ; movdqu %xmm9,(%rdx,%r9,4)
- DB 243,70,15,127,68,138,16 ; movdqu %xmm8,0x10(%rdx,%r9,4)
+ DB 117,78 ; jne 29ca2 <_sk_srcover_rgba_8888_sse2_8bit+0x15a>
+ DB 243,71,15,127,12,152 ; movdqu %xmm9,(%r8,%r11,4)
+ DB 243,71,15,127,68,152,16 ; movdqu %xmm8,0x10(%r8,%r11,4)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
- DB 68,137,192 ; mov %r8d,%eax
- DB 36,7 ; and $0x7,%al
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
- DB 254,200 ; dec %al
- DB 60,6 ; cmp $0x6,%al
- DB 15,135,246,254,255,255 ; ja 29c3d <_sk_srcover_rgba_8888_sse2_8bit+0x31>
- DB 15,182,192 ; movzbl %al,%eax
- DB 72,141,13,207,0,0,0 ; lea 0xcf(%rip),%rcx # 29e20 <_sk_srcover_rgba_8888_sse2_8bit+0x214>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 243,70,15,16,12,138 ; movss (%rdx,%r9,4),%xmm9
- DB 233,216,254,255,255 ; jmpq 29c3d <_sk_srcover_rgba_8888_sse2_8bit+0x31>
- DB 65,128,224,7 ; and $0x7,%r8b
- DB 65,254,200 ; dec %r8b
- DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,184 ; ja 29d2a <_sk_srcover_rgba_8888_sse2_8bit+0x11e>
- DB 65,15,182,192 ; movzbl %r8b,%eax
- DB 72,141,13,191,0,0,0 ; lea 0xbf(%rip),%rcx # 29e3c <_sk_srcover_rgba_8888_sse2_8bit+0x230>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
- DB 255,224 ; jmpq *%rax
- DB 102,70,15,126,12,138 ; movd %xmm9,(%rdx,%r9,4)
- DB 235,156 ; jmp 29d2a <_sk_srcover_rgba_8888_sse2_8bit+0x11e>
- DB 102,66,15,110,100,138,8 ; movd 0x8(%rdx,%r9,4),%xmm4
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 15,135,241,254,255,255 ; ja 29b74 <_sk_srcover_rgba_8888_sse2_8bit+0x2c>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,210,0,0,0 ; lea 0xd2(%rip),%r10 # 29d60 <_sk_srcover_rgba_8888_sse2_8bit+0x218>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 243,71,15,16,12,152 ; movss (%r8,%r11,4),%xmm9
+ DB 233,210,254,255,255 ; jmpq 29b74 <_sk_srcover_rgba_8888_sse2_8bit+0x2c>
+ DB 65,137,249 ; mov %edi,%r9d
+ DB 65,128,225,7 ; and $0x7,%r9b
+ DB 65,254,201 ; dec %r9b
+ DB 65,128,249,6 ; cmp $0x6,%r9b
+ DB 119,175 ; ja 29c61 <_sk_srcover_rgba_8888_sse2_8bit+0x119>
+ DB 65,15,182,193 ; movzbl %r9b,%eax
+ DB 76,141,13,191,0,0,0 ; lea 0xbf(%rip),%r9 # 29d7c <_sk_srcover_rgba_8888_sse2_8bit+0x234>
+ DB 73,99,4,129 ; movslq (%r9,%rax,4),%rax
+ DB 76,1,200 ; add %r9,%rax
+ DB 255,224 ; jmpq *%rax
+ DB 102,71,15,126,12,152 ; movd %xmm9,(%r8,%r11,4)
+ DB 235,147 ; jmp 29c61 <_sk_srcover_rgba_8888_sse2_8bit+0x119>
+ DB 102,67,15,110,100,152,8 ; movd 0x8(%r8,%r11,4),%xmm4
DB 102,68,15,112,204,69 ; pshufd $0x45,%xmm4,%xmm9
- DB 102,70,15,18,12,138 ; movlpd (%rdx,%r9,4),%xmm9
- DB 233,151,254,255,255 ; jmpq 29c3d <_sk_srcover_rgba_8888_sse2_8bit+0x31>
- DB 102,66,15,110,100,138,24 ; movd 0x18(%rdx,%r9,4),%xmm4
+ DB 102,71,15,18,12,152 ; movlpd (%r8,%r11,4),%xmm9
+ DB 233,142,254,255,255 ; jmpq 29b74 <_sk_srcover_rgba_8888_sse2_8bit+0x2c>
+ DB 102,67,15,110,100,152,24 ; movd 0x18(%r8,%r11,4),%xmm4
DB 102,68,15,112,196,69 ; pshufd $0x45,%xmm4,%xmm8
- DB 243,66,15,16,100,138,20 ; movss 0x14(%rdx,%r9,4),%xmm4
+ DB 243,67,15,16,100,152,20 ; movss 0x14(%r8,%r11,4),%xmm4
DB 65,15,198,224,0 ; shufps $0x0,%xmm8,%xmm4
DB 65,15,198,224,226 ; shufps $0xe2,%xmm8,%xmm4
DB 68,15,40,196 ; movaps %xmm4,%xmm8
- DB 243,66,15,16,100,138,16 ; movss 0x10(%rdx,%r9,4),%xmm4
+ DB 243,67,15,16,100,152,16 ; movss 0x10(%r8,%r11,4),%xmm4
DB 243,68,15,16,196 ; movss %xmm4,%xmm8
- DB 233,94,254,255,255 ; jmpq 29c37 <_sk_srcover_rgba_8888_sse2_8bit+0x2b>
+ DB 233,85,254,255,255 ; jmpq 29b6e <_sk_srcover_rgba_8888_sse2_8bit+0x26>
DB 102,65,15,112,225,78 ; pshufd $0x4e,%xmm9,%xmm4
- DB 102,66,15,126,100,138,8 ; movd %xmm4,0x8(%rdx,%r9,4)
- DB 102,70,15,214,12,138 ; movq %xmm9,(%rdx,%r9,4)
- DB 233,57,255,255,255 ; jmpq 29d2a <_sk_srcover_rgba_8888_sse2_8bit+0x11e>
+ DB 102,67,15,126,100,152,8 ; movd %xmm4,0x8(%r8,%r11,4)
+ DB 102,71,15,214,12,152 ; movq %xmm9,(%r8,%r11,4)
+ DB 233,48,255,255,255 ; jmpq 29c61 <_sk_srcover_rgba_8888_sse2_8bit+0x119>
DB 102,65,15,112,224,78 ; pshufd $0x4e,%xmm8,%xmm4
- DB 102,66,15,126,100,138,24 ; movd %xmm4,0x18(%rdx,%r9,4)
+ DB 102,67,15,126,100,152,24 ; movd %xmm4,0x18(%r8,%r11,4)
DB 102,65,15,112,224,229 ; pshufd $0xe5,%xmm8,%xmm4
- DB 102,66,15,126,100,138,20 ; movd %xmm4,0x14(%rdx,%r9,4)
- DB 102,70,15,126,68,138,16 ; movd %xmm8,0x10(%rdx,%r9,4)
- DB 243,70,15,127,12,138 ; movdqu %xmm9,(%rdx,%r9,4)
- DB 233,13,255,255,255 ; jmpq 29d2a <_sk_srcover_rgba_8888_sse2_8bit+0x11e>
+ DB 102,67,15,126,100,152,20 ; movd %xmm4,0x14(%r8,%r11,4)
+ DB 102,71,15,126,68,152,16 ; movd %xmm8,0x10(%r8,%r11,4)
+ DB 243,71,15,127,12,152 ; movdqu %xmm9,(%r8,%r11,4)
+ DB 233,4,255,255,255 ; jmpq 29c61 <_sk_srcover_rgba_8888_sse2_8bit+0x119>
DB 15,31,0 ; nopl (%rax)
- DB 58,255 ; cmp %bh,%bh
+ DB 55 ; (bad)
+ DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 123,255 ; jnp 29e25 <_sk_srcover_rgba_8888_sse2_8bit+0x219>
+ DB 123,255 ; jnp 29d65 <_sk_srcover_rgba_8888_sse2_8bit+0x21d>
DB 255 ; (bad)
DB 255,110,255 ; ljmp *-0x1(%rsi)
DB 255 ; (bad)
- DB 255,23 ; callq *(%rdi)
+ DB 255,14 ; decl (%rsi)
DB 254 ; (bad)
DB 255 ; (bad)
DB 255,168,255,255,255,147 ; ljmp *-0x6c000001(%rax)
@@ -40161,7 +40152,7 @@ _sk_scale_1_float_sse2_8bit LABEL PROC
DB 102,68,15,111,200 ; movdqa %xmm0,%xmm9
DB 72,173 ; lods %ds:(%rsi),%rax
DB 243,15,16,0 ; movss (%rax),%xmm0
- DB 243,15,89,5,160,34,0,0 ; mulss 0x22a0(%rip),%xmm0 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 243,15,89,5,156,34,0,0 ; mulss 0x229c(%rip),%xmm0 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 243,15,44,192 ; cvttss2si %xmm0,%eax
DB 102,15,239,246 ; pxor %xmm6,%xmm6
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
@@ -40173,7 +40164,7 @@ _sk_scale_1_float_sse2_8bit LABEL PROC
DB 102,15,96,246 ; punpcklbw %xmm6,%xmm6
DB 242,15,112,246,0 ; pshuflw $0x0,%xmm6,%xmm6
DB 102,15,112,246,80 ; pshufd $0x50,%xmm6,%xmm6
- DB 102,15,219,53,39,44,0,0 ; pand 0x2c27(%rip),%xmm6 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,53,39,44,0,0 ; pand 0x2c27(%rip),%xmm6 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,111,254 ; movdqa %xmm6,%xmm7
DB 102,65,15,213,248 ; pmullw %xmm8,%xmm7
DB 102,15,111,230 ; movdqa %xmm6,%xmm4
@@ -40196,18 +40187,17 @@ _sk_scale_1_float_sse2_8bit LABEL PROC
PUBLIC _sk_scale_u8_sse2_8bit
_sk_scale_u8_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 15,133,239,0,0,0 ; jne 2a009 <_sk_scale_u8_sse2_8bit+0x110>
- DB 243,66,15,126,36,2 ; movq (%rdx,%r8,1),%xmm4
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,239,0,0,0 ; jne 29f44 <_sk_scale_u8_sse2_8bit+0x10b>
+ DB 243,67,15,126,36,24 ; movq (%r8,%r11,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
- DB 102,15,219,37,164,43,0,0 ; pand 0x2ba4(%rip),%xmm4 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,37,169,43,0,0 ; pand 0x2ba9(%rip),%xmm4 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,15,111,236 ; movdqa %xmm4,%xmm5
DB 102,65,15,105,232 ; punpckhwd %xmm8,%xmm5
@@ -40256,56 +40246,57 @@ _sk_scale_u8_sse2_8bit LABEL PROC
DB 102,15,111,196 ; movdqa %xmm4,%xmm0
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 15,135,6,255,255,255 ; ja 29f24 <_sk_scale_u8_sse2_8bit+0x2b>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,119,0,0,0 ; lea 0x77(%rip),%rcx # 2a0a0 <_sk_scale_u8_sse2_8bit+0x1a7>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 15,135,3,255,255,255 ; ja 29e5f <_sk_scale_u8_sse2_8bit+0x26>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,117,0,0,0 ; lea 0x75(%rip),%r10 # 29fdc <_sk_scale_u8_sse2_8bit+0x1a3>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,224 ; movd %eax,%xmm4
- DB 233,228,254,255,255 ; jmpq 29f24 <_sk_scale_u8_sse2_8bit+0x2b>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 233,225,254,255,255 ; jmpq 29e5f <_sk_scale_u8_sse2_8bit+0x26>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,224,2 ; pinsrw $0x2,%eax,%xmm4
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,232 ; movd %eax,%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 243,15,16,229 ; movss %xmm5,%xmm4
- DB 233,191,254,255,255 ; jmpq 29f24 <_sk_scale_u8_sse2_8bit+0x2b>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,188,254,255,255 ; jmpq 29e5f <_sk_scale_u8_sse2_8bit+0x26>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,224,6 ; pinsrw $0x6,%eax,%xmm4
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,224,5 ; pinsrw $0x5,%eax,%xmm4
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,224,4 ; pinsrw $0x4,%eax,%xmm4
- DB 102,66,15,110,44,2 ; movd (%rdx,%r8,1),%xmm5
+ DB 102,67,15,110,44,24 ; movd (%r8,%r11,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 242,15,16,229 ; movsd %xmm5,%xmm4
- DB 233,135,254,255,255 ; jmpq 29f24 <_sk_scale_u8_sse2_8bit+0x2b>
- DB 15,31,0 ; nopl (%rax)
- DB 146 ; xchg %eax,%edx
+ DB 233,132,254,255,255 ; jmpq 29e5f <_sk_scale_u8_sse2_8bit+0x26>
+ DB 144 ; nop
+ DB 148 ; xchg %eax,%esp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,175,255,255,255,160 ; ljmp *-0x5f000001(%rdi)
+ DB 255,177,255,255,255,162 ; pushq -0x5d000001(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 234 ; (bad)
+ DB 236 ; in (%dx),%al
DB 255 ; (bad)
DB 255 ; (bad)
+ DB 255,225 ; jmpq *%rcx
DB 255 ; (bad)
- DB 223,255 ; (bad)
DB 255 ; (bad)
- DB 255,212 ; callq *%rsp
+ DB 255,214 ; callq *%rsi
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,197 ; inc %ebp
+ DB 255,199 ; inc %edi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -40314,7 +40305,7 @@ PUBLIC _sk_lerp_1_float_sse2_8bit
_sk_lerp_1_float_sse2_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 243,15,16,32 ; movss (%rax),%xmm4
- DB 243,15,89,37,70,32,0,0 ; mulss 0x2046(%rip),%xmm4 # 2c110 <_sk_overlay_sse2_8bit+0x49b>
+ DB 243,15,89,37,70,32,0,0 ; mulss 0x2046(%rip),%xmm4 # 2c04c <_sk_overlay_sse2_8bit+0x49c>
DB 243,15,44,196 ; cvttss2si %xmm4,%eax
DB 102,15,110,224 ; movd %eax,%xmm4
DB 102,15,96,228 ; punpcklbw %xmm4,%xmm4
@@ -40327,7 +40318,7 @@ _sk_lerp_1_float_sse2_8bit LABEL PROC
DB 102,68,15,111,217 ; movdqa %xmm1,%xmm11
DB 102,69,15,96,217 ; punpcklbw %xmm9,%xmm11
DB 102,65,15,104,201 ; punpckhbw %xmm9,%xmm1
- DB 102,15,111,53,197,41,0,0 ; movdqa 0x29c5(%rip),%xmm6 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,111,53,201,41,0,0 ; movdqa 0x29c9(%rip),%xmm6 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,65,15,219,240 ; pand %xmm8,%xmm6
DB 102,15,111,230 ; movdqa %xmm6,%xmm4
DB 102,15,213,225 ; pmullw %xmm1,%xmm4
@@ -40382,18 +40373,17 @@ _sk_lerp_1_float_sse2_8bit LABEL PROC
PUBLIC _sk_lerp_u8_sse2_8bit
_sk_lerp_u8_sse2_8bit LABEL PROC
- DB 76,99,7 ; movslq (%rdi),%r8
- DB 76,139,79,16 ; mov 0x10(%rdi),%r9
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 72,99,72,8 ; movslq 0x8(%rax),%rcx
- DB 72,99,87,8 ; movslq 0x8(%rdi),%rdx
- DB 72,15,175,209 ; imul %rcx,%rdx
- DB 72,3,16 ; add (%rax),%rdx
- DB 77,133,201 ; test %r9,%r9
- DB 15,133,141,1,0,0 ; jne 2a3a0 <_sk_lerp_u8_sse2_8bit+0x1ae>
- DB 243,66,15,126,44,2 ; movq (%rdx,%r8,1),%xmm5
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 76,99,72,8 ; movslq 0x8(%rax),%r9
+ DB 76,99,193 ; movslq %ecx,%r8
+ DB 77,15,175,193 ; imul %r9,%r8
+ DB 76,3,0 ; add (%rax),%r8
+ DB 76,99,218 ; movslq %edx,%r11
+ DB 72,133,255 ; test %rdi,%rdi
+ DB 15,133,141,1,0,0 ; jne 2a2d7 <_sk_lerp_u8_sse2_8bit+0x1a9>
+ DB 243,67,15,126,44,24 ; movq (%r8,%r11,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
- DB 102,15,219,45,171,40,0,0 ; pand 0x28ab(%rip),%xmm5 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,219,45,180,40,0,0 ; pand 0x28b4(%rip),%xmm5 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,15,111,229 ; movdqa %xmm5,%xmm4
DB 102,65,15,105,224 ; punpckhwd %xmm8,%xmm4
@@ -40475,55 +40465,56 @@ _sk_lerp_u8_sse2_8bit LABEL PROC
DB 102,65,15,252,204 ; paddb %xmm12,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
+ DB 65,137,249 ; mov %edi,%r9d
DB 65,128,225,7 ; and $0x7,%r9b
DB 102,15,239,237 ; pxor %xmm5,%xmm5
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 15,135,104,254,255,255 ; ja 2a21d <_sk_lerp_u8_sse2_8bit+0x2b>
- DB 65,15,182,193 ; movzbl %r9b,%eax
- DB 72,141,13,116,0,0,0 ; lea 0x74(%rip),%rcx # 2a434 <_sk_lerp_u8_sse2_8bit+0x242>
- DB 72,99,4,129 ; movslq (%rcx,%rax,4),%rax
- DB 72,1,200 ; add %rcx,%rax
+ DB 15,135,101,254,255,255 ; ja 2a154 <_sk_lerp_u8_sse2_8bit+0x26>
+ DB 69,15,182,201 ; movzbl %r9b,%r9d
+ DB 76,141,21,118,0,0,0 ; lea 0x76(%rip),%r10 # 2a370 <_sk_lerp_u8_sse2_8bit+0x242>
+ DB 75,99,4,138 ; movslq (%r10,%r9,4),%rax
+ DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
- DB 66,15,182,4,2 ; movzbl (%rdx,%r8,1),%eax
+ DB 67,15,182,4,24 ; movzbl (%r8,%r11,1),%eax
DB 102,15,110,232 ; movd %eax,%xmm5
- DB 233,70,254,255,255 ; jmpq 2a21d <_sk_lerp_u8_sse2_8bit+0x2b>
- DB 66,15,182,68,2,2 ; movzbl 0x2(%rdx,%r8,1),%eax
+ DB 233,67,254,255,255 ; jmpq 2a154 <_sk_lerp_u8_sse2_8bit+0x26>
+ DB 67,15,182,68,24,2 ; movzbl 0x2(%r8,%r11,1),%eax
DB 102,15,239,237 ; pxor %xmm5,%xmm5
DB 102,15,196,232,2 ; pinsrw $0x2,%eax,%xmm5
- DB 66,15,183,4,2 ; movzwl (%rdx,%r8,1),%eax
+ DB 67,15,183,4,24 ; movzwl (%r8,%r11,1),%eax
DB 102,15,110,224 ; movd %eax,%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 243,15,16,236 ; movss %xmm4,%xmm5
- DB 233,33,254,255,255 ; jmpq 2a21d <_sk_lerp_u8_sse2_8bit+0x2b>
- DB 66,15,182,68,2,6 ; movzbl 0x6(%rdx,%r8,1),%eax
+ DB 233,30,254,255,255 ; jmpq 2a154 <_sk_lerp_u8_sse2_8bit+0x26>
+ DB 67,15,182,68,24,6 ; movzbl 0x6(%r8,%r11,1),%eax
DB 102,15,239,237 ; pxor %xmm5,%xmm5
DB 102,15,196,232,6 ; pinsrw $0x6,%eax,%xmm5
- DB 66,15,182,68,2,5 ; movzbl 0x5(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,5 ; movzbl 0x5(%r8,%r11,1),%eax
DB 102,15,196,232,5 ; pinsrw $0x5,%eax,%xmm5
- DB 66,15,182,68,2,4 ; movzbl 0x4(%rdx,%r8,1),%eax
+ DB 67,15,182,68,24,4 ; movzbl 0x4(%r8,%r11,1),%eax
DB 102,15,196,232,4 ; pinsrw $0x4,%eax,%xmm5
- DB 102,66,15,110,36,2 ; movd (%rdx,%r8,1),%xmm4
+ DB 102,67,15,110,36,24 ; movd (%r8,%r11,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 242,15,16,236 ; movsd %xmm4,%xmm5
- DB 233,233,253,255,255 ; jmpq 2a21d <_sk_lerp_u8_sse2_8bit+0x2b>
- DB 149 ; xchg %eax,%ebp
- DB 255 ; (bad)
+ DB 233,230,253,255,255 ; jmpq 2a154 <_sk_lerp_u8_sse2_8bit+0x26>
+ DB 102,144 ; xchg %ax,%ax
+ DB 147 ; xchg %eax,%ebx
DB 255 ; (bad)
- DB 255,178,255,255,255,163 ; pushq -0x5c000001(%rdx)
DB 255 ; (bad)
+ DB 255,176,255,255,255,161 ; pushq -0x5e000001(%rax)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 237 ; in (%dx),%eax
DB 255 ; (bad)
+ DB 235,255 ; jmp 2a37d <_sk_lerp_u8_sse2_8bit+0x24f>
DB 255 ; (bad)
- DB 255,226 ; jmpq *%rdx
+ DB 255,224 ; jmpq *%rax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,215 ; callq *%rdi
+ DB 255,213 ; callq *%rbp
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,200 ; dec %eax
+ DB 255,198 ; inc %esi
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -40545,7 +40536,7 @@ _sk_move_dst_src_sse2_8bit LABEL PROC
PUBLIC _sk_black_color_sse2_8bit
_sk_black_color_sse2_8bit LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,5,163,45,0,0 ; movaps 0x2da3(%rip),%xmm0 # 2d210 <_sk_overlay_sse2_8bit+0x159b>
+ DB 15,40,5,167,45,0,0 ; movaps 0x2da7(%rip),%xmm0 # 2d150 <_sk_overlay_sse2_8bit+0x15a0>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 255,224 ; jmpq *%rax
@@ -41083,9 +41074,9 @@ _sk_multiply_sse2_8bit LABEL PROC
DB 102,15,112,210,232 ; pshufd $0xe8,%xmm2,%xmm2
DB 102,15,96,210 ; punpcklbw %xmm2,%xmm2
DB 242,15,112,210,95 ; pshuflw $0x5f,%xmm2,%xmm2
- DB 243,15,112,226,95 ; pshufhw $0x5f,%xmm2,%xmm4
+ DB 243,15,112,234,95 ; pshufhw $0x5f,%xmm2,%xmm5
DB 102,69,15,118,192 ; pcmpeqd %xmm8,%xmm8
- DB 102,65,15,239,224 ; pxor %xmm8,%xmm4
+ DB 102,65,15,239,232 ; pxor %xmm8,%xmm5
DB 102,65,15,239,248 ; pxor %xmm8,%xmm7
DB 102,69,15,239,237 ; pxor %xmm13,%xmm13
DB 102,68,15,111,200 ; movdqa %xmm0,%xmm9
@@ -41101,23 +41092,23 @@ _sk_multiply_sse2_8bit LABEL PROC
DB 102,68,15,111,255 ; movdqa %xmm7,%xmm15
DB 102,69,15,96,253 ; punpcklbw %xmm13,%xmm15
DB 102,65,15,104,253 ; punpckhbw %xmm13,%xmm7
- DB 102,15,111,236 ; movdqa %xmm4,%xmm5
- DB 102,65,15,96,237 ; punpcklbw %xmm13,%xmm5
- DB 102,65,15,104,229 ; punpckhbw %xmm13,%xmm4
- DB 102,65,15,213,226 ; pmullw %xmm10,%xmm4
- DB 102,65,15,213,236 ; pmullw %xmm12,%xmm5
+ DB 102,15,111,229 ; movdqa %xmm5,%xmm4
+ DB 102,65,15,96,229 ; punpcklbw %xmm13,%xmm4
+ DB 102,65,15,104,237 ; punpckhbw %xmm13,%xmm5
+ DB 102,65,15,213,234 ; pmullw %xmm10,%xmm5
+ DB 102,65,15,213,228 ; pmullw %xmm12,%xmm4
DB 102,65,15,213,249 ; pmullw %xmm9,%xmm7
DB 102,69,15,213,251 ; pmullw %xmm11,%xmm15
DB 102,69,15,253,251 ; paddw %xmm11,%xmm15
DB 102,65,15,253,249 ; paddw %xmm9,%xmm7
- DB 102,65,15,253,236 ; paddw %xmm12,%xmm5
- DB 102,65,15,253,226 ; paddw %xmm10,%xmm4
- DB 102,15,113,212,8 ; psrlw $0x8,%xmm4
+ DB 102,65,15,253,228 ; paddw %xmm12,%xmm4
+ DB 102,65,15,253,234 ; paddw %xmm10,%xmm5
DB 102,15,113,213,8 ; psrlw $0x8,%xmm5
+ DB 102,15,113,212,8 ; psrlw $0x8,%xmm4
DB 102,15,113,215,8 ; psrlw $0x8,%xmm7
DB 102,65,15,113,215,8 ; psrlw $0x8,%xmm15
DB 102,68,15,103,255 ; packuswb %xmm7,%xmm15
- DB 102,15,103,236 ; packuswb %xmm4,%xmm5
+ DB 102,15,103,229 ; packuswb %xmm5,%xmm4
DB 243,15,112,194,231 ; pshufhw $0xe7,%xmm2,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
@@ -41130,28 +41121,28 @@ _sk_multiply_sse2_8bit LABEL PROC
DB 243,15,112,241,95 ; pshufhw $0x5f,%xmm1,%xmm6
DB 102,65,15,239,240 ; pxor %xmm8,%xmm6
DB 102,65,15,239,192 ; pxor %xmm8,%xmm0
- DB 102,68,15,111,195 ; movdqa %xmm3,%xmm8
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
- DB 102,65,15,96,213 ; punpcklbw %xmm13,%xmm2
- DB 102,69,15,104,197 ; punpckhbw %xmm13,%xmm8
+ DB 102,15,111,235 ; movdqa %xmm3,%xmm5
+ DB 102,65,15,96,237 ; punpcklbw %xmm13,%xmm5
+ DB 102,65,15,104,213 ; punpckhbw %xmm13,%xmm2
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,15,127,12,36 ; movdqa %xmm1,(%rsp)
DB 102,15,111,249 ; movdqa %xmm1,%xmm7
DB 102,65,15,96,253 ; punpcklbw %xmm13,%xmm7
DB 102,69,15,104,245 ; punpckhbw %xmm13,%xmm14
- DB 102,15,111,224 ; movdqa %xmm0,%xmm4
- DB 102,65,15,96,229 ; punpcklbw %xmm13,%xmm4
+ DB 102,68,15,111,192 ; movdqa %xmm0,%xmm8
+ DB 102,69,15,96,197 ; punpcklbw %xmm13,%xmm8
DB 102,65,15,104,197 ; punpckhbw %xmm13,%xmm0
DB 102,15,111,206 ; movdqa %xmm6,%xmm1
DB 102,65,15,96,205 ; punpcklbw %xmm13,%xmm1
DB 102,65,15,104,245 ; punpckhbw %xmm13,%xmm6
- DB 102,65,15,213,192 ; pmullw %xmm8,%xmm0
- DB 102,15,213,226 ; pmullw %xmm2,%xmm4
- DB 102,15,253,226 ; paddw %xmm2,%xmm4
- DB 102,65,15,253,192 ; paddw %xmm8,%xmm0
+ DB 102,15,213,194 ; pmullw %xmm2,%xmm0
+ DB 102,68,15,213,197 ; pmullw %xmm5,%xmm8
+ DB 102,68,15,253,197 ; paddw %xmm5,%xmm8
+ DB 102,15,253,194 ; paddw %xmm2,%xmm0
DB 102,15,113,208,8 ; psrlw $0x8,%xmm0
- DB 102,15,113,212,8 ; psrlw $0x8,%xmm4
- DB 102,15,103,224 ; packuswb %xmm0,%xmm4
+ DB 102,65,15,113,208,8 ; psrlw $0x8,%xmm8
+ DB 102,68,15,103,192 ; packuswb %xmm0,%xmm8
DB 102,65,15,213,246 ; pmullw %xmm14,%xmm6
DB 102,15,213,207 ; pmullw %xmm7,%xmm1
DB 102,15,253,207 ; paddw %xmm7,%xmm1
@@ -41159,70 +41150,70 @@ _sk_multiply_sse2_8bit LABEL PROC
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
DB 102,15,103,206 ; packuswb %xmm6,%xmm1
- DB 102,15,252,205 ; paddb %xmm5,%xmm1
- DB 102,65,15,252,231 ; paddb %xmm15,%xmm4
- DB 102,65,15,213,211 ; pmullw %xmm11,%xmm2
- DB 102,65,15,253,211 ; paddw %xmm11,%xmm2
- DB 102,69,15,213,193 ; pmullw %xmm9,%xmm8
- DB 102,69,15,253,193 ; paddw %xmm9,%xmm8
+ DB 102,15,252,204 ; paddb %xmm4,%xmm1
+ DB 102,69,15,252,199 ; paddb %xmm15,%xmm8
+ DB 102,65,15,213,235 ; pmullw %xmm11,%xmm5
+ DB 102,65,15,253,235 ; paddw %xmm11,%xmm5
+ DB 102,65,15,213,209 ; pmullw %xmm9,%xmm2
+ DB 102,65,15,253,209 ; paddw %xmm9,%xmm2
DB 102,65,15,213,252 ; pmullw %xmm12,%xmm7
DB 102,65,15,253,252 ; paddw %xmm12,%xmm7
DB 102,69,15,213,242 ; pmullw %xmm10,%xmm14
DB 102,69,15,253,242 ; paddw %xmm10,%xmm14
- DB 102,65,15,113,208,8 ; psrlw $0x8,%xmm8
DB 102,15,113,210,8 ; psrlw $0x8,%xmm2
- DB 102,65,15,103,208 ; packuswb %xmm8,%xmm2
+ DB 102,15,113,213,8 ; psrlw $0x8,%xmm5
+ DB 102,15,103,234 ; packuswb %xmm2,%xmm5
DB 102,65,15,113,214,8 ; psrlw $0x8,%xmm14
DB 102,15,113,215,8 ; psrlw $0x8,%xmm7
DB 102,65,15,103,254 ; packuswb %xmm14,%xmm7
- DB 102,15,252,226 ; paddb %xmm2,%xmm4
+ DB 102,68,15,252,197 ; paddb %xmm5,%xmm8
DB 102,15,252,207 ; paddb %xmm7,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
DB 15,40,28,36 ; movaps (%rsp),%xmm3
- DB 102,15,111,196 ; movdqa %xmm4,%xmm0
+ DB 102,65,15,111,192 ; movdqa %xmm8,%xmm0
DB 72,131,196,24 ; add $0x18,%rsp
DB 255,224 ; jmpq *%rax
PUBLIC _sk_screen_sse2_8bit
_sk_screen_sse2_8bit LABEL PROC
- DB 102,69,15,118,219 ; pcmpeqd %xmm11,%xmm11
- DB 102,68,15,111,201 ; movdqa %xmm1,%xmm9
- DB 102,69,15,239,203 ; pxor %xmm11,%xmm9
- DB 102,68,15,239,216 ; pxor %xmm0,%xmm11
- DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
- DB 102,65,15,111,235 ; movdqa %xmm11,%xmm5
- DB 102,65,15,96,232 ; punpcklbw %xmm8,%xmm5
- DB 102,69,15,104,216 ; punpckhbw %xmm8,%xmm11
- DB 102,65,15,111,225 ; movdqa %xmm9,%xmm4
- DB 102,65,15,96,224 ; punpcklbw %xmm8,%xmm4
- DB 102,69,15,104,200 ; punpckhbw %xmm8,%xmm9
- DB 102,15,111,242 ; movdqa %xmm2,%xmm6
- DB 102,68,15,111,210 ; movdqa %xmm2,%xmm10
- DB 102,69,15,96,208 ; punpcklbw %xmm8,%xmm10
- DB 102,65,15,104,240 ; punpckhbw %xmm8,%xmm6
- DB 102,15,111,251 ; movdqa %xmm3,%xmm7
+ DB 102,68,15,111,193 ; movdqa %xmm1,%xmm8
+ DB 102,15,118,255 ; pcmpeqd %xmm7,%xmm7
+ DB 102,69,15,111,208 ; movdqa %xmm8,%xmm10
+ DB 102,68,15,239,215 ; pxor %xmm7,%xmm10
+ DB 102,15,239,248 ; pxor %xmm0,%xmm7
+ DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
+ DB 102,15,111,239 ; movdqa %xmm7,%xmm5
+ DB 102,65,15,96,233 ; punpcklbw %xmm9,%xmm5
+ DB 102,65,15,104,249 ; punpckhbw %xmm9,%xmm7
+ DB 102,65,15,111,202 ; movdqa %xmm10,%xmm1
+ DB 102,65,15,96,201 ; punpcklbw %xmm9,%xmm1
+ DB 102,69,15,104,209 ; punpckhbw %xmm9,%xmm10
+ DB 102,15,111,226 ; movdqa %xmm2,%xmm4
+ DB 102,68,15,111,218 ; movdqa %xmm2,%xmm11
+ DB 102,69,15,96,217 ; punpcklbw %xmm9,%xmm11
+ DB 102,65,15,104,225 ; punpckhbw %xmm9,%xmm4
+ DB 102,15,111,243 ; movdqa %xmm3,%xmm6
DB 102,68,15,111,227 ; movdqa %xmm3,%xmm12
- DB 102,69,15,96,224 ; punpcklbw %xmm8,%xmm12
- DB 102,65,15,104,248 ; punpckhbw %xmm8,%xmm7
- DB 102,65,15,213,249 ; pmullw %xmm9,%xmm7
- DB 102,68,15,213,228 ; pmullw %xmm4,%xmm12
- DB 102,65,15,213,243 ; pmullw %xmm11,%xmm6
- DB 102,68,15,213,213 ; pmullw %xmm5,%xmm10
- DB 102,65,15,253,234 ; paddw %xmm10,%xmm5
- DB 102,65,15,253,243 ; paddw %xmm11,%xmm6
- DB 102,65,15,253,228 ; paddw %xmm12,%xmm4
- DB 102,65,15,253,249 ; paddw %xmm9,%xmm7
- DB 102,15,113,215,8 ; psrlw $0x8,%xmm7
- DB 102,15,113,212,8 ; psrlw $0x8,%xmm4
+ DB 102,69,15,96,225 ; punpcklbw %xmm9,%xmm12
+ DB 102,65,15,104,241 ; punpckhbw %xmm9,%xmm6
+ DB 102,65,15,213,242 ; pmullw %xmm10,%xmm6
+ DB 102,68,15,213,225 ; pmullw %xmm1,%xmm12
+ DB 102,15,213,231 ; pmullw %xmm7,%xmm4
+ DB 102,68,15,213,221 ; pmullw %xmm5,%xmm11
+ DB 102,65,15,253,235 ; paddw %xmm11,%xmm5
+ DB 102,15,253,231 ; paddw %xmm7,%xmm4
+ DB 102,65,15,253,204 ; paddw %xmm12,%xmm1
+ DB 102,65,15,253,242 ; paddw %xmm10,%xmm6
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
+ DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
+ DB 102,15,113,212,8 ; psrlw $0x8,%xmm4
DB 102,15,113,213,8 ; psrlw $0x8,%xmm5
- DB 102,15,103,238 ; packuswb %xmm6,%xmm5
- DB 102,15,103,231 ; packuswb %xmm7,%xmm4
+ DB 102,15,103,236 ; packuswb %xmm4,%xmm5
+ DB 102,15,103,206 ; packuswb %xmm6,%xmm1
DB 102,15,252,197 ; paddb %xmm5,%xmm0
- DB 102,15,252,225 ; paddb %xmm1,%xmm4
+ DB 102,65,15,252,200 ; paddb %xmm8,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 102,15,111,204 ; movdqa %xmm4,%xmm1
DB 255,224 ; jmpq *%rax
PUBLIC _sk_xor__sse2_8bit
@@ -41416,7 +41407,7 @@ _sk_darken_sse2_8bit LABEL PROC
DB 102,65,15,248,234 ; psubb %xmm10,%xmm5
DB 102,15,248,207 ; psubb %xmm7,%xmm1
DB 102,15,248,196 ; psubb %xmm4,%xmm0
- DB 102,15,111,37,44,31,0,0 ; movdqa 0x1f2c(%rip),%xmm4 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 102,15,111,37,49,31,0,0 ; movdqa 0x1f31(%rip),%xmm4 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 102,15,111,252 ; movdqa %xmm4,%xmm7
DB 102,15,223,248 ; pandn %xmm0,%xmm7
@@ -41522,7 +41513,7 @@ _sk_lighten_sse2_8bit LABEL PROC
DB 102,65,15,248,234 ; psubb %xmm10,%xmm5
DB 102,15,248,207 ; psubb %xmm7,%xmm1
DB 102,15,248,196 ; psubb %xmm4,%xmm0
- DB 102,15,111,37,64,29,0,0 ; movdqa 0x1d40(%rip),%xmm4 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 102,15,111,37,69,29,0,0 ; movdqa 0x1d45(%rip),%xmm4 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 102,15,111,252 ; movdqa %xmm4,%xmm7
DB 102,15,223,248 ; pandn %xmm0,%xmm7
@@ -41570,7 +41561,7 @@ _sk_exclusion_sse2_8bit LABEL PROC
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
DB 102,15,103,244 ; packuswb %xmm4,%xmm6
DB 102,15,103,239 ; packuswb %xmm7,%xmm5
- DB 102,15,111,37,115,28,0,0 ; movdqa 0x1c73(%rip),%xmm4 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 102,15,111,37,120,28,0,0 ; movdqa 0x1c78(%rip),%xmm4 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,15,248,205 ; psubb %xmm5,%xmm1
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 102,15,219,230 ; pand %xmm6,%xmm4
@@ -41667,7 +41658,7 @@ _sk_difference_sse2_8bit LABEL PROC
DB 102,65,15,103,244 ; packuswb %xmm12,%xmm6
DB 102,65,15,218,226 ; pminub %xmm10,%xmm4
DB 102,65,15,218,243 ; pminub %xmm11,%xmm6
- DB 102,15,111,45,176,26,0,0 ; movdqa 0x1ab0(%rip),%xmm5 # 2d2a0 <_sk_overlay_sse2_8bit+0x162b>
+ DB 102,15,111,45,181,26,0,0 ; movdqa 0x1ab5(%rip),%xmm5 # 2d1e0 <_sk_overlay_sse2_8bit+0x1630>
DB 102,15,248,206 ; psubb %xmm6,%xmm1
DB 102,15,219,245 ; pand %xmm5,%xmm6
DB 102,15,219,236 ; pand %xmm4,%xmm5
@@ -41681,15 +41672,15 @@ PUBLIC _sk_hardlight_sse2_8bit
_sk_hardlight_sse2_8bit LABEL PROC
DB 72,129,236,56,1,0,0 ; sub $0x138,%rsp
DB 102,68,15,111,250 ; movdqa %xmm2,%xmm15
- DB 102,68,15,111,200 ; movdqa %xmm0,%xmm9
+ DB 102,68,15,111,192 ; movdqa %xmm0,%xmm8
DB 102,15,239,237 ; pxor %xmm5,%xmm5
- DB 102,69,15,111,241 ; movdqa %xmm9,%xmm14
+ DB 102,69,15,111,240 ; movdqa %xmm8,%xmm14
DB 102,68,15,96,245 ; punpcklbw %xmm5,%xmm14
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,96,197 ; punpcklbw %xmm5,%xmm0
- DB 102,68,15,111,192 ; movdqa %xmm0,%xmm8
- DB 242,65,15,112,193,231 ; pshuflw $0xe7,%xmm9,%xmm0
- DB 102,68,15,104,205 ; punpckhbw %xmm5,%xmm9
+ DB 102,68,15,111,200 ; movdqa %xmm0,%xmm9
+ DB 242,65,15,112,192,231 ; pshuflw $0xe7,%xmm8,%xmm0
+ DB 102,68,15,104,197 ; punpckhbw %xmm5,%xmm8
DB 243,15,112,192,231 ; pshufhw $0xe7,%xmm0,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
@@ -41744,17 +41735,17 @@ _sk_hardlight_sse2_8bit LABEL PROC
DB 102,15,96,245 ; punpcklbw %xmm5,%xmm6
DB 102,69,15,111,214 ; movdqa %xmm14,%xmm10
DB 102,69,15,253,210 ; paddw %xmm10,%xmm10
- DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
+ DB 102,65,15,111,192 ; movdqa %xmm8,%xmm0
DB 102,15,253,192 ; paddw %xmm0,%xmm0
- DB 102,65,15,111,216 ; movdqa %xmm8,%xmm3
- DB 102,69,15,253,192 ; paddw %xmm8,%xmm8
+ DB 102,65,15,111,217 ; movdqa %xmm9,%xmm3
+ DB 102,69,15,253,201 ; paddw %xmm9,%xmm9
DB 102,15,111,84,36,64 ; movdqa 0x40(%rsp),%xmm2
DB 102,15,253,210 ; paddw %xmm2,%xmm2
DB 102,15,217,215 ; psubusw %xmm7,%xmm2
DB 102,15,117,213 ; pcmpeqw %xmm5,%xmm2
DB 102,15,127,148,36,240,0,0,0 ; movdqa %xmm2,0xf0(%rsp)
- DB 102,69,15,217,196 ; psubusw %xmm12,%xmm8
- DB 102,68,15,117,197 ; pcmpeqw %xmm5,%xmm8
+ DB 102,69,15,217,204 ; psubusw %xmm12,%xmm9
+ DB 102,68,15,117,205 ; pcmpeqw %xmm5,%xmm9
DB 102,15,111,84,36,32 ; movdqa 0x20(%rsp),%xmm2
DB 102,15,217,194 ; psubusw %xmm2,%xmm0
DB 102,15,117,197 ; pcmpeqw %xmm5,%xmm0
@@ -41762,7 +41753,7 @@ _sk_hardlight_sse2_8bit LABEL PROC
DB 102,68,15,111,220 ; movdqa %xmm4,%xmm11
DB 102,69,15,217,211 ; psubusw %xmm11,%xmm10
DB 102,68,15,117,213 ; pcmpeqw %xmm5,%xmm10
- DB 102,15,111,45,19,17,0,0 ; movdqa 0x1113(%rip),%xmm5 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,111,45,24,17,0,0 ; movdqa 0x1118(%rip),%xmm5 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,111,198 ; movdqa %xmm6,%xmm0
DB 102,15,239,197 ; pxor %xmm5,%xmm0
DB 102,65,15,213,198 ; pmullw %xmm14,%xmm0
@@ -41781,7 +41772,7 @@ _sk_hardlight_sse2_8bit LABEL PROC
DB 102,69,15,249,222 ; psubw %xmm14,%xmm11
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,239,197 ; pxor %xmm5,%xmm0
- DB 102,65,15,213,193 ; pmullw %xmm9,%xmm0
+ DB 102,65,15,213,192 ; pmullw %xmm8,%xmm0
DB 102,15,127,132,36,160,0,0,0 ; movdqa %xmm0,0xa0(%rsp)
DB 102,68,15,111,250 ; movdqa %xmm2,%xmm15
DB 102,68,15,239,253 ; pxor %xmm5,%xmm15
@@ -41790,20 +41781,20 @@ _sk_hardlight_sse2_8bit LABEL PROC
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,249,206 ; psubw %xmm6,%xmm1
DB 102,15,127,76,36,96 ; movdqa %xmm1,0x60(%rsp)
- DB 102,65,15,213,241 ; pmullw %xmm9,%xmm6
+ DB 102,65,15,213,240 ; pmullw %xmm8,%xmm6
DB 102,15,213,194 ; pmullw %xmm2,%xmm0
DB 102,15,127,68,36,112 ; movdqa %xmm0,0x70(%rsp)
- DB 102,65,15,249,209 ; psubw %xmm9,%xmm2
+ DB 102,65,15,249,208 ; psubw %xmm8,%xmm2
DB 102,15,127,84,36,32 ; movdqa %xmm2,0x20(%rsp)
DB 102,65,15,111,197 ; movdqa %xmm13,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,239,205 ; pxor %xmm5,%xmm1
DB 102,15,213,203 ; pmullw %xmm3,%xmm1
DB 102,15,127,76,36,16 ; movdqa %xmm1,0x10(%rsp)
- DB 102,69,15,111,204 ; movdqa %xmm12,%xmm9
- DB 102,68,15,239,205 ; pxor %xmm5,%xmm9
+ DB 102,69,15,111,196 ; movdqa %xmm12,%xmm8
+ DB 102,68,15,239,197 ; pxor %xmm5,%xmm8
DB 102,15,111,36,36 ; movdqa (%rsp),%xmm4
- DB 102,68,15,213,204 ; pmullw %xmm4,%xmm9
+ DB 102,68,15,213,196 ; pmullw %xmm4,%xmm8
DB 102,68,15,111,232 ; movdqa %xmm0,%xmm13
DB 102,15,249,196 ; psubw %xmm4,%xmm0
DB 102,15,127,68,36,80 ; movdqa %xmm0,0x50(%rsp)
@@ -41852,9 +41843,9 @@ _sk_hardlight_sse2_8bit LABEL PROC
DB 102,15,235,198 ; por %xmm6,%xmm0
DB 102,15,111,216 ; movdqa %xmm0,%xmm3
DB 102,15,253,228 ; paddw %xmm4,%xmm4
- DB 102,65,15,219,224 ; pand %xmm8,%xmm4
- DB 102,69,15,223,197 ; pandn %xmm13,%xmm8
- DB 102,68,15,235,196 ; por %xmm4,%xmm8
+ DB 102,65,15,219,225 ; pand %xmm9,%xmm4
+ DB 102,69,15,223,205 ; pandn %xmm13,%xmm9
+ DB 102,68,15,235,204 ; por %xmm4,%xmm9
DB 102,15,253,210 ; paddw %xmm2,%xmm2
DB 102,15,111,132,36,240,0,0,0 ; movdqa 0xf0(%rsp),%xmm0
DB 102,15,219,208 ; pand %xmm0,%xmm2
@@ -41864,33 +41855,33 @@ _sk_hardlight_sse2_8bit LABEL PROC
DB 102,15,111,148,36,208,0,0,0 ; movdqa 0xd0(%rsp),%xmm2
DB 102,15,253,148,36,224,0,0,0 ; paddw 0xe0(%rsp),%xmm2
DB 102,68,15,253,188,36,160,0,0,0 ; paddw 0xa0(%rsp),%xmm15
- DB 102,68,15,253,76,36,16 ; paddw 0x10(%rsp),%xmm9
+ DB 102,68,15,253,68,36,16 ; paddw 0x10(%rsp),%xmm8
DB 102,15,253,44,36 ; paddw (%rsp),%xmm5
- DB 102,15,111,5,193,22,0,0 ; movdqa 0x16c1(%rip),%xmm0 # 2d2b0 <_sk_overlay_sse2_8bit+0x163b>
+ DB 102,15,111,5,198,22,0,0 ; movdqa 0x16c6(%rip),%xmm0 # 2d1f0 <_sk_overlay_sse2_8bit+0x1640>
DB 102,15,253,208 ; paddw %xmm0,%xmm2
DB 102,68,15,253,210 ; paddw %xmm2,%xmm10
DB 102,68,15,253,248 ; paddw %xmm0,%xmm15
DB 102,68,15,253,251 ; paddw %xmm3,%xmm15
- DB 102,68,15,253,200 ; paddw %xmm0,%xmm9
- DB 102,69,15,253,193 ; paddw %xmm9,%xmm8
+ DB 102,68,15,253,192 ; paddw %xmm0,%xmm8
+ DB 102,69,15,253,200 ; paddw %xmm8,%xmm9
DB 102,15,253,232 ; paddw %xmm0,%xmm5
DB 102,15,253,233 ; paddw %xmm1,%xmm5
- DB 102,15,111,5,164,22,0,0 ; movdqa 0x16a4(%rip),%xmm0 # 2d2c0 <_sk_overlay_sse2_8bit+0x164b>
+ DB 102,15,111,5,169,22,0,0 ; movdqa 0x16a9(%rip),%xmm0 # 2d200 <_sk_overlay_sse2_8bit+0x1650>
DB 102,15,228,232 ; pmulhuw %xmm0,%xmm5
- DB 102,68,15,228,192 ; pmulhuw %xmm0,%xmm8
+ DB 102,68,15,228,200 ; pmulhuw %xmm0,%xmm9
DB 102,68,15,228,248 ; pmulhuw %xmm0,%xmm15
DB 102,68,15,228,208 ; pmulhuw %xmm0,%xmm10
DB 102,65,15,113,215,7 ; psrlw $0x7,%xmm15
DB 102,65,15,113,210,7 ; psrlw $0x7,%xmm10
DB 102,69,15,103,215 ; packuswb %xmm15,%xmm10
DB 102,15,113,213,7 ; psrlw $0x7,%xmm5
- DB 102,65,15,113,208,7 ; psrlw $0x7,%xmm8
- DB 102,68,15,103,197 ; packuswb %xmm5,%xmm8
+ DB 102,65,15,113,209,7 ; psrlw $0x7,%xmm9
+ DB 102,68,15,103,205 ; packuswb %xmm5,%xmm9
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,40,148,36,32,1,0,0 ; movaps 0x120(%rsp),%xmm2
DB 15,40,156,36,16,1,0,0 ; movaps 0x110(%rsp),%xmm3
DB 102,65,15,111,194 ; movdqa %xmm10,%xmm0
- DB 102,65,15,111,200 ; movdqa %xmm8,%xmm1
+ DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 72,129,196,56,1,0,0 ; add $0x138,%rsp
DB 255,224 ; jmpq *%rax
@@ -41978,7 +41969,7 @@ _sk_overlay_sse2_8bit LABEL PROC
DB 102,15,217,234 ; psubusw %xmm2,%xmm5
DB 102,15,117,236 ; pcmpeqw %xmm4,%xmm5
DB 102,15,127,172,36,160,0,0,0 ; movdqa %xmm5,0xa0(%rsp)
- DB 102,15,111,53,168,12,0,0 ; movdqa 0xca8(%rip),%xmm6 # 2cad0 <_sk_overlay_sse2_8bit+0xe5b>
+ DB 102,15,111,53,173,12,0,0 ; movdqa 0xcad(%rip),%xmm6 # 2ca10 <_sk_overlay_sse2_8bit+0xe60>
DB 102,15,111,194 ; movdqa %xmm2,%xmm0
DB 102,15,239,198 ; pxor %xmm6,%xmm0
DB 102,65,15,213,199 ; pmullw %xmm15,%xmm0
@@ -42086,7 +42077,7 @@ _sk_overlay_sse2_8bit LABEL PROC
DB 102,68,15,253,92,36,112 ; paddw 0x70(%rsp),%xmm11
DB 102,15,253,44,36 ; paddw (%rsp),%xmm5
DB 102,15,253,116,36,16 ; paddw 0x10(%rsp),%xmm6
- DB 102,15,111,5,82,18,0,0 ; movdqa 0x1252(%rip),%xmm0 # 2d2b0 <_sk_overlay_sse2_8bit+0x163b>
+ DB 102,15,111,5,87,18,0,0 ; movdqa 0x1257(%rip),%xmm0 # 2d1f0 <_sk_overlay_sse2_8bit+0x1640>
DB 102,68,15,253,224 ; paddw %xmm0,%xmm12
DB 102,68,15,253,227 ; paddw %xmm3,%xmm12
DB 102,68,15,253,216 ; paddw %xmm0,%xmm11
@@ -42095,7 +42086,7 @@ _sk_overlay_sse2_8bit LABEL PROC
DB 102,15,253,234 ; paddw %xmm2,%xmm5
DB 102,15,253,240 ; paddw %xmm0,%xmm6
DB 102,15,253,241 ; paddw %xmm1,%xmm6
- DB 102,15,111,5,54,18,0,0 ; movdqa 0x1236(%rip),%xmm0 # 2d2c0 <_sk_overlay_sse2_8bit+0x164b>
+ DB 102,15,111,5,59,18,0,0 ; movdqa 0x123b(%rip),%xmm0 # 2d200 <_sk_overlay_sse2_8bit+0x1650>
DB 102,15,228,240 ; pmulhuw %xmm0,%xmm6
DB 102,15,228,232 ; pmulhuw %xmm0,%xmm5
DB 102,68,15,228,216 ; pmulhuw %xmm0,%xmm11
@@ -42129,14 +42120,14 @@ ALIGN 4
DB 252 ; cld
DB 190,0,0,128,191 ; mov $0xbf800000,%esi
DB 0,0 ; add %al,(%rax)
- DB 224,64 ; loopne 2c144 <.literal4+0x64>
+ DB 224,64 ; loopne 2c080 <.literal4+0x64>
DB 154 ; (bad)
DB 153 ; cltd
DB 153 ; cltd
DB 62,61,10,23,63,174 ; ds cmp $0xae3f170a,%eax
- DB 71,225,61 ; rex.RXB loope 2c14d <.literal4+0x6d>
+ DB 71,225,61 ; rex.RXB loope 2c089 <.literal4+0x6d>
DB 0,0 ; add %al,(%rax)
- DB 127,67 ; jg 2c157 <.literal4+0x77>
+ DB 127,67 ; jg 2c093 <.literal4+0x77>
DB 145 ; xchg %eax,%ecx
DB 131,158,61,92,143,50,63 ; sbbl $0x3f,0x328f5c3d(%rsi)
DB 10,215 ; or %bh,%dl
@@ -42169,7 +42160,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 8,33 ; or %ah,(%rcx)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 2c16d <.literal4+0x8d>
+ DB 224,7 ; loopne 2c0a9 <.literal4+0x8d>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -42180,8 +42171,8 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 0,52,255 ; add %dh,(%rdi,%rdi,8)
DB 255 ; (bad)
- DB 127,0 ; jg 2c180 <.literal4+0xa0>
- DB 119,115 ; ja 2c1f5 <.literal4+0x115>
+ DB 127,0 ; jg 2c0bc <.literal4+0xa0>
+ DB 119,115 ; ja 2c131 <.literal4+0x115>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -42204,12 +42195,12 @@ ALIGN 4
DB 190,80,128,3,62 ; mov $0x3e038050,%esi
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 2c20b <.literal4+0x12b>
+ DB 118,63 ; jbe 2c147 <.literal4+0x12b>
DB 246,64,83,63 ; testb $0x3f,0x53(%rax)
DB 0,0 ; add %al,(%rax)
DB 248 ; clc
DB 65,0,0 ; add %al,(%r8)
- DB 124,66 ; jl 2c21a <.literal4+0x13a>
+ DB 124,66 ; jl 2c156 <.literal4+0x13a>
DB 0,240 ; add %dh,%al
DB 0,0 ; add %al,(%rax)
DB 137,136,136,55,0,15 ; mov %ecx,0xf003788(%rax)
@@ -42219,9 +42210,9 @@ ALIGN 4
DB 137,136,136,59,15,0 ; mov %ecx,0xf3b88(%rax)
DB 0,0 ; add %al,(%rax)
DB 137,136,136,61,0,0 ; mov %ecx,0x3d88(%rax)
- DB 112,65 ; jo 2c23d <.literal4+0x15d>
+ DB 112,65 ; jo 2c179 <.literal4+0x15d>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg 2c247 <.literal4+0x167>
+ DB 127,71 ; jg 2c183 <.literal4+0x167>
DB 208 ; (bad)
DB 179,89 ; mov $0x59,%bl
DB 62,89 ; ds pop %rcx
@@ -42248,15 +42239,15 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 128,0,0 ; addb $0x0,(%rax)
DB 0,191,0,0,192,191 ; add %bh,-0x40400000(%rdi)
- DB 114,28 ; jb 2c266 <.literal4+0x186>
+ DB 114,28 ; jb 2c1a2 <.literal4+0x186>
DB 199 ; (bad)
DB 62,0,0 ; add %al,%ds:(%rax)
DB 192,63,85 ; sarb $0x55,(%rdi)
DB 85 ; push %rbp
DB 149 ; xchg %eax,%ebp
DB 191,57,142,99,61 ; mov $0x3d638e39,%edi
- DB 114,249 ; jb 2c253 <.literal4+0x173>
- DB 127,63 ; jg 2c29b <_sk_overlay_sse2_8bit+0x626>
+ DB 114,249 ; jb 2c18f <.literal4+0x173>
+ DB 127,63 ; jg 2c1d7 <_sk_overlay_sse2_8bit+0x627>
DB 3,0 ; add (%rax),%eax
DB 0,0 ; add %al,(%rax)
DB 0,128,0,0,0,4 ; add %al,0x4000000(%rax)
@@ -42317,16 +42308,16 @@ ALIGN 32
DB 0,1 ; add %al,(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c2e8 <_sk_overlay_sse2_8bit+0xa000673>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c228 <_sk_overlay_sse2_8bit+0xa000678>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c2f0 <_sk_overlay_sse2_8bit+0x1200067b>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c230 <_sk_overlay_sse2_8bit+0x12000680>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c2f8 <_sk_overlay_sse2_8bit+0x1a000683>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c238 <_sk_overlay_sse2_8bit+0x1a000688>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c300 <_sk_overlay_sse2_8bit+0x300068b>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c240 <_sk_overlay_sse2_8bit+0x3000690>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42369,16 +42360,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c348 <_sk_overlay_sse2_8bit+0xa0006d3>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c288 <_sk_overlay_sse2_8bit+0xa0006d8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c350 <_sk_overlay_sse2_8bit+0x120006db>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c290 <_sk_overlay_sse2_8bit+0x120006e0>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c358 <_sk_overlay_sse2_8bit+0x1a0006e3>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c298 <_sk_overlay_sse2_8bit+0x1a0006e8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c360 <_sk_overlay_sse2_8bit+0x30006eb>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c2a0 <_sk_overlay_sse2_8bit+0x30006f0>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42421,16 +42412,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c3a8 <_sk_overlay_sse2_8bit+0xa000733>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c2e8 <_sk_overlay_sse2_8bit+0xa000738>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c3b0 <_sk_overlay_sse2_8bit+0x1200073b>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c2f0 <_sk_overlay_sse2_8bit+0x12000740>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c3b8 <_sk_overlay_sse2_8bit+0x1a000743>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c2f8 <_sk_overlay_sse2_8bit+0x1a000748>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c3c0 <_sk_overlay_sse2_8bit+0x300074b>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c300 <_sk_overlay_sse2_8bit+0x3000750>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42473,16 +42464,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c408 <_sk_overlay_sse2_8bit+0xa000793>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c348 <_sk_overlay_sse2_8bit+0xa000798>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c410 <_sk_overlay_sse2_8bit+0x1200079b>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c350 <_sk_overlay_sse2_8bit+0x120007a0>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c418 <_sk_overlay_sse2_8bit+0x1a0007a3>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c358 <_sk_overlay_sse2_8bit+0x1a0007a8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c420 <_sk_overlay_sse2_8bit+0x30007ab>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c360 <_sk_overlay_sse2_8bit+0x30007b0>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42525,16 +42516,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c468 <_sk_overlay_sse2_8bit+0xa0007f3>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c3a8 <_sk_overlay_sse2_8bit+0xa0007f8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c470 <_sk_overlay_sse2_8bit+0x120007fb>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c3b0 <_sk_overlay_sse2_8bit+0x12000800>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c478 <_sk_overlay_sse2_8bit+0x1a000803>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c3b8 <_sk_overlay_sse2_8bit+0x1a000808>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c480 <_sk_overlay_sse2_8bit+0x300080b>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c3c0 <_sk_overlay_sse2_8bit+0x3000810>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42577,16 +42568,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c4c8 <_sk_overlay_sse2_8bit+0xa000853>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c408 <_sk_overlay_sse2_8bit+0xa000858>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c4d0 <_sk_overlay_sse2_8bit+0x1200085b>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c410 <_sk_overlay_sse2_8bit+0x12000860>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c4d8 <_sk_overlay_sse2_8bit+0x1a000863>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c418 <_sk_overlay_sse2_8bit+0x1a000868>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c4e0 <_sk_overlay_sse2_8bit+0x300086b>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c420 <_sk_overlay_sse2_8bit+0x3000870>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42629,16 +42620,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c528 <_sk_overlay_sse2_8bit+0xa0008b3>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c468 <_sk_overlay_sse2_8bit+0xa0008b8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c530 <_sk_overlay_sse2_8bit+0x120008bb>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c470 <_sk_overlay_sse2_8bit+0x120008c0>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c538 <_sk_overlay_sse2_8bit+0x1a0008c3>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c478 <_sk_overlay_sse2_8bit+0x1a0008c8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c540 <_sk_overlay_sse2_8bit+0x30008cb>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c480 <_sk_overlay_sse2_8bit+0x30008d0>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -42681,16 +42672,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c588 <_sk_overlay_sse2_8bit+0xa000913>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02c4c8 <_sk_overlay_sse2_8bit+0xa000918>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c590 <_sk_overlay_sse2_8bit+0x1200091b>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 1202c4d0 <_sk_overlay_sse2_8bit+0x12000920>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c598 <_sk_overlay_sse2_8bit+0x1a000923>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a02c4d8 <_sk_overlay_sse2_8bit+0x1a000928>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c5a0 <_sk_overlay_sse2_8bit+0x300092b>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 302c4e0 <_sk_overlay_sse2_8bit+0x3000930>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -43557,11 +43548,11 @@ ALIGN 16
DB 0,128,191,0,0,128 ; add %al,-0x7fffff41(%rax)
DB 191,0,0,224,64 ; mov $0x40e00000,%edi
DB 0,0 ; add %al,(%rax)
- DB 224,64 ; loopne 2cbf8 <.literal16+0x128>
+ DB 224,64 ; loopne 2cb38 <.literal16+0x128>
DB 0,0 ; add %al,(%rax)
- DB 224,64 ; loopne 2cbfc <.literal16+0x12c>
+ DB 224,64 ; loopne 2cb3c <.literal16+0x12c>
DB 0,0 ; add %al,(%rax)
- DB 224,64 ; loopne 2cc00 <.literal16+0x130>
+ DB 224,64 ; loopne 2cb40 <.literal16+0x130>
DB 154 ; (bad)
DB 153 ; cltd
DB 153 ; cltd
@@ -43581,13 +43572,13 @@ ALIGN 16
DB 10,23 ; or (%rdi),%dl
DB 63 ; (bad)
DB 174 ; scas %es:(%rdi),%al
- DB 71,225,61 ; rex.RXB loope 2cc21 <.literal16+0x151>
+ DB 71,225,61 ; rex.RXB loope 2cb61 <.literal16+0x151>
DB 174 ; scas %es:(%rdi),%al
- DB 71,225,61 ; rex.RXB loope 2cc25 <.literal16+0x155>
+ DB 71,225,61 ; rex.RXB loope 2cb65 <.literal16+0x155>
DB 174 ; scas %es:(%rdi),%al
- DB 71,225,61 ; rex.RXB loope 2cc29 <.literal16+0x159>
+ DB 71,225,61 ; rex.RXB loope 2cb69 <.literal16+0x159>
DB 174 ; scas %es:(%rdi),%al
- DB 71,225,61 ; rex.RXB loope 2cc2d <.literal16+0x15d>
+ DB 71,225,61 ; rex.RXB loope 2cb6d <.literal16+0x15d>
DB 255,0 ; incl (%rax)
DB 0,0 ; add %al,(%rax)
DB 255,0 ; incl (%rax)
@@ -43598,10 +43589,10 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02cc08 <_sk_overlay_sse2_8bit+0xa000f93>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a02cb48 <_sk_overlay_sse2_8bit+0xa000f98>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 302cc10 <_sk_overlay_sse2_8bit+0x3000f9b>
+ DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 302cb50 <_sk_overlay_sse2_8bit+0x3000fa0>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -43616,11 +43607,11 @@ ALIGN 16
DB 255,0 ; incl (%rax)
DB 0,127,67 ; add %bh,0x43(%rdi)
DB 0,0 ; add %al,(%rax)
- DB 127,67 ; jg 2cc6b <.literal16+0x19b>
+ DB 127,67 ; jg 2cbab <.literal16+0x19b>
DB 0,0 ; add %al,(%rax)
- DB 127,67 ; jg 2cc6f <.literal16+0x19f>
+ DB 127,67 ; jg 2cbaf <.literal16+0x19f>
DB 0,0 ; add %al,(%rax)
- DB 127,67 ; jg 2cc73 <.literal16+0x1a3>
+ DB 127,67 ; jg 2cbb3 <.literal16+0x1a3>
DB 145 ; xchg %eax,%ecx
DB 131,158,61,145,131,158,61 ; sbbl $0x3d,-0x617c6ec3(%rsi)
DB 145 ; xchg %eax,%ecx
@@ -43771,13 +43762,13 @@ ALIGN 16
DB 132,55 ; test %dh,(%rdi)
DB 8,33 ; or %ah,(%rcx)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 2cd79 <.literal16+0x2a9>
+ DB 224,7 ; loopne 2ccb9 <.literal16+0x2a9>
DB 0,0 ; add %al,(%rax)
- DB 224,7 ; loopne 2cd7d <.literal16+0x2ad>
+ DB 224,7 ; loopne 2ccbd <.literal16+0x2ad>
DB 0,0 ; add %al,(%rax)
- DB 224,7 ; loopne 2cd81 <.literal16+0x2b1>
+ DB 224,7 ; loopne 2ccc1 <.literal16+0x2b1>
DB 0,0 ; add %al,(%rax)
- DB 224,7 ; loopne 2cd85 <.literal16+0x2b5>
+ DB 224,7 ; loopne 2ccc5 <.literal16+0x2b5>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -43837,17 +43828,17 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 2ce04 <.literal16+0x334>
+ DB 127,0 ; jg 2cd44 <.literal16+0x334>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg 2ce08 <.literal16+0x338>
+ DB 127,0 ; jg 2cd48 <.literal16+0x338>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg 2ce0c <.literal16+0x33c>
+ DB 127,0 ; jg 2cd4c <.literal16+0x33c>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg 2ce10 <.literal16+0x340>
- DB 119,115 ; ja 2ce85 <.literal16+0x3b5>
+ DB 127,0 ; jg 2cd50 <.literal16+0x340>
+ DB 119,115 ; ja 2cdc5 <.literal16+0x3b5>
DB 248 ; clc
DB 194,119,115 ; retq $0x7377
DB 248 ; clc
@@ -43858,7 +43849,7 @@ ALIGN 16
DB 194,117,191 ; retq $0xbf75
DB 191,63,117,191,191 ; mov $0xbfbf753f,%edi
DB 63 ; (bad)
- DB 117,191 ; jne 2cde9 <.literal16+0x319>
+ DB 117,191 ; jne 2cd29 <.literal16+0x319>
DB 191,63,117,191,191 ; mov $0xbfbf753f,%edi
DB 63 ; (bad)
DB 249 ; stc
@@ -43870,7 +43861,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a60e2a <_sk_overlay_sse2_8bit+0xffffffffe9a351b5>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a60d6a <_sk_overlay_sse2_8bit+0xffffffffe9a351ba>
DB 220,63 ; fdivrl (%rdi)
DB 81 ; push %rcx
DB 140,242 ; mov %?,%edx
@@ -43960,16 +43951,16 @@ ALIGN 16
DB 128,3,62 ; addb $0x3e,(%rbx)
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 2cf73 <.literal16+0x4a3>
+ DB 118,63 ; jbe 2ceb3 <.literal16+0x4a3>
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 2cf77 <.literal16+0x4a7>
+ DB 118,63 ; jbe 2ceb7 <.literal16+0x4a7>
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 2cf7b <.literal16+0x4ab>
+ DB 118,63 ; jbe 2cebb <.literal16+0x4ab>
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 2cf7f <.literal16+0x4af>
+ DB 118,63 ; jbe 2cebf <.literal16+0x4af>
DB 246,64,83,63 ; testb $0x3f,0x53(%rax)
DB 246,64,83,63 ; testb $0x3f,0x53(%rax)
DB 246,64,83,63 ; testb $0x3f,0x53(%rax)
@@ -43990,13 +43981,13 @@ ALIGN 16
DB 65,0,0 ; add %al,(%r8)
DB 248 ; clc
DB 65,0,0 ; add %al,(%r8)
- DB 124,66 ; jl 2cfb6 <.literal16+0x4e6>
+ DB 124,66 ; jl 2cef6 <.literal16+0x4e6>
DB 0,0 ; add %al,(%rax)
- DB 124,66 ; jl 2cfba <.literal16+0x4ea>
+ DB 124,66 ; jl 2cefa <.literal16+0x4ea>
DB 0,0 ; add %al,(%rax)
- DB 124,66 ; jl 2cfbe <.literal16+0x4ee>
+ DB 124,66 ; jl 2cefe <.literal16+0x4ee>
DB 0,0 ; add %al,(%rax)
- DB 124,66 ; jl 2cfc2 <.literal16+0x4f2>
+ DB 124,66 ; jl 2cf02 <.literal16+0x4f2>
DB 0,240 ; add %dh,%al
DB 0,0 ; add %al,(%rax)
DB 0,240 ; add %dh,%al
@@ -44042,13 +44033,13 @@ ALIGN 16
DB 136,136,61,137,136,136 ; mov %cl,-0x777776c3(%rax)
DB 61,137,136,136,61 ; cmp $0x3d888889,%eax
DB 0,0 ; add %al,(%rax)
- DB 112,65 ; jo 2d045 <.literal16+0x575>
+ DB 112,65 ; jo 2cf85 <.literal16+0x575>
DB 0,0 ; add %al,(%rax)
- DB 112,65 ; jo 2d049 <.literal16+0x579>
+ DB 112,65 ; jo 2cf89 <.literal16+0x579>
DB 0,0 ; add %al,(%rax)
- DB 112,65 ; jo 2d04d <.literal16+0x57d>
+ DB 112,65 ; jo 2cf8d <.literal16+0x57d>
DB 0,0 ; add %al,(%rax)
- DB 112,65 ; jo 2d051 <.literal16+0x581>
+ DB 112,65 ; jo 2cf91 <.literal16+0x581>
DB 0,128,0,0,0,128 ; add %al,-0x80000000(%rax)
DB 0,0 ; add %al,(%rax)
DB 0,128,0,0,0,128 ; add %al,-0x80000000(%rax)
@@ -44087,13 +44078,13 @@ ALIGN 16
DB 64,254 ; rex (bad)
DB 255,0 ; incl (%rax)
DB 255 ; (bad)
- DB 127,71 ; jg 2d0bb <.literal16+0x5eb>
+ DB 127,71 ; jg 2cffb <.literal16+0x5eb>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg 2d0bf <.literal16+0x5ef>
+ DB 127,71 ; jg 2cfff <.literal16+0x5ef>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg 2d0c3 <.literal16+0x5f3>
+ DB 127,71 ; jg 2d003 <.literal16+0x5f3>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg 2d0c7 <.literal16+0x5f7>
+ DB 127,71 ; jg 2d007 <.literal16+0x5f7>
DB 208 ; (bad)
DB 179,89 ; mov $0x59,%bl
DB 62,208 ; ds (bad)
@@ -44123,10 +44114,10 @@ ALIGN 16
DB 61,152,221,147,61 ; cmp $0x3d93dd98,%eax
DB 152 ; cwtl
DB 221,147,61,45,16,17 ; fstl 0x11102d3d(%rbx)
- DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110(%rip) # 2dc2e1ca <_sk_overlay_sse2_8bit+0x2dc02555>
+ DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110(%rip) # 2dc2e10a <_sk_overlay_sse2_8bit+0x2dc0255a>
DB 17,192 ; adc %eax,%eax
DB 45,16,17,192,18 ; sub $0x12c01110,%eax
- DB 120,57 ; js 2d0fc <.literal16+0x62c>
+ DB 120,57 ; js 2d03c <.literal16+0x62c>
DB 64,18,120,57 ; adc 0x39(%rax),%dil
DB 64,18,120,57 ; adc 0x39(%rax),%dil
DB 64,18,120,57 ; adc 0x39(%rax),%dil
@@ -44191,13 +44182,13 @@ ALIGN 16
DB 192,191,0,0,192,191,0 ; sarb $0x0,-0x40400000(%rdi)
DB 0,192 ; add %al,%al
DB 191,0,0,192,191 ; mov $0xbfc00000,%edi
- DB 114,28 ; jb 2d1ae <.literal16+0x6de>
+ DB 114,28 ; jb 2d0ee <.literal16+0x6de>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 2d1b2 <.literal16+0x6e2>
+ DB 62,114,28 ; jb,pt 2d0f2 <.literal16+0x6e2>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 2d1b6 <.literal16+0x6e6>
+ DB 62,114,28 ; jb,pt 2d0f6 <.literal16+0x6e6>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 2d1ba <.literal16+0x6ea>
+ DB 62,114,28 ; jb,pt 2d0fa <.literal16+0x6ea>
DB 199 ; (bad)
DB 62,85 ; ds push %rbp
DB 85 ; push %rbp
@@ -44216,15 +44207,15 @@ ALIGN 16
DB 0,192 ; add %al,%al
DB 63 ; (bad)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d666005 <_sk_overlay_sse2_8bit+0x3d63a390>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d665f45 <_sk_overlay_sse2_8bit+0x3d63a395>
DB 57,142,99,61,114,249 ; cmp %ecx,-0x68dc29d(%rsi)
- DB 127,63 ; jg 2d213 <.literal16+0x743>
- DB 114,249 ; jb 2d1cf <.literal16+0x6ff>
- DB 127,63 ; jg 2d217 <.literal16+0x747>
- DB 114,249 ; jb 2d1d3 <.literal16+0x703>
- DB 127,63 ; jg 2d21b <.literal16+0x74b>
- DB 114,249 ; jb 2d1d7 <.literal16+0x707>
- DB 127,63 ; jg 2d21f <.literal16+0x74f>
+ DB 127,63 ; jg 2d153 <.literal16+0x743>
+ DB 114,249 ; jb 2d10f <.literal16+0x6ff>
+ DB 127,63 ; jg 2d157 <.literal16+0x747>
+ DB 114,249 ; jb 2d113 <.literal16+0x703>
+ DB 127,63 ; jg 2d15b <.literal16+0x74b>
+ DB 114,249 ; jb 2d117 <.literal16+0x707>
+ DB 127,63 ; jg 2d15f <.literal16+0x74f>
DB 3,0 ; add (%rax),%eax
DB 0,0 ; add %al,(%rax)
DB 3,0 ; add (%rax),%eax
@@ -44331,14 +44322,14 @@ ALIGN 16
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,0 ; incl (%rax)
- DB 127,0 ; jg 2d2b2 <.literal16+0x7e2>
- DB 127,0 ; jg 2d2b4 <.literal16+0x7e4>
- DB 127,0 ; jg 2d2b6 <.literal16+0x7e6>
- DB 127,0 ; jg 2d2b8 <.literal16+0x7e8>
- DB 127,0 ; jg 2d2ba <.literal16+0x7ea>
- DB 127,0 ; jg 2d2bc <.literal16+0x7ec>
- DB 127,0 ; jg 2d2be <.literal16+0x7ee>
- DB 127,0 ; jg 2d2c0 <.literal16+0x7f0>
+ DB 127,0 ; jg 2d1f2 <.literal16+0x7e2>
+ DB 127,0 ; jg 2d1f4 <.literal16+0x7e4>
+ DB 127,0 ; jg 2d1f6 <.literal16+0x7e6>
+ DB 127,0 ; jg 2d1f8 <.literal16+0x7e8>
+ DB 127,0 ; jg 2d1fa <.literal16+0x7ea>
+ DB 127,0 ; jg 2d1fc <.literal16+0x7ec>
+ DB 127,0 ; jg 2d1fe <.literal16+0x7ee>
+ DB 127,0 ; jg 2d200 <.literal16+0x7f0>
DB 129,128,129,128,129,128,129,128,129,128; addl $0x80818081,-0x7f7e7f7f(%rax)
DB 129 ; .byte 0x81
DB 128 ; .byte 0x80