aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/jumper
diff options
context:
space:
mode:
authorGravatar Mike Klein <mtklein@chromium.org>2017-09-27 11:42:30 -0400
committerGravatar Skia Commit-Bot <skia-commit-bot@chromium.org>2017-09-28 18:08:28 +0000
commitf7729c262076b88b2635e7f8d09e7f3340eea79b (patch)
tree20ecc274046d229721ae9383359e4e5ff370a2a1 /src/jumper
parent6c08b7bbe47201a21d9e53a907b4baa906bb20b4 (diff)
Move context types into STAGE() macros.
This is something I came up with while writing _lowp.cpp. This should all be a logical no-op, but there are some code generation changes. I'm not exactly sure why. Change-Id: Iaad36b5298b37fe26ebd375a147a48852f98e1e4 Reviewed-on: https://skia-review.googlesource.com/52003 Commit-Queue: Mike Klein <mtklein@chromium.org> Reviewed-by: Herb Derby <herb@google.com>
Diffstat (limited to 'src/jumper')
-rw-r--r--src/jumper/SkJumper_generated.S2008
-rw-r--r--src/jumper/SkJumper_generated_win.S1736
-rw-r--r--src/jumper/SkJumper_misc.h4
-rw-r--r--src/jumper/SkJumper_stages.cpp346
4 files changed, 2007 insertions, 2087 deletions
diff --git a/src/jumper/SkJumper_generated.S b/src/jumper/SkJumper_generated.S
index ac9aef2434..337703b096 100644
--- a/src/jumper/SkJumper_generated.S
+++ b/src/jumper/SkJumper_generated.S
@@ -6808,11 +6808,11 @@ _sk_evenly_spaced_gradient_vfp4:
.long 0xed2d8b10 // vpush {d8-d15}
.long 0xe24dd010 // sub sp, sp, #16
.long 0xe58d0008 // str r0, [sp, #8]
- .long 0xe2810004 // add r0, r1, #4
- .long 0xe58d000c // str r0, [sp, #12]
- .long 0xe1a0c001 // mov ip, r1
- .long 0xe49c7008 // ldr r7, [ip], #8
.long 0xf2600150 // vorr q8, q0, q0
+ .long 0xe5917000 // ldr r7, [r1]
+ .long 0xe5910004 // ldr r0, [r1, #4]
+ .long 0xe2811008 // add r1, r1, #8
+ .long 0xe58d000c // str r0, [sp, #12]
.long 0xe8974204 // ldm r7, {r2, r9, lr}
.long 0xe2422001 // sub r2, r2, #1
.long 0xe5970010 // ldr r0, [r7, #16]
@@ -6848,34 +6848,31 @@ _sk_evenly_spaced_gradient_vfp4:
.long 0xed90ca00 // vldr s24, [r0]
.long 0xe597001c // ldr r0, [r7, #28]
.long 0xe0806103 // add r6, r0, r3, lsl #2
+ .long 0xe0808102 // add r8, r0, r2, lsl #2
.long 0xe080a104 // add sl, r0, r4, lsl #2
.long 0xedd65a00 // vldr s11, [r6]
.long 0xe0806105 // add r6, r0, r5, lsl #2
.long 0xe58d6004 // str r6, [sp, #4]
- .long 0xe0806102 // add r6, r0, r2, lsl #2
- .long 0xe58d6000 // str r6, [sp]
.long 0xe5970018 // ldr r0, [r7, #24]
- .long 0xed9a5a00 // vldr s10, [sl]
- .long 0xe0808103 // add r8, r0, r3, lsl #2
+ .long 0xe5977014 // ldr r7, [r7, #20]
+ .long 0xe080c103 // add ip, r0, r3, lsl #2
.long 0xe0806104 // add r6, r0, r4, lsl #2
- .long 0xedd83a00 // vldr s7, [r8]
+ .long 0xed9a5a00 // vldr s10, [sl]
+ .long 0xeddc3a00 // vldr s7, [ip]
+ .long 0xedd84a00 // vldr s9, [r8]
.long 0xed963a00 // vldr s6, [r6]
.long 0xe0806102 // add r6, r0, r2, lsl #2
.long 0xe0800105 // add r0, r0, r5, lsl #2
.long 0xedd62a00 // vldr s5, [r6]
- .long 0xe5976014 // ldr r6, [r7, #20]
+ .long 0xe0876103 // add r6, r7, r3, lsl #2
+ .long 0xedd69a00 // vldr s19, [r6]
+ .long 0xe0876104 // add r6, r7, r4, lsl #2
.long 0xed902a00 // vldr s4, [r0]
- .long 0xe0867103 // add r7, r6, r3, lsl #2
- .long 0xe59d0000 // ldr r0, [sp]
- .long 0xedd79a00 // vldr s19, [r7]
- .long 0xe0867104 // add r7, r6, r4, lsl #2
- .long 0xedd04a00 // vldr s9, [r0]
- .long 0xed979a00 // vldr s18, [r7]
- .long 0xe08e7103 // add r7, lr, r3, lsl #2
+ .long 0xed969a00 // vldr s18, [r6]
+ .long 0xe08e6103 // add r6, lr, r3, lsl #2
.long 0xe0893103 // add r3, r9, r3, lsl #2
.long 0xe59d0004 // ldr r0, [sp, #4]
- .long 0xedd71a00 // vldr s3, [r7]
- .long 0xe08e7105 // add r7, lr, r5, lsl #2
+ .long 0xedd61a00 // vldr s3, [r6]
.long 0xedd3fa00 // vldr s31, [r3]
.long 0xe0893104 // add r3, r9, r4, lsl #2
.long 0xed904a00 // vldr s8, [r0]
@@ -6888,16 +6885,16 @@ _sk_evenly_spaced_gradient_vfp4:
.long 0xe0893105 // add r3, r9, r5, lsl #2
.long 0xe59d0008 // ldr r0, [sp, #8]
.long 0xed93ea00 // vldr s28, [r3]
- .long 0xe0863102 // add r3, r6, r2, lsl #2
+ .long 0xe0873102 // add r3, r7, r2, lsl #2
.long 0xedd38a00 // vldr s17, [r3]
- .long 0xe0863105 // add r3, r6, r5, lsl #2
+ .long 0xe0873105 // add r3, r7, r5, lsl #2
+ .long 0xe08e7105 // add r7, lr, r5, lsl #2
.long 0xed938a00 // vldr s16, [r3]
.long 0xe08e3104 // add r3, lr, r4, lsl #2
.long 0xf2008cde // vfma.f32 q4, q8, q7
.long 0xed931a00 // vldr s2, [r3]
.long 0xe08e3102 // add r3, lr, r2, lsl #2
- .long 0xe5912004 // ldr r2, [r1, #4]
- .long 0xe1a0100c // mov r1, ip
+ .long 0xe59d200c // ldr r2, [sp, #12]
.long 0xedd30a00 // vldr s1, [r3]
.long 0xe08b3105 // add r3, fp, r5, lsl #2
.long 0xed936a00 // vldr s12, [r3]
@@ -6910,7 +6907,6 @@ _sk_evenly_spaced_gradient_vfp4:
.long 0xe28dd004 // add sp, sp, #4
.long 0xe8bd4ff0 // pop {r4, r5, r6, r7, r8, r9, sl, fp, lr}
.long 0xe12fff12 // bx r2
- .long 0xe320f000 // nop {0}
HIDDEN _sk_gauss_a_to_rgba_vfp4
.globl _sk_gauss_a_to_rgba_vfp4
@@ -6964,110 +6960,107 @@ _sk_gradient_vfp4:
.long 0xe92d4ff0 // push {r4, r5, r6, r7, r8, r9, sl, fp, lr}
.long 0xe24dd004 // sub sp, sp, #4
.long 0xed2d8b10 // vpush {d8-d15}
- .long 0xe24dd008 // sub sp, sp, #8
- .long 0xe2812004 // add r2, r1, #4
- .long 0xe58d2004 // str r2, [sp, #4]
- .long 0xe5913000 // ldr r3, [r1]
+ .long 0xe5912000 // ldr r2, [r1]
.long 0xf2606150 // vorr q11, q0, q0
.long 0xf2c02050 // vmov.i32 q9, #0
.long 0xf2c00050 // vmov.i32 q8, #0
- .long 0xe5931000 // ldr r1, [r3]
- .long 0xe3510002 // cmp r1, #2
- .long 0x3a00000a // bcc 62e8 <sk_gradient_vfp4+0x60>
- .long 0xe5932024 // ldr r2, [r3, #36]
+ .long 0xe5923000 // ldr r3, [r2]
+ .long 0xe3530002 // cmp r3, #2
+ .long 0x3a00000a // bcc 62cc <sk_gradient_vfp4+0x54>
+ .long 0xe5927024 // ldr r7, [r2, #36]
.long 0xf2c04051 // vmov.i32 q10, #1
.long 0xf2c00050 // vmov.i32 q8, #0
- .long 0xe2411001 // sub r1, r1, #1
- .long 0xe2822004 // add r2, r2, #4
- .long 0xf4e28cbd // vld1.32 {d24[]-d25[]}, [r2 :32]!
- .long 0xe2511001 // subs r1, r1, #1
+ .long 0xe2433001 // sub r3, r3, #1
+ .long 0xe2877004 // add r7, r7, #4
+ .long 0xf4e78cbd // vld1.32 {d24[]-d25[]}, [r7 :32]!
+ .long 0xe2533001 // subs r3, r3, #1
.long 0xf3468ee8 // vcge.f32 q12, q11, q12
.long 0xf35481f2 // vbsl q12, q10, q9
.long 0xf26008e8 // vadd.i32 q8, q8, q12
- .long 0x1afffff9 // bne 62d0 <sk_gradient_vfp4+0x48>
- .long 0xee317b90 // vmov.32 r7, d17[1]
- .long 0xe9934400 // ldmib r3, {sl, lr}
- .long 0xee111b90 // vmov.32 r1, d17[0]
- .long 0xe5935010 // ldr r5, [r3, #16]
- .long 0xe593c020 // ldr ip, [r3, #32]
- .long 0xe593600c // ldr r6, [r3, #12]
- .long 0xe593b01c // ldr fp, [r3, #28]
- .long 0xe0852107 // add r2, r5, r7, lsl #2
- .long 0xedd2ba00 // vldr s23, [r2]
- .long 0xe0852101 // add r2, r5, r1, lsl #2
- .long 0xed92ba00 // vldr s22, [r2]
- .long 0xee302b90 // vmov.32 r2, d16[1]
- .long 0xe0854102 // add r4, r5, r2, lsl #2
- .long 0xedd4aa00 // vldr s21, [r4]
- .long 0xee104b90 // vmov.32 r4, d16[0]
- .long 0xe0855104 // add r5, r5, r4, lsl #2
- .long 0xed95aa00 // vldr s20, [r5]
- .long 0xe08c5107 // add r5, ip, r7, lsl #2
- .long 0xedd57a00 // vldr s15, [r5]
- .long 0xe08c5101 // add r5, ip, r1, lsl #2
- .long 0xed957a00 // vldr s14, [r5]
- .long 0xe0865107 // add r5, r6, r7, lsl #2
- .long 0xedd5da00 // vldr s27, [r5]
- .long 0xe0865101 // add r5, r6, r1, lsl #2
- .long 0xed95da00 // vldr s26, [r5]
- .long 0xe0865102 // add r5, r6, r2, lsl #2
- .long 0xedd5ca00 // vldr s25, [r5]
- .long 0xe0865104 // add r5, r6, r4, lsl #2
- .long 0xed95ca00 // vldr s24, [r5]
- .long 0xe08b5107 // add r5, fp, r7, lsl #2
- .long 0xedd55a00 // vldr s11, [r5]
- .long 0xe5935018 // ldr r5, [r3, #24]
- .long 0xe5933014 // ldr r3, [r3, #20]
- .long 0xe0856107 // add r6, r5, r7, lsl #2
- .long 0xe0858104 // add r8, r5, r4, lsl #2
- .long 0xe0859102 // add r9, r5, r2, lsl #2
- .long 0xedd63a00 // vldr s7, [r6]
- .long 0xe0856101 // add r6, r5, r1, lsl #2
- .long 0xe08e5107 // add r5, lr, r7, lsl #2
- .long 0xed963a00 // vldr s6, [r6]
- .long 0xe08a6101 // add r6, sl, r1, lsl #2
- .long 0xedd5fa00 // vldr s31, [r5]
- .long 0xe08e5101 // add r5, lr, r1, lsl #2
- .long 0xedd92a00 // vldr s5, [r9]
- .long 0xed95fa00 // vldr s30, [r5]
- .long 0xe0835107 // add r5, r3, r7, lsl #2
- .long 0xed982a00 // vldr s4, [r8]
- .long 0xedd59a00 // vldr s19, [r5]
- .long 0xe0835101 // add r5, r3, r1, lsl #2
- .long 0xe08b1101 // add r1, fp, r1, lsl #2
- .long 0xed959a00 // vldr s18, [r5]
- .long 0xe0835102 // add r5, r3, r2, lsl #2
- .long 0xe0833104 // add r3, r3, r4, lsl #2
- .long 0xed915a00 // vldr s10, [r1]
- .long 0xedd58a00 // vldr s17, [r5]
- .long 0xe08a5107 // add r5, sl, r7, lsl #2
- .long 0xe08e7104 // add r7, lr, r4, lsl #2
- .long 0xe08c1102 // add r1, ip, r2, lsl #2
- .long 0xedd51a00 // vldr s3, [r5]
- .long 0xe08e5102 // add r5, lr, r2, lsl #2
- .long 0xed938a00 // vldr s16, [r3]
- .long 0xe08c3104 // add r3, ip, r4, lsl #2
+ .long 0x1afffff9 // bne 62b4 <sk_gradient_vfp4+0x3c>
+ .long 0xee314b90 // vmov.32 r4, d17[1]
+ .long 0xe5926010 // ldr r6, [r2, #16]
+ .long 0xee11cb90 // vmov.32 ip, d17[0]
+ .long 0xe592e020 // ldr lr, [r2, #32]
+ .long 0xe592700c // ldr r7, [r2, #12]
+ .long 0xe592901c // ldr r9, [r2, #28]
+ .long 0xe5928008 // ldr r8, [r2, #8]
+ .long 0xe592b004 // ldr fp, [r2, #4]
+ .long 0xe0863104 // add r3, r6, r4, lsl #2
+ .long 0xedd3ba00 // vldr s23, [r3]
+ .long 0xe086310c // add r3, r6, ip, lsl #2
+ .long 0xed93ba00 // vldr s22, [r3]
+ .long 0xee303b90 // vmov.32 r3, d16[1]
+ .long 0xe0865103 // add r5, r6, r3, lsl #2
+ .long 0xedd5aa00 // vldr s21, [r5]
+ .long 0xee105b90 // vmov.32 r5, d16[0]
+ .long 0xe0866105 // add r6, r6, r5, lsl #2
+ .long 0xed96aa00 // vldr s20, [r6]
+ .long 0xe08e6104 // add r6, lr, r4, lsl #2
+ .long 0xedd67a00 // vldr s15, [r6]
+ .long 0xe08e610c // add r6, lr, ip, lsl #2
+ .long 0xed967a00 // vldr s14, [r6]
+ .long 0xe0876104 // add r6, r7, r4, lsl #2
+ .long 0xedd6da00 // vldr s27, [r6]
+ .long 0xe087610c // add r6, r7, ip, lsl #2
+ .long 0xed96da00 // vldr s26, [r6]
+ .long 0xe0876103 // add r6, r7, r3, lsl #2
+ .long 0xedd6ca00 // vldr s25, [r6]
+ .long 0xe0876105 // add r6, r7, r5, lsl #2
+ .long 0xed96ca00 // vldr s24, [r6]
+ .long 0xe0896104 // add r6, r9, r4, lsl #2
+ .long 0xedd65a00 // vldr s11, [r6]
+ .long 0xe5926018 // ldr r6, [r2, #24]
+ .long 0xe5922014 // ldr r2, [r2, #20]
+ .long 0xe0867104 // add r7, r6, r4, lsl #2
+ .long 0xe086a103 // add sl, r6, r3, lsl #2
+ .long 0xedd73a00 // vldr s7, [r7]
+ .long 0xe086710c // add r7, r6, ip, lsl #2
+ .long 0xed973a00 // vldr s6, [r7]
+ .long 0xe0867105 // add r7, r6, r5, lsl #2
+ .long 0xe0886104 // add r6, r8, r4, lsl #2
+ .long 0xedda2a00 // vldr s5, [sl]
+ .long 0xedd6fa00 // vldr s31, [r6]
+ .long 0xe088610c // add r6, r8, ip, lsl #2
+ .long 0xed972a00 // vldr s4, [r7]
+ .long 0xe089710c // add r7, r9, ip, lsl #2
+ .long 0xed96fa00 // vldr s30, [r6]
+ .long 0xe0826104 // add r6, r2, r4, lsl #2
+ .long 0xe08b4104 // add r4, fp, r4, lsl #2
+ .long 0xed975a00 // vldr s10, [r7]
+ .long 0xedd69a00 // vldr s19, [r6]
+ .long 0xe082610c // add r6, r2, ip, lsl #2
+ .long 0xedd41a00 // vldr s3, [r4]
+ .long 0xe0884103 // add r4, r8, r3, lsl #2
+ .long 0xed969a00 // vldr s18, [r6]
+ .long 0xe0826103 // add r6, r2, r3, lsl #2
+ .long 0xe0822105 // add r2, r2, r5, lsl #2
+ .long 0xedd4ea00 // vldr s29, [r4]
+ .long 0xedd68a00 // vldr s17, [r6]
+ .long 0xe08b610c // add r6, fp, ip, lsl #2
+ .long 0xe0894105 // add r4, r9, r5, lsl #2
.long 0xed961a00 // vldr s2, [r6]
- .long 0xe08a6102 // add r6, sl, r2, lsl #2
- .long 0xedd5ea00 // vldr s29, [r5]
- .long 0xe08b5104 // add r5, fp, r4, lsl #2
+ .long 0xe08b6103 // add r6, fp, r3, lsl #2
+ .long 0xed928a00 // vldr s16, [r2]
+ .long 0xe08e2105 // add r2, lr, r5, lsl #2
.long 0xedd60a00 // vldr s1, [r6]
- .long 0xe08a6104 // add r6, sl, r4, lsl #2
- .long 0xed97ea00 // vldr s28, [r7]
- .long 0xe08b7102 // add r7, fp, r2, lsl #2
+ .long 0xe08b6105 // add r6, fp, r5, lsl #2
+ .long 0xe0885105 // add r5, r8, r5, lsl #2
.long 0xed960a00 // vldr s0, [r6]
- .long 0xedd16a00 // vldr s13, [r1]
- .long 0xf2062cde // vfma.f32 q1, q11, q7
- .long 0xedd74a00 // vldr s9, [r7]
+ .long 0xed95ea00 // vldr s28, [r5]
+ .long 0xe0895103 // add r5, r9, r3, lsl #2
.long 0xf2068cd0 // vfma.f32 q4, q11, q0
- .long 0xe59d1004 // ldr r1, [sp, #4]
- .long 0xed954a00 // vldr s8, [r5]
- .long 0xed936a00 // vldr s12, [r3]
+ .long 0xe08e3103 // add r3, lr, r3, lsl #2
+ .long 0xedd54a00 // vldr s9, [r5]
+ .long 0xedd36a00 // vldr s13, [r3]
+ .long 0xf2062cde // vfma.f32 q1, q11, q7
+ .long 0xed944a00 // vldr s8, [r4]
+ .long 0xed926a00 // vldr s12, [r2]
+ .long 0xe5912004 // ldr r2, [r1, #4]
.long 0xf2064cdc // vfma.f32 q2, q11, q6
- .long 0xe4912004 // ldr r2, [r1], #4
+ .long 0xe2811008 // add r1, r1, #8
.long 0xf2066cda // vfma.f32 q3, q11, q5
.long 0xf2280158 // vorr q0, q4, q4
- .long 0xe28dd008 // add sp, sp, #8
.long 0xecbd8b10 // vpop {d8-d15}
.long 0xe28dd004 // add sp, sp, #4
.long 0xe8bd4ff0 // pop {r4, r5, r6, r7, r8, r9, sl, fp, lr}
@@ -7079,31 +7072,30 @@ FUNCTION(_sk_evenly_spaced_2_stop_gradient_vfp4)
_sk_evenly_spaced_2_stop_gradient_vfp4:
.long 0xe92d4010 // push {r4, lr}
.long 0xe8911008 // ldm r1, {r3, ip}
- .long 0xe3a0e014 // mov lr, #20
+ .long 0xe3a0e01c // mov lr, #28
.long 0xe2811008 // add r1, r1, #8
- .long 0xe2832004 // add r2, r3, #4
+ .long 0xe283200c // add r2, r3, #12
.long 0xe1a04003 // mov r4, r3
.long 0xf4e24cbf // vld1.32 {d20[]-d21[]}, [r2 :32]
- .long 0xe283200c // add r2, r3, #12
- .long 0xf4e26cbf // vld1.32 {d22[]-d23[]}, [r2 :32]
.long 0xe2832008 // add r2, r3, #8
+ .long 0xf4e26cbf // vld1.32 {d22[]-d23[]}, [r2 :32]
+ .long 0xe2832004 // add r2, r3, #4
.long 0xf4e28cbf // vld1.32 {d24[]-d25[]}, [r2 :32]
.long 0xe2832010 // add r2, r3, #16
.long 0xf4e42cbe // vld1.32 {d18[]-d19[]}, [r4 :32], lr
.long 0xf4e20cbf // vld1.32 {d16[]-d17[]}, [r2 :32]
- .long 0xe2832018 // add r2, r3, #24
+ .long 0xe2832014 // add r2, r3, #20
.long 0xf2400c72 // vfma.f32 q8, q0, q9
+ .long 0xf4a22cbf // vld1.32 {d2[]-d3[]}, [r2 :32]
+ .long 0xe2832018 // add r2, r3, #24
+ .long 0xf2002c78 // vfma.f32 q1, q0, q12
.long 0xf4a24cbf // vld1.32 {d4[]-d5[]}, [r2 :32]
- .long 0xe283201c // add r2, r3, #28
- .long 0xf2004c78 // vfma.f32 q2, q0, q12
- .long 0xf4a26cbf // vld1.32 {d6[]-d7[]}, [r2 :32]
- .long 0xf2006c76 // vfma.f32 q3, q0, q11
- .long 0xf4a42cbf // vld1.32 {d2[]-d3[]}, [r4 :32]
- .long 0xf2002c74 // vfma.f32 q1, q0, q10
+ .long 0xf2004c76 // vfma.f32 q2, q0, q11
+ .long 0xf4a46cbf // vld1.32 {d6[]-d7[]}, [r4 :32]
+ .long 0xf2006c74 // vfma.f32 q3, q0, q10
.long 0xf22001f0 // vorr q0, q8, q8
.long 0xe8bd4010 // pop {r4, lr}
.long 0xe12fff1c // bx ip
- .long 0xe320f000 // nop {0}
HIDDEN _sk_xy_to_unit_angle_vfp4
.globl _sk_xy_to_unit_angle_vfp4
@@ -7815,13 +7807,11 @@ FUNCTION(_sk_clut_3D_vfp4)
_sk_clut_3D_vfp4:
.long 0xe92d4830 // push {r4, r5, fp, lr}
.long 0xed2d8b10 // vpush {d8-d15}
- .long 0xe24dd0b0 // sub sp, sp, #176
+ .long 0xe24dd0a0 // sub sp, sp, #160
.long 0xe28de070 // add lr, sp, #112
- .long 0xe2812004 // add r2, r1, #4
- .long 0xe1a0c001 // mov ip, r1
.long 0xec8e6b04 // vstmia lr, {d6-d7}
- .long 0xe58d20ac // str r2, [sp, #172]
- .long 0xe49c2008 // ldr r2, [ip], #8
+ .long 0xe8911004 // ldm r1, {r2, ip}
+ .long 0xe2811008 // add r1, r1, #8
.long 0xe8924008 // ldm r2, {r3, lr}
.long 0xe5924008 // ldr r4, [r2, #8]
.long 0xe592200c // ldr r2, [r2, #12]
@@ -8131,7 +8121,7 @@ _sk_clut_3D_vfp4:
.long 0xe0835105 // add r5, r3, r5, lsl #2
.long 0xedd55a00 // vldr s11, [r5]
.long 0xee325b90 // vmov.32 r5, d18[1]
- .long 0xea000004 // b 7308 <sk_clut_3D_vfp4+0x510>
+ .long 0xea000004 // b 72e0 <sk_clut_3D_vfp4+0x508>
.long 0xe320f000 // nop {0}
.long 0x3f7ff972 // .word 0x3f7ff972
.long 0x3f7ff972 // .word 0x3f7ff972
@@ -8299,8 +8289,6 @@ _sk_clut_3D_vfp4:
.long 0xe28de090 // add lr, sp, #144
.long 0xed92ea00 // vldr s28, [r2]
.long 0xf3fb2662 // vcvt.f32.s32 q9, q9
- .long 0xe5912004 // ldr r2, [r1, #4]
- .long 0xe1a0100c // mov r1, ip
.long 0xf26e0d44 // vsub.f32 q8, q7, q2
.long 0xf2004cf4 // vfma.f32 q2, q8, q10
.long 0xf2684d42 // vsub.f32 q10, q4, q1
@@ -8316,10 +8304,10 @@ _sk_clut_3D_vfp4:
.long 0xf2020cf0 // vfma.f32 q0, q9, q8
.long 0xf206ccf0 // vfma.f32 q6, q11, q8
.long 0xf22c415c // vorr q2, q6, q6
- .long 0xe28dd0b0 // add sp, sp, #176
+ .long 0xe28dd0a0 // add sp, sp, #160
.long 0xecbd8b10 // vpop {d8-d15}
.long 0xe8bd4830 // pop {r4, r5, fp, lr}
- .long 0xe12fff12 // bx r2
+ .long 0xe12fff1c // bx ip
.long 0xe320f000 // nop {0}
HIDDEN _sk_clut_4D_vfp4
@@ -8329,11 +8317,9 @@ _sk_clut_4D_vfp4:
.long 0xe92d41f0 // push {r4, r5, r6, r7, r8, lr}
.long 0xed2d8b10 // vpush {d8-d15}
.long 0xe24ddf6a // sub sp, sp, #424
- .long 0xe2812004 // add r2, r1, #4
- .long 0xe58d21a4 // str r2, [sp, #420]
- .long 0xe1a0c001 // mov ip, r1
+ .long 0xe8911004 // ldm r1, {r2, ip}
.long 0xf2c0c052 // vmov.i32 q14, #2
- .long 0xe49c2008 // ldr r2, [ip], #8
+ .long 0xe2811008 // add r1, r1, #8
.long 0xe8924008 // ldm r2, {r3, lr}
.long 0xe592500c // ldr r5, [r2, #12]
.long 0xe5924008 // ldr r4, [r2, #8]
@@ -8652,7 +8638,7 @@ _sk_clut_4D_vfp4:
.long 0xf2802051 // vmov.i32 q1, #1
.long 0xf22e29e0 // vmla.i32 q1, q15, q8
.long 0xedd20a00 // vldr s1, [r2]
- .long 0xea000004 // b 7b18 <sk_clut_4D_vfp4+0x530>
+ .long 0xea000004 // b 7ae0 <sk_clut_4D_vfp4+0x528>
.long 0xe320f000 // nop {0}
.long 0x3f7ff972 // .word 0x3f7ff972
.long 0x3f7ff972 // .word 0x3f7ff972
@@ -9357,12 +9343,10 @@ _sk_clut_4D_vfp4:
.long 0xe28de0e0 // add lr, sp, #224
.long 0xf2600de2 // vsub.f32 q8, q8, q9
.long 0xecde8b04 // vldmia lr, {d24-d25}
- .long 0xe28f203c // add r2, pc, #60
+ .long 0xe28f2034 // add r2, pc, #52
.long 0xf26c4d6a // vsub.f32 q10, q6, q13
.long 0xf4226acf // vld1.64 {d6-d7}, [r2]
.long 0xf2642d40 // vsub.f32 q9, q2, q0
- .long 0xe5912004 // ldr r2, [r1, #4]
- .long 0xe1a0100c // mov r1, ip
.long 0xf26a6d68 // vsub.f32 q11, q5, q12
.long 0xf244acf0 // vfma.f32 q13, q10, q8
.long 0xf2020cf0 // vfma.f32 q0, q9, q8
@@ -9372,7 +9356,7 @@ _sk_clut_4D_vfp4:
.long 0xe28ddf6a // add sp, sp, #424
.long 0xecbd8b10 // vpop {d8-d15}
.long 0xe8bd41f0 // pop {r4, r5, r6, r7, r8, lr}
- .long 0xe12fff12 // bx r2
+ .long 0xe12fff1c // bx ip
.long 0xe320f000 // nop {0}
.long 0x3f800000 // .word 0x3f800000
.long 0x3f800000 // .word 0x3f800000
@@ -54257,11 +54241,11 @@ _sk_seed_shader_sse2:
.byte 102,15,110,2 // movd (%edx),%xmm0
.byte 102,15,112,192,0 // pshufd $0x0,%xmm0,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,88,128,247,203,0,0 // addps 0xcbf7(%eax),%xmm0
+ .byte 15,88,128,215,203,0,0 // addps 0xcbd7(%eax),%xmm0
.byte 102,15,110,74,4 // movd 0x4(%edx),%xmm1
.byte 102,15,112,201,0 // pshufd $0x0,%xmm1,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,88,136,7,204,0,0 // addps 0xcc07(%eax),%xmm1
+ .byte 15,88,136,231,203,0,0 // addps 0xcbe7(%eax),%xmm1
.byte 141,113,4 // lea 0x4(%ecx),%esi
.byte 15,87,210 // xorps %xmm2,%xmm2
.byte 15,41,82,64 // movaps %xmm2,0x40(%edx)
@@ -54269,7 +54253,7 @@ _sk_seed_shader_sse2:
.byte 15,41,82,32 // movaps %xmm2,0x20(%edx)
.byte 15,41,82,16 // movaps %xmm2,0x10(%edx)
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,144,23,204,0,0 // movaps 0xcc17(%eax),%xmm2
+ .byte 15,40,144,247,203,0,0 // movaps 0xcbf7(%eax),%xmm2
.byte 15,87,219 // xorps %xmm3,%xmm3
.byte 86 // push %esi
.byte 82 // push %edx
@@ -54296,15 +54280,15 @@ _sk_dither_sse2:
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 102,15,110,32 // movd (%eax),%xmm4
.byte 102,15,112,228,0 // pshufd $0x0,%xmm4,%xmm4
- .byte 102,15,254,161,178,203,0,0 // paddd 0xcbb2(%ecx),%xmm4
+ .byte 102,15,254,161,146,203,0,0 // paddd 0xcb92(%ecx),%xmm4
.byte 102,15,110,104,4 // movd 0x4(%eax),%xmm5
.byte 102,15,112,253,0 // pshufd $0x0,%xmm5,%xmm7
.byte 102,15,239,252 // pxor %xmm4,%xmm7
- .byte 102,15,111,177,194,203,0,0 // movdqa 0xcbc2(%ecx),%xmm6
+ .byte 102,15,111,177,162,203,0,0 // movdqa 0xcba2(%ecx),%xmm6
.byte 102,15,111,207 // movdqa %xmm7,%xmm1
.byte 102,15,219,206 // pand %xmm6,%xmm1
.byte 102,15,114,241,5 // pslld $0x5,%xmm1
- .byte 102,15,111,129,226,203,0,0 // movdqa 0xcbe2(%ecx),%xmm0
+ .byte 102,15,111,129,194,203,0,0 // movdqa 0xcbc2(%ecx),%xmm0
.byte 102,15,111,239 // movdqa %xmm7,%xmm5
.byte 102,15,219,232 // pand %xmm0,%xmm5
.byte 102,15,114,245,2 // pslld $0x2,%xmm5
@@ -54314,7 +54298,7 @@ _sk_dither_sse2:
.byte 102,15,219,196 // pand %xmm4,%xmm0
.byte 102,15,254,192 // paddd %xmm0,%xmm0
.byte 102,15,235,198 // por %xmm6,%xmm0
- .byte 102,15,111,137,210,203,0,0 // movdqa 0xcbd2(%ecx),%xmm1
+ .byte 102,15,111,137,178,203,0,0 // movdqa 0xcbb2(%ecx),%xmm1
.byte 102,15,219,249 // pand %xmm1,%xmm7
.byte 102,15,219,225 // pand %xmm1,%xmm4
.byte 102,15,114,212,2 // psrld $0x2,%xmm4
@@ -54325,8 +54309,8 @@ _sk_dither_sse2:
.byte 102,15,114,215,1 // psrld $0x1,%xmm7
.byte 102,15,235,231 // por %xmm7,%xmm4
.byte 15,91,196 // cvtdq2ps %xmm4,%xmm0
- .byte 15,89,129,242,203,0,0 // mulps 0xcbf2(%ecx),%xmm0
- .byte 15,88,129,2,204,0,0 // addps 0xcc02(%ecx),%xmm0
+ .byte 15,89,129,210,203,0,0 // mulps 0xcbd2(%ecx),%xmm0
+ .byte 15,88,129,226,203,0,0 // addps 0xcbe2(%ecx),%xmm0
.byte 243,15,16,14 // movss (%esi),%xmm1
.byte 15,198,201,0 // shufps $0x0,%xmm1,%xmm1
.byte 15,89,200 // mulps %xmm0,%xmm1
@@ -54394,7 +54378,7 @@ _sk_black_color_sse2:
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 141,81,4 // lea 0x4(%ecx),%edx
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,152,102,202,0,0 // movaps 0xca66(%eax),%xmm3
+ .byte 15,40,152,70,202,0,0 // movaps 0xca46(%eax),%xmm3
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 15,87,201 // xorps %xmm1,%xmm1
.byte 15,87,210 // xorps %xmm2,%xmm2
@@ -54417,7 +54401,7 @@ _sk_white_color_sse2:
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 141,81,4 // lea 0x4(%ecx),%edx
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,128,54,202,0,0 // movaps 0xca36(%eax),%xmm0
+ .byte 15,40,128,22,202,0,0 // movaps 0xca16(%eax),%xmm0
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 15,40,216 // movaps %xmm0,%xmm3
@@ -54507,7 +54491,7 @@ _sk_srcatop_sse2:
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 15,40,97,64 // movaps 0x40(%ecx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
- .byte 15,40,170,135,201,0,0 // movaps 0xc987(%edx),%xmm5
+ .byte 15,40,170,103,201,0,0 // movaps 0xc967(%edx),%xmm5
.byte 15,92,235 // subps %xmm3,%xmm5
.byte 15,40,113,16 // movaps 0x10(%ecx),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
@@ -54546,7 +54530,7 @@ _sk_dstatop_sse2:
.byte 15,40,105,64 // movaps 0x40(%ecx),%xmm5
.byte 15,40,113,16 // movaps 0x10(%ecx),%xmm6
.byte 15,89,243 // mulps %xmm3,%xmm6
- .byte 15,40,162,40,201,0,0 // movaps 0xc928(%edx),%xmm4
+ .byte 15,40,162,8,201,0,0 // movaps 0xc908(%edx),%xmm4
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 15,88,198 // addps %xmm6,%xmm0
@@ -54630,7 +54614,7 @@ _sk_srcout_sse2:
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,85,8 // mov 0x8(%ebp),%edx
- .byte 15,40,160,103,200,0,0 // movaps 0xc867(%eax),%xmm4
+ .byte 15,40,160,71,200,0,0 // movaps 0xc847(%eax),%xmm4
.byte 15,92,98,64 // subps 0x40(%edx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 15,89,204 // mulps %xmm4,%xmm1
@@ -54656,7 +54640,7 @@ _sk_dstout_sse2:
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,85,8 // mov 0x8(%ebp),%edx
- .byte 15,40,160,47,200,0,0 // movaps 0xc82f(%eax),%xmm4
+ .byte 15,40,160,15,200,0,0 // movaps 0xc80f(%eax),%xmm4
.byte 15,92,227 // subps %xmm3,%xmm4
.byte 15,40,66,16 // movaps 0x10(%edx),%xmm0
.byte 15,89,196 // mulps %xmm4,%xmm0
@@ -54686,7 +54670,7 @@ _sk_srcover_sse2:
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,85,8 // mov 0x8(%ebp),%edx
- .byte 15,40,160,232,199,0,0 // movaps 0xc7e8(%eax),%xmm4
+ .byte 15,40,160,200,199,0,0 // movaps 0xc7c8(%eax),%xmm4
.byte 15,92,227 // subps %xmm3,%xmm4
.byte 15,40,106,16 // movaps 0x10(%edx),%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
@@ -54720,7 +54704,7 @@ _sk_dstover_sse2:
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,85,8 // mov 0x8(%ebp),%edx
.byte 15,40,106,64 // movaps 0x40(%edx),%xmm5
- .byte 15,40,160,152,199,0,0 // movaps 0xc798(%eax),%xmm4
+ .byte 15,40,160,120,199,0,0 // movaps 0xc778(%eax),%xmm4
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 15,88,66,16 // addps 0x10(%edx),%xmm0
@@ -54776,7 +54760,7 @@ _sk_multiply_sse2:
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 15,40,80,64 // movaps 0x40(%eax),%xmm2
.byte 15,41,85,200 // movaps %xmm2,-0x38(%ebp)
- .byte 15,40,129,25,199,0,0 // movaps 0xc719(%ecx),%xmm0
+ .byte 15,40,129,249,198,0,0 // movaps 0xc6f9(%ecx),%xmm0
.byte 15,40,240 // movaps %xmm0,%xmm6
.byte 15,92,242 // subps %xmm2,%xmm6
.byte 15,40,254 // movaps %xmm6,%xmm7
@@ -54836,7 +54820,7 @@ _sk_plus__sse2:
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,85,8 // mov 0x8(%ebp),%edx
.byte 15,88,66,16 // addps 0x10(%edx),%xmm0
- .byte 15,40,160,115,198,0,0 // movaps 0xc673(%eax),%xmm4
+ .byte 15,40,160,83,198,0,0 // movaps 0xc653(%eax),%xmm4
.byte 15,93,196 // minps %xmm4,%xmm0
.byte 15,88,74,32 // addps 0x20(%edx),%xmm1
.byte 15,93,204 // minps %xmm4,%xmm1
@@ -54908,7 +54892,7 @@ _sk_xor__sse2:
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 15,40,105,64 // movaps 0x40(%ecx),%xmm5
- .byte 15,40,154,197,197,0,0 // movaps 0xc5c5(%edx),%xmm3
+ .byte 15,40,154,165,197,0,0 // movaps 0xc5a5(%edx),%xmm3
.byte 15,40,243 // movaps %xmm3,%xmm6
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 15,89,198 // mulps %xmm6,%xmm0
@@ -54970,7 +54954,7 @@ _sk_darken_sse2:
.byte 15,89,203 // mulps %xmm3,%xmm1
.byte 15,95,209 // maxps %xmm1,%xmm2
.byte 15,92,234 // subps %xmm2,%xmm5
- .byte 15,40,138,93,197,0,0 // movaps 0xc55d(%edx),%xmm1
+ .byte 15,40,138,61,197,0,0 // movaps 0xc53d(%edx),%xmm1
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,89,206 // mulps %xmm6,%xmm1
.byte 15,88,217 // addps %xmm1,%xmm3
@@ -55019,7 +55003,7 @@ _sk_lighten_sse2:
.byte 15,89,203 // mulps %xmm3,%xmm1
.byte 15,93,209 // minps %xmm1,%xmm2
.byte 15,92,234 // subps %xmm2,%xmm5
- .byte 15,40,138,221,196,0,0 // movaps 0xc4dd(%edx),%xmm1
+ .byte 15,40,138,189,196,0,0 // movaps 0xc4bd(%edx),%xmm1
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,89,206 // mulps %xmm6,%xmm1
.byte 15,88,217 // addps %xmm1,%xmm3
@@ -55072,7 +55056,7 @@ _sk_difference_sse2:
.byte 15,93,214 // minps %xmm6,%xmm2
.byte 15,88,210 // addps %xmm2,%xmm2
.byte 15,92,226 // subps %xmm2,%xmm4
- .byte 15,40,146,90,196,0,0 // movaps 0xc45a(%edx),%xmm2
+ .byte 15,40,146,58,196,0,0 // movaps 0xc43a(%edx),%xmm2
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,213 // mulps %xmm5,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -55116,7 +55100,7 @@ _sk_exclusion_sse2:
.byte 15,89,202 // mulps %xmm2,%xmm1
.byte 15,88,201 // addps %xmm1,%xmm1
.byte 15,92,233 // subps %xmm1,%xmm5
- .byte 15,40,138,212,195,0,0 // movaps 0xc3d4(%edx),%xmm1
+ .byte 15,40,138,180,195,0,0 // movaps 0xc3b4(%edx),%xmm1
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,89,73,64 // mulps 0x40(%ecx),%xmm1
.byte 15,88,217 // addps %xmm1,%xmm3
@@ -55157,7 +55141,7 @@ _sk_colorburn_sse2:
.byte 15,93,198 // minps %xmm6,%xmm0
.byte 15,40,233 // movaps %xmm1,%xmm5
.byte 15,92,232 // subps %xmm0,%xmm5
- .byte 15,40,177,85,195,0,0 // movaps 0xc355(%ecx),%xmm6
+ .byte 15,40,177,53,195,0,0 // movaps 0xc335(%ecx),%xmm6
.byte 15,40,198 // movaps %xmm6,%xmm0
.byte 15,92,193 // subps %xmm1,%xmm0
.byte 15,41,69,200 // movaps %xmm0,-0x38(%ebp)
@@ -55274,7 +55258,7 @@ _sk_colordodge_sse2:
.byte 89 // pop %ecx
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 15,40,72,16 // movaps 0x10(%eax),%xmm1
- .byte 15,40,145,204,193,0,0 // movaps 0xc1cc(%ecx),%xmm2
+ .byte 15,40,145,172,193,0,0 // movaps 0xc1ac(%ecx),%xmm2
.byte 15,40,226 // movaps %xmm2,%xmm4
.byte 15,92,214 // subps %xmm6,%xmm2
.byte 15,40,250 // movaps %xmm2,%xmm7
@@ -55391,7 +55375,7 @@ _sk_hardlight_sse2:
.byte 89 // pop %ecx
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 15,40,72,64 // movaps 0x40(%eax),%xmm1
- .byte 15,40,145,107,192,0,0 // movaps 0xc06b(%ecx),%xmm2
+ .byte 15,40,145,75,192,0,0 // movaps 0xc04b(%ecx),%xmm2
.byte 15,40,234 // movaps %xmm2,%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
.byte 15,40,225 // movaps %xmm1,%xmm4
@@ -55501,7 +55485,7 @@ _sk_overlay_sse2:
.byte 89 // pop %ecx
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 15,40,80,64 // movaps 0x40(%eax),%xmm2
- .byte 15,40,161,32,191,0,0 // movaps 0xbf20(%ecx),%xmm4
+ .byte 15,40,161,0,191,0,0 // movaps 0xbf00(%ecx),%xmm4
.byte 15,40,244 // movaps %xmm4,%xmm6
.byte 15,92,242 // subps %xmm2,%xmm6
.byte 15,40,206 // movaps %xmm6,%xmm1
@@ -55629,17 +55613,17 @@ _sk_softlight_sse2:
.byte 232,0,0,0,0 // call f50 <_sk_softlight_sse2+0x52>
.byte 89 // pop %ecx
.byte 15,40,194 // movaps %xmm2,%xmm0
- .byte 15,40,137,0,190,0,0 // movaps 0xbe00(%ecx),%xmm1
+ .byte 15,40,137,224,189,0,0 // movaps 0xbde0(%ecx),%xmm1
.byte 15,41,141,104,255,255,255 // movaps %xmm1,-0x98(%ebp)
.byte 15,88,193 // addps %xmm1,%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
- .byte 15,40,185,144,189,0,0 // movaps 0xbd90(%ecx),%xmm7
+ .byte 15,40,185,112,189,0,0 // movaps 0xbd70(%ecx),%xmm7
.byte 15,41,125,232 // movaps %xmm7,-0x18(%ebp)
.byte 15,92,250 // subps %xmm2,%xmm7
.byte 15,82,242 // rsqrtps %xmm2,%xmm6
.byte 15,83,206 // rcpps %xmm6,%xmm1
.byte 15,92,202 // subps %xmm2,%xmm1
- .byte 15,40,161,16,190,0,0 // movaps 0xbe10(%ecx),%xmm4
+ .byte 15,40,161,240,189,0,0 // movaps 0xbdf0(%ecx),%xmm4
.byte 15,41,101,152 // movaps %xmm4,-0x68(%ebp)
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 15,88,208 // addps %xmm0,%xmm2
@@ -55845,7 +55829,7 @@ _sk_hue_sse2:
.byte 15,40,226 // movaps %xmm2,%xmm4
.byte 15,40,72,64 // movaps 0x40(%eax),%xmm1
.byte 15,41,77,216 // movaps %xmm1,-0x28(%ebp)
- .byte 15,40,169,207,186,0,0 // movaps 0xbacf(%ecx),%xmm5
+ .byte 15,40,169,175,186,0,0 // movaps 0xbaaf(%ecx),%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
.byte 15,89,197 // mulps %xmm5,%xmm0
.byte 15,41,133,72,255,255,255 // movaps %xmm0,-0xb8(%ebp)
@@ -55878,17 +55862,17 @@ _sk_hue_sse2:
.byte 15,89,233 // mulps %xmm1,%xmm5
.byte 15,41,173,120,255,255,255 // movaps %xmm5,-0x88(%ebp)
.byte 15,89,193 // mulps %xmm1,%xmm0
- .byte 15,40,153,95,187,0,0 // movaps 0xbb5f(%ecx),%xmm3
+ .byte 15,40,153,63,187,0,0 // movaps 0xbb3f(%ecx),%xmm3
.byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp)
.byte 15,40,117,152 // movaps -0x68(%ebp),%xmm6
.byte 15,40,206 // movaps %xmm6,%xmm1
.byte 15,89,203 // mulps %xmm3,%xmm1
- .byte 15,40,153,111,187,0,0 // movaps 0xbb6f(%ecx),%xmm3
+ .byte 15,40,153,79,187,0,0 // movaps 0xbb4f(%ecx),%xmm3
.byte 15,40,109,136 // movaps -0x78(%ebp),%xmm5
.byte 15,40,253 // movaps %xmm5,%xmm7
.byte 15,89,251 // mulps %xmm3,%xmm7
.byte 15,88,249 // addps %xmm1,%xmm7
- .byte 15,40,137,207,186,0,0 // movaps 0xbacf(%ecx),%xmm1
+ .byte 15,40,137,175,186,0,0 // movaps 0xbaaf(%ecx),%xmm1
.byte 15,92,77,184 // subps -0x48(%ebp),%xmm1
.byte 15,89,241 // mulps %xmm1,%xmm6
.byte 15,41,117,152 // movaps %xmm6,-0x68(%ebp)
@@ -55898,7 +55882,7 @@ _sk_hue_sse2:
.byte 15,40,77,200 // movaps -0x38(%ebp),%xmm1
.byte 15,89,241 // mulps %xmm1,%xmm6
.byte 15,41,117,168 // movaps %xmm6,-0x58(%ebp)
- .byte 15,40,169,127,187,0,0 // movaps 0xbb7f(%ecx),%xmm5
+ .byte 15,40,169,95,187,0,0 // movaps 0xbb5f(%ecx),%xmm5
.byte 15,89,205 // mulps %xmm5,%xmm1
.byte 15,88,207 // addps %xmm7,%xmm1
.byte 15,94,212 // divps %xmm4,%xmm2
@@ -56091,17 +56075,17 @@ _sk_saturation_sse2:
.byte 15,89,253 // mulps %xmm5,%xmm7
.byte 232,0,0,0,0 // call 1565 <_sk_saturation_sse2+0xb0>
.byte 89 // pop %ecx
- .byte 15,40,153,11,184,0,0 // movaps 0xb80b(%ecx),%xmm3
+ .byte 15,40,153,235,183,0,0 // movaps 0xb7eb(%ecx),%xmm3
.byte 15,41,157,88,255,255,255 // movaps %xmm3,-0xa8(%ebp)
.byte 15,40,77,184 // movaps -0x48(%ebp),%xmm1
.byte 15,40,193 // movaps %xmm1,%xmm0
.byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,40,153,27,184,0,0 // movaps 0xb81b(%ecx),%xmm3
+ .byte 15,40,153,251,183,0,0 // movaps 0xb7fb(%ecx),%xmm3
.byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp)
.byte 15,40,238 // movaps %xmm6,%xmm5
.byte 15,89,235 // mulps %xmm3,%xmm5
.byte 15,88,232 // addps %xmm0,%xmm5
- .byte 15,40,129,123,183,0,0 // movaps 0xb77b(%ecx),%xmm0
+ .byte 15,40,129,91,183,0,0 // movaps 0xb75b(%ecx),%xmm0
.byte 15,41,133,104,255,255,255 // movaps %xmm0,-0x98(%ebp)
.byte 15,92,69,216 // subps -0x28(%ebp),%xmm0
.byte 15,89,200 // mulps %xmm0,%xmm1
@@ -56113,7 +56097,7 @@ _sk_saturation_sse2:
.byte 15,89,200 // mulps %xmm0,%xmm1
.byte 15,41,141,120,255,255,255 // movaps %xmm1,-0x88(%ebp)
.byte 15,40,200 // movaps %xmm0,%xmm1
- .byte 15,40,129,43,184,0,0 // movaps 0xb82b(%ecx),%xmm0
+ .byte 15,40,129,11,184,0,0 // movaps 0xb80b(%ecx),%xmm0
.byte 15,89,200 // mulps %xmm0,%xmm1
.byte 15,88,205 // addps %xmm5,%xmm1
.byte 15,40,109,168 // movaps -0x58(%ebp),%xmm5
@@ -56272,16 +56256,16 @@ _sk_color_sse2:
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 15,40,80,16 // movaps 0x10(%eax),%xmm2
.byte 15,40,72,32 // movaps 0x20(%eax),%xmm1
- .byte 15,40,177,176,181,0,0 // movaps 0xb5b0(%ecx),%xmm6
+ .byte 15,40,177,144,181,0,0 // movaps 0xb590(%ecx),%xmm6
.byte 15,41,117,216 // movaps %xmm6,-0x28(%ebp)
.byte 15,40,194 // movaps %xmm2,%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
- .byte 15,40,153,192,181,0,0 // movaps 0xb5c0(%ecx),%xmm3
+ .byte 15,40,153,160,181,0,0 // movaps 0xb5a0(%ecx),%xmm3
.byte 15,41,93,184 // movaps %xmm3,-0x48(%ebp)
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,243 // mulps %xmm3,%xmm6
.byte 15,88,240 // addps %xmm0,%xmm6
- .byte 15,40,129,32,181,0,0 // movaps 0xb520(%ecx),%xmm0
+ .byte 15,40,129,0,181,0,0 // movaps 0xb500(%ecx),%xmm0
.byte 15,41,69,168 // movaps %xmm0,-0x58(%ebp)
.byte 15,92,69,200 // subps -0x38(%ebp),%xmm0
.byte 15,89,208 // mulps %xmm0,%xmm2
@@ -56291,7 +56275,7 @@ _sk_color_sse2:
.byte 15,40,80,48 // movaps 0x30(%eax),%xmm2
.byte 15,89,194 // mulps %xmm2,%xmm0
.byte 15,41,133,72,255,255,255 // movaps %xmm0,-0xb8(%ebp)
- .byte 15,40,137,208,181,0,0 // movaps 0xb5d0(%ecx),%xmm1
+ .byte 15,40,137,176,181,0,0 // movaps 0xb5b0(%ecx),%xmm1
.byte 15,89,209 // mulps %xmm1,%xmm2
.byte 15,88,214 // addps %xmm6,%xmm2
.byte 15,40,88,64 // movaps 0x40(%eax),%xmm3
@@ -56450,18 +56434,18 @@ _sk_luminosity_sse2:
.byte 232,0,0,0,0 // call 1a23 <_sk_luminosity_sse2+0x11>
.byte 89 // pop %ecx
.byte 139,69,8 // mov 0x8(%ebp),%eax
- .byte 15,40,161,77,179,0,0 // movaps 0xb34d(%ecx),%xmm4
+ .byte 15,40,161,45,179,0,0 // movaps 0xb32d(%ecx),%xmm4
.byte 15,41,101,232 // movaps %xmm4,-0x18(%ebp)
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 15,89,212 // mulps %xmm4,%xmm2
- .byte 15,40,161,93,179,0,0 // movaps 0xb35d(%ecx),%xmm4
+ .byte 15,40,161,61,179,0,0 // movaps 0xb33d(%ecx),%xmm4
.byte 15,41,101,216 // movaps %xmm4,-0x28(%ebp)
.byte 15,40,233 // movaps %xmm1,%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
.byte 15,88,234 // addps %xmm2,%xmm5
.byte 15,40,80,64 // movaps 0x40(%eax),%xmm2
.byte 15,41,85,184 // movaps %xmm2,-0x48(%ebp)
- .byte 15,40,161,189,178,0,0 // movaps 0xb2bd(%ecx),%xmm4
+ .byte 15,40,161,157,178,0,0 // movaps 0xb29d(%ecx),%xmm4
.byte 15,40,252 // movaps %xmm4,%xmm7
.byte 15,92,250 // subps %xmm2,%xmm7
.byte 15,89,199 // mulps %xmm7,%xmm0
@@ -56471,7 +56455,7 @@ _sk_luminosity_sse2:
.byte 15,89,254 // mulps %xmm6,%xmm7
.byte 15,41,189,104,255,255,255 // movaps %xmm7,-0x98(%ebp)
.byte 15,40,214 // movaps %xmm6,%xmm2
- .byte 15,40,137,109,179,0,0 // movaps 0xb36d(%ecx),%xmm1
+ .byte 15,40,137,77,179,0,0 // movaps 0xb34d(%ecx),%xmm1
.byte 15,89,209 // mulps %xmm1,%xmm2
.byte 15,88,213 // addps %xmm5,%xmm2
.byte 15,40,104,16 // movaps 0x10(%eax),%xmm5
@@ -56647,7 +56631,7 @@ _sk_srcover_rgba_8888_sse2:
.byte 139,49 // mov (%ecx),%esi
.byte 15,133,224,0,0,0 // jne 1d90 <_sk_srcover_rgba_8888_sse2+0x119>
.byte 243,15,111,20,178 // movdqu (%edx,%esi,4),%xmm2
- .byte 102,15,111,167,18,177,0,0 // movdqa 0xb112(%edi),%xmm4
+ .byte 102,15,111,167,242,176,0,0 // movdqa 0xb0f2(%edi),%xmm4
.byte 102,15,111,234 // movdqa %xmm2,%xmm5
.byte 102,15,219,236 // pand %xmm4,%xmm5
.byte 102,15,111,242 // movdqa %xmm2,%xmm6
@@ -56658,9 +56642,9 @@ _sk_srcover_rgba_8888_sse2:
.byte 102,15,219,252 // pand %xmm4,%xmm7
.byte 15,91,229 // cvtdq2ps %xmm5,%xmm4
.byte 15,41,97,16 // movaps %xmm4,0x10(%ecx)
- .byte 15,40,175,82,176,0,0 // movaps 0xb052(%edi),%xmm5
+ .byte 15,40,175,50,176,0,0 // movaps 0xb032(%edi),%xmm5
.byte 15,92,235 // subps %xmm3,%xmm5
- .byte 15,40,143,34,177,0,0 // movaps 0xb122(%edi),%xmm1
+ .byte 15,40,143,2,177,0,0 // movaps 0xb102(%edi),%xmm1
.byte 15,89,193 // mulps %xmm1,%xmm0
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,88,224 // addps %xmm0,%xmm4
@@ -56774,7 +56758,7 @@ _sk_clamp_1_sse2:
.byte 232,0,0,0,0 // call 1e3a <_sk_clamp_1_sse2+0xb>
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,40,160,166,174,0,0 // movaps 0xaea6(%eax),%xmm4
+ .byte 15,40,160,134,174,0,0 // movaps 0xae86(%eax),%xmm4
.byte 15,93,196 // minps %xmm4,%xmm0
.byte 15,93,204 // minps %xmm4,%xmm1
.byte 15,93,212 // minps %xmm4,%xmm2
@@ -56798,7 +56782,7 @@ _sk_clamp_a_sse2:
.byte 232,0,0,0,0 // call 1e6d <_sk_clamp_a_sse2+0xb>
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,93,152,115,174,0,0 // minps 0xae73(%eax),%xmm3
+ .byte 15,93,152,83,174,0,0 // minps 0xae53(%eax),%xmm3
.byte 15,93,195 // minps %xmm3,%xmm0
.byte 15,93,203 // minps %xmm3,%xmm1
.byte 15,93,211 // minps %xmm3,%xmm2
@@ -56823,7 +56807,7 @@ _sk_clamp_a_dst_sse2:
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,85,8 // mov 0x8(%ebp),%edx
.byte 15,40,98,64 // movaps 0x40(%edx),%xmm4
- .byte 15,93,160,67,174,0,0 // minps 0xae43(%eax),%xmm4
+ .byte 15,93,160,35,174,0,0 // minps 0xae23(%eax),%xmm4
.byte 15,41,98,64 // movaps %xmm4,0x40(%edx)
.byte 15,40,106,16 // movaps 0x10(%edx),%xmm5
.byte 15,40,114,32 // movaps 0x20(%edx),%xmm6
@@ -56897,7 +56881,7 @@ _sk_invert_sse2:
.byte 232,0,0,0,0 // call 1f48 <_sk_invert_sse2+0xb>
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,40,160,152,173,0,0 // movaps 0xad98(%eax),%xmm4
+ .byte 15,40,160,120,173,0,0 // movaps 0xad78(%eax),%xmm4
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,92,232 // subps %xmm0,%xmm5
.byte 15,40,244 // movaps %xmm4,%xmm6
@@ -57020,7 +57004,7 @@ _sk_unpremul_sse2:
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 15,87,228 // xorps %xmm4,%xmm4
- .byte 15,40,168,154,172,0,0 // movaps 0xac9a(%eax),%xmm5
+ .byte 15,40,168,122,172,0,0 // movaps 0xac7a(%eax),%xmm5
.byte 15,94,235 // divps %xmm3,%xmm5
.byte 15,194,227,4 // cmpneqps %xmm3,%xmm4
.byte 15,84,229 // andps %xmm5,%xmm4
@@ -57051,19 +57035,19 @@ _sk_from_srgb_sse2:
.byte 88 // pop %eax
.byte 15,40,202 // movaps %xmm2,%xmm1
.byte 15,89,201 // mulps %xmm1,%xmm1
- .byte 15,40,160,224,172,0,0 // movaps 0xace0(%eax),%xmm4
+ .byte 15,40,160,192,172,0,0 // movaps 0xacc0(%eax),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
- .byte 15,40,176,64,173,0,0 // movaps 0xad40(%eax),%xmm6
+ .byte 15,40,176,32,173,0,0 // movaps 0xad20(%eax),%xmm6
.byte 15,41,117,216 // movaps %xmm6,-0x28(%ebp)
.byte 15,88,198 // addps %xmm6,%xmm0
.byte 15,89,193 // mulps %xmm1,%xmm0
- .byte 15,40,176,48,173,0,0 // movaps 0xad30(%eax),%xmm6
+ .byte 15,40,176,16,173,0,0 // movaps 0xad10(%eax),%xmm6
.byte 15,40,202 // movaps %xmm2,%xmm1
.byte 15,89,206 // mulps %xmm6,%xmm1
- .byte 15,40,184,80,173,0,0 // movaps 0xad50(%eax),%xmm7
+ .byte 15,40,184,48,173,0,0 // movaps 0xad30(%eax),%xmm7
.byte 15,41,125,232 // movaps %xmm7,-0x18(%ebp)
.byte 15,88,199 // addps %xmm7,%xmm0
- .byte 15,40,184,96,173,0,0 // movaps 0xad60(%eax),%xmm7
+ .byte 15,40,184,64,173,0,0 // movaps 0xad40(%eax),%xmm7
.byte 15,194,215,1 // cmpltps %xmm7,%xmm2
.byte 15,84,202 // andps %xmm2,%xmm1
.byte 15,85,208 // andnps %xmm0,%xmm2
@@ -57123,18 +57107,18 @@ _sk_from_srgb_dst_sse2:
.byte 15,40,72,16 // movaps 0x10(%eax),%xmm1
.byte 15,40,233 // movaps %xmm1,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
- .byte 15,40,161,5,172,0,0 // movaps 0xac05(%ecx),%xmm4
+ .byte 15,40,161,229,171,0,0 // movaps 0xabe5(%ecx),%xmm4
.byte 15,40,193 // movaps %xmm1,%xmm0
.byte 15,89,196 // mulps %xmm4,%xmm0
- .byte 15,40,177,101,172,0,0 // movaps 0xac65(%ecx),%xmm6
+ .byte 15,40,177,69,172,0,0 // movaps 0xac45(%ecx),%xmm6
.byte 15,88,198 // addps %xmm6,%xmm0
.byte 15,89,197 // mulps %xmm5,%xmm0
- .byte 15,40,169,85,172,0,0 // movaps 0xac55(%ecx),%xmm5
+ .byte 15,40,169,53,172,0,0 // movaps 0xac35(%ecx),%xmm5
.byte 15,40,209 // movaps %xmm1,%xmm2
.byte 15,89,213 // mulps %xmm5,%xmm2
- .byte 15,40,185,117,172,0,0 // movaps 0xac75(%ecx),%xmm7
+ .byte 15,40,185,85,172,0,0 // movaps 0xac55(%ecx),%xmm7
.byte 15,88,199 // addps %xmm7,%xmm0
- .byte 15,40,153,133,172,0,0 // movaps 0xac85(%ecx),%xmm3
+ .byte 15,40,153,101,172,0,0 // movaps 0xac65(%ecx),%xmm3
.byte 15,194,203,1 // cmpltps %xmm3,%xmm1
.byte 15,84,209 // andps %xmm1,%xmm2
.byte 15,85,200 // andnps %xmm0,%xmm1
@@ -57196,25 +57180,25 @@ _sk_to_srgb_sse2:
.byte 232,0,0,0,0 // call 2256 <_sk_to_srgb_sse2+0x18>
.byte 88 // pop %eax
.byte 15,82,218 // rsqrtps %xmm2,%xmm3
- .byte 15,40,160,186,171,0,0 // movaps 0xabba(%eax),%xmm4
+ .byte 15,40,160,154,171,0,0 // movaps 0xab9a(%eax),%xmm4
.byte 15,40,235 // movaps %xmm3,%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
- .byte 15,40,128,202,171,0,0 // movaps 0xabca(%eax),%xmm0
+ .byte 15,40,128,170,171,0,0 // movaps 0xabaa(%eax),%xmm0
.byte 15,41,69,232 // movaps %xmm0,-0x18(%ebp)
.byte 15,88,232 // addps %xmm0,%xmm5
.byte 15,89,235 // mulps %xmm3,%xmm5
- .byte 15,40,128,218,171,0,0 // movaps 0xabda(%eax),%xmm0
+ .byte 15,40,128,186,171,0,0 // movaps 0xabba(%eax),%xmm0
.byte 15,41,69,200 // movaps %xmm0,-0x38(%ebp)
.byte 15,88,232 // addps %xmm0,%xmm5
- .byte 15,40,128,234,171,0,0 // movaps 0xabea(%eax),%xmm0
+ .byte 15,40,128,202,171,0,0 // movaps 0xabca(%eax),%xmm0
.byte 15,41,69,216 // movaps %xmm0,-0x28(%ebp)
.byte 15,88,216 // addps %xmm0,%xmm3
.byte 15,83,195 // rcpps %xmm3,%xmm0
.byte 15,89,197 // mulps %xmm5,%xmm0
- .byte 15,40,168,170,171,0,0 // movaps 0xabaa(%eax),%xmm5
+ .byte 15,40,168,138,171,0,0 // movaps 0xab8a(%eax),%xmm5
.byte 15,40,202 // movaps %xmm2,%xmm1
.byte 15,89,205 // mulps %xmm5,%xmm1
- .byte 15,40,152,250,171,0,0 // movaps 0xabfa(%eax),%xmm3
+ .byte 15,40,152,218,171,0,0 // movaps 0xabda(%eax),%xmm3
.byte 15,194,211,1 // cmpltps %xmm3,%xmm2
.byte 15,84,202 // andps %xmm2,%xmm1
.byte 15,85,208 // andnps %xmm0,%xmm2
@@ -57285,14 +57269,14 @@ _sk_rgb_to_hsl_sse2:
.byte 15,40,195 // movaps %xmm3,%xmm0
.byte 15,92,193 // subps %xmm1,%xmm0
.byte 15,41,69,216 // movaps %xmm0,-0x28(%ebp)
- .byte 15,40,136,147,169,0,0 // movaps 0xa993(%eax),%xmm1
+ .byte 15,40,136,115,169,0,0 // movaps 0xa973(%eax),%xmm1
.byte 15,94,200 // divps %xmm0,%xmm1
.byte 15,40,199 // movaps %xmm7,%xmm0
.byte 15,92,194 // subps %xmm2,%xmm0
.byte 15,89,193 // mulps %xmm1,%xmm0
.byte 15,40,239 // movaps %xmm7,%xmm5
.byte 15,194,234,1 // cmpltps %xmm2,%xmm5
- .byte 15,84,168,19,171,0,0 // andps 0xab13(%eax),%xmm5
+ .byte 15,84,168,243,170,0,0 // andps 0xaaf3(%eax),%xmm5
.byte 15,88,232 // addps %xmm0,%xmm5
.byte 15,40,195 // movaps %xmm3,%xmm0
.byte 15,194,196,0 // cmpeqps %xmm4,%xmm0
@@ -57302,9 +57286,9 @@ _sk_rgb_to_hsl_sse2:
.byte 15,92,231 // subps %xmm7,%xmm4
.byte 15,89,209 // mulps %xmm1,%xmm2
.byte 15,89,225 // mulps %xmm1,%xmm4
- .byte 15,40,136,35,171,0,0 // movaps 0xab23(%eax),%xmm1
+ .byte 15,40,136,3,171,0,0 // movaps 0xab03(%eax),%xmm1
.byte 15,88,209 // addps %xmm1,%xmm2
- .byte 15,88,160,51,171,0,0 // addps 0xab33(%eax),%xmm4
+ .byte 15,88,160,19,171,0,0 // addps 0xab13(%eax),%xmm4
.byte 15,84,214 // andps %xmm6,%xmm2
.byte 15,85,244 // andnps %xmm4,%xmm6
.byte 15,86,242 // orps %xmm2,%xmm6
@@ -57316,7 +57300,7 @@ _sk_rgb_to_hsl_sse2:
.byte 15,194,226,4 // cmpneqps %xmm2,%xmm4
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,88,218 // addps %xmm2,%xmm3
- .byte 15,40,168,131,169,0,0 // movaps 0xa983(%eax),%xmm5
+ .byte 15,40,168,99,169,0,0 // movaps 0xa963(%eax),%xmm5
.byte 15,92,202 // subps %xmm2,%xmm1
.byte 15,40,211 // movaps %xmm3,%xmm2
.byte 15,89,213 // mulps %xmm5,%xmm2
@@ -57326,7 +57310,7 @@ _sk_rgb_to_hsl_sse2:
.byte 15,86,233 // orps %xmm1,%xmm5
.byte 15,40,77,216 // movaps -0x28(%ebp),%xmm1
.byte 15,94,205 // divps %xmm5,%xmm1
- .byte 15,89,128,67,171,0,0 // mulps 0xab43(%eax),%xmm0
+ .byte 15,89,128,35,171,0,0 // mulps 0xab23(%eax),%xmm0
.byte 15,84,196 // andps %xmm4,%xmm0
.byte 15,84,204 // andps %xmm4,%xmm1
.byte 139,69,12 // mov 0xc(%ebp),%eax
@@ -57351,7 +57335,7 @@ _sk_hsl_to_rgb_sse2:
.byte 15,41,69,184 // movaps %xmm0,-0x48(%ebp)
.byte 232,0,0,0,0 // call 2448 <_sk_hsl_to_rgb_sse2+0x19>
.byte 88 // pop %eax
- .byte 15,40,160,136,168,0,0 // movaps 0xa888(%eax),%xmm4
+ .byte 15,40,160,104,168,0,0 // movaps 0xa868(%eax),%xmm4
.byte 15,40,220 // movaps %xmm4,%xmm3
.byte 15,41,165,104,255,255,255 // movaps %xmm4,-0x98(%ebp)
.byte 15,194,218,2 // cmpleps %xmm2,%xmm3
@@ -57364,13 +57348,13 @@ _sk_hsl_to_rgb_sse2:
.byte 15,84,243 // andps %xmm3,%xmm6
.byte 15,85,217 // andnps %xmm1,%xmm3
.byte 15,86,222 // orps %xmm6,%xmm3
- .byte 15,40,168,88,170,0,0 // movaps 0xaa58(%eax),%xmm5
+ .byte 15,40,168,56,170,0,0 // movaps 0xaa38(%eax),%xmm5
.byte 15,88,232 // addps %xmm0,%xmm5
.byte 243,15,91,205 // cvttps2dq %xmm5,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,194,193,1 // cmpltps %xmm1,%xmm0
- .byte 15,40,176,152,168,0,0 // movaps 0xa898(%eax),%xmm6
+ .byte 15,40,176,120,168,0,0 // movaps 0xa878(%eax),%xmm6
.byte 15,41,117,136 // movaps %xmm6,-0x78(%ebp)
.byte 15,84,198 // andps %xmm6,%xmm0
.byte 15,92,200 // subps %xmm0,%xmm1
@@ -57380,19 +57364,19 @@ _sk_hsl_to_rgb_sse2:
.byte 15,41,93,216 // movaps %xmm3,-0x28(%ebp)
.byte 15,88,210 // addps %xmm2,%xmm2
.byte 15,92,211 // subps %xmm3,%xmm2
- .byte 15,40,184,104,170,0,0 // movaps 0xaa68(%eax),%xmm7
+ .byte 15,40,184,72,170,0,0 // movaps 0xaa48(%eax),%xmm7
.byte 15,41,189,88,255,255,255 // movaps %xmm7,-0xa8(%ebp)
.byte 15,194,253,2 // cmpleps %xmm5,%xmm7
.byte 15,92,218 // subps %xmm2,%xmm3
.byte 15,41,93,200 // movaps %xmm3,-0x38(%ebp)
.byte 15,40,204 // movaps %xmm4,%xmm1
.byte 15,194,205,2 // cmpleps %xmm5,%xmm1
- .byte 15,40,160,72,170,0,0 // movaps 0xaa48(%eax),%xmm4
+ .byte 15,40,160,40,170,0,0 // movaps 0xaa28(%eax),%xmm4
.byte 15,41,165,120,255,255,255 // movaps %xmm4,-0x88(%ebp)
.byte 15,194,229,2 // cmpleps %xmm5,%xmm4
- .byte 15,40,176,24,170,0,0 // movaps 0xaa18(%eax),%xmm6
+ .byte 15,40,176,248,169,0,0 // movaps 0xa9f8(%eax),%xmm6
.byte 15,89,238 // mulps %xmm6,%xmm5
- .byte 15,40,128,56,170,0,0 // movaps 0xaa38(%eax),%xmm0
+ .byte 15,40,128,24,170,0,0 // movaps 0xaa18(%eax),%xmm0
.byte 15,41,69,168 // movaps %xmm0,-0x58(%ebp)
.byte 15,92,197 // subps %xmm5,%xmm0
.byte 15,89,195 // mulps %xmm3,%xmm0
@@ -57418,18 +57402,18 @@ _sk_hsl_to_rgb_sse2:
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
.byte 15,40,203 // movaps %xmm3,%xmm1
.byte 15,194,200,1 // cmpltps %xmm0,%xmm1
- .byte 15,84,136,152,168,0,0 // andps 0xa898(%eax),%xmm1
+ .byte 15,84,136,120,168,0,0 // andps 0xa878(%eax),%xmm1
.byte 15,92,193 // subps %xmm1,%xmm0
.byte 15,40,203 // movaps %xmm3,%xmm1
.byte 15,92,200 // subps %xmm0,%xmm1
- .byte 15,40,128,104,170,0,0 // movaps 0xaa68(%eax),%xmm0
+ .byte 15,40,128,72,170,0,0 // movaps 0xaa48(%eax),%xmm0
.byte 15,194,193,2 // cmpleps %xmm1,%xmm0
- .byte 15,40,152,136,168,0,0 // movaps 0xa888(%eax),%xmm3
+ .byte 15,40,152,104,168,0,0 // movaps 0xa868(%eax),%xmm3
.byte 15,194,217,2 // cmpleps %xmm1,%xmm3
- .byte 15,40,160,72,170,0,0 // movaps 0xaa48(%eax),%xmm4
+ .byte 15,40,160,40,170,0,0 // movaps 0xaa28(%eax),%xmm4
.byte 15,194,225,2 // cmpleps %xmm1,%xmm4
.byte 15,89,206 // mulps %xmm6,%xmm1
- .byte 15,40,168,56,170,0,0 // movaps 0xaa38(%eax),%xmm5
+ .byte 15,40,168,24,170,0,0 // movaps 0xaa18(%eax),%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
.byte 15,89,239 // mulps %xmm7,%xmm5
.byte 15,88,234 // addps %xmm2,%xmm5
@@ -57449,7 +57433,7 @@ _sk_hsl_to_rgb_sse2:
.byte 15,40,125,232 // movaps -0x18(%ebp),%xmm7
.byte 15,85,252 // andnps %xmm4,%xmm7
.byte 15,40,93,184 // movaps -0x48(%ebp),%xmm3
- .byte 15,88,152,120,170,0,0 // addps 0xaa78(%eax),%xmm3
+ .byte 15,88,152,88,170,0,0 // addps 0xaa58(%eax),%xmm3
.byte 243,15,91,195 // cvttps2dq %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
.byte 15,40,203 // movaps %xmm3,%xmm1
@@ -57551,9 +57535,9 @@ _sk_scale_u8_sse2:
.byte 102,15,110,36,62 // movd (%esi,%edi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
.byte 102,15,97,224 // punpcklwd %xmm0,%xmm4
- .byte 102,15,219,162,222,166,0,0 // pand 0xa6de(%edx),%xmm4
+ .byte 102,15,219,162,190,166,0,0 // pand 0xa6be(%edx),%xmm4
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
- .byte 15,89,162,14,168,0,0 // mulps 0xa80e(%edx),%xmm4
+ .byte 15,89,162,238,167,0,0 // mulps 0xa7ee(%edx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 15,89,204 // mulps %xmm4,%xmm1
.byte 15,89,212 // mulps %xmm4,%xmm2
@@ -57619,17 +57603,17 @@ _sk_scale_565_sse2:
.byte 15,133,157,0,0,0 // jne 283a <_sk_scale_565_sse2+0xd8>
.byte 243,15,126,52,126 // movq (%esi,%edi,2),%xmm6
.byte 102,15,97,240 // punpcklwd %xmm0,%xmm6
- .byte 102,15,111,162,100,167,0,0 // movdqa 0xa764(%edx),%xmm4
+ .byte 102,15,111,162,68,167,0,0 // movdqa 0xa744(%edx),%xmm4
.byte 102,15,219,230 // pand %xmm6,%xmm4
.byte 15,91,212 // cvtdq2ps %xmm4,%xmm2
- .byte 15,89,146,116,167,0,0 // mulps 0xa774(%edx),%xmm2
- .byte 102,15,111,170,132,167,0,0 // movdqa 0xa784(%edx),%xmm5
+ .byte 15,89,146,84,167,0,0 // mulps 0xa754(%edx),%xmm2
+ .byte 102,15,111,170,100,167,0,0 // movdqa 0xa764(%edx),%xmm5
.byte 102,15,219,238 // pand %xmm6,%xmm5
.byte 15,91,237 // cvtdq2ps %xmm5,%xmm5
- .byte 15,89,170,148,167,0,0 // mulps 0xa794(%edx),%xmm5
- .byte 102,15,219,178,164,167,0,0 // pand 0xa7a4(%edx),%xmm6
+ .byte 15,89,170,116,167,0,0 // mulps 0xa774(%edx),%xmm5
+ .byte 102,15,219,178,132,167,0,0 // pand 0xa784(%edx),%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
- .byte 15,89,178,180,167,0,0 // mulps 0xa7b4(%edx),%xmm6
+ .byte 15,89,178,148,167,0,0 // mulps 0xa794(%edx),%xmm6
.byte 15,40,253 // movaps %xmm5,%xmm7
.byte 15,93,254 // minps %xmm6,%xmm7
.byte 15,40,226 // movaps %xmm2,%xmm4
@@ -57743,9 +57727,9 @@ _sk_lerp_u8_sse2:
.byte 102,15,110,36,62 // movd (%esi,%edi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
.byte 102,15,97,224 // punpcklwd %xmm0,%xmm4
- .byte 102,15,219,162,182,164,0,0 // pand 0xa4b6(%edx),%xmm4
+ .byte 102,15,219,162,150,164,0,0 // pand 0xa496(%edx),%xmm4
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
- .byte 15,89,162,230,165,0,0 // mulps 0xa5e6(%edx),%xmm4
+ .byte 15,89,162,198,165,0,0 // mulps 0xa5c6(%edx),%xmm4
.byte 15,40,105,16 // movaps 0x10(%ecx),%xmm5
.byte 15,40,113,32 // movaps 0x20(%ecx),%xmm6
.byte 15,92,197 // subps %xmm5,%xmm0
@@ -57823,17 +57807,17 @@ _sk_lerp_565_sse2:
.byte 15,133,211,0,0,0 // jne 2ac8 <_sk_lerp_565_sse2+0x113>
.byte 243,15,126,44,126 // movq (%esi,%edi,2),%xmm5
.byte 102,15,97,232 // punpcklwd %xmm0,%xmm5
- .byte 102,15,111,162,12,165,0,0 // movdqa 0xa50c(%edx),%xmm4
+ .byte 102,15,111,162,236,164,0,0 // movdqa 0xa4ec(%edx),%xmm4
.byte 102,15,219,229 // pand %xmm5,%xmm4
.byte 15,91,204 // cvtdq2ps %xmm4,%xmm1
- .byte 15,89,138,28,165,0,0 // mulps 0xa51c(%edx),%xmm1
- .byte 102,15,111,178,44,165,0,0 // movdqa 0xa52c(%edx),%xmm6
+ .byte 15,89,138,252,164,0,0 // mulps 0xa4fc(%edx),%xmm1
+ .byte 102,15,111,178,12,165,0,0 // movdqa 0xa50c(%edx),%xmm6
.byte 102,15,219,245 // pand %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
- .byte 15,89,178,60,165,0,0 // mulps 0xa53c(%edx),%xmm6
- .byte 102,15,219,170,76,165,0,0 // pand 0xa54c(%edx),%xmm5
+ .byte 15,89,178,28,165,0,0 // mulps 0xa51c(%edx),%xmm6
+ .byte 102,15,219,170,44,165,0,0 // pand 0xa52c(%edx),%xmm5
.byte 15,91,213 // cvtdq2ps %xmm5,%xmm2
- .byte 15,89,146,92,165,0,0 // mulps 0xa55c(%edx),%xmm2
+ .byte 15,89,146,60,165,0,0 // mulps 0xa53c(%edx),%xmm2
.byte 15,40,218 // movaps %xmm2,%xmm3
.byte 15,41,93,200 // movaps %xmm3,-0x38(%ebp)
.byte 15,40,254 // movaps %xmm6,%xmm7
@@ -57912,16 +57896,16 @@ _sk_load_tables_sse2:
.byte 131,236,12 // sub $0xc,%esp
.byte 232,0,0,0,0 // call 2b1e <_sk_load_tables_sse2+0xe>
.byte 90 // pop %edx
- .byte 139,117,12 // mov 0xc(%ebp),%esi
+ .byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,57 // mov (%ecx),%edi
+ .byte 139,48 // mov (%eax),%esi
.byte 139,65,8 // mov 0x8(%ecx),%eax
.byte 133,192 // test %eax,%eax
- .byte 139,54 // mov (%esi),%esi
+ .byte 139,57 // mov (%ecx),%edi
.byte 139,30 // mov (%esi),%ebx
.byte 15,133,22,1,0,0 // jne 2c4c <_sk_load_tables_sse2+0x13c>
.byte 243,15,111,28,187 // movdqu (%ebx,%edi,4),%xmm3
- .byte 102,15,111,146,130,162,0,0 // movdqa 0xa282(%edx),%xmm2
+ .byte 102,15,111,146,98,162,0,0 // movdqa 0xa262(%edx),%xmm2
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
@@ -57977,7 +57961,7 @@ _sk_load_tables_sse2:
.byte 102,15,20,215 // unpcklpd %xmm7,%xmm2
.byte 102,15,114,211,24 // psrld $0x18,%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,154,178,163,0,0 // mulps 0xa3b2(%edx),%xmm3
+ .byte 15,89,154,146,163,0,0 // mulps 0xa392(%edx),%xmm3
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 137,194 // mov %eax,%edx
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -58018,17 +58002,17 @@ _sk_load_tables_u16_be_sse2:
.byte 131,236,44 // sub $0x2c,%esp
.byte 232,0,0,0,0 // call 2c8f <_sk_load_tables_u16_be_sse2+0xe>
.byte 90 // pop %edx
- .byte 139,69,12 // mov 0xc(%ebp),%eax
+ .byte 139,117,12 // mov 0xc(%ebp),%esi
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,57 // mov (%ecx),%edi
- .byte 139,89,8 // mov 0x8(%ecx),%ebx
+ .byte 139,65,8 // mov 0x8(%ecx),%eax
.byte 193,231,2 // shl $0x2,%edi
- .byte 133,219 // test %ebx,%ebx
- .byte 139,48 // mov (%eax),%esi
- .byte 139,6 // mov (%esi),%eax
+ .byte 133,192 // test %eax,%eax
+ .byte 139,54 // mov (%esi),%esi
+ .byte 139,30 // mov (%esi),%ebx
.byte 15,133,210,1,0,0 // jne 2e7c <_sk_load_tables_u16_be_sse2+0x1fb>
- .byte 102,15,16,4,120 // movupd (%eax,%edi,2),%xmm0
- .byte 243,15,111,76,120,16 // movdqu 0x10(%eax,%edi,2),%xmm1
+ .byte 102,15,16,4,123 // movupd (%ebx,%edi,2),%xmm0
+ .byte 243,15,111,76,123,16 // movdqu 0x10(%ebx,%edi,2),%xmm1
.byte 102,15,40,216 // movapd %xmm0,%xmm3
.byte 102,15,97,217 // punpcklwd %xmm1,%xmm3
.byte 102,15,105,193 // punpckhwd %xmm1,%xmm0
@@ -58052,7 +58036,7 @@ _sk_load_tables_u16_be_sse2:
.byte 242,15,112,192,232 // pshuflw $0xe8,%xmm0,%xmm0
.byte 243,15,112,192,232 // pshufhw $0xe8,%xmm0,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
- .byte 102,15,111,146,177,162,0,0 // movdqa 0xa2b1(%edx),%xmm2
+ .byte 102,15,111,146,145,162,0,0 // movdqa 0xa291(%edx),%xmm2
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,97,196 // punpcklwd %xmm4,%xmm0
@@ -58124,7 +58108,7 @@ _sk_load_tables_u16_be_sse2:
.byte 243,15,126,93,232 // movq -0x18(%ebp),%xmm3
.byte 102,15,97,220 // punpcklwd %xmm4,%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,154,193,162,0,0 // mulps 0xa2c1(%edx),%xmm3
+ .byte 15,89,154,161,162,0,0 // mulps 0xa2a1(%edx),%xmm3
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 137,194 // mov %eax,%edx
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -58138,14 +58122,14 @@ _sk_load_tables_u16_be_sse2:
.byte 91 // pop %ebx
.byte 93 // pop %ebp
.byte 195 // ret
- .byte 242,15,16,4,120 // movsd (%eax,%edi,2),%xmm0
+ .byte 242,15,16,4,123 // movsd (%ebx,%edi,2),%xmm0
.byte 102,15,239,201 // pxor %xmm1,%xmm1
- .byte 131,251,1 // cmp $0x1,%ebx
+ .byte 131,248,1 // cmp $0x1,%eax
.byte 15,132,39,254,255,255 // je 2cb5 <_sk_load_tables_u16_be_sse2+0x34>
- .byte 102,15,22,68,120,8 // movhpd 0x8(%eax,%edi,2),%xmm0
- .byte 131,251,3 // cmp $0x3,%ebx
+ .byte 102,15,22,68,123,8 // movhpd 0x8(%ebx,%edi,2),%xmm0
+ .byte 131,248,3 // cmp $0x3,%eax
.byte 15,130,24,254,255,255 // jb 2cb5 <_sk_load_tables_u16_be_sse2+0x34>
- .byte 243,15,126,76,120,16 // movq 0x10(%eax,%edi,2),%xmm1
+ .byte 243,15,126,76,123,16 // movq 0x10(%ebx,%edi,2),%xmm1
.byte 233,13,254,255,255 // jmp 2cb5 <_sk_load_tables_u16_be_sse2+0x34>
HIDDEN _sk_load_tables_rgb_u16_be_sse2
@@ -58197,7 +58181,7 @@ _sk_load_tables_rgb_u16_be_sse2:
.byte 242,15,112,194,232 // pshuflw $0xe8,%xmm2,%xmm0
.byte 243,15,112,192,232 // pshufhw $0xe8,%xmm0,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
- .byte 102,15,111,146,138,160,0,0 // movdqa 0xa08a(%edx),%xmm2
+ .byte 102,15,111,146,106,160,0,0 // movdqa 0xa06a(%edx),%xmm2
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,97,195 // punpcklwd %xmm3,%xmm0
@@ -58262,7 +58246,7 @@ _sk_load_tables_rgb_u16_be_sse2:
.byte 137,198 // mov %eax,%esi
.byte 141,70,8 // lea 0x8(%esi),%eax
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,154,42,158,0,0 // movaps 0x9e2a(%edx),%xmm3
+ .byte 15,40,154,10,158,0,0 // movaps 0x9e0a(%edx),%xmm3
.byte 80 // push %eax
.byte 81 // push %ecx
.byte 255,86,4 // call *0x4(%esi)
@@ -58305,7 +58289,7 @@ _sk_byte_tables_sse2:
.byte 90 // pop %edx
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,8 // mov (%eax),%ecx
- .byte 15,40,162,205,156,0,0 // movaps 0x9ccd(%edx),%xmm4
+ .byte 15,40,162,173,156,0,0 // movaps 0x9cad(%edx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 102,15,112,232,78 // pshufd $0x4e,%xmm0,%xmm5
@@ -58327,7 +58311,7 @@ _sk_byte_tables_sse2:
.byte 102,15,110,192 // movd %eax,%xmm0
.byte 139,65,4 // mov 0x4(%ecx),%eax
.byte 102,15,196,195,1 // pinsrw $0x1,%ebx,%xmm0
- .byte 15,40,170,237,157,0,0 // movaps 0x9ded(%edx),%xmm5
+ .byte 15,40,170,205,157,0,0 // movaps 0x9dcd(%edx),%xmm5
.byte 15,89,204 // mulps %xmm4,%xmm1
.byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1
.byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6
@@ -58457,7 +58441,7 @@ _sk_byte_tables_rgb_sse2:
.byte 102,15,110,199 // movd %edi,%xmm0
.byte 139,121,4 // mov 0x4(%ecx),%edi
.byte 102,15,196,198,1 // pinsrw $0x1,%esi,%xmm0
- .byte 15,40,170,241,155,0,0 // movaps 0x9bf1(%edx),%xmm5
+ .byte 15,40,170,209,155,0,0 // movaps 0x9bd1(%edx),%xmm5
.byte 15,89,204 // mulps %xmm4,%xmm1
.byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1
.byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6
@@ -58713,15 +58697,15 @@ _sk_parametric_r_sse2:
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,88,245 // addps %xmm5,%xmm6
.byte 15,91,238 // cvtdq2ps %xmm6,%xmm5
- .byte 15,89,170,177,153,0,0 // mulps 0x99b1(%edx),%xmm5
- .byte 15,84,178,193,153,0,0 // andps 0x99c1(%edx),%xmm6
- .byte 15,86,178,33,151,0,0 // orps 0x9721(%edx),%xmm6
- .byte 15,88,170,209,153,0,0 // addps 0x99d1(%edx),%xmm5
- .byte 15,40,186,225,153,0,0 // movaps 0x99e1(%edx),%xmm7
+ .byte 15,89,170,145,153,0,0 // mulps 0x9991(%edx),%xmm5
+ .byte 15,84,178,161,153,0,0 // andps 0x99a1(%edx),%xmm6
+ .byte 15,86,178,1,151,0,0 // orps 0x9701(%edx),%xmm6
+ .byte 15,88,170,177,153,0,0 // addps 0x99b1(%edx),%xmm5
+ .byte 15,40,186,193,153,0,0 // movaps 0x99c1(%edx),%xmm7
.byte 15,89,254 // mulps %xmm6,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,88,178,241,153,0,0 // addps 0x99f1(%edx),%xmm6
- .byte 15,40,186,1,154,0,0 // movaps 0x9a01(%edx),%xmm7
+ .byte 15,88,178,209,153,0,0 // addps 0x99d1(%edx),%xmm6
+ .byte 15,40,186,225,153,0,0 // movaps 0x99e1(%edx),%xmm7
.byte 15,94,254 // divps %xmm6,%xmm7
.byte 243,15,16,49 // movss (%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -58731,21 +58715,21 @@ _sk_parametric_r_sse2:
.byte 15,91,254 // cvtdq2ps %xmm6,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,194,199,1 // cmpltps %xmm7,%xmm0
- .byte 15,40,178,49,151,0,0 // movaps 0x9731(%edx),%xmm6
+ .byte 15,40,178,17,151,0,0 // movaps 0x9711(%edx),%xmm6
.byte 15,84,198 // andps %xmm6,%xmm0
.byte 15,92,248 // subps %xmm0,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,199 // subps %xmm7,%xmm0
- .byte 15,88,170,17,154,0,0 // addps 0x9a11(%edx),%xmm5
- .byte 15,40,186,33,154,0,0 // movaps 0x9a21(%edx),%xmm7
+ .byte 15,88,170,241,153,0,0 // addps 0x99f1(%edx),%xmm5
+ .byte 15,40,186,1,154,0,0 // movaps 0x9a01(%edx),%xmm7
.byte 15,89,248 // mulps %xmm0,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,40,186,49,154,0,0 // movaps 0x9a31(%edx),%xmm7
+ .byte 15,40,186,17,154,0,0 // movaps 0x9a11(%edx),%xmm7
.byte 15,92,248 // subps %xmm0,%xmm7
- .byte 15,40,130,65,154,0,0 // movaps 0x9a41(%edx),%xmm0
+ .byte 15,40,130,33,154,0,0 // movaps 0x9a21(%edx),%xmm0
.byte 15,94,199 // divps %xmm7,%xmm0
.byte 15,88,197 // addps %xmm5,%xmm0
- .byte 15,89,130,81,154,0,0 // mulps 0x9a51(%edx),%xmm0
+ .byte 15,89,130,49,154,0,0 // mulps 0x9a31(%edx),%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
@@ -58799,15 +58783,15 @@ _sk_parametric_g_sse2:
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,88,245 // addps %xmm5,%xmm6
.byte 15,91,238 // cvtdq2ps %xmm6,%xmm5
- .byte 15,89,170,122,152,0,0 // mulps 0x987a(%edx),%xmm5
- .byte 15,84,178,138,152,0,0 // andps 0x988a(%edx),%xmm6
- .byte 15,86,178,234,149,0,0 // orps 0x95ea(%edx),%xmm6
- .byte 15,88,170,154,152,0,0 // addps 0x989a(%edx),%xmm5
- .byte 15,40,186,170,152,0,0 // movaps 0x98aa(%edx),%xmm7
+ .byte 15,89,170,90,152,0,0 // mulps 0x985a(%edx),%xmm5
+ .byte 15,84,178,106,152,0,0 // andps 0x986a(%edx),%xmm6
+ .byte 15,86,178,202,149,0,0 // orps 0x95ca(%edx),%xmm6
+ .byte 15,88,170,122,152,0,0 // addps 0x987a(%edx),%xmm5
+ .byte 15,40,186,138,152,0,0 // movaps 0x988a(%edx),%xmm7
.byte 15,89,254 // mulps %xmm6,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,88,178,186,152,0,0 // addps 0x98ba(%edx),%xmm6
- .byte 15,40,186,202,152,0,0 // movaps 0x98ca(%edx),%xmm7
+ .byte 15,88,178,154,152,0,0 // addps 0x989a(%edx),%xmm6
+ .byte 15,40,186,170,152,0,0 // movaps 0x98aa(%edx),%xmm7
.byte 15,94,254 // divps %xmm6,%xmm7
.byte 243,15,16,49 // movss (%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -58817,21 +58801,21 @@ _sk_parametric_g_sse2:
.byte 15,91,254 // cvtdq2ps %xmm6,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,194,199,1 // cmpltps %xmm7,%xmm0
- .byte 15,40,178,250,149,0,0 // movaps 0x95fa(%edx),%xmm6
+ .byte 15,40,178,218,149,0,0 // movaps 0x95da(%edx),%xmm6
.byte 15,84,198 // andps %xmm6,%xmm0
.byte 15,92,248 // subps %xmm0,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,199 // subps %xmm7,%xmm0
- .byte 15,88,170,218,152,0,0 // addps 0x98da(%edx),%xmm5
- .byte 15,40,186,234,152,0,0 // movaps 0x98ea(%edx),%xmm7
+ .byte 15,88,170,186,152,0,0 // addps 0x98ba(%edx),%xmm5
+ .byte 15,40,186,202,152,0,0 // movaps 0x98ca(%edx),%xmm7
.byte 15,89,248 // mulps %xmm0,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,40,186,250,152,0,0 // movaps 0x98fa(%edx),%xmm7
+ .byte 15,40,186,218,152,0,0 // movaps 0x98da(%edx),%xmm7
.byte 15,92,248 // subps %xmm0,%xmm7
- .byte 15,40,130,10,153,0,0 // movaps 0x990a(%edx),%xmm0
+ .byte 15,40,130,234,152,0,0 // movaps 0x98ea(%edx),%xmm0
.byte 15,94,199 // divps %xmm7,%xmm0
.byte 15,88,197 // addps %xmm5,%xmm0
- .byte 15,89,130,26,153,0,0 // mulps 0x991a(%edx),%xmm0
+ .byte 15,89,130,250,152,0,0 // mulps 0x98fa(%edx),%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
@@ -58884,15 +58868,15 @@ _sk_parametric_b_sse2:
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,88,245 // addps %xmm5,%xmm6
.byte 15,91,238 // cvtdq2ps %xmm6,%xmm5
- .byte 15,89,170,70,151,0,0 // mulps 0x9746(%edx),%xmm5
- .byte 15,84,178,86,151,0,0 // andps 0x9756(%edx),%xmm6
- .byte 15,86,178,182,148,0,0 // orps 0x94b6(%edx),%xmm6
- .byte 15,88,170,102,151,0,0 // addps 0x9766(%edx),%xmm5
- .byte 15,40,186,118,151,0,0 // movaps 0x9776(%edx),%xmm7
+ .byte 15,89,170,38,151,0,0 // mulps 0x9726(%edx),%xmm5
+ .byte 15,84,178,54,151,0,0 // andps 0x9736(%edx),%xmm6
+ .byte 15,86,178,150,148,0,0 // orps 0x9496(%edx),%xmm6
+ .byte 15,88,170,70,151,0,0 // addps 0x9746(%edx),%xmm5
+ .byte 15,40,186,86,151,0,0 // movaps 0x9756(%edx),%xmm7
.byte 15,89,254 // mulps %xmm6,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,88,178,134,151,0,0 // addps 0x9786(%edx),%xmm6
- .byte 15,40,186,150,151,0,0 // movaps 0x9796(%edx),%xmm7
+ .byte 15,88,178,102,151,0,0 // addps 0x9766(%edx),%xmm6
+ .byte 15,40,186,118,151,0,0 // movaps 0x9776(%edx),%xmm7
.byte 15,94,254 // divps %xmm6,%xmm7
.byte 243,15,16,49 // movss (%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -58902,21 +58886,21 @@ _sk_parametric_b_sse2:
.byte 15,91,254 // cvtdq2ps %xmm6,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,194,199,1 // cmpltps %xmm7,%xmm0
- .byte 15,40,178,198,148,0,0 // movaps 0x94c6(%edx),%xmm6
+ .byte 15,40,178,166,148,0,0 // movaps 0x94a6(%edx),%xmm6
.byte 15,84,198 // andps %xmm6,%xmm0
.byte 15,92,248 // subps %xmm0,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,199 // subps %xmm7,%xmm0
- .byte 15,88,170,166,151,0,0 // addps 0x97a6(%edx),%xmm5
- .byte 15,40,186,182,151,0,0 // movaps 0x97b6(%edx),%xmm7
+ .byte 15,88,170,134,151,0,0 // addps 0x9786(%edx),%xmm5
+ .byte 15,40,186,150,151,0,0 // movaps 0x9796(%edx),%xmm7
.byte 15,89,248 // mulps %xmm0,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,40,186,198,151,0,0 // movaps 0x97c6(%edx),%xmm7
+ .byte 15,40,186,166,151,0,0 // movaps 0x97a6(%edx),%xmm7
.byte 15,92,248 // subps %xmm0,%xmm7
- .byte 15,40,130,214,151,0,0 // movaps 0x97d6(%edx),%xmm0
+ .byte 15,40,130,182,151,0,0 // movaps 0x97b6(%edx),%xmm0
.byte 15,94,199 // divps %xmm7,%xmm0
.byte 15,88,197 // addps %xmm5,%xmm0
- .byte 15,89,130,230,151,0,0 // mulps 0x97e6(%edx),%xmm0
+ .byte 15,89,130,198,151,0,0 // mulps 0x97c6(%edx),%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
@@ -58969,15 +58953,15 @@ _sk_parametric_a_sse2:
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,88,245 // addps %xmm5,%xmm6
.byte 15,91,238 // cvtdq2ps %xmm6,%xmm5
- .byte 15,89,170,18,150,0,0 // mulps 0x9612(%edx),%xmm5
- .byte 15,84,178,34,150,0,0 // andps 0x9622(%edx),%xmm6
- .byte 15,86,178,130,147,0,0 // orps 0x9382(%edx),%xmm6
- .byte 15,88,170,50,150,0,0 // addps 0x9632(%edx),%xmm5
- .byte 15,40,186,66,150,0,0 // movaps 0x9642(%edx),%xmm7
+ .byte 15,89,170,242,149,0,0 // mulps 0x95f2(%edx),%xmm5
+ .byte 15,84,178,2,150,0,0 // andps 0x9602(%edx),%xmm6
+ .byte 15,86,178,98,147,0,0 // orps 0x9362(%edx),%xmm6
+ .byte 15,88,170,18,150,0,0 // addps 0x9612(%edx),%xmm5
+ .byte 15,40,186,34,150,0,0 // movaps 0x9622(%edx),%xmm7
.byte 15,89,254 // mulps %xmm6,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,88,178,82,150,0,0 // addps 0x9652(%edx),%xmm6
- .byte 15,40,186,98,150,0,0 // movaps 0x9662(%edx),%xmm7
+ .byte 15,88,178,50,150,0,0 // addps 0x9632(%edx),%xmm6
+ .byte 15,40,186,66,150,0,0 // movaps 0x9642(%edx),%xmm7
.byte 15,94,254 // divps %xmm6,%xmm7
.byte 243,15,16,49 // movss (%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -58987,21 +58971,21 @@ _sk_parametric_a_sse2:
.byte 15,91,254 // cvtdq2ps %xmm6,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,194,199,1 // cmpltps %xmm7,%xmm0
- .byte 15,40,178,146,147,0,0 // movaps 0x9392(%edx),%xmm6
+ .byte 15,40,178,114,147,0,0 // movaps 0x9372(%edx),%xmm6
.byte 15,84,198 // andps %xmm6,%xmm0
.byte 15,92,248 // subps %xmm0,%xmm7
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,199 // subps %xmm7,%xmm0
- .byte 15,88,170,114,150,0,0 // addps 0x9672(%edx),%xmm5
- .byte 15,40,186,130,150,0,0 // movaps 0x9682(%edx),%xmm7
+ .byte 15,88,170,82,150,0,0 // addps 0x9652(%edx),%xmm5
+ .byte 15,40,186,98,150,0,0 // movaps 0x9662(%edx),%xmm7
.byte 15,89,248 // mulps %xmm0,%xmm7
.byte 15,92,239 // subps %xmm7,%xmm5
- .byte 15,40,186,146,150,0,0 // movaps 0x9692(%edx),%xmm7
+ .byte 15,40,186,114,150,0,0 // movaps 0x9672(%edx),%xmm7
.byte 15,92,248 // subps %xmm0,%xmm7
- .byte 15,40,130,162,150,0,0 // movaps 0x96a2(%edx),%xmm0
+ .byte 15,40,130,130,150,0,0 // movaps 0x9682(%edx),%xmm0
.byte 15,94,199 // divps %xmm7,%xmm0
.byte 15,88,197 // addps %xmm5,%xmm0
- .byte 15,89,130,178,150,0,0 // mulps 0x96b2(%edx),%xmm0
+ .byte 15,89,130,146,150,0,0 // mulps 0x9692(%edx),%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
@@ -59036,15 +59020,15 @@ _sk_gamma_sse2:
.byte 232,0,0,0,0 // call 3a7f <_sk_gamma_sse2+0x12>
.byte 88 // pop %eax
.byte 15,91,195 // cvtdq2ps %xmm3,%xmm0
- .byte 15,89,128,225,148,0,0 // mulps 0x94e1(%eax),%xmm0
- .byte 15,84,152,241,148,0,0 // andps 0x94f1(%eax),%xmm3
- .byte 15,86,152,81,146,0,0 // orps 0x9251(%eax),%xmm3
- .byte 15,88,128,1,149,0,0 // addps 0x9501(%eax),%xmm0
+ .byte 15,89,128,193,148,0,0 // mulps 0x94c1(%eax),%xmm0
+ .byte 15,84,152,209,148,0,0 // andps 0x94d1(%eax),%xmm3
+ .byte 15,86,152,49,146,0,0 // orps 0x9231(%eax),%xmm3
+ .byte 15,88,128,225,148,0,0 // addps 0x94e1(%eax),%xmm0
.byte 15,40,227 // movaps %xmm3,%xmm4
- .byte 15,89,160,17,149,0,0 // mulps 0x9511(%eax),%xmm4
+ .byte 15,89,160,241,148,0,0 // mulps 0x94f1(%eax),%xmm4
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,88,152,33,149,0,0 // addps 0x9521(%eax),%xmm3
- .byte 15,40,160,49,149,0,0 // movaps 0x9531(%eax),%xmm4
+ .byte 15,88,152,1,149,0,0 // addps 0x9501(%eax),%xmm3
+ .byte 15,40,160,17,149,0,0 // movaps 0x9511(%eax),%xmm4
.byte 15,94,227 // divps %xmm3,%xmm4
.byte 15,92,196 // subps %xmm4,%xmm0
.byte 139,77,12 // mov 0xc(%ebp),%ecx
@@ -59057,30 +59041,30 @@ _sk_gamma_sse2:
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
.byte 15,40,224 // movaps %xmm0,%xmm4
.byte 15,194,227,1 // cmpltps %xmm3,%xmm4
- .byte 15,84,160,97,146,0,0 // andps 0x9261(%eax),%xmm4
+ .byte 15,84,160,65,146,0,0 // andps 0x9241(%eax),%xmm4
.byte 15,92,220 // subps %xmm4,%xmm3
.byte 15,40,224 // movaps %xmm0,%xmm4
.byte 15,92,227 // subps %xmm3,%xmm4
- .byte 15,88,128,65,149,0,0 // addps 0x9541(%eax),%xmm0
- .byte 15,40,176,97,149,0,0 // movaps 0x9561(%eax),%xmm6
+ .byte 15,88,128,33,149,0,0 // addps 0x9521(%eax),%xmm0
+ .byte 15,40,176,65,149,0,0 // movaps 0x9541(%eax),%xmm6
.byte 15,92,244 // subps %xmm4,%xmm6
- .byte 15,40,168,81,149,0,0 // movaps 0x9551(%eax),%xmm5
+ .byte 15,40,168,49,149,0,0 // movaps 0x9531(%eax),%xmm5
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,40,152,113,149,0,0 // movaps 0x9571(%eax),%xmm3
+ .byte 15,40,152,81,149,0,0 // movaps 0x9551(%eax),%xmm3
.byte 15,40,227 // movaps %xmm3,%xmm4
.byte 15,94,230 // divps %xmm6,%xmm4
.byte 15,88,224 // addps %xmm0,%xmm4
.byte 15,91,193 // cvtdq2ps %xmm1,%xmm0
- .byte 15,89,128,225,148,0,0 // mulps 0x94e1(%eax),%xmm0
- .byte 15,84,136,241,148,0,0 // andps 0x94f1(%eax),%xmm1
- .byte 15,86,136,81,146,0,0 // orps 0x9251(%eax),%xmm1
- .byte 15,88,128,1,149,0,0 // addps 0x9501(%eax),%xmm0
+ .byte 15,89,128,193,148,0,0 // mulps 0x94c1(%eax),%xmm0
+ .byte 15,84,136,209,148,0,0 // andps 0x94d1(%eax),%xmm1
+ .byte 15,86,136,49,146,0,0 // orps 0x9231(%eax),%xmm1
+ .byte 15,88,128,225,148,0,0 // addps 0x94e1(%eax),%xmm0
.byte 15,40,241 // movaps %xmm1,%xmm6
- .byte 15,89,176,17,149,0,0 // mulps 0x9511(%eax),%xmm6
+ .byte 15,89,176,241,148,0,0 // mulps 0x94f1(%eax),%xmm6
.byte 15,92,198 // subps %xmm6,%xmm0
- .byte 15,88,136,33,149,0,0 // addps 0x9521(%eax),%xmm1
- .byte 15,40,176,49,149,0,0 // movaps 0x9531(%eax),%xmm6
+ .byte 15,88,136,1,149,0,0 // addps 0x9501(%eax),%xmm1
+ .byte 15,40,176,17,149,0,0 // movaps 0x9511(%eax),%xmm6
.byte 15,94,241 // divps %xmm1,%xmm6
.byte 15,92,198 // subps %xmm6,%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
@@ -59088,12 +59072,12 @@ _sk_gamma_sse2:
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 15,40,240 // movaps %xmm0,%xmm6
.byte 15,194,241,1 // cmpltps %xmm1,%xmm6
- .byte 15,84,176,97,146,0,0 // andps 0x9261(%eax),%xmm6
+ .byte 15,84,176,65,146,0,0 // andps 0x9241(%eax),%xmm6
.byte 15,92,206 // subps %xmm6,%xmm1
.byte 15,40,240 // movaps %xmm0,%xmm6
.byte 15,92,241 // subps %xmm1,%xmm6
- .byte 15,88,128,65,149,0,0 // addps 0x9541(%eax),%xmm0
- .byte 15,40,184,97,149,0,0 // movaps 0x9561(%eax),%xmm7
+ .byte 15,88,128,33,149,0,0 // addps 0x9521(%eax),%xmm0
+ .byte 15,40,184,65,149,0,0 // movaps 0x9541(%eax),%xmm7
.byte 15,92,254 // subps %xmm6,%xmm7
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,92,198 // subps %xmm6,%xmm0
@@ -59101,15 +59085,15 @@ _sk_gamma_sse2:
.byte 15,94,207 // divps %xmm7,%xmm1
.byte 15,88,200 // addps %xmm0,%xmm1
.byte 15,91,194 // cvtdq2ps %xmm2,%xmm0
- .byte 15,89,128,225,148,0,0 // mulps 0x94e1(%eax),%xmm0
- .byte 15,84,144,241,148,0,0 // andps 0x94f1(%eax),%xmm2
- .byte 15,86,144,81,146,0,0 // orps 0x9251(%eax),%xmm2
- .byte 15,88,128,1,149,0,0 // addps 0x9501(%eax),%xmm0
- .byte 15,40,176,17,149,0,0 // movaps 0x9511(%eax),%xmm6
+ .byte 15,89,128,193,148,0,0 // mulps 0x94c1(%eax),%xmm0
+ .byte 15,84,144,209,148,0,0 // andps 0x94d1(%eax),%xmm2
+ .byte 15,86,144,49,146,0,0 // orps 0x9231(%eax),%xmm2
+ .byte 15,88,128,225,148,0,0 // addps 0x94e1(%eax),%xmm0
+ .byte 15,40,176,241,148,0,0 // movaps 0x94f1(%eax),%xmm6
.byte 15,89,242 // mulps %xmm2,%xmm6
.byte 15,92,198 // subps %xmm6,%xmm0
- .byte 15,88,144,33,149,0,0 // addps 0x9521(%eax),%xmm2
- .byte 15,40,176,49,149,0,0 // movaps 0x9531(%eax),%xmm6
+ .byte 15,88,144,1,149,0,0 // addps 0x9501(%eax),%xmm2
+ .byte 15,40,176,17,149,0,0 // movaps 0x9511(%eax),%xmm6
.byte 15,94,242 // divps %xmm2,%xmm6
.byte 15,92,198 // subps %xmm6,%xmm0
.byte 15,89,69,232 // mulps -0x18(%ebp),%xmm0
@@ -59117,18 +59101,18 @@ _sk_gamma_sse2:
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
.byte 15,40,240 // movaps %xmm0,%xmm6
.byte 15,194,242,1 // cmpltps %xmm2,%xmm6
- .byte 15,84,176,97,146,0,0 // andps 0x9261(%eax),%xmm6
+ .byte 15,84,176,65,146,0,0 // andps 0x9241(%eax),%xmm6
.byte 15,92,214 // subps %xmm6,%xmm2
.byte 15,40,240 // movaps %xmm0,%xmm6
.byte 15,92,242 // subps %xmm2,%xmm6
- .byte 15,88,128,65,149,0,0 // addps 0x9541(%eax),%xmm0
+ .byte 15,88,128,33,149,0,0 // addps 0x9521(%eax),%xmm0
.byte 15,89,238 // mulps %xmm6,%xmm5
.byte 15,92,197 // subps %xmm5,%xmm0
- .byte 15,40,144,97,149,0,0 // movaps 0x9561(%eax),%xmm2
+ .byte 15,40,144,65,149,0,0 // movaps 0x9541(%eax),%xmm2
.byte 15,92,214 // subps %xmm6,%xmm2
.byte 15,94,218 // divps %xmm2,%xmm3
.byte 15,88,216 // addps %xmm0,%xmm3
- .byte 15,40,128,129,149,0,0 // movaps 0x9581(%eax),%xmm0
+ .byte 15,40,128,97,149,0,0 // movaps 0x9561(%eax),%xmm0
.byte 15,89,224 // mulps %xmm0,%xmm4
.byte 15,89,200 // mulps %xmm0,%xmm1
.byte 15,89,216 // mulps %xmm0,%xmm3
@@ -59157,29 +59141,29 @@ _sk_lab_to_xyz_sse2:
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 232,0,0,0,0 // call 3c67 <_sk_lab_to_xyz_sse2+0x15>
.byte 88 // pop %eax
- .byte 15,89,144,169,147,0,0 // mulps 0x93a9(%eax),%xmm2
- .byte 15,40,160,73,145,0,0 // movaps 0x9149(%eax),%xmm4
+ .byte 15,89,144,137,147,0,0 // mulps 0x9389(%eax),%xmm2
+ .byte 15,40,160,41,145,0,0 // movaps 0x9129(%eax),%xmm4
.byte 15,89,204 // mulps %xmm4,%xmm1
- .byte 15,40,168,185,147,0,0 // movaps 0x93b9(%eax),%xmm5
+ .byte 15,40,168,153,147,0,0 // movaps 0x9399(%eax),%xmm5
.byte 15,88,205 // addps %xmm5,%xmm1
.byte 15,89,220 // mulps %xmm4,%xmm3
.byte 15,88,221 // addps %xmm5,%xmm3
- .byte 15,88,144,201,147,0,0 // addps 0x93c9(%eax),%xmm2
- .byte 15,89,144,217,147,0,0 // mulps 0x93d9(%eax),%xmm2
- .byte 15,89,136,233,147,0,0 // mulps 0x93e9(%eax),%xmm1
+ .byte 15,88,144,169,147,0,0 // addps 0x93a9(%eax),%xmm2
+ .byte 15,89,144,185,147,0,0 // mulps 0x93b9(%eax),%xmm2
+ .byte 15,89,136,201,147,0,0 // mulps 0x93c9(%eax),%xmm1
.byte 15,88,202 // addps %xmm2,%xmm1
- .byte 15,89,152,249,147,0,0 // mulps 0x93f9(%eax),%xmm3
+ .byte 15,89,152,217,147,0,0 // mulps 0x93d9(%eax),%xmm3
.byte 15,40,234 // movaps %xmm2,%xmm5
.byte 15,92,235 // subps %xmm3,%xmm5
.byte 15,40,193 // movaps %xmm1,%xmm0
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 15,89,193 // mulps %xmm1,%xmm0
- .byte 15,40,152,9,148,0,0 // movaps 0x9409(%eax),%xmm3
+ .byte 15,40,152,233,147,0,0 // movaps 0x93e9(%eax),%xmm3
.byte 15,40,227 // movaps %xmm3,%xmm4
.byte 15,194,224,1 // cmpltps %xmm0,%xmm4
- .byte 15,40,176,25,148,0,0 // movaps 0x9419(%eax),%xmm6
+ .byte 15,40,176,249,147,0,0 // movaps 0x93f9(%eax),%xmm6
.byte 15,88,206 // addps %xmm6,%xmm1
- .byte 15,40,184,41,148,0,0 // movaps 0x9429(%eax),%xmm7
+ .byte 15,40,184,9,148,0,0 // movaps 0x9409(%eax),%xmm7
.byte 15,89,207 // mulps %xmm7,%xmm1
.byte 15,84,196 // andps %xmm4,%xmm0
.byte 15,85,225 // andnps %xmm1,%xmm4
@@ -59204,8 +59188,8 @@ _sk_lab_to_xyz_sse2:
.byte 15,85,221 // andnps %xmm5,%xmm3
.byte 15,86,216 // orps %xmm0,%xmm3
.byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,89,160,57,148,0,0 // mulps 0x9439(%eax),%xmm4
- .byte 15,89,152,73,148,0,0 // mulps 0x9449(%eax),%xmm3
+ .byte 15,89,160,25,148,0,0 // mulps 0x9419(%eax),%xmm4
+ .byte 15,89,152,41,148,0,0 // mulps 0x9429(%eax),%xmm3
.byte 141,65,4 // lea 0x4(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
.byte 15,40,196 // movaps %xmm4,%xmm0
@@ -59243,9 +59227,9 @@ _sk_load_a8_sse2:
.byte 102,15,110,4,62 // movd (%esi,%edi,1),%xmm0
.byte 102,15,96,192 // punpcklbw %xmm0,%xmm0
.byte 102,15,97,192 // punpcklwd %xmm0,%xmm0
- .byte 102,15,219,130,73,144,0,0 // pand 0x9049(%edx),%xmm0
+ .byte 102,15,219,130,41,144,0,0 // pand 0x9029(%edx),%xmm0
.byte 15,91,216 // cvtdq2ps %xmm0,%xmm3
- .byte 15,89,154,121,145,0,0 // mulps 0x9179(%edx),%xmm3
+ .byte 15,89,154,89,145,0,0 // mulps 0x9159(%edx),%xmm3
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
.byte 15,87,192 // xorps %xmm0,%xmm0
@@ -59293,8 +59277,8 @@ _sk_load_a8_dst_sse2:
.byte 131,236,12 // sub $0xc,%esp
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,49 // mov (%ecx),%esi
.byte 139,16 // mov (%eax),%edx
+ .byte 139,49 // mov (%ecx),%esi
.byte 139,122,4 // mov 0x4(%edx),%edi
.byte 15,175,121,4 // imul 0x4(%ecx),%edi
.byte 3,58 // add (%edx),%edi
@@ -59310,9 +59294,9 @@ _sk_load_a8_dst_sse2:
.byte 102,15,110,36,55 // movd (%edi,%esi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
.byte 102,15,97,224 // punpcklwd %xmm0,%xmm4
- .byte 102,15,219,162,117,143,0,0 // pand 0x8f75(%edx),%xmm4
+ .byte 102,15,219,162,85,143,0,0 // pand 0x8f55(%edx),%xmm4
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
- .byte 15,89,162,165,144,0,0 // mulps 0x90a5(%edx),%xmm4
+ .byte 15,89,162,133,144,0,0 // mulps 0x9085(%edx),%xmm4
.byte 15,41,97,64 // movaps %xmm4,0x40(%ecx)
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
@@ -59403,7 +59387,7 @@ _sk_gather_a8_sse2:
.byte 102,15,96,193 // punpcklbw %xmm1,%xmm0
.byte 102,15,97,193 // punpcklwd %xmm1,%xmm0
.byte 15,91,216 // cvtdq2ps %xmm0,%xmm3
- .byte 15,89,153,120,143,0,0 // mulps 0x8f78(%ecx),%xmm3
+ .byte 15,89,153,88,143,0,0 // mulps 0x8f58(%ecx),%xmm3
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 131,236,8 // sub $0x8,%esp
.byte 15,87,192 // xorps %xmm0,%xmm0
@@ -59437,7 +59421,7 @@ _sk_store_a8_sse2:
.byte 15,175,81,4 // imul 0x4(%ecx),%edx
.byte 3,23 // add (%edi),%edx
.byte 139,89,8 // mov 0x8(%ecx),%ebx
- .byte 15,40,166,20,142,0,0 // movaps 0x8e14(%esi),%xmm4
+ .byte 15,40,166,244,141,0,0 // movaps 0x8df4(%esi),%xmm4
.byte 15,89,227 // mulps %xmm3,%xmm4
.byte 102,15,91,228 // cvtps2dq %xmm4,%xmm4
.byte 102,15,114,244,16 // pslld $0x10,%xmm4
@@ -59472,7 +59456,7 @@ _sk_store_a8_sse2:
.byte 102,15,197,220,4 // pextrw $0x4,%xmm4,%ebx
.byte 136,92,58,2 // mov %bl,0x2(%edx,%edi,1)
.byte 102,15,112,228,212 // pshufd $0xd4,%xmm4,%xmm4
- .byte 102,15,219,166,36,145,0,0 // pand 0x9124(%esi),%xmm4
+ .byte 102,15,219,166,4,145,0,0 // pand 0x9104(%esi),%xmm4
.byte 102,15,103,228 // packuswb %xmm4,%xmm4
.byte 102,15,103,228 // packuswb %xmm4,%xmm4
.byte 102,15,103,228 // packuswb %xmm4,%xmm4
@@ -59508,12 +59492,12 @@ _sk_load_g8_sse2:
.byte 102,15,110,4,62 // movd (%esi,%edi,1),%xmm0
.byte 102,15,96,192 // punpcklbw %xmm0,%xmm0
.byte 102,15,97,192 // punpcklwd %xmm0,%xmm0
- .byte 102,15,219,130,82,141,0,0 // pand 0x8d52(%edx),%xmm0
+ .byte 102,15,219,130,50,141,0,0 // pand 0x8d32(%edx),%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,130,130,142,0,0 // mulps 0x8e82(%edx),%xmm0
+ .byte 15,89,130,98,142,0,0 // mulps 0x8e62(%edx),%xmm0
.byte 141,112,8 // lea 0x8(%eax),%esi
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,154,146,140,0,0 // movaps 0x8c92(%edx),%xmm3
+ .byte 15,40,154,114,140,0,0 // movaps 0x8c72(%edx),%xmm3
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 86 // push %esi
@@ -59571,13 +59555,13 @@ _sk_load_g8_dst_sse2:
.byte 102,15,110,36,62 // movd (%esi,%edi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
.byte 102,15,97,224 // punpcklwd %xmm0,%xmm4
- .byte 102,15,219,162,166,140,0,0 // pand 0x8ca6(%edx),%xmm4
+ .byte 102,15,219,162,134,140,0,0 // pand 0x8c86(%edx),%xmm4
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
- .byte 15,89,162,214,141,0,0 // mulps 0x8dd6(%edx),%xmm4
+ .byte 15,89,162,182,141,0,0 // mulps 0x8db6(%edx),%xmm4
.byte 15,41,97,48 // movaps %xmm4,0x30(%ecx)
.byte 15,41,97,32 // movaps %xmm4,0x20(%ecx)
.byte 15,41,97,16 // movaps %xmm4,0x10(%ecx)
- .byte 15,40,162,230,139,0,0 // movaps 0x8be6(%edx),%xmm4
+ .byte 15,40,162,198,139,0,0 // movaps 0x8bc6(%edx),%xmm4
.byte 15,41,97,64 // movaps %xmm4,0x40(%ecx)
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
@@ -59669,10 +59653,10 @@ _sk_gather_g8_sse2:
.byte 102,15,96,193 // punpcklbw %xmm1,%xmm0
.byte 102,15,97,193 // punpcklwd %xmm1,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,129,127,140,0,0 // mulps 0x8c7f(%ecx),%xmm0
+ .byte 15,89,129,95,140,0,0 // mulps 0x8c5f(%ecx),%xmm0
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,153,143,138,0,0 // movaps 0x8a8f(%ecx),%xmm3
+ .byte 15,40,153,111,138,0,0 // movaps 0x8a6f(%ecx),%xmm3
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 82 // push %edx
@@ -59709,20 +59693,20 @@ _sk_load_565_sse2:
.byte 117,97 // jne 431a <_sk_load_565_sse2+0x8c>
.byte 243,15,126,20,126 // movq (%esi,%edi,2),%xmm2
.byte 102,15,97,208 // punpcklwd %xmm0,%xmm2
- .byte 102,15,111,130,68,140,0,0 // movdqa 0x8c44(%edx),%xmm0
+ .byte 102,15,111,130,36,140,0,0 // movdqa 0x8c24(%edx),%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,130,84,140,0,0 // mulps 0x8c54(%edx),%xmm0
- .byte 102,15,111,138,100,140,0,0 // movdqa 0x8c64(%edx),%xmm1
+ .byte 15,89,130,52,140,0,0 // mulps 0x8c34(%edx),%xmm0
+ .byte 102,15,111,138,68,140,0,0 // movdqa 0x8c44(%edx),%xmm1
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,138,116,140,0,0 // mulps 0x8c74(%edx),%xmm1
- .byte 102,15,219,146,132,140,0,0 // pand 0x8c84(%edx),%xmm2
+ .byte 15,89,138,84,140,0,0 // mulps 0x8c54(%edx),%xmm1
+ .byte 102,15,219,146,100,140,0,0 // pand 0x8c64(%edx),%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,146,148,140,0,0 // mulps 0x8c94(%edx),%xmm2
+ .byte 15,89,146,116,140,0,0 // mulps 0x8c74(%edx),%xmm2
.byte 141,112,8 // lea 0x8(%eax),%esi
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,154,68,138,0,0 // movaps 0x8a44(%edx),%xmm3
+ .byte 15,40,154,36,138,0,0 // movaps 0x8a24(%edx),%xmm3
.byte 86 // push %esi
.byte 81 // push %ecx
.byte 255,80,4 // call *0x4(%eax)
@@ -59776,21 +59760,21 @@ _sk_load_565_dst_sse2:
.byte 117,113 // jne 43fa <_sk_load_565_dst_sse2+0x9c>
.byte 243,15,126,36,126 // movq (%esi,%edi,2),%xmm4
.byte 102,15,97,224 // punpcklwd %xmm0,%xmm4
- .byte 102,15,111,170,116,139,0,0 // movdqa 0x8b74(%edx),%xmm5
+ .byte 102,15,111,170,84,139,0,0 // movdqa 0x8b54(%edx),%xmm5
.byte 102,15,219,236 // pand %xmm4,%xmm5
.byte 15,91,237 // cvtdq2ps %xmm5,%xmm5
- .byte 15,89,170,132,139,0,0 // mulps 0x8b84(%edx),%xmm5
+ .byte 15,89,170,100,139,0,0 // mulps 0x8b64(%edx),%xmm5
.byte 15,41,105,16 // movaps %xmm5,0x10(%ecx)
- .byte 102,15,111,170,148,139,0,0 // movdqa 0x8b94(%edx),%xmm5
+ .byte 102,15,111,170,116,139,0,0 // movdqa 0x8b74(%edx),%xmm5
.byte 102,15,219,236 // pand %xmm4,%xmm5
.byte 15,91,237 // cvtdq2ps %xmm5,%xmm5
- .byte 15,89,170,164,139,0,0 // mulps 0x8ba4(%edx),%xmm5
+ .byte 15,89,170,132,139,0,0 // mulps 0x8b84(%edx),%xmm5
.byte 15,41,105,32 // movaps %xmm5,0x20(%ecx)
- .byte 102,15,219,162,180,139,0,0 // pand 0x8bb4(%edx),%xmm4
+ .byte 102,15,219,162,148,139,0,0 // pand 0x8b94(%edx),%xmm4
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
- .byte 15,89,162,196,139,0,0 // mulps 0x8bc4(%edx),%xmm4
+ .byte 15,89,162,164,139,0,0 // mulps 0x8ba4(%edx),%xmm4
.byte 15,41,97,48 // movaps %xmm4,0x30(%ecx)
- .byte 15,40,162,116,137,0,0 // movaps 0x8974(%edx),%xmm4
+ .byte 15,40,162,84,137,0,0 // movaps 0x8954(%edx),%xmm4
.byte 15,41,97,64 // movaps %xmm4,0x40(%ecx)
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
@@ -59875,20 +59859,20 @@ _sk_gather_565_sse2:
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,196,209,3 // pinsrw $0x3,%ecx,%xmm2
.byte 102,15,97,208 // punpcklwd %xmm0,%xmm2
- .byte 102,15,111,130,242,137,0,0 // movdqa 0x89f2(%edx),%xmm0
+ .byte 102,15,111,130,210,137,0,0 // movdqa 0x89d2(%edx),%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,130,2,138,0,0 // mulps 0x8a02(%edx),%xmm0
- .byte 102,15,111,138,18,138,0,0 // movdqa 0x8a12(%edx),%xmm1
+ .byte 15,89,130,226,137,0,0 // mulps 0x89e2(%edx),%xmm0
+ .byte 102,15,111,138,242,137,0,0 // movdqa 0x89f2(%edx),%xmm1
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,138,34,138,0,0 // mulps 0x8a22(%edx),%xmm1
- .byte 102,15,219,146,50,138,0,0 // pand 0x8a32(%edx),%xmm2
+ .byte 15,89,138,2,138,0,0 // mulps 0x8a02(%edx),%xmm1
+ .byte 102,15,219,146,18,138,0,0 // pand 0x8a12(%edx),%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,146,66,138,0,0 // mulps 0x8a42(%edx),%xmm2
+ .byte 15,89,146,34,138,0,0 // mulps 0x8a22(%edx),%xmm2
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,154,242,135,0,0 // movaps 0x87f2(%edx),%xmm3
+ .byte 15,40,154,210,135,0,0 // movaps 0x87d2(%edx),%xmm3
.byte 81 // push %ecx
.byte 255,117,8 // pushl 0x8(%ebp)
.byte 255,80,4 // call *0x4(%eax)
@@ -59916,8 +59900,8 @@ _sk_store_565_sse2:
.byte 1,210 // add %edx,%edx
.byte 3,22 // add (%esi),%edx
.byte 139,49 // mov (%ecx),%esi
- .byte 15,40,167,111,139,0,0 // movaps 0x8b6f(%edi),%xmm4
- .byte 15,40,175,127,139,0,0 // movaps 0x8b7f(%edi),%xmm5
+ .byte 15,40,167,79,139,0,0 // movaps 0x8b4f(%edi),%xmm4
+ .byte 15,40,175,95,139,0,0 // movaps 0x8b5f(%edi),%xmm5
.byte 139,89,8 // mov 0x8(%ecx),%ebx
.byte 15,40,240 // movaps %xmm0,%xmm6
.byte 15,89,244 // mulps %xmm4,%xmm6
@@ -59997,21 +59981,21 @@ _sk_load_4444_sse2:
.byte 117,112 // jne 46d0 <_sk_load_4444_sse2+0x9b>
.byte 243,15,126,28,126 // movq (%esi,%edi,2),%xmm3
.byte 102,15,97,216 // punpcklwd %xmm0,%xmm3
- .byte 102,15,111,130,173,138,0,0 // movdqa 0x8aad(%edx),%xmm0
+ .byte 102,15,111,130,141,138,0,0 // movdqa 0x8a8d(%edx),%xmm0
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,130,189,138,0,0 // mulps 0x8abd(%edx),%xmm0
- .byte 102,15,111,138,205,138,0,0 // movdqa 0x8acd(%edx),%xmm1
+ .byte 15,89,130,157,138,0,0 // mulps 0x8a9d(%edx),%xmm0
+ .byte 102,15,111,138,173,138,0,0 // movdqa 0x8aad(%edx),%xmm1
.byte 102,15,219,203 // pand %xmm3,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,138,221,138,0,0 // mulps 0x8add(%edx),%xmm1
- .byte 102,15,111,146,237,138,0,0 // movdqa 0x8aed(%edx),%xmm2
+ .byte 15,89,138,189,138,0,0 // mulps 0x8abd(%edx),%xmm1
+ .byte 102,15,111,146,205,138,0,0 // movdqa 0x8acd(%edx),%xmm2
.byte 102,15,219,211 // pand %xmm3,%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,146,253,138,0,0 // mulps 0x8afd(%edx),%xmm2
- .byte 102,15,219,154,13,139,0,0 // pand 0x8b0d(%edx),%xmm3
+ .byte 15,89,146,221,138,0,0 // mulps 0x8add(%edx),%xmm2
+ .byte 102,15,219,154,237,138,0,0 // pand 0x8aed(%edx),%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,154,29,139,0,0 // mulps 0x8b1d(%edx),%xmm3
+ .byte 15,89,154,253,138,0,0 // mulps 0x8afd(%edx),%xmm3
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
.byte 82 // push %edx
@@ -60067,24 +60051,24 @@ _sk_load_4444_dst_sse2:
.byte 15,133,128,0,0,0 // jne 47c3 <_sk_load_4444_dst_sse2+0xaf>
.byte 243,15,126,36,126 // movq (%esi,%edi,2),%xmm4
.byte 102,15,97,224 // punpcklwd %xmm0,%xmm4
- .byte 102,15,111,170,206,137,0,0 // movdqa 0x89ce(%edx),%xmm5
+ .byte 102,15,111,170,174,137,0,0 // movdqa 0x89ae(%edx),%xmm5
.byte 102,15,219,236 // pand %xmm4,%xmm5
.byte 15,91,237 // cvtdq2ps %xmm5,%xmm5
- .byte 15,89,170,222,137,0,0 // mulps 0x89de(%edx),%xmm5
+ .byte 15,89,170,190,137,0,0 // mulps 0x89be(%edx),%xmm5
.byte 15,41,105,16 // movaps %xmm5,0x10(%ecx)
- .byte 102,15,111,170,238,137,0,0 // movdqa 0x89ee(%edx),%xmm5
+ .byte 102,15,111,170,206,137,0,0 // movdqa 0x89ce(%edx),%xmm5
.byte 102,15,219,236 // pand %xmm4,%xmm5
.byte 15,91,237 // cvtdq2ps %xmm5,%xmm5
- .byte 15,89,170,254,137,0,0 // mulps 0x89fe(%edx),%xmm5
+ .byte 15,89,170,222,137,0,0 // mulps 0x89de(%edx),%xmm5
.byte 15,41,105,32 // movaps %xmm5,0x20(%ecx)
- .byte 102,15,111,170,14,138,0,0 // movdqa 0x8a0e(%edx),%xmm5
+ .byte 102,15,111,170,238,137,0,0 // movdqa 0x89ee(%edx),%xmm5
.byte 102,15,219,236 // pand %xmm4,%xmm5
.byte 15,91,237 // cvtdq2ps %xmm5,%xmm5
- .byte 15,89,170,30,138,0,0 // mulps 0x8a1e(%edx),%xmm5
+ .byte 15,89,170,254,137,0,0 // mulps 0x89fe(%edx),%xmm5
.byte 15,41,105,48 // movaps %xmm5,0x30(%ecx)
- .byte 102,15,219,162,46,138,0,0 // pand 0x8a2e(%edx),%xmm4
+ .byte 102,15,219,162,14,138,0,0 // pand 0x8a0e(%edx),%xmm4
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
- .byte 15,89,162,62,138,0,0 // mulps 0x8a3e(%edx),%xmm4
+ .byte 15,89,162,30,138,0,0 // mulps 0x8a1e(%edx),%xmm4
.byte 15,41,97,64 // movaps %xmm4,0x40(%ecx)
.byte 141,80,8 // lea 0x8(%eax),%edx
.byte 131,236,8 // sub $0x8,%esp
@@ -60169,21 +60153,21 @@ _sk_gather_4444_sse2:
.byte 89 // pop %ecx
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,97,216 // punpcklwd %xmm0,%xmm3
- .byte 102,15,111,129,48,136,0,0 // movdqa 0x8830(%ecx),%xmm0
+ .byte 102,15,111,129,16,136,0,0 // movdqa 0x8810(%ecx),%xmm0
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,129,64,136,0,0 // mulps 0x8840(%ecx),%xmm0
- .byte 102,15,111,137,80,136,0,0 // movdqa 0x8850(%ecx),%xmm1
+ .byte 15,89,129,32,136,0,0 // mulps 0x8820(%ecx),%xmm0
+ .byte 102,15,111,137,48,136,0,0 // movdqa 0x8830(%ecx),%xmm1
.byte 102,15,219,203 // pand %xmm3,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,137,96,136,0,0 // mulps 0x8860(%ecx),%xmm1
- .byte 102,15,111,145,112,136,0,0 // movdqa 0x8870(%ecx),%xmm2
+ .byte 15,89,137,64,136,0,0 // mulps 0x8840(%ecx),%xmm1
+ .byte 102,15,111,145,80,136,0,0 // movdqa 0x8850(%ecx),%xmm2
.byte 102,15,219,211 // pand %xmm3,%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,145,128,136,0,0 // mulps 0x8880(%ecx),%xmm2
- .byte 102,15,219,153,144,136,0,0 // pand 0x8890(%ecx),%xmm3
+ .byte 15,89,145,96,136,0,0 // mulps 0x8860(%ecx),%xmm2
+ .byte 102,15,219,153,112,136,0,0 // pand 0x8870(%ecx),%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,153,160,136,0,0 // mulps 0x88a0(%ecx),%xmm3
+ .byte 15,89,153,128,136,0,0 // mulps 0x8880(%ecx),%xmm3
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 131,236,8 // sub $0x8,%esp
.byte 81 // push %ecx
@@ -60213,7 +60197,7 @@ _sk_store_4444_sse2:
.byte 1,210 // add %edx,%edx
.byte 3,22 // add (%esi),%edx
.byte 139,49 // mov (%ecx),%esi
- .byte 15,40,167,51,136,0,0 // movaps 0x8833(%edi),%xmm4
+ .byte 15,40,167,19,136,0,0 // movaps 0x8813(%edi),%xmm4
.byte 139,89,8 // mov 0x8(%ecx),%ebx
.byte 15,40,232 // movaps %xmm0,%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
@@ -60298,11 +60282,11 @@ _sk_load_8888_sse2:
.byte 139,57 // mov (%ecx),%edi
.byte 117,102 // jne 4ab2 <_sk_load_8888_sse2+0x92>
.byte 243,15,111,28,190 // movdqu (%esi,%edi,4),%xmm3
- .byte 102,15,111,146,114,131,0,0 // movdqa 0x8372(%edx),%xmm2
+ .byte 102,15,111,146,82,131,0,0 // movdqa 0x8352(%edx),%xmm2
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,40,162,162,132,0,0 // movaps 0x84a2(%edx),%xmm4
+ .byte 15,40,162,130,132,0,0 // movaps 0x8482(%edx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -60367,11 +60351,11 @@ _sk_load_8888_dst_sse2:
.byte 139,57 // mov (%ecx),%edi
.byte 117,118 // jne 4b89 <_sk_load_8888_dst_sse2+0xa2>
.byte 243,15,111,36,190 // movdqu (%esi,%edi,4),%xmm4
- .byte 102,15,111,170,171,130,0,0 // movdqa 0x82ab(%edx),%xmm5
+ .byte 102,15,111,170,139,130,0,0 // movdqa 0x828b(%edx),%xmm5
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
.byte 102,15,219,245 // pand %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
- .byte 15,40,186,219,131,0,0 // movaps 0x83db(%edx),%xmm7
+ .byte 15,40,186,187,131,0,0 // movaps 0x83bb(%edx),%xmm7
.byte 15,89,247 // mulps %xmm7,%xmm6
.byte 15,41,113,16 // movaps %xmm6,0x10(%ecx)
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
@@ -60466,11 +60450,11 @@ _sk_gather_8888_sse2:
.byte 102,15,98,194 // punpckldq %xmm2,%xmm0
.byte 102,15,98,217 // punpckldq %xmm1,%xmm3
.byte 102,15,108,216 // punpcklqdq %xmm0,%xmm3
- .byte 102,15,111,145,56,129,0,0 // movdqa 0x8138(%ecx),%xmm2
+ .byte 102,15,111,145,24,129,0,0 // movdqa 0x8118(%ecx),%xmm2
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,40,161,104,130,0,0 // movaps 0x8268(%ecx),%xmm4
+ .byte 15,40,161,72,130,0,0 // movaps 0x8248(%ecx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -60514,7 +60498,7 @@ _sk_store_8888_sse2:
.byte 193,226,2 // shl $0x2,%edx
.byte 3,22 // add (%esi),%edx
.byte 139,49 // mov (%ecx),%esi
- .byte 15,40,167,205,128,0,0 // movaps 0x80cd(%edi),%xmm4
+ .byte 15,40,167,173,128,0,0 // movaps 0x80ad(%edi),%xmm4
.byte 139,89,8 // mov 0x8(%ecx),%ebx
.byte 15,40,232 // movaps %xmm0,%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
@@ -60585,11 +60569,11 @@ _sk_load_bgra_sse2:
.byte 139,57 // mov (%ecx),%edi
.byte 117,102 // jne 4e1d <_sk_load_bgra_sse2+0x92>
.byte 243,15,111,28,190 // movdqu (%esi,%edi,4),%xmm3
- .byte 102,15,111,130,7,128,0,0 // movdqa 0x8007(%edx),%xmm0
+ .byte 102,15,111,130,231,127,0,0 // movdqa 0x7fe7(%edx),%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,219,200 // pand %xmm0,%xmm1
.byte 15,91,209 // cvtdq2ps %xmm1,%xmm2
- .byte 15,40,162,55,129,0,0 // movaps 0x8137(%edx),%xmm4
+ .byte 15,40,162,23,129,0,0 // movaps 0x8117(%edx),%xmm4
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -60654,11 +60638,11 @@ _sk_load_bgra_dst_sse2:
.byte 139,57 // mov (%ecx),%edi
.byte 117,118 // jne 4ef4 <_sk_load_bgra_dst_sse2+0xa2>
.byte 243,15,111,36,190 // movdqu (%esi,%edi,4),%xmm4
- .byte 102,15,111,170,64,127,0,0 // movdqa 0x7f40(%edx),%xmm5
+ .byte 102,15,111,170,32,127,0,0 // movdqa 0x7f20(%edx),%xmm5
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
.byte 102,15,219,245 // pand %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
- .byte 15,40,186,112,128,0,0 // movaps 0x8070(%edx),%xmm7
+ .byte 15,40,186,80,128,0,0 // movaps 0x8050(%edx),%xmm7
.byte 15,89,247 // mulps %xmm7,%xmm6
.byte 15,41,113,48 // movaps %xmm6,0x30(%ecx)
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
@@ -60753,11 +60737,11 @@ _sk_gather_bgra_sse2:
.byte 102,15,98,194 // punpckldq %xmm2,%xmm0
.byte 102,15,98,217 // punpckldq %xmm1,%xmm3
.byte 102,15,108,216 // punpcklqdq %xmm0,%xmm3
- .byte 102,15,111,129,205,125,0,0 // movdqa 0x7dcd(%ecx),%xmm0
+ .byte 102,15,111,129,173,125,0,0 // movdqa 0x7dad(%ecx),%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,219,200 // pand %xmm0,%xmm1
.byte 15,91,209 // cvtdq2ps %xmm1,%xmm2
- .byte 15,40,161,253,126,0,0 // movaps 0x7efd(%ecx),%xmm4
+ .byte 15,40,161,221,126,0,0 // movaps 0x7edd(%ecx),%xmm4
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -60801,7 +60785,7 @@ _sk_store_bgra_sse2:
.byte 193,226,2 // shl $0x2,%edx
.byte 3,22 // add (%esi),%edx
.byte 139,49 // mov (%ecx),%esi
- .byte 15,40,167,98,125,0,0 // movaps 0x7d62(%edi),%xmm4
+ .byte 15,40,167,66,125,0,0 // movaps 0x7d42(%edi),%xmm4
.byte 139,89,8 // mov 0x8(%ecx),%ebx
.byte 15,40,234 // movaps %xmm2,%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
@@ -60900,11 +60884,11 @@ _sk_load_f16_sse2:
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,97,200 // punpcklwd %xmm0,%xmm1
.byte 102,15,239,210 // pxor %xmm2,%xmm2
- .byte 102,15,111,170,124,128,0,0 // movdqa 0x807c(%edx),%xmm5
+ .byte 102,15,111,170,92,128,0,0 // movdqa 0x805c(%edx),%xmm5
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
.byte 102,15,219,245 // pand %xmm5,%xmm6
- .byte 102,15,219,138,140,128,0,0 // pand 0x808c(%edx),%xmm1
- .byte 102,15,111,130,156,128,0,0 // movdqa 0x809c(%edx),%xmm0
+ .byte 102,15,219,138,108,128,0,0 // pand 0x806c(%edx),%xmm1
+ .byte 102,15,111,130,124,128,0,0 // movdqa 0x807c(%edx),%xmm0
.byte 102,15,127,69,184 // movdqa %xmm0,-0x48(%ebp)
.byte 102,15,114,246,16 // pslld $0x10,%xmm6
.byte 102,15,111,216 // movdqa %xmm0,%xmm3
@@ -60916,7 +60900,7 @@ _sk_load_f16_sse2:
.byte 102,15,239,255 // pxor %xmm7,%xmm7
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
.byte 102,15,219,213 // pand %xmm5,%xmm2
- .byte 102,15,111,154,140,128,0,0 // movdqa 0x808c(%edx),%xmm3
+ .byte 102,15,111,154,108,128,0,0 // movdqa 0x806c(%edx),%xmm3
.byte 102,15,219,227 // pand %xmm3,%xmm4
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,102,196 // pcmpgtd %xmm4,%xmm0
@@ -60929,7 +60913,7 @@ _sk_load_f16_sse2:
.byte 102,15,219,253 // pand %xmm5,%xmm7
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 102,15,114,247,16 // pslld $0x10,%xmm7
- .byte 102,15,111,146,156,128,0,0 // movdqa 0x809c(%edx),%xmm2
+ .byte 102,15,111,146,124,128,0,0 // movdqa 0x807c(%edx),%xmm2
.byte 102,15,102,208 // pcmpgtd %xmm0,%xmm2
.byte 102,15,114,240,13 // pslld $0xd,%xmm0
.byte 102,15,235,199 // por %xmm7,%xmm0
@@ -60944,7 +60928,7 @@ _sk_load_f16_sse2:
.byte 102,15,127,93,184 // movdqa %xmm3,-0x48(%ebp)
.byte 102,15,114,247,13 // pslld $0xd,%xmm7
.byte 102,15,235,253 // por %xmm5,%xmm7
- .byte 102,15,111,154,172,128,0,0 // movdqa 0x80ac(%edx),%xmm3
+ .byte 102,15,111,154,140,128,0,0 // movdqa 0x808c(%edx),%xmm3
.byte 102,15,254,203 // paddd %xmm3,%xmm1
.byte 102,15,254,227 // paddd %xmm3,%xmm4
.byte 102,15,254,195 // paddd %xmm3,%xmm0
@@ -61033,18 +61017,18 @@ _sk_load_f16_dst_sse2:
.byte 102,15,126,85,232 // movd %xmm2,-0x18(%ebp)
.byte 102,15,239,210 // pxor %xmm2,%xmm2
.byte 102,15,97,202 // punpcklwd %xmm2,%xmm1
- .byte 102,15,111,186,95,126,0,0 // movdqa 0x7e5f(%edx),%xmm7
+ .byte 102,15,111,186,63,126,0,0 // movdqa 0x7e3f(%edx),%xmm7
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,219,215 // pand %xmm7,%xmm2
- .byte 102,15,111,154,111,126,0,0 // movdqa 0x7e6f(%edx),%xmm3
+ .byte 102,15,111,154,79,126,0,0 // movdqa 0x7e4f(%edx),%xmm3
.byte 102,15,219,203 // pand %xmm3,%xmm1
- .byte 102,15,111,162,127,126,0,0 // movdqa 0x7e7f(%edx),%xmm4
+ .byte 102,15,111,162,95,126,0,0 // movdqa 0x7e5f(%edx),%xmm4
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,111,236 // movdqa %xmm4,%xmm5
.byte 102,15,102,233 // pcmpgtd %xmm1,%xmm5
.byte 102,15,114,241,13 // pslld $0xd,%xmm1
.byte 102,15,235,202 // por %xmm2,%xmm1
- .byte 102,15,111,146,143,126,0,0 // movdqa 0x7e8f(%edx),%xmm2
+ .byte 102,15,111,146,111,126,0,0 // movdqa 0x7e6f(%edx),%xmm2
.byte 102,15,127,85,184 // movdqa %xmm2,-0x48(%ebp)
.byte 102,15,254,202 // paddd %xmm2,%xmm1
.byte 102,15,223,233 // pandn %xmm1,%xmm5
@@ -61190,11 +61174,11 @@ _sk_gather_f16_sse2:
.byte 102,15,126,69,248 // movd %xmm0,-0x8(%ebp)
.byte 102,15,97,206 // punpcklwd %xmm6,%xmm1
.byte 102,15,239,210 // pxor %xmm2,%xmm2
- .byte 102,15,111,177,195,123,0,0 // movdqa 0x7bc3(%ecx),%xmm6
+ .byte 102,15,111,177,163,123,0,0 // movdqa 0x7ba3(%ecx),%xmm6
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,219,230 // pand %xmm6,%xmm4
- .byte 102,15,219,137,211,123,0,0 // pand 0x7bd3(%ecx),%xmm1
- .byte 102,15,111,129,227,123,0,0 // movdqa 0x7be3(%ecx),%xmm0
+ .byte 102,15,219,137,179,123,0,0 // pand 0x7bb3(%ecx),%xmm1
+ .byte 102,15,111,129,195,123,0,0 // movdqa 0x7bc3(%ecx),%xmm0
.byte 102,15,114,244,16 // pslld $0x10,%xmm4
.byte 102,15,111,216 // movdqa %xmm0,%xmm3
.byte 102,15,102,217 // pcmpgtd %xmm1,%xmm3
@@ -61205,7 +61189,7 @@ _sk_gather_f16_sse2:
.byte 102,15,239,255 // pxor %xmm7,%xmm7
.byte 102,15,111,213 // movdqa %xmm5,%xmm2
.byte 102,15,219,214 // pand %xmm6,%xmm2
- .byte 102,15,111,153,211,123,0,0 // movdqa 0x7bd3(%ecx),%xmm3
+ .byte 102,15,111,153,179,123,0,0 // movdqa 0x7bb3(%ecx),%xmm3
.byte 102,15,219,235 // pand %xmm3,%xmm5
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,111,224 // movdqa %xmm0,%xmm4
@@ -61219,7 +61203,7 @@ _sk_gather_f16_sse2:
.byte 102,15,219,254 // pand %xmm6,%xmm7
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 102,15,114,247,16 // pslld $0x10,%xmm7
- .byte 102,15,111,145,227,123,0,0 // movdqa 0x7be3(%ecx),%xmm2
+ .byte 102,15,111,145,195,123,0,0 // movdqa 0x7bc3(%ecx),%xmm2
.byte 102,15,111,218 // movdqa %xmm2,%xmm3
.byte 102,15,102,216 // pcmpgtd %xmm0,%xmm3
.byte 102,15,114,240,13 // pslld $0xd,%xmm0
@@ -61228,12 +61212,12 @@ _sk_gather_f16_sse2:
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,97,252 // punpcklwd %xmm4,%xmm7
.byte 102,15,219,247 // pand %xmm7,%xmm6
- .byte 102,15,219,185,211,123,0,0 // pand 0x7bd3(%ecx),%xmm7
+ .byte 102,15,219,185,179,123,0,0 // pand 0x7bb3(%ecx),%xmm7
.byte 102,15,114,246,16 // pslld $0x10,%xmm6
.byte 102,15,102,215 // pcmpgtd %xmm7,%xmm2
.byte 102,15,114,247,13 // pslld $0xd,%xmm7
.byte 102,15,235,254 // por %xmm6,%xmm7
- .byte 102,15,111,161,243,123,0,0 // movdqa 0x7bf3(%ecx),%xmm4
+ .byte 102,15,111,161,211,123,0,0 // movdqa 0x7bd3(%ecx),%xmm4
.byte 102,15,254,204 // paddd %xmm4,%xmm1
.byte 102,15,254,236 // paddd %xmm4,%xmm5
.byte 102,15,254,196 // paddd %xmm4,%xmm0
@@ -61272,22 +61256,22 @@ _sk_store_f16_sse2:
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 232,0,0,0,0 // call 5781 <_sk_store_f16_sse2+0x19>
.byte 88 // pop %eax
- .byte 102,15,111,152,63,122,0,0 // movdqa 0x7a3f(%eax),%xmm3
+ .byte 102,15,111,152,31,122,0,0 // movdqa 0x7a1f(%eax),%xmm3
.byte 102,15,111,224 // movdqa %xmm0,%xmm4
.byte 102,15,219,227 // pand %xmm3,%xmm4
- .byte 102,15,111,136,111,122,0,0 // movdqa 0x7a6f(%eax),%xmm1
+ .byte 102,15,111,136,79,122,0,0 // movdqa 0x7a4f(%eax),%xmm1
.byte 102,15,127,77,232 // movdqa %xmm1,-0x18(%ebp)
.byte 102,15,111,240 // movdqa %xmm0,%xmm6
.byte 102,15,114,246,3 // pslld $0x3,%xmm6
.byte 102,15,219,241 // pand %xmm1,%xmm6
.byte 102,15,254,244 // paddd %xmm4,%xmm6
- .byte 102,15,111,184,79,122,0,0 // movdqa 0x7a4f(%eax),%xmm7
+ .byte 102,15,111,184,47,122,0,0 // movdqa 0x7a2f(%eax),%xmm7
.byte 102,15,127,69,168 // movdqa %xmm0,-0x58(%ebp)
.byte 102,15,219,199 // pand %xmm7,%xmm0
- .byte 102,15,111,168,95,122,0,0 // movdqa 0x7a5f(%eax),%xmm5
+ .byte 102,15,111,168,63,122,0,0 // movdqa 0x7a3f(%eax),%xmm5
.byte 102,15,111,205 // movdqa %xmm5,%xmm1
.byte 102,15,102,200 // pcmpgtd %xmm0,%xmm1
- .byte 102,15,111,128,239,118,0,0 // movdqa 0x76ef(%eax),%xmm0
+ .byte 102,15,111,128,207,118,0,0 // movdqa 0x76cf(%eax),%xmm0
.byte 102,15,127,69,216 // movdqa %xmm0,-0x28(%ebp)
.byte 102,15,254,240 // paddd %xmm0,%xmm6
.byte 102,15,114,230,16 // psrad $0x10,%xmm6
@@ -61339,8 +61323,8 @@ _sk_store_f16_sse2:
.byte 102,15,97,245 // punpcklwd %xmm5,%xmm6
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,17 // mov (%ecx),%edx
.byte 139,56 // mov (%eax),%edi
+ .byte 139,17 // mov (%ecx),%edx
.byte 139,119,4 // mov 0x4(%edi),%esi
.byte 15,175,113,4 // imul 0x4(%ecx),%esi
.byte 193,230,3 // shl $0x3,%esi
@@ -61389,8 +61373,8 @@ _sk_load_u16_be_sse2:
.byte 131,236,44 // sub $0x2c,%esp
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,49 // mov (%ecx),%esi
.byte 139,16 // mov (%eax),%edx
+ .byte 139,49 // mov (%ecx),%esi
.byte 139,122,4 // mov 0x4(%edx),%edi
.byte 15,175,121,4 // imul 0x4(%ecx),%edi
.byte 1,255 // add %edi,%edi
@@ -61421,7 +61405,7 @@ _sk_load_u16_be_sse2:
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,97,195 // punpcklwd %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,40,162,2,118,0,0 // movaps 0x7602(%edx),%xmm4
+ .byte 15,40,162,226,117,0,0 // movaps 0x75e2(%edx),%xmm4
.byte 15,89,196 // mulps %xmm4,%xmm0
.byte 102,15,111,205 // movdqa %xmm5,%xmm1
.byte 102,15,113,241,8 // psllw $0x8,%xmm1
@@ -61490,8 +61474,8 @@ _sk_load_rgb_u16_be_sse2:
.byte 131,236,28 // sub $0x1c,%esp
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,121,8 // mov 0x8(%ecx),%edi
.byte 139,16 // mov (%eax),%edx
+ .byte 139,121,8 // mov 0x8(%ecx),%edi
.byte 139,114,4 // mov 0x4(%edx),%esi
.byte 15,175,113,4 // imul 0x4(%ecx),%esi
.byte 1,246 // add %esi,%esi
@@ -61525,7 +61509,7 @@ _sk_load_rgb_u16_be_sse2:
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,97,195 // punpcklwd %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,40,170,155,116,0,0 // movaps 0x749b(%edx),%xmm5
+ .byte 15,40,170,123,116,0,0 // movaps 0x747b(%edx),%xmm5
.byte 15,89,197 // mulps %xmm5,%xmm0
.byte 102,15,111,204 // movdqa %xmm4,%xmm1
.byte 102,15,113,241,8 // psllw $0x8,%xmm1
@@ -61551,7 +61535,7 @@ _sk_load_rgb_u16_be_sse2:
.byte 15,89,213 // mulps %xmm5,%xmm2
.byte 141,112,8 // lea 0x8(%eax),%esi
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,154,43,114,0,0 // movaps 0x722b(%edx),%xmm3
+ .byte 15,40,154,11,114,0,0 // movaps 0x720b(%edx),%xmm3
.byte 86 // push %esi
.byte 81 // push %ecx
.byte 255,80,4 // call *0x4(%eax)
@@ -61598,7 +61582,7 @@ _sk_store_u16_be_sse2:
.byte 1,210 // add %edx,%edx
.byte 3,22 // add (%esi),%edx
.byte 139,49 // mov (%ecx),%esi
- .byte 15,40,183,247,117,0,0 // movaps 0x75f7(%edi),%xmm6
+ .byte 15,40,183,215,117,0,0 // movaps 0x75d7(%edi),%xmm6
.byte 139,121,8 // mov 0x8(%ecx),%edi
.byte 193,230,2 // shl $0x2,%esi
.byte 15,40,224 // movaps %xmm0,%xmm4
@@ -61679,8 +61663,8 @@ _sk_load_f32_sse2:
.byte 86 // push %esi
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,57 // mov (%ecx),%edi
.byte 139,48 // mov (%eax),%esi
+ .byte 139,57 // mov (%ecx),%edi
.byte 139,86,4 // mov 0x4(%esi),%edx
.byte 15,175,81,4 // imul 0x4(%ecx),%edx
.byte 193,226,2 // shl $0x2,%edx
@@ -61743,8 +61727,8 @@ _sk_load_f32_dst_sse2:
.byte 15,41,85,232 // movaps %xmm2,-0x18(%ebp)
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,57 // mov (%ecx),%edi
.byte 139,48 // mov (%eax),%esi
+ .byte 139,57 // mov (%ecx),%edi
.byte 139,86,4 // mov 0x4(%esi),%edx
.byte 15,175,81,4 // imul 0x4(%ecx),%edx
.byte 193,226,2 // shl $0x2,%edx
@@ -61812,8 +61796,8 @@ _sk_store_f32_sse2:
.byte 131,236,12 // sub $0xc,%esp
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 139,25 // mov (%ecx),%ebx
.byte 139,48 // mov (%eax),%esi
+ .byte 139,25 // mov (%ecx),%ebx
.byte 139,86,4 // mov 0x4(%esi),%edx
.byte 15,175,81,4 // imul 0x4(%ecx),%edx
.byte 193,226,2 // shl $0x2,%edx
@@ -61878,7 +61862,7 @@ _sk_repeat_x_sse2:
.byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
.byte 15,194,238,1 // cmpltps %xmm6,%xmm5
- .byte 15,84,168,179,109,0,0 // andps 0x6db3(%eax),%xmm5
+ .byte 15,84,168,147,109,0,0 // andps 0x6d93(%eax),%xmm5
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
.byte 15,89,230 // mulps %xmm6,%xmm4
@@ -61910,7 +61894,7 @@ _sk_repeat_y_sse2:
.byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
.byte 15,194,238,1 // cmpltps %xmm6,%xmm5
- .byte 15,84,168,97,109,0,0 // andps 0x6d61(%eax),%xmm5
+ .byte 15,84,168,65,109,0,0 // andps 0x6d41(%eax),%xmm5
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
.byte 15,89,230 // mulps %xmm6,%xmm4
@@ -61940,13 +61924,13 @@ _sk_mirror_x_sse2:
.byte 15,40,244 // movaps %xmm4,%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
.byte 15,92,198 // subps %xmm6,%xmm0
- .byte 243,15,89,169,159,116,0,0 // mulss 0x749f(%ecx),%xmm5
+ .byte 243,15,89,169,127,116,0,0 // mulss 0x747f(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,89,232 // mulps %xmm0,%xmm5
.byte 243,15,91,253 // cvttps2dq %xmm5,%xmm7
.byte 15,91,255 // cvtdq2ps %xmm7,%xmm7
.byte 15,194,239,1 // cmpltps %xmm7,%xmm5
- .byte 15,84,169,15,109,0,0 // andps 0x6d0f(%ecx),%xmm5
+ .byte 15,84,169,239,108,0,0 // andps 0x6cef(%ecx),%xmm5
.byte 15,92,253 // subps %xmm5,%xmm7
.byte 243,15,88,228 // addss %xmm4,%xmm4
.byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
@@ -61981,13 +61965,13 @@ _sk_mirror_y_sse2:
.byte 15,40,244 // movaps %xmm4,%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
.byte 15,92,206 // subps %xmm6,%xmm1
- .byte 243,15,89,169,43,116,0,0 // mulss 0x742b(%ecx),%xmm5
+ .byte 243,15,89,169,11,116,0,0 // mulss 0x740b(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,89,233 // mulps %xmm1,%xmm5
.byte 243,15,91,253 // cvttps2dq %xmm5,%xmm7
.byte 15,91,255 // cvtdq2ps %xmm7,%xmm7
.byte 15,194,239,1 // cmpltps %xmm7,%xmm5
- .byte 15,84,169,155,108,0,0 // andps 0x6c9b(%ecx),%xmm5
+ .byte 15,84,169,123,108,0,0 // andps 0x6c7b(%ecx),%xmm5
.byte 15,92,253 // subps %xmm5,%xmm7
.byte 243,15,88,228 // addss %xmm4,%xmm4
.byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
@@ -62018,7 +62002,7 @@ _sk_clamp_x_1_sse2:
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 15,87,228 // xorps %xmm4,%xmm4
.byte 15,95,224 // maxps %xmm0,%xmm4
- .byte 15,93,160,39,108,0,0 // minps 0x6c27(%eax),%xmm4
+ .byte 15,93,160,7,108,0,0 // minps 0x6c07(%eax),%xmm4
.byte 141,65,4 // lea 0x4(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
.byte 15,40,196 // movaps %xmm4,%xmm0
@@ -62043,7 +62027,7 @@ _sk_repeat_x_1_sse2:
.byte 15,91,228 // cvtdq2ps %xmm4,%xmm4
.byte 15,40,232 // movaps %xmm0,%xmm5
.byte 15,194,236,1 // cmpltps %xmm4,%xmm5
- .byte 15,84,168,247,107,0,0 // andps 0x6bf7(%eax),%xmm5
+ .byte 15,84,168,215,107,0,0 // andps 0x6bd7(%eax),%xmm5
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 15,92,196 // subps %xmm4,%xmm0
.byte 141,65,4 // lea 0x4(%ecx),%eax
@@ -62065,14 +62049,14 @@ _sk_mirror_x_1_sse2:
.byte 232,0,0,0,0 // call 6124 <_sk_mirror_x_1_sse2+0xb>
.byte 89 // pop %ecx
.byte 139,69,12 // mov 0xc(%ebp),%eax
- .byte 15,40,161,44,108,0,0 // movaps 0x6c2c(%ecx),%xmm4
+ .byte 15,40,161,12,108,0,0 // movaps 0x6c0c(%ecx),%xmm4
.byte 15,88,196 // addps %xmm4,%xmm0
- .byte 15,40,169,172,107,0,0 // movaps 0x6bac(%ecx),%xmm5
+ .byte 15,40,169,140,107,0,0 // movaps 0x6b8c(%ecx),%xmm5
.byte 15,89,232 // mulps %xmm0,%xmm5
.byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
.byte 15,194,238,1 // cmpltps %xmm6,%xmm5
- .byte 15,84,169,188,107,0,0 // andps 0x6bbc(%ecx),%xmm5
+ .byte 15,84,169,156,107,0,0 // andps 0x6b9c(%ecx),%xmm5
.byte 15,87,255 // xorps %xmm7,%xmm7
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 15,88,246 // addps %xmm6,%xmm6
@@ -62100,10 +62084,10 @@ _sk_luminance_to_alpha_sse2:
.byte 232,0,0,0,0 // call 6182 <_sk_luminance_to_alpha_sse2+0xe>
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,89,128,142,112,0,0 // mulps 0x708e(%eax),%xmm0
- .byte 15,89,136,158,112,0,0 // mulps 0x709e(%eax),%xmm1
+ .byte 15,89,128,110,112,0,0 // mulps 0x706e(%eax),%xmm0
+ .byte 15,89,136,126,112,0,0 // mulps 0x707e(%eax),%xmm1
.byte 15,88,200 // addps %xmm0,%xmm1
- .byte 15,89,152,174,112,0,0 // mulps 0x70ae(%eax),%xmm3
+ .byte 15,89,152,142,112,0,0 // mulps 0x708e(%eax),%xmm3
.byte 15,88,217 // addps %xmm1,%xmm3
.byte 141,65,4 // lea 0x4(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -62281,13 +62265,12 @@ _sk_matrix_4x5_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 131,236,8 // sub $0x8,%esp
.byte 15,40,233 // movaps %xmm1,%xmm5
+ .byte 15,40,224 // movaps %xmm0,%xmm4
.byte 139,69,12 // mov 0xc(%ebp),%eax
- .byte 141,72,4 // lea 0x4(%eax),%ecx
- .byte 137,77,252 // mov %ecx,-0x4(%ebp)
.byte 139,8 // mov (%eax),%ecx
- .byte 243,15,16,33 // movss (%ecx),%xmm4
+ .byte 243,15,16,1 // movss (%ecx),%xmm0
.byte 243,15,16,73,4 // movss 0x4(%ecx),%xmm1
- .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
+ .byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0
.byte 243,15,16,113,48 // movss 0x30(%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
.byte 243,15,16,121,64 // movss 0x40(%ecx),%xmm7
@@ -62302,8 +62285,8 @@ _sk_matrix_4x5_sse2:
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,88,247 // addps %xmm7,%xmm6
- .byte 15,89,224 // mulps %xmm0,%xmm4
- .byte 15,88,230 // addps %xmm6,%xmm4
+ .byte 15,89,196 // mulps %xmm4,%xmm0
+ .byte 15,88,198 // addps %xmm6,%xmm0
.byte 15,198,201,0 // shufps $0x0,%xmm1,%xmm1
.byte 243,15,16,113,52 // movss 0x34(%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -62319,7 +62302,7 @@ _sk_matrix_4x5_sse2:
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,88,247 // addps %xmm7,%xmm6
- .byte 15,89,200 // mulps %xmm0,%xmm1
+ .byte 15,89,204 // mulps %xmm4,%xmm1
.byte 15,88,206 // addps %xmm6,%xmm1
.byte 243,15,16,113,56 // movss 0x38(%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -62337,7 +62320,7 @@ _sk_matrix_4x5_sse2:
.byte 15,88,247 // addps %xmm7,%xmm6
.byte 243,15,16,121,8 // movss 0x8(%ecx),%xmm7
.byte 15,198,255,0 // shufps $0x0,%xmm7,%xmm7
- .byte 15,89,248 // mulps %xmm0,%xmm7
+ .byte 15,89,252 // mulps %xmm4,%xmm7
.byte 15,88,254 // addps %xmm6,%xmm7
.byte 243,15,16,113,60 // movss 0x3c(%ecx),%xmm6
.byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6
@@ -62355,15 +62338,13 @@ _sk_matrix_4x5_sse2:
.byte 15,88,211 // addps %xmm3,%xmm2
.byte 243,15,16,89,12 // movss 0xc(%ecx),%xmm3
.byte 15,198,219,0 // shufps $0x0,%xmm3,%xmm3
- .byte 15,89,216 // mulps %xmm0,%xmm3
+ .byte 15,89,220 // mulps %xmm4,%xmm3
.byte 15,88,218 // addps %xmm2,%xmm3
- .byte 139,77,8 // mov 0x8(%ebp),%ecx
- .byte 141,80,8 // lea 0x8(%eax),%edx
+ .byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,196 // movaps %xmm4,%xmm0
.byte 15,40,215 // movaps %xmm7,%xmm2
- .byte 82 // push %edx
.byte 81 // push %ecx
+ .byte 255,117,8 // pushl 0x8(%ebp)
.byte 255,80,4 // call *0x4(%eax)
.byte 131,196,24 // add $0x18,%esp
.byte 93 // pop %ebp
@@ -62493,23 +62474,21 @@ _sk_evenly_spaced_gradient_sse2:
.byte 86 // push %esi
.byte 131,236,60 // sub $0x3c,%esp
.byte 15,41,69,184 // movaps %xmm0,-0x48(%ebp)
- .byte 232,0,0,0,0 // call 661f <_sk_evenly_spaced_gradient_sse2+0x12>
+ .byte 232,0,0,0,0 // call 6618 <_sk_evenly_spaced_gradient_sse2+0x12>
.byte 90 // pop %edx
- .byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 141,65,4 // lea 0x4(%ecx),%eax
- .byte 137,69,240 // mov %eax,-0x10(%ebp)
- .byte 139,9 // mov (%ecx),%ecx
+ .byte 139,69,12 // mov 0xc(%ebp),%eax
+ .byte 139,8 // mov (%eax),%ecx
.byte 139,49 // mov (%ecx),%esi
.byte 139,65,4 // mov 0x4(%ecx),%eax
.byte 78 // dec %esi
.byte 102,15,110,206 // movd %esi,%xmm1
.byte 102,15,112,201,0 // pshufd $0x0,%xmm1,%xmm1
- .byte 102,15,111,146,33,108,0,0 // movdqa 0x6c21(%edx),%xmm2
+ .byte 102,15,111,146,8,108,0,0 // movdqa 0x6c08(%edx),%xmm2
.byte 102,15,219,209 // pand %xmm1,%xmm2
- .byte 102,15,235,146,225,105,0,0 // por 0x69e1(%edx),%xmm2
+ .byte 102,15,235,146,200,105,0,0 // por 0x69c8(%edx),%xmm2
.byte 102,15,114,209,16 // psrld $0x10,%xmm1
- .byte 102,15,235,138,49,108,0,0 // por 0x6c31(%edx),%xmm1
- .byte 15,88,138,65,108,0,0 // addps 0x6c41(%edx),%xmm1
+ .byte 102,15,235,138,24,108,0,0 // por 0x6c18(%edx),%xmm1
+ .byte 15,88,138,40,108,0,0 // addps 0x6c28(%edx),%xmm1
.byte 15,88,202 // addps %xmm2,%xmm1
.byte 15,89,200 // mulps %xmm0,%xmm1
.byte 243,15,91,201 // cvttps2dq %xmm1,%xmm1
@@ -62594,14 +62573,13 @@ _sk_evenly_spaced_gradient_sse2:
.byte 15,88,215 // addps %xmm7,%xmm2
.byte 15,89,221 // mulps %xmm5,%xmm3
.byte 15,88,216 // addps %xmm0,%xmm3
- .byte 139,69,8 // mov 0x8(%ebp),%eax
- .byte 139,85,12 // mov 0xc(%ebp),%edx
- .byte 141,74,8 // lea 0x8(%edx),%ecx
+ .byte 139,77,12 // mov 0xc(%ebp),%ecx
+ .byte 141,65,8 // lea 0x8(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
.byte 15,40,196 // movaps %xmm4,%xmm0
- .byte 81 // push %ecx
.byte 80 // push %eax
- .byte 255,82,4 // call *0x4(%edx)
+ .byte 255,117,8 // pushl 0x8(%ebp)
+ .byte 255,81,4 // call *0x4(%ecx)
.byte 131,196,76 // add $0x4c,%esp
.byte 94 // pop %esi
.byte 95 // pop %edi
@@ -62616,18 +62594,18 @@ _sk_gauss_a_to_rgba_sse2:
.byte 85 // push %ebp
.byte 137,229 // mov %esp,%ebp
.byte 131,236,8 // sub $0x8,%esp
- .byte 232,0,0,0,0 // call 67df <_sk_gauss_a_to_rgba_sse2+0xb>
+ .byte 232,0,0,0,0 // call 67d1 <_sk_gauss_a_to_rgba_sse2+0xb>
.byte 88 // pop %eax
.byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,40,128,145,106,0,0 // movaps 0x6a91(%eax),%xmm0
+ .byte 15,40,128,127,106,0,0 // movaps 0x6a7f(%eax),%xmm0
.byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,161,106,0,0 // addps 0x6aa1(%eax),%xmm0
+ .byte 15,88,128,143,106,0,0 // addps 0x6a8f(%eax),%xmm0
.byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,177,106,0,0 // addps 0x6ab1(%eax),%xmm0
+ .byte 15,88,128,159,106,0,0 // addps 0x6a9f(%eax),%xmm0
.byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,193,106,0,0 // addps 0x6ac1(%eax),%xmm0
+ .byte 15,88,128,175,106,0,0 // addps 0x6aaf(%eax),%xmm0
.byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,209,106,0,0 // addps 0x6ad1(%eax),%xmm0
+ .byte 15,88,128,191,106,0,0 // addps 0x6abf(%eax),%xmm0
.byte 141,65,4 // lea 0x4(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
.byte 15,40,200 // movaps %xmm0,%xmm1
@@ -62650,16 +62628,14 @@ _sk_gradient_sse2:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,60 // sub $0x3c,%esp
- .byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 141,81,4 // lea 0x4(%ecx),%edx
- .byte 137,85,240 // mov %edx,-0x10(%ebp)
- .byte 139,9 // mov (%ecx),%ecx
- .byte 139,17 // mov (%ecx),%edx
+ .byte 139,69,12 // mov 0xc(%ebp),%eax
+ .byte 139,16 // mov (%eax),%edx
+ .byte 139,10 // mov (%edx),%ecx
.byte 102,15,239,201 // pxor %xmm1,%xmm1
- .byte 131,250,2 // cmp $0x2,%edx
- .byte 114,33 // jb 686c <_sk_gradient_sse2+0x40>
- .byte 139,113,36 // mov 0x24(%ecx),%esi
- .byte 74 // dec %edx
+ .byte 131,249,2 // cmp $0x2,%ecx
+ .byte 114,33 // jb 6858 <_sk_gradient_sse2+0x3a>
+ .byte 139,114,36 // mov 0x24(%edx),%esi
+ .byte 73 // dec %ecx
.byte 131,198,4 // add $0x4,%esi
.byte 102,15,239,201 // pxor %xmm1,%xmm1
.byte 243,15,16,22 // movss (%esi),%xmm2
@@ -62667,80 +62643,80 @@ _sk_gradient_sse2:
.byte 15,194,208,2 // cmpleps %xmm0,%xmm2
.byte 102,15,250,202 // psubd %xmm2,%xmm1
.byte 131,198,4 // add $0x4,%esi
- .byte 74 // dec %edx
- .byte 117,234 // jne 6856 <_sk_gradient_sse2+0x2a>
- .byte 102,15,126,202 // movd %xmm1,%edx
+ .byte 73 // dec %ecx
+ .byte 117,234 // jne 6842 <_sk_gradient_sse2+0x24>
+ .byte 102,15,126,206 // movd %xmm1,%esi
.byte 102,15,112,209,229 // pshufd $0xe5,%xmm1,%xmm2
.byte 102,15,112,217,78 // pshufd $0x4e,%xmm1,%xmm3
- .byte 102,15,126,222 // movd %xmm3,%esi
+ .byte 102,15,126,223 // movd %xmm3,%edi
.byte 102,15,112,201,231 // pshufd $0xe7,%xmm1,%xmm1
- .byte 102,15,126,207 // movd %xmm1,%edi
- .byte 139,65,4 // mov 0x4(%ecx),%eax
- .byte 243,15,16,12,184 // movss (%eax,%edi,4),%xmm1
- .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3
- .byte 243,15,16,36,144 // movss (%eax,%edx,4),%xmm4
- .byte 102,15,126,211 // movd %xmm2,%ebx
- .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2
+ .byte 102,15,126,203 // movd %xmm1,%ebx
+ .byte 139,66,4 // mov 0x4(%edx),%eax
+ .byte 243,15,16,12,152 // movss (%eax,%ebx,4),%xmm1
+ .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3
+ .byte 243,15,16,36,176 // movss (%eax,%esi,4),%xmm4
+ .byte 102,15,126,209 // movd %xmm2,%ecx
+ .byte 243,15,16,20,136 // movss (%eax,%ecx,4),%xmm2
.byte 15,20,217 // unpcklps %xmm1,%xmm3
- .byte 139,65,20 // mov 0x14(%ecx),%eax
- .byte 243,15,16,12,184 // movss (%eax,%edi,4),%xmm1
- .byte 243,15,16,52,176 // movss (%eax,%esi,4),%xmm6
- .byte 243,15,16,44,144 // movss (%eax,%edx,4),%xmm5
- .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7
+ .byte 139,66,20 // mov 0x14(%edx),%eax
+ .byte 243,15,16,12,152 // movss (%eax,%ebx,4),%xmm1
+ .byte 243,15,16,52,184 // movss (%eax,%edi,4),%xmm6
+ .byte 243,15,16,44,176 // movss (%eax,%esi,4),%xmm5
+ .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7
.byte 15,20,226 // unpcklps %xmm2,%xmm4
.byte 102,15,20,227 // unpcklpd %xmm3,%xmm4
.byte 102,15,41,101,184 // movapd %xmm4,-0x48(%ebp)
.byte 15,20,241 // unpcklps %xmm1,%xmm6
.byte 15,20,239 // unpcklps %xmm7,%xmm5
- .byte 139,65,8 // mov 0x8(%ecx),%eax
- .byte 243,15,16,20,184 // movss (%eax,%edi,4),%xmm2
- .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3
- .byte 243,15,16,12,144 // movss (%eax,%edx,4),%xmm1
- .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7
+ .byte 139,66,8 // mov 0x8(%edx),%eax
+ .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2
+ .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3
+ .byte 243,15,16,12,176 // movss (%eax,%esi,4),%xmm1
+ .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7
.byte 102,15,20,238 // unpcklpd %xmm6,%xmm5
.byte 102,15,41,109,200 // movapd %xmm5,-0x38(%ebp)
.byte 15,20,218 // unpcklps %xmm2,%xmm3
.byte 15,20,207 // unpcklps %xmm7,%xmm1
.byte 102,15,20,203 // unpcklpd %xmm3,%xmm1
- .byte 139,65,24 // mov 0x18(%ecx),%eax
- .byte 243,15,16,20,184 // movss (%eax,%edi,4),%xmm2
- .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3
- .byte 243,15,16,36,144 // movss (%eax,%edx,4),%xmm4
- .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7
+ .byte 139,66,24 // mov 0x18(%edx),%eax
+ .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2
+ .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3
+ .byte 243,15,16,36,176 // movss (%eax,%esi,4),%xmm4
+ .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7
.byte 15,20,218 // unpcklps %xmm2,%xmm3
.byte 15,20,231 // unpcklps %xmm7,%xmm4
.byte 102,15,20,227 // unpcklpd %xmm3,%xmm4
.byte 102,15,41,101,216 // movapd %xmm4,-0x28(%ebp)
- .byte 139,65,12 // mov 0xc(%ecx),%eax
- .byte 243,15,16,20,184 // movss (%eax,%edi,4),%xmm2
- .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3
+ .byte 139,66,12 // mov 0xc(%edx),%eax
+ .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2
+ .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3
.byte 15,20,218 // unpcklps %xmm2,%xmm3
- .byte 243,15,16,20,144 // movss (%eax,%edx,4),%xmm2
- .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7
+ .byte 243,15,16,20,176 // movss (%eax,%esi,4),%xmm2
+ .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7
.byte 15,20,215 // unpcklps %xmm7,%xmm2
.byte 102,15,20,211 // unpcklpd %xmm3,%xmm2
- .byte 139,65,28 // mov 0x1c(%ecx),%eax
- .byte 243,15,16,60,184 // movss (%eax,%edi,4),%xmm7
- .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3
+ .byte 139,66,28 // mov 0x1c(%edx),%eax
+ .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7
+ .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3
.byte 15,20,223 // unpcklps %xmm7,%xmm3
- .byte 243,15,16,60,144 // movss (%eax,%edx,4),%xmm7
- .byte 243,15,16,44,152 // movss (%eax,%ebx,4),%xmm5
+ .byte 243,15,16,60,176 // movss (%eax,%esi,4),%xmm7
+ .byte 243,15,16,44,136 // movss (%eax,%ecx,4),%xmm5
.byte 15,20,253 // unpcklps %xmm5,%xmm7
.byte 102,15,20,251 // unpcklpd %xmm3,%xmm7
- .byte 139,65,16 // mov 0x10(%ecx),%eax
- .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3
- .byte 243,15,16,44,176 // movss (%eax,%esi,4),%xmm5
+ .byte 139,66,16 // mov 0x10(%edx),%eax
+ .byte 243,15,16,28,152 // movss (%eax,%ebx,4),%xmm3
+ .byte 243,15,16,44,184 // movss (%eax,%edi,4),%xmm5
.byte 15,20,235 // unpcklps %xmm3,%xmm5
- .byte 243,15,16,28,144 // movss (%eax,%edx,4),%xmm3
- .byte 243,15,16,52,152 // movss (%eax,%ebx,4),%xmm6
+ .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3
+ .byte 243,15,16,52,136 // movss (%eax,%ecx,4),%xmm6
.byte 15,20,222 // unpcklps %xmm6,%xmm3
.byte 102,15,20,221 // unpcklpd %xmm5,%xmm3
- .byte 139,65,32 // mov 0x20(%ecx),%eax
- .byte 243,15,16,44,184 // movss (%eax,%edi,4),%xmm5
- .byte 243,15,16,52,176 // movss (%eax,%esi,4),%xmm6
+ .byte 139,66,32 // mov 0x20(%edx),%eax
+ .byte 243,15,16,44,152 // movss (%eax,%ebx,4),%xmm5
+ .byte 243,15,16,52,184 // movss (%eax,%edi,4),%xmm6
.byte 15,20,245 // unpcklps %xmm5,%xmm6
- .byte 243,15,16,44,144 // movss (%eax,%edx,4),%xmm5
- .byte 243,15,16,36,152 // movss (%eax,%ebx,4),%xmm4
+ .byte 243,15,16,44,176 // movss (%eax,%esi,4),%xmm5
+ .byte 243,15,16,36,136 // movss (%eax,%ecx,4),%xmm4
.byte 15,20,236 // unpcklps %xmm4,%xmm5
.byte 102,15,20,238 // unpcklpd %xmm6,%xmm5
.byte 15,40,101,184 // movaps -0x48(%ebp),%xmm4
@@ -62752,13 +62728,14 @@ _sk_gradient_sse2:
.byte 15,88,215 // addps %xmm7,%xmm2
.byte 15,89,216 // mulps %xmm0,%xmm3
.byte 15,88,221 // addps %xmm5,%xmm3
- .byte 139,69,240 // mov -0x10(%ebp),%eax
- .byte 141,72,4 // lea 0x4(%eax),%ecx
+ .byte 139,69,12 // mov 0xc(%ebp),%eax
+ .byte 137,193 // mov %eax,%ecx
+ .byte 141,65,8 // lea 0x8(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
.byte 15,40,196 // movaps %xmm4,%xmm0
- .byte 81 // push %ecx
+ .byte 80 // push %eax
.byte 255,117,8 // pushl 0x8(%ebp)
- .byte 255,16 // call *(%eax)
+ .byte 255,81,4 // call *0x4(%ecx)
.byte 131,196,76 // add $0x4c,%esp
.byte 94 // pop %esi
.byte 95 // pop %edi
@@ -62820,7 +62797,7 @@ _sk_xy_to_unit_angle_sse2:
.byte 15,40,218 // movaps %xmm2,%xmm3
.byte 15,40,209 // movaps %xmm1,%xmm2
.byte 15,40,200 // movaps %xmm0,%xmm1
- .byte 232,0,0,0,0 // call 6a71 <_sk_xy_to_unit_angle_sse2+0x18>
+ .byte 232,0,0,0,0 // call 6a60 <_sk_xy_to_unit_angle_sse2+0x18>
.byte 88 // pop %eax
.byte 15,87,237 // xorps %xmm5,%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
@@ -62835,30 +62812,30 @@ _sk_xy_to_unit_angle_sse2:
.byte 15,94,247 // divps %xmm7,%xmm6
.byte 15,40,254 // movaps %xmm6,%xmm7
.byte 15,89,255 // mulps %xmm7,%xmm7
- .byte 15,40,128,79,104,0,0 // movaps 0x684f(%eax),%xmm0
+ .byte 15,40,128,64,104,0,0 // movaps 0x6840(%eax),%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 15,88,128,95,104,0,0 // addps 0x685f(%eax),%xmm0
+ .byte 15,88,128,80,104,0,0 // addps 0x6850(%eax),%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 15,88,128,111,104,0,0 // addps 0x686f(%eax),%xmm0
+ .byte 15,88,128,96,104,0,0 // addps 0x6860(%eax),%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 15,88,128,127,104,0,0 // addps 0x687f(%eax),%xmm0
+ .byte 15,88,128,112,104,0,0 // addps 0x6870(%eax),%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
.byte 15,194,236,1 // cmpltps %xmm4,%xmm5
- .byte 15,40,176,143,104,0,0 // movaps 0x688f(%eax),%xmm6
+ .byte 15,40,176,128,104,0,0 // movaps 0x6880(%eax),%xmm6
.byte 15,92,240 // subps %xmm0,%xmm6
.byte 15,84,245 // andps %xmm5,%xmm6
.byte 15,85,232 // andnps %xmm0,%xmm5
.byte 15,87,228 // xorps %xmm4,%xmm4
.byte 15,86,238 // orps %xmm6,%xmm5
.byte 15,194,204,1 // cmpltps %xmm4,%xmm1
- .byte 15,40,128,95,98,0,0 // movaps 0x625f(%eax),%xmm0
+ .byte 15,40,128,80,98,0,0 // movaps 0x6250(%eax),%xmm0
.byte 15,92,197 // subps %xmm5,%xmm0
.byte 15,84,193 // andps %xmm1,%xmm0
.byte 15,85,205 // andnps %xmm5,%xmm1
.byte 15,86,200 // orps %xmm0,%xmm1
.byte 15,40,194 // movaps %xmm2,%xmm0
.byte 15,194,196,1 // cmpltps %xmm4,%xmm0
- .byte 15,40,168,111,98,0,0 // movaps 0x626f(%eax),%xmm5
+ .byte 15,40,168,96,98,0,0 // movaps 0x6260(%eax),%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
.byte 15,84,232 // andps %xmm0,%xmm5
.byte 15,85,193 // andnps %xmm1,%xmm0
@@ -62919,15 +62896,15 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,246 // mulps %xmm6,%xmm6
.byte 15,88,240 // addps %xmm0,%xmm6
- .byte 232,0,0,0,0 // call 6b8e <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
+ .byte 232,0,0,0,0 // call 6b7d <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
.byte 90 // pop %edx
.byte 243,15,89,237 // mulss %xmm5,%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 243,15,16,65,32 // movss 0x20(%ecx),%xmm0
.byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0
- .byte 15,89,162,130,103,0,0 // mulps 0x6782(%edx),%xmm4
- .byte 15,89,130,146,103,0,0 // mulps 0x6792(%edx),%xmm0
+ .byte 15,89,162,115,103,0,0 // mulps 0x6773(%edx),%xmm4
+ .byte 15,89,130,131,103,0,0 // mulps 0x6783(%edx),%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
@@ -62935,11 +62912,11 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 15,81,237 // sqrtps %xmm5,%xmm5
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,87,162,50,102,0,0 // xorps 0x6632(%edx),%xmm4
+ .byte 15,87,162,35,102,0,0 // xorps 0x6623(%edx),%xmm4
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 243,15,16,105,36 // movss 0x24(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
- .byte 15,89,170,66,97,0,0 // mulps 0x6142(%edx),%xmm5
+ .byte 15,89,170,51,97,0,0 // mulps 0x6133(%edx),%xmm5
.byte 15,89,197 // mulps %xmm5,%xmm0
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,95,196 // maxps %xmm4,%xmm0
@@ -62970,15 +62947,15 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,246 // mulps %xmm6,%xmm6
.byte 15,88,240 // addps %xmm0,%xmm6
- .byte 232,0,0,0,0 // call 6c2c <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
+ .byte 232,0,0,0,0 // call 6c1b <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
.byte 90 // pop %edx
.byte 243,15,89,237 // mulss %xmm5,%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 243,15,16,65,32 // movss 0x20(%ecx),%xmm0
.byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0
- .byte 15,89,162,228,102,0,0 // mulps 0x66e4(%edx),%xmm4
- .byte 15,89,130,244,102,0,0 // mulps 0x66f4(%edx),%xmm0
+ .byte 15,89,162,213,102,0,0 // mulps 0x66d5(%edx),%xmm4
+ .byte 15,89,130,229,102,0,0 // mulps 0x66e5(%edx),%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
@@ -62986,11 +62963,11 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 15,81,237 // sqrtps %xmm5,%xmm5
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,87,162,148,101,0,0 // xorps 0x6594(%edx),%xmm4
+ .byte 15,87,162,133,101,0,0 // xorps 0x6585(%edx),%xmm4
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 243,15,16,105,36 // movss 0x24(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
- .byte 15,89,170,164,96,0,0 // mulps 0x60a4(%edx),%xmm5
+ .byte 15,89,170,149,96,0,0 // mulps 0x6095(%edx),%xmm5
.byte 15,89,197 // mulps %xmm5,%xmm0
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,93,196 // minps %xmm4,%xmm0
@@ -63010,7 +62987,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 85 // push %ebp
.byte 137,229 // mov %esp,%ebp
.byte 131,236,8 // sub $0x8,%esp
- .byte 232,0,0,0,0 // call 6ca4 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
+ .byte 232,0,0,0,0 // call 6c93 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
.byte 89 // pop %ecx
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,16 // mov (%eax),%edx
@@ -63019,7 +62996,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 243,15,89,236 // mulss %xmm4,%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,88,232 // addps %xmm0,%xmm5
- .byte 15,89,169,108,102,0,0 // mulps 0x666c(%ecx),%xmm5
+ .byte 15,89,169,93,102,0,0 // mulps 0x665d(%ecx),%xmm5
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,246 // mulps %xmm6,%xmm6
@@ -63027,7 +63004,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 243,15,89,228 // mulss %xmm4,%xmm4
.byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,87,129,28,101,0,0 // xorps 0x651c(%ecx),%xmm0
+ .byte 15,87,129,13,101,0,0 // xorps 0x650d(%ecx),%xmm0
.byte 15,94,197 // divps %xmm5,%xmm0
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 131,236,8 // sub $0x8,%esp
@@ -63104,16 +63081,16 @@ _sk_save_xy_sse2:
.byte 131,236,24 // sub $0x18,%esp
.byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp)
.byte 15,40,218 // movaps %xmm2,%xmm3
- .byte 232,0,0,0,0 // call 6d8d <_sk_save_xy_sse2+0x12>
+ .byte 232,0,0,0,0 // call 6d7c <_sk_save_xy_sse2+0x12>
.byte 88 // pop %eax
- .byte 15,40,160,67,95,0,0 // movaps 0x5f43(%eax),%xmm4
+ .byte 15,40,160,52,95,0,0 // movaps 0x5f34(%eax),%xmm4
.byte 15,40,232 // movaps %xmm0,%xmm5
.byte 15,88,236 // addps %xmm4,%xmm5
.byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
.byte 15,40,253 // movaps %xmm5,%xmm7
.byte 15,194,254,1 // cmpltps %xmm6,%xmm7
- .byte 15,40,144,83,95,0,0 // movaps 0x5f53(%eax),%xmm2
+ .byte 15,40,144,68,95,0,0 // movaps 0x5f44(%eax),%xmm2
.byte 15,84,250 // andps %xmm2,%xmm7
.byte 15,92,247 // subps %xmm7,%xmm6
.byte 15,92,238 // subps %xmm6,%xmm5
@@ -63188,15 +63165,15 @@ _sk_bilinear_nx_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 6e6f <_sk_bilinear_nx_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6e5e <_sk_bilinear_nx_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,102,64 // movups 0x40(%esi),%xmm4
- .byte 15,88,128,193,100,0,0 // addps 0x64c1(%eax),%xmm0
- .byte 15,40,168,113,94,0,0 // movaps 0x5e71(%eax),%xmm5
+ .byte 15,88,128,178,100,0,0 // addps 0x64b2(%eax),%xmm0
+ .byte 15,40,168,98,94,0,0 // movaps 0x5e62(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,17,174,128,0,0,0 // movups %xmm5,0x80(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -63217,14 +63194,14 @@ _sk_bilinear_px_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 6eb2 <_sk_bilinear_px_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6ea1 <_sk_bilinear_px_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,102,64 // movups 0x40(%esi),%xmm4
- .byte 15,88,128,30,94,0,0 // addps 0x5e1e(%eax),%xmm0
+ .byte 15,88,128,15,94,0,0 // addps 0x5e0f(%eax),%xmm0
.byte 15,17,166,128,0,0,0 // movups %xmm4,0x80(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -63244,15 +63221,15 @@ _sk_bilinear_ny_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 6eeb <_sk_bilinear_ny_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6eda <_sk_bilinear_ny_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,32 // movups 0x20(%esi),%xmm1
.byte 15,16,102,96 // movups 0x60(%esi),%xmm4
- .byte 15,88,136,69,100,0,0 // addps 0x6445(%eax),%xmm1
- .byte 15,40,168,245,93,0,0 // movaps 0x5df5(%eax),%xmm5
+ .byte 15,88,136,54,100,0,0 // addps 0x6436(%eax),%xmm1
+ .byte 15,40,168,230,93,0,0 // movaps 0x5de6(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,17,174,160,0,0,0 // movups %xmm5,0xa0(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -63273,14 +63250,14 @@ _sk_bilinear_py_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 6f2f <_sk_bilinear_py_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6f1e <_sk_bilinear_py_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,32 // movups 0x20(%esi),%xmm1
.byte 15,16,102,96 // movups 0x60(%esi),%xmm4
- .byte 15,88,136,161,93,0,0 // addps 0x5da1(%eax),%xmm1
+ .byte 15,88,136,146,93,0,0 // addps 0x5d92(%eax),%xmm1
.byte 15,17,166,160,0,0,0 // movups %xmm4,0xa0(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -63300,20 +63277,20 @@ _sk_bicubic_n3x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 6f69 <_sk_bicubic_n3x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6f58 <_sk_bicubic_n3x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,102,64 // movups 0x40(%esi),%xmm4
- .byte 15,88,128,215,99,0,0 // addps 0x63d7(%eax),%xmm0
- .byte 15,40,168,119,93,0,0 // movaps 0x5d77(%eax),%xmm5
+ .byte 15,88,128,200,99,0,0 // addps 0x63c8(%eax),%xmm0
+ .byte 15,40,168,104,93,0,0 // movaps 0x5d68(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,40,229 // movaps %xmm5,%xmm4
.byte 15,89,228 // mulps %xmm4,%xmm4
- .byte 15,89,168,231,99,0,0 // mulps 0x63e7(%eax),%xmm5
- .byte 15,88,168,87,95,0,0 // addps 0x5f57(%eax),%xmm5
+ .byte 15,89,168,216,99,0,0 // mulps 0x63d8(%eax),%xmm5
+ .byte 15,88,168,72,95,0,0 // addps 0x5f48(%eax),%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
.byte 15,17,174,128,0,0,0 // movups %xmm5,0x80(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -63334,23 +63311,23 @@ _sk_bicubic_n1x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 6fc3 <_sk_bicubic_n1x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6fb2 <_sk_bicubic_n1x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,102,64 // movups 0x40(%esi),%xmm4
- .byte 15,88,128,109,99,0,0 // addps 0x636d(%eax),%xmm0
- .byte 15,40,168,29,93,0,0 // movaps 0x5d1d(%eax),%xmm5
+ .byte 15,88,128,94,99,0,0 // addps 0x635e(%eax),%xmm0
+ .byte 15,40,168,14,93,0,0 // movaps 0x5d0e(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
- .byte 15,40,160,157,99,0,0 // movaps 0x639d(%eax),%xmm4
+ .byte 15,40,160,142,99,0,0 // movaps 0x638e(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,173,99,0,0 // addps 0x63ad(%eax),%xmm4
+ .byte 15,88,160,158,99,0,0 // addps 0x639e(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,13,93,0,0 // addps 0x5d0d(%eax),%xmm4
+ .byte 15,88,160,254,92,0,0 // addps 0x5cfe(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,189,99,0,0 // addps 0x63bd(%eax),%xmm4
+ .byte 15,88,160,174,99,0,0 // addps 0x63ae(%eax),%xmm4
.byte 15,17,166,128,0,0,0 // movups %xmm4,0x80(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -63370,22 +63347,22 @@ _sk_bicubic_p1x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 702b <_sk_bicubic_p1x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 701a <_sk_bicubic_p1x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
- .byte 15,40,160,165,92,0,0 // movaps 0x5ca5(%eax),%xmm4
+ .byte 15,40,160,150,92,0,0 // movaps 0x5c96(%eax),%xmm4
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,110,64 // movups 0x40(%esi),%xmm5
.byte 15,88,196 // addps %xmm4,%xmm0
- .byte 15,40,176,53,99,0,0 // movaps 0x6335(%eax),%xmm6
+ .byte 15,40,176,38,99,0,0 // movaps 0x6326(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,69,99,0,0 // addps 0x6345(%eax),%xmm6
+ .byte 15,88,176,54,99,0,0 // addps 0x6336(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,88,244 // addps %xmm4,%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,85,99,0,0 // addps 0x6355(%eax),%xmm6
+ .byte 15,88,176,70,99,0,0 // addps 0x6346(%eax),%xmm6
.byte 15,17,182,128,0,0,0 // movups %xmm6,0x80(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -63405,18 +63382,18 @@ _sk_bicubic_p3x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7088 <_sk_bicubic_p3x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7077 <_sk_bicubic_p3x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,102,64 // movups 0x40(%esi),%xmm4
- .byte 15,88,128,232,98,0,0 // addps 0x62e8(%eax),%xmm0
+ .byte 15,88,128,217,98,0,0 // addps 0x62d9(%eax),%xmm0
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
- .byte 15,89,160,200,98,0,0 // mulps 0x62c8(%eax),%xmm4
- .byte 15,88,160,56,94,0,0 // addps 0x5e38(%eax),%xmm4
+ .byte 15,89,160,185,98,0,0 // mulps 0x62b9(%eax),%xmm4
+ .byte 15,88,160,41,94,0,0 // addps 0x5e29(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,17,166,128,0,0,0 // movups %xmm4,0x80(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -63437,20 +63414,20 @@ _sk_bicubic_n3y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 70d8 <_sk_bicubic_n3y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 70c7 <_sk_bicubic_n3y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,32 // movups 0x20(%esi),%xmm1
.byte 15,16,102,96 // movups 0x60(%esi),%xmm4
- .byte 15,88,136,104,98,0,0 // addps 0x6268(%eax),%xmm1
- .byte 15,40,168,8,92,0,0 // movaps 0x5c08(%eax),%xmm5
+ .byte 15,88,136,89,98,0,0 // addps 0x6259(%eax),%xmm1
+ .byte 15,40,168,249,91,0,0 // movaps 0x5bf9(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,40,229 // movaps %xmm5,%xmm4
.byte 15,89,228 // mulps %xmm4,%xmm4
- .byte 15,89,168,120,98,0,0 // mulps 0x6278(%eax),%xmm5
- .byte 15,88,168,232,93,0,0 // addps 0x5de8(%eax),%xmm5
+ .byte 15,89,168,105,98,0,0 // mulps 0x6269(%eax),%xmm5
+ .byte 15,88,168,217,93,0,0 // addps 0x5dd9(%eax),%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
.byte 15,17,174,160,0,0,0 // movups %xmm5,0xa0(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -63471,23 +63448,23 @@ _sk_bicubic_n1y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7133 <_sk_bicubic_n1y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7122 <_sk_bicubic_n1y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,32 // movups 0x20(%esi),%xmm1
.byte 15,16,102,96 // movups 0x60(%esi),%xmm4
- .byte 15,88,136,253,97,0,0 // addps 0x61fd(%eax),%xmm1
- .byte 15,40,168,173,91,0,0 // movaps 0x5bad(%eax),%xmm5
+ .byte 15,88,136,238,97,0,0 // addps 0x61ee(%eax),%xmm1
+ .byte 15,40,168,158,91,0,0 // movaps 0x5b9e(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
- .byte 15,40,160,45,98,0,0 // movaps 0x622d(%eax),%xmm4
+ .byte 15,40,160,30,98,0,0 // movaps 0x621e(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,61,98,0,0 // addps 0x623d(%eax),%xmm4
+ .byte 15,88,160,46,98,0,0 // addps 0x622e(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,157,91,0,0 // addps 0x5b9d(%eax),%xmm4
+ .byte 15,88,160,142,91,0,0 // addps 0x5b8e(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,77,98,0,0 // addps 0x624d(%eax),%xmm4
+ .byte 15,88,160,62,98,0,0 // addps 0x623e(%eax),%xmm4
.byte 15,17,166,160,0,0,0 // movups %xmm4,0xa0(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -63507,22 +63484,22 @@ _sk_bicubic_p1y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 719c <_sk_bicubic_p1y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 718b <_sk_bicubic_p1y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
- .byte 15,40,160,52,91,0,0 // movaps 0x5b34(%eax),%xmm4
+ .byte 15,40,160,37,91,0,0 // movaps 0x5b25(%eax),%xmm4
.byte 15,16,78,32 // movups 0x20(%esi),%xmm1
.byte 15,16,110,96 // movups 0x60(%esi),%xmm5
.byte 15,88,204 // addps %xmm4,%xmm1
- .byte 15,40,176,196,97,0,0 // movaps 0x61c4(%eax),%xmm6
+ .byte 15,40,176,181,97,0,0 // movaps 0x61b5(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,212,97,0,0 // addps 0x61d4(%eax),%xmm6
+ .byte 15,88,176,197,97,0,0 // addps 0x61c5(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,88,244 // addps %xmm4,%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,228,97,0,0 // addps 0x61e4(%eax),%xmm6
+ .byte 15,88,176,213,97,0,0 // addps 0x61d5(%eax),%xmm6
.byte 15,17,182,160,0,0,0 // movups %xmm6,0xa0(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -63542,18 +63519,18 @@ _sk_bicubic_p3y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 71fa <_sk_bicubic_p3y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 71e9 <_sk_bicubic_p3y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,32 // movups 0x20(%esi),%xmm1
.byte 15,16,102,96 // movups 0x60(%esi),%xmm4
- .byte 15,88,136,118,97,0,0 // addps 0x6176(%eax),%xmm1
+ .byte 15,88,136,103,97,0,0 // addps 0x6167(%eax),%xmm1
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
- .byte 15,89,160,86,97,0,0 // mulps 0x6156(%eax),%xmm4
- .byte 15,88,160,198,92,0,0 // addps 0x5cc6(%eax),%xmm4
+ .byte 15,89,160,71,97,0,0 // mulps 0x6147(%eax),%xmm4
+ .byte 15,88,160,183,92,0,0 // addps 0x5cb7(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,17,166,160,0,0,0 // movups %xmm4,0xa0(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -63576,10 +63553,10 @@ _sk_callback_sse2:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,12 // sub $0xc,%esp
- .byte 139,117,12 // mov 0xc(%ebp),%esi
- .byte 139,125,8 // mov 0x8(%ebp),%edi
- .byte 139,71,8 // mov 0x8(%edi),%eax
- .byte 139,30 // mov (%esi),%ebx
+ .byte 139,117,8 // mov 0x8(%ebp),%esi
+ .byte 139,125,12 // mov 0xc(%ebp),%edi
+ .byte 139,31 // mov (%edi),%ebx
+ .byte 139,70,8 // mov 0x8(%esi),%eax
.byte 15,40,224 // movaps %xmm0,%xmm4
.byte 15,20,225 // unpcklps %xmm1,%xmm4
.byte 15,40,234 // movaps %xmm2,%xmm5
@@ -63621,11 +63598,11 @@ _sk_callback_sse2:
.byte 15,40,212 // movaps %xmm4,%xmm2
.byte 102,15,20,211 // unpcklpd %xmm3,%xmm2
.byte 15,18,220 // movhlps %xmm4,%xmm3
- .byte 141,70,8 // lea 0x8(%esi),%eax
+ .byte 141,71,8 // lea 0x8(%edi),%eax
.byte 131,236,8 // sub $0x8,%esp
.byte 80 // push %eax
- .byte 87 // push %edi
- .byte 255,86,4 // call *0x4(%esi)
+ .byte 86 // push %esi
+ .byte 255,87,4 // call *0x4(%edi)
.byte 131,196,28 // add $0x1c,%esp
.byte 94 // pop %esi
.byte 95 // pop %edi
@@ -63642,12 +63619,10 @@ _sk_clut_3D_sse2:
.byte 83 // push %ebx
.byte 87 // push %edi
.byte 86 // push %esi
- .byte 129,236,44,1,0,0 // sub $0x12c,%esp
- .byte 15,41,157,200,254,255,255 // movaps %xmm3,-0x138(%ebp)
+ .byte 129,236,28,1,0,0 // sub $0x11c,%esp
+ .byte 15,41,157,216,254,255,255 // movaps %xmm3,-0x128(%ebp)
.byte 15,40,216 // movaps %xmm0,%xmm3
.byte 139,69,12 // mov 0xc(%ebp),%eax
- .byte 141,72,4 // lea 0x4(%eax),%ecx
- .byte 137,141,20,255,255,255 // mov %ecx,-0xec(%ebp)
.byte 139,8 // mov (%eax),%ecx
.byte 139,81,12 // mov 0xc(%ecx),%edx
.byte 141,114,255 // lea -0x1(%edx),%esi
@@ -63656,7 +63631,7 @@ _sk_clut_3D_sse2:
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
.byte 15,89,194 // mulps %xmm2,%xmm0
.byte 15,40,224 // movaps %xmm0,%xmm4
- .byte 15,41,165,232,254,255,255 // movaps %xmm4,-0x118(%ebp)
+ .byte 15,41,165,248,254,255,255 // movaps %xmm4,-0x108(%ebp)
.byte 102,15,110,194 // movd %edx,%xmm0
.byte 102,15,112,240,0 // pshufd $0x0,%xmm0,%xmm6
.byte 102,15,127,117,152 // movdqa %xmm6,-0x68(%ebp)
@@ -63698,15 +63673,15 @@ _sk_clut_3D_sse2:
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
.byte 102,15,98,200 // punpckldq %xmm0,%xmm1
.byte 102,15,127,77,136 // movdqa %xmm1,-0x78(%ebp)
- .byte 232,0,0,0,0 // call 73e6 <_sk_clut_3D_sse2+0xf7>
+ .byte 232,0,0,0,0 // call 73cc <_sk_clut_3D_sse2+0xee>
.byte 90 // pop %edx
.byte 243,15,91,196 // cvttps2dq %xmm4,%xmm0
- .byte 102,15,127,133,248,254,255,255 // movdqa %xmm0,-0x108(%ebp)
+ .byte 102,15,127,133,8,255,255,255 // movdqa %xmm0,-0xf8(%ebp)
.byte 102,15,111,221 // movdqa %xmm5,%xmm3
.byte 102,15,254,216 // paddd %xmm0,%xmm3
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,254,195 // paddd %xmm3,%xmm0
- .byte 102,15,111,162,186,95,0,0 // movdqa 0x5fba(%edx),%xmm4
+ .byte 102,15,111,162,180,95,0,0 // movdqa 0x5fb4(%edx),%xmm4
.byte 102,15,127,165,120,255,255,255 // movdqa %xmm4,-0x88(%ebp)
.byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
@@ -63746,7 +63721,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,4,129 // movss (%ecx,%eax,4),%xmm0
.byte 15,20,248 // unpcklps %xmm0,%xmm7
.byte 102,15,20,252 // unpcklpd %xmm4,%xmm7
- .byte 102,15,111,130,58,89,0,0 // movdqa 0x593a(%edx),%xmm0
+ .byte 102,15,111,130,52,89,0,0 // movdqa 0x5934(%edx),%xmm0
.byte 102,15,127,133,104,255,255,255 // movdqa %xmm0,-0x98(%ebp)
.byte 102,15,254,200 // paddd %xmm0,%xmm1
.byte 102,15,112,193,229 // pshufd $0xe5,%xmm1,%xmm0
@@ -63763,8 +63738,8 @@ _sk_clut_3D_sse2:
.byte 243,15,16,4,129 // movss (%ecx,%eax,4),%xmm0
.byte 15,20,240 // unpcklps %xmm0,%xmm6
.byte 102,15,20,241 // unpcklpd %xmm1,%xmm6
- .byte 15,40,130,170,95,0,0 // movaps 0x5faa(%edx),%xmm0
- .byte 15,40,141,232,254,255,255 // movaps -0x118(%ebp),%xmm1
+ .byte 15,40,130,164,95,0,0 // movaps 0x5fa4(%edx),%xmm0
+ .byte 15,40,141,248,254,255,255 // movaps -0x108(%ebp),%xmm1
.byte 15,88,200 // addps %xmm0,%xmm1
.byte 15,41,77,200 // movaps %xmm1,-0x38(%ebp)
.byte 15,40,141,88,255,255,255 // movaps -0xa8(%ebp),%xmm1
@@ -63848,7 +63823,7 @@ _sk_clut_3D_sse2:
.byte 15,92,206 // subps %xmm6,%xmm1
.byte 15,89,204 // mulps %xmm4,%xmm1
.byte 15,88,206 // addps %xmm6,%xmm1
- .byte 15,41,141,216,254,255,255 // movaps %xmm1,-0x128(%ebp)
+ .byte 15,41,141,232,254,255,255 // movaps %xmm1,-0x118(%ebp)
.byte 243,15,91,133,72,255,255,255 // cvttps2dq -0xb8(%ebp),%xmm0
.byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4
.byte 102,15,111,77,152 // movdqa -0x68(%ebp),%xmm1
@@ -63859,7 +63834,7 @@ _sk_clut_3D_sse2:
.byte 102,15,112,196,232 // pshufd $0xe8,%xmm4,%xmm0
.byte 102,15,98,248 // punpckldq %xmm0,%xmm7
.byte 102,15,127,125,152 // movdqa %xmm7,-0x68(%ebp)
- .byte 102,15,254,189,248,254,255,255 // paddd -0x108(%ebp),%xmm7
+ .byte 102,15,254,189,8,255,255,255 // paddd -0xf8(%ebp),%xmm7
.byte 102,15,111,199 // movdqa %xmm7,%xmm0
.byte 102,15,254,69,136 // paddd -0x78(%ebp),%xmm0
.byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4
@@ -63996,7 +63971,7 @@ _sk_clut_3D_sse2:
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 15,88,208 // addps %xmm0,%xmm2
.byte 15,41,149,56,255,255,255 // movaps %xmm2,-0xc8(%ebp)
- .byte 15,40,133,216,254,255,255 // movaps -0x128(%ebp),%xmm0
+ .byte 15,40,133,232,254,255,255 // movaps -0x118(%ebp),%xmm0
.byte 15,92,216 // subps %xmm0,%xmm3
.byte 15,89,220 // mulps %xmm4,%xmm3
.byte 15,88,216 // addps %xmm0,%xmm3
@@ -64267,8 +64242,8 @@ _sk_clut_3D_sse2:
.byte 15,92,214 // subps %xmm6,%xmm2
.byte 15,89,211 // mulps %xmm3,%xmm2
.byte 15,88,214 // addps %xmm6,%xmm2
- .byte 15,91,157,248,254,255,255 // cvtdq2ps -0x108(%ebp),%xmm3
- .byte 15,40,165,232,254,255,255 // movaps -0x118(%ebp),%xmm4
+ .byte 15,91,157,8,255,255,255 // cvtdq2ps -0xf8(%ebp),%xmm3
+ .byte 15,40,165,248,254,255,255 // movaps -0x108(%ebp),%xmm4
.byte 15,92,227 // subps %xmm3,%xmm4
.byte 15,40,93,184 // movaps -0x48(%ebp),%xmm3
.byte 15,92,195 // subps %xmm3,%xmm0
@@ -64282,15 +64257,14 @@ _sk_clut_3D_sse2:
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 15,88,211 // addps %xmm3,%xmm2
- .byte 139,69,8 // mov 0x8(%ebp),%eax
- .byte 139,85,12 // mov 0xc(%ebp),%edx
- .byte 141,74,8 // lea 0x8(%edx),%ecx
+ .byte 139,77,12 // mov 0xc(%ebp),%ecx
+ .byte 141,65,8 // lea 0x8(%ecx),%eax
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,157,200,254,255,255 // movaps -0x138(%ebp),%xmm3
- .byte 81 // push %ecx
+ .byte 15,40,157,216,254,255,255 // movaps -0x128(%ebp),%xmm3
.byte 80 // push %eax
- .byte 255,82,4 // call *0x4(%edx)
- .byte 129,196,60,1,0,0 // add $0x13c,%esp
+ .byte 255,117,8 // pushl 0x8(%ebp)
+ .byte 255,81,4 // call *0x4(%ecx)
+ .byte 129,196,44,1,0,0 // add $0x12c,%esp
.byte 94 // pop %esi
.byte 95 // pop %edi
.byte 91 // pop %ebx
@@ -64306,10 +64280,8 @@ _sk_clut_4D_sse2:
.byte 83 // push %ebx
.byte 87 // push %edi
.byte 86 // push %esi
- .byte 129,236,92,1,0,0 // sub $0x15c,%esp
+ .byte 129,236,76,1,0,0 // sub $0x14c,%esp
.byte 139,69,12 // mov 0xc(%ebp),%eax
- .byte 141,72,4 // lea 0x4(%eax),%ecx
- .byte 137,141,212,254,255,255 // mov %ecx,-0x12c(%ebp)
.byte 139,16 // mov (%eax),%edx
.byte 139,74,16 // mov 0x10(%edx),%ecx
.byte 141,113,255 // lea -0x1(%ecx),%esi
@@ -64386,18 +64358,18 @@ _sk_clut_4D_sse2:
.byte 102,15,112,201,232 // pshufd $0xe8,%xmm1,%xmm1
.byte 102,15,98,217 // punpckldq %xmm1,%xmm3
.byte 102,15,127,93,152 // movdqa %xmm3,-0x68(%ebp)
- .byte 232,0,0,0,0 // call 7f7c <_sk_clut_4D_sse2+0x16e>
+ .byte 232,0,0,0,0 // call 7f58 <_sk_clut_4D_sse2+0x165>
.byte 89 // pop %ecx
.byte 15,40,197 // movaps %xmm5,%xmm0
- .byte 15,41,133,152,254,255,255 // movaps %xmm0,-0x168(%ebp)
+ .byte 15,41,133,168,254,255,255 // movaps %xmm0,-0x158(%ebp)
.byte 243,15,91,200 // cvttps2dq %xmm0,%xmm1
- .byte 102,15,127,141,184,254,255,255 // movdqa %xmm1,-0x148(%ebp)
+ .byte 102,15,127,141,200,254,255,255 // movdqa %xmm1,-0x138(%ebp)
.byte 102,15,254,241 // paddd %xmm1,%xmm6
.byte 102,15,127,117,200 // movdqa %xmm6,-0x38(%ebp)
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
.byte 102,15,254,214 // paddd %xmm6,%xmm2
.byte 102,15,254,218 // paddd %xmm2,%xmm3
- .byte 102,15,111,161,36,84,0,0 // movdqa 0x5424(%ecx),%xmm4
+ .byte 102,15,111,161,40,84,0,0 // movdqa 0x5428(%ecx),%xmm4
.byte 102,15,112,203,245 // pshufd $0xf5,%xmm3,%xmm1
.byte 102,15,244,220 // pmuludq %xmm4,%xmm3
.byte 102,15,244,204 // pmuludq %xmm4,%xmm1
@@ -64439,7 +64411,7 @@ _sk_clut_4D_sse2:
.byte 15,20,223 // unpcklps %xmm7,%xmm3
.byte 102,15,20,222 // unpcklpd %xmm6,%xmm3
.byte 102,15,41,157,232,254,255,255 // movapd %xmm3,-0x118(%ebp)
- .byte 102,15,254,137,164,77,0,0 // paddd 0x4da4(%ecx),%xmm1
+ .byte 102,15,254,137,168,77,0,0 // paddd 0x4da8(%ecx),%xmm1
.byte 102,15,112,241,229 // pshufd $0xe5,%xmm1,%xmm6
.byte 102,15,126,240 // movd %xmm6,%eax
.byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6
@@ -64454,7 +64426,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,60,130 // movss (%edx,%eax,4),%xmm7
.byte 15,20,223 // unpcklps %xmm7,%xmm3
.byte 102,15,20,222 // unpcklpd %xmm6,%xmm3
- .byte 15,40,185,20,84,0,0 // movaps 0x5414(%ecx),%xmm7
+ .byte 15,40,185,24,84,0,0 // movaps 0x5418(%ecx),%xmm7
.byte 15,88,199 // addps %xmm7,%xmm0
.byte 15,41,133,120,255,255,255 // movaps %xmm0,-0x88(%ebp)
.byte 15,40,133,248,254,255,255 // movaps -0x108(%ebp),%xmm0
@@ -64462,7 +64434,7 @@ _sk_clut_4D_sse2:
.byte 15,41,69,136 // movaps %xmm0,-0x78(%ebp)
.byte 15,40,133,56,255,255,255 // movaps -0xc8(%ebp),%xmm0
.byte 15,88,199 // addps %xmm7,%xmm0
- .byte 15,41,133,168,254,255,255 // movaps %xmm0,-0x158(%ebp)
+ .byte 15,41,133,184,254,255,255 // movaps %xmm0,-0x148(%ebp)
.byte 15,88,125,216 // addps -0x28(%ebp),%xmm7
.byte 243,15,91,255 // cvttps2dq %xmm7,%xmm7
.byte 102,15,112,199,245 // pshufd $0xf5,%xmm7,%xmm0
@@ -64475,7 +64447,7 @@ _sk_clut_4D_sse2:
.byte 102,15,127,101,168 // movdqa %xmm4,-0x58(%ebp)
.byte 102,15,254,212 // paddd %xmm4,%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,161,36,84,0,0 // movdqa 0x5424(%ecx),%xmm4
+ .byte 102,15,111,161,40,84,0,0 // movdqa 0x5428(%ecx),%xmm4
.byte 102,15,244,212 // pmuludq %xmm4,%xmm2
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
.byte 102,15,112,240,232 // pshufd $0xe8,%xmm0,%xmm6
@@ -64511,7 +64483,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5
.byte 15,20,213 // unpcklps %xmm5,%xmm2
.byte 102,15,20,214 // unpcklpd %xmm6,%xmm2
- .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0
+ .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0
.byte 102,15,112,232,229 // pshufd $0xe5,%xmm0,%xmm5
.byte 102,15,126,232 // movd %xmm5,%eax
.byte 102,15,112,232,78 // pshufd $0x4e,%xmm0,%xmm5
@@ -64543,7 +64515,7 @@ _sk_clut_4D_sse2:
.byte 15,92,251 // subps %xmm3,%xmm7
.byte 15,89,248 // mulps %xmm0,%xmm7
.byte 15,88,251 // addps %xmm3,%xmm7
- .byte 243,15,91,141,168,254,255,255 // cvttps2dq -0x158(%ebp),%xmm1
+ .byte 243,15,91,141,184,254,255,255 // cvttps2dq -0x148(%ebp),%xmm1
.byte 102,15,112,217,245 // pshufd $0xf5,%xmm1,%xmm3
.byte 102,15,111,133,88,255,255,255 // movdqa -0xa8(%ebp),%xmm0
.byte 102,15,244,216 // pmuludq %xmm0,%xmm3
@@ -64595,7 +64567,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5
.byte 15,20,245 // unpcklps %xmm5,%xmm6
.byte 102,15,20,240 // unpcklpd %xmm0,%xmm6
- .byte 102,15,254,137,164,77,0,0 // paddd 0x4da4(%ecx),%xmm1
+ .byte 102,15,254,137,168,77,0,0 // paddd 0x4da8(%ecx),%xmm1
.byte 102,15,112,193,229 // pshufd $0xe5,%xmm1,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
.byte 102,15,112,193,78 // pshufd $0x4e,%xmm1,%xmm0
@@ -64613,7 +64585,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
.byte 102,15,254,77,168 // paddd -0x58(%ebp),%xmm1
.byte 102,15,112,193,245 // pshufd $0xf5,%xmm1,%xmm0
- .byte 102,15,111,145,36,84,0,0 // movdqa 0x5424(%ecx),%xmm2
+ .byte 102,15,111,145,40,84,0,0 // movdqa 0x5428(%ecx),%xmm2
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
@@ -64649,7 +64621,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0
.byte 15,20,216 // unpcklps %xmm0,%xmm3
.byte 102,15,20,217 // unpcklpd %xmm1,%xmm3
- .byte 102,15,254,169,164,77,0,0 // paddd 0x4da4(%ecx),%xmm5
+ .byte 102,15,254,169,168,77,0,0 // paddd 0x4da8(%ecx),%xmm5
.byte 102,15,112,197,229 // pshufd $0xe5,%xmm5,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
.byte 102,15,112,197,78 // pshufd $0x4e,%xmm5,%xmm0
@@ -64702,14 +64674,14 @@ _sk_clut_4D_sse2:
.byte 102,15,112,193,232 // pshufd $0xe8,%xmm1,%xmm0
.byte 102,15,98,224 // punpckldq %xmm0,%xmm4
.byte 102,15,127,165,24,255,255,255 // movdqa %xmm4,-0xe8(%ebp)
- .byte 102,15,254,165,184,254,255,255 // paddd -0x148(%ebp),%xmm4
+ .byte 102,15,254,165,200,254,255,255 // paddd -0x138(%ebp),%xmm4
.byte 102,15,127,101,200 // movdqa %xmm4,-0x38(%ebp)
.byte 102,15,111,204 // movdqa %xmm4,%xmm1
.byte 102,15,254,141,72,255,255,255 // paddd -0xb8(%ebp),%xmm1
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,254,85,152 // paddd -0x68(%ebp),%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,153,36,84,0,0 // movdqa 0x5424(%ecx),%xmm3
+ .byte 102,15,111,153,40,84,0,0 // movdqa 0x5428(%ecx),%xmm3
.byte 102,15,244,211 // pmuludq %xmm3,%xmm2
.byte 102,15,244,195 // pmuludq %xmm3,%xmm0
.byte 102,15,111,251 // movdqa %xmm3,%xmm7
@@ -64748,7 +64720,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5
.byte 15,20,229 // unpcklps %xmm5,%xmm4
.byte 102,15,20,227 // unpcklpd %xmm3,%xmm4
- .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0
+ .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0
.byte 102,15,112,216,229 // pshufd $0xe5,%xmm0,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,216,78 // pshufd $0x4e,%xmm0,%xmm3
@@ -64800,7 +64772,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,52,130 // movss (%edx,%eax,4),%xmm6
.byte 15,20,238 // unpcklps %xmm6,%xmm5
.byte 102,15,20,235 // unpcklpd %xmm3,%xmm5
- .byte 102,15,111,137,164,77,0,0 // movdqa 0x4da4(%ecx),%xmm1
+ .byte 102,15,111,137,168,77,0,0 // movdqa 0x4da8(%ecx),%xmm1
.byte 102,15,254,249 // paddd %xmm1,%xmm7
.byte 102,15,112,223,229 // pshufd $0xe5,%xmm7,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
@@ -64834,7 +64806,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,226 // movdqa %xmm2,%xmm4
.byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0
.byte 102,15,112,208,245 // pshufd $0xf5,%xmm0,%xmm2
- .byte 102,15,111,153,36,84,0,0 // movdqa 0x5424(%ecx),%xmm3
+ .byte 102,15,111,153,40,84,0,0 // movdqa 0x5428(%ecx),%xmm3
.byte 102,15,244,195 // pmuludq %xmm3,%xmm0
.byte 102,15,244,211 // pmuludq %xmm3,%xmm2
.byte 102,15,112,218,232 // pshufd $0xe8,%xmm2,%xmm3
@@ -64891,7 +64863,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
.byte 102,15,254,85,168 // paddd -0x58(%ebp),%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,137,36,84,0,0 // movdqa 0x5424(%ecx),%xmm1
+ .byte 102,15,111,137,40,84,0,0 // movdqa 0x5428(%ecx),%xmm1
.byte 102,15,244,209 // pmuludq %xmm1,%xmm2
.byte 102,15,244,193 // pmuludq %xmm1,%xmm0
.byte 102,15,112,240,232 // pshufd $0xe8,%xmm0,%xmm6
@@ -64928,7 +64900,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4
.byte 15,20,212 // unpcklps %xmm4,%xmm2
.byte 102,15,20,214 // unpcklpd %xmm6,%xmm2
- .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0
+ .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0
.byte 102,15,112,224,229 // pshufd $0xe5,%xmm0,%xmm4
.byte 102,15,126,224 // movd %xmm4,%eax
.byte 102,15,112,224,78 // pshufd $0x4e,%xmm0,%xmm4
@@ -64996,7 +64968,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,93,152 // movdqa -0x68(%ebp),%xmm3
.byte 102,15,254,217 // paddd %xmm1,%xmm3
.byte 102,15,112,211,245 // pshufd $0xf5,%xmm3,%xmm2
- .byte 102,15,111,129,36,84,0,0 // movdqa 0x5424(%ecx),%xmm0
+ .byte 102,15,111,129,40,84,0,0 // movdqa 0x5428(%ecx),%xmm0
.byte 102,15,244,216 // pmuludq %xmm0,%xmm3
.byte 102,15,244,208 // pmuludq %xmm0,%xmm2
.byte 102,15,111,248 // movdqa %xmm0,%xmm7
@@ -65035,7 +65007,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,28,130 // movss (%edx,%eax,4),%xmm3
.byte 15,20,235 // unpcklps %xmm3,%xmm5
.byte 102,15,20,238 // unpcklpd %xmm6,%xmm5
- .byte 102,15,254,145,164,77,0,0 // paddd 0x4da4(%ecx),%xmm2
+ .byte 102,15,254,145,168,77,0,0 // paddd 0x4da8(%ecx),%xmm2
.byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
@@ -65087,7 +65059,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0
.byte 15,20,208 // unpcklps %xmm0,%xmm2
.byte 102,15,20,215 // unpcklpd %xmm7,%xmm2
- .byte 102,15,111,137,164,77,0,0 // movdqa 0x4da4(%ecx),%xmm1
+ .byte 102,15,111,137,168,77,0,0 // movdqa 0x4da8(%ecx),%xmm1
.byte 102,15,254,217 // paddd %xmm1,%xmm3
.byte 102,15,112,195,229 // pshufd $0xe5,%xmm3,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
@@ -65122,7 +65094,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,194 // movdqa %xmm2,%xmm0
.byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0
.byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4
- .byte 102,15,111,169,36,84,0,0 // movdqa 0x5424(%ecx),%xmm5
+ .byte 102,15,111,169,40,84,0,0 // movdqa 0x5428(%ecx),%xmm5
.byte 102,15,111,221 // movdqa %xmm5,%xmm3
.byte 102,15,244,195 // pmuludq %xmm3,%xmm0
.byte 102,15,244,227 // pmuludq %xmm3,%xmm4
@@ -65178,7 +65150,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
.byte 102,15,254,77,168 // paddd -0x58(%ebp),%xmm1
.byte 102,15,112,193,245 // pshufd $0xf5,%xmm1,%xmm0
- .byte 102,15,111,145,36,84,0,0 // movdqa 0x5424(%ecx),%xmm2
+ .byte 102,15,111,145,40,84,0,0 // movdqa 0x5428(%ecx),%xmm2
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
@@ -65214,7 +65186,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0
.byte 15,20,216 // unpcklps %xmm0,%xmm3
.byte 102,15,20,217 // unpcklpd %xmm1,%xmm3
- .byte 102,15,254,185,164,77,0,0 // paddd 0x4da4(%ecx),%xmm7
+ .byte 102,15,254,185,168,77,0,0 // paddd 0x4da8(%ecx),%xmm7
.byte 102,15,112,199,229 // pshufd $0xe5,%xmm7,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
.byte 102,15,112,199,78 // pshufd $0x4e,%xmm7,%xmm0
@@ -65264,7 +65236,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,233 // movdqa %xmm1,%xmm5
.byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0
.byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1
- .byte 102,15,111,145,36,84,0,0 // movdqa 0x5424(%ecx),%xmm2
+ .byte 102,15,111,145,40,84,0,0 // movdqa 0x5428(%ecx),%xmm2
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,15,111,250 // movdqa %xmm2,%xmm7
@@ -65303,7 +65275,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4
.byte 15,20,204 // unpcklps %xmm4,%xmm1
.byte 102,15,20,203 // unpcklpd %xmm3,%xmm1
- .byte 102,15,254,145,164,77,0,0 // paddd 0x4da4(%ecx),%xmm2
+ .byte 102,15,254,145,168,77,0,0 // paddd 0x4da8(%ecx),%xmm2
.byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
@@ -65357,7 +65329,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4
.byte 15,20,252 // unpcklps %xmm4,%xmm7
.byte 102,15,20,254 // unpcklpd %xmm6,%xmm7
- .byte 102,15,254,153,164,77,0,0 // paddd 0x4da4(%ecx),%xmm3
+ .byte 102,15,254,153,168,77,0,0 // paddd 0x4da8(%ecx),%xmm3
.byte 102,15,112,227,229 // pshufd $0xe5,%xmm3,%xmm4
.byte 102,15,126,224 // movd %xmm4,%eax
.byte 102,15,112,227,78 // pshufd $0x4e,%xmm3,%xmm4
@@ -65390,7 +65362,7 @@ _sk_clut_4D_sse2:
.byte 102,15,254,208 // paddd %xmm0,%xmm2
.byte 102,15,111,216 // movdqa %xmm0,%xmm3
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,137,36,84,0,0 // movdqa 0x5424(%ecx),%xmm1
+ .byte 102,15,111,137,40,84,0,0 // movdqa 0x5428(%ecx),%xmm1
.byte 102,15,244,209 // pmuludq %xmm1,%xmm2
.byte 102,15,244,193 // pmuludq %xmm1,%xmm0
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
@@ -65430,7 +65402,7 @@ _sk_clut_4D_sse2:
.byte 15,20,225 // unpcklps %xmm1,%xmm4
.byte 102,15,20,226 // unpcklpd %xmm2,%xmm4
.byte 102,15,41,165,88,255,255,255 // movapd %xmm4,-0xa8(%ebp)
- .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0
+ .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0
.byte 102,15,112,200,229 // pshufd $0xe5,%xmm0,%xmm1
.byte 102,15,126,200 // movd %xmm1,%eax
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
@@ -65484,7 +65456,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,52,130 // movss (%edx,%eax,4),%xmm6
.byte 15,20,206 // unpcklps %xmm6,%xmm1
.byte 102,15,20,203 // unpcklpd %xmm3,%xmm1
- .byte 102,15,254,145,164,77,0,0 // paddd 0x4da4(%ecx),%xmm2
+ .byte 102,15,254,145,168,77,0,0 // paddd 0x4da8(%ecx),%xmm2
.byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
@@ -65535,8 +65507,8 @@ _sk_clut_4D_sse2:
.byte 15,92,212 // subps %xmm4,%xmm2
.byte 15,89,211 // mulps %xmm3,%xmm2
.byte 15,88,212 // addps %xmm4,%xmm2
- .byte 15,91,157,184,254,255,255 // cvtdq2ps -0x148(%ebp),%xmm3
- .byte 15,40,165,152,254,255,255 // movaps -0x168(%ebp),%xmm4
+ .byte 15,91,157,200,254,255,255 // cvtdq2ps -0x138(%ebp),%xmm3
+ .byte 15,40,165,168,254,255,255 // movaps -0x158(%ebp),%xmm4
.byte 15,92,227 // subps %xmm3,%xmm4
.byte 15,40,157,40,255,255,255 // movaps -0xd8(%ebp),%xmm3
.byte 15,92,195 // subps %xmm3,%xmm0
@@ -65550,21 +65522,21 @@ _sk_clut_4D_sse2:
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 15,88,211 // addps %xmm3,%xmm2
- .byte 139,69,8 // mov 0x8(%ebp),%eax
- .byte 139,117,12 // mov 0xc(%ebp),%esi
- .byte 141,86,8 // lea 0x8(%esi),%edx
+ .byte 139,85,12 // mov 0xc(%ebp),%edx
+ .byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,153,100,77,0,0 // movaps 0x4d64(%ecx),%xmm3
- .byte 82 // push %edx
+ .byte 15,40,153,104,77,0,0 // movaps 0x4d68(%ecx),%xmm3
.byte 80 // push %eax
- .byte 255,86,4 // call *0x4(%esi)
- .byte 129,196,108,1,0,0 // add $0x16c,%esp
+ .byte 255,117,8 // pushl 0x8(%ebp)
+ .byte 255,82,4 // call *0x4(%edx)
+ .byte 129,196,92,1,0,0 // add $0x15c,%esp
.byte 94 // pop %esi
.byte 95 // pop %edi
.byte 91 // pop %ebx
.byte 93 // pop %ebp
.byte 195 // ret
.byte 144 // nop
+ .byte 144 // nop
HIDDEN _sk_start_pipeline_sse2_lowp
.globl _sk_start_pipeline_sse2_lowp
@@ -65578,7 +65550,7 @@ _sk_start_pipeline_sse2_lowp:
.byte 131,236,92 // sub $0x5c,%esp
.byte 139,125,12 // mov 0xc(%ebp),%edi
.byte 59,125,20 // cmp 0x14(%ebp),%edi
- .byte 15,131,193,0,0,0 // jae 949e <_sk_start_pipeline_sse2_lowp+0xd6>
+ .byte 15,131,193,0,0,0 // jae 947a <_sk_start_pipeline_sse2_lowp+0xd6>
.byte 139,85,16 // mov 0x10(%ebp),%edx
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 139,117,24 // mov 0x18(%ebp),%esi
@@ -65592,7 +65564,7 @@ _sk_start_pipeline_sse2_lowp:
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 137,223 // mov %ebx,%edi
.byte 137,243 // mov %esi,%ebx
- .byte 119,77 // ja 9450 <_sk_start_pipeline_sse2_lowp+0x88>
+ .byte 119,77 // ja 942c <_sk_start_pipeline_sse2_lowp+0x88>
.byte 139,117,8 // mov 0x8(%ebp),%esi
.byte 15,41,68,36,64 // movaps %xmm0,0x40(%esp)
.byte 15,41,68,36,48 // movaps %xmm0,0x30(%esp)
@@ -65614,13 +65586,13 @@ _sk_start_pipeline_sse2_lowp:
.byte 131,198,16 // add $0x10,%esi
.byte 57,214 // cmp %edx,%esi
.byte 137,198 // mov %eax,%esi
- .byte 118,182 // jbe 9406 <_sk_start_pipeline_sse2_lowp+0x3e>
+ .byte 118,182 // jbe 93e2 <_sk_start_pipeline_sse2_lowp+0x3e>
.byte 137,209 // mov %edx,%ecx
.byte 41,193 // sub %eax,%ecx
.byte 137,222 // mov %ebx,%esi
.byte 137,251 // mov %edi,%ebx
.byte 139,125,240 // mov -0x10(%ebp),%edi
- .byte 116,55 // je 9494 <_sk_start_pipeline_sse2_lowp+0xcc>
+ .byte 116,55 // je 9470 <_sk_start_pipeline_sse2_lowp+0xcc>
.byte 15,41,68,36,64 // movaps %xmm0,0x40(%esp)
.byte 15,41,68,36,48 // movaps %xmm0,0x30(%esp)
.byte 15,41,68,36,32 // movaps %xmm0,0x20(%esp)
@@ -65638,7 +65610,7 @@ _sk_start_pipeline_sse2_lowp:
.byte 139,85,16 // mov 0x10(%ebp),%edx
.byte 71 // inc %edi
.byte 59,125,20 // cmp 0x14(%ebp),%edi
- .byte 15,133,86,255,255,255 // jne 93f4 <_sk_start_pipeline_sse2_lowp+0x2c>
+ .byte 15,133,86,255,255,255 // jne 93d0 <_sk_start_pipeline_sse2_lowp+0x2c>
.byte 131,196,92 // add $0x5c,%esp
.byte 94 // pop %esi
.byte 95 // pop %edi
@@ -65710,7 +65682,7 @@ _sk_black_color_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,92 // sub $0x5c,%esp
- .byte 232,0,0,0,0 // call 954d <_sk_black_color_sse2_lowp+0xe>
+ .byte 232,0,0,0,0 // call 9529 <_sk_black_color_sse2_lowp+0xe>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,16 // mov 0x10(%ebp),%edx
@@ -65729,7 +65701,7 @@ _sk_black_color_sse2_lowp:
.byte 137,84,36,8 // mov %edx,0x8(%esp)
.byte 137,92,36,4 // mov %ebx,0x4(%esp)
.byte 137,12,36 // mov %ecx,(%esp)
- .byte 15,40,152,99,62,0,0 // movaps 0x3e63(%eax),%xmm3
+ .byte 15,40,152,103,62,0,0 // movaps 0x3e67(%eax),%xmm3
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 15,87,201 // xorps %xmm1,%xmm1
.byte 15,87,210 // xorps %xmm2,%xmm2
@@ -65751,7 +65723,7 @@ _sk_white_color_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,92 // sub $0x5c,%esp
- .byte 232,0,0,0,0 // call 95b8 <_sk_white_color_sse2_lowp+0xe>
+ .byte 232,0,0,0,0 // call 9594 <_sk_white_color_sse2_lowp+0xe>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,16 // mov 0x10(%ebp),%edx
@@ -65770,7 +65742,7 @@ _sk_white_color_sse2_lowp:
.byte 137,84,36,8 // mov %edx,0x8(%esp)
.byte 137,92,36,4 // mov %ebx,0x4(%esp)
.byte 137,12,36 // mov %ecx,(%esp)
- .byte 15,40,128,248,61,0,0 // movaps 0x3df8(%eax),%xmm0
+ .byte 15,40,128,252,61,0,0 // movaps 0x3dfc(%eax),%xmm0
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 15,40,216 // movaps %xmm0,%xmm3
@@ -65791,16 +65763,16 @@ _sk_set_rgb_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9622 <_sk_set_rgb_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 95fe <_sk_set_rgb_sse2_lowp+0xd>
.byte 94 // pop %esi
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 139,85,16 // mov 0x10(%ebp),%edx
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,57 // mov (%ecx),%edi
- .byte 243,15,16,150,82,62,0,0 // movss 0x3e52(%esi),%xmm2
+ .byte 243,15,16,150,86,62,0,0 // movss 0x3e56(%esi),%xmm2
.byte 243,15,16,7 // movss (%edi),%xmm0
.byte 243,15,89,194 // mulss %xmm2,%xmm0
- .byte 243,15,16,142,78,62,0,0 // movss 0x3e4e(%esi),%xmm1
+ .byte 243,15,16,142,82,62,0,0 // movss 0x3e52(%esi),%xmm1
.byte 243,15,88,193 // addss %xmm1,%xmm0
.byte 243,15,44,240 // cvttss2si %xmm0,%esi
.byte 102,15,110,198 // movd %esi,%xmm0
@@ -65849,7 +65821,7 @@ _sk_premul_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 96e6 <_sk_premul_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 96c2 <_sk_premul_sse2_lowp+0xd>
.byte 90 // pop %edx
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 139,77,16 // mov 0x10(%ebp),%ecx
@@ -65858,7 +65830,7 @@ _sk_premul_sse2_lowp:
.byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5
.byte 15,40,117,56 // movaps 0x38(%ebp),%xmm6
.byte 102,15,213,195 // pmullw %xmm3,%xmm0
- .byte 102,15,111,186,202,60,0,0 // movdqa 0x3cca(%edx),%xmm7
+ .byte 102,15,111,186,206,60,0,0 // movdqa 0x3cce(%edx),%xmm7
.byte 102,15,253,199 // paddw %xmm7,%xmm0
.byte 102,15,213,203 // pmullw %xmm3,%xmm1
.byte 102,15,253,207 // paddw %xmm7,%xmm1
@@ -65992,12 +65964,12 @@ _sk_invert_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9860 <_sk_invert_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 983c <_sk_invert_sse2_lowp+0xd>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,16 // mov 0x10(%ebp),%edx
.byte 139,117,20 // mov 0x14(%ebp),%esi
- .byte 102,15,111,160,80,59,0,0 // movdqa 0x3b50(%eax),%xmm4
+ .byte 102,15,111,160,84,59,0,0 // movdqa 0x3b54(%eax),%xmm4
.byte 102,15,111,236 // movdqa %xmm4,%xmm5
.byte 102,15,249,232 // psubw %xmm0,%xmm5
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
@@ -66079,11 +66051,11 @@ _sk_srcatop_sse2_lowp:
.byte 102,15,111,234 // movdqa %xmm2,%xmm5
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call 9958 <_sk_srcatop_sse2_lowp+0x19>
+ .byte 232,0,0,0,0 // call 9934 <_sk_srcatop_sse2_lowp+0x19>
.byte 88 // pop %eax
.byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6
.byte 102,15,213,206 // pmullw %xmm6,%xmm1
- .byte 102,15,111,128,88,58,0,0 // movdqa 0x3a58(%eax),%xmm0
+ .byte 102,15,111,128,92,58,0,0 // movdqa 0x3a5c(%eax),%xmm0
.byte 102,15,253,200 // paddw %xmm0,%xmm1
.byte 102,15,213,214 // pmullw %xmm6,%xmm2
.byte 102,15,253,208 // paddw %xmm0,%xmm2
@@ -66141,12 +66113,12 @@ _sk_dstatop_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9a2c <_sk_dstatop_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9a08 <_sk_dstatop_sse2_lowp+0xd>
.byte 88 // pop %eax
.byte 102,15,111,101,40 // movdqa 0x28(%ebp),%xmm4
.byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6
.byte 102,15,213,243 // pmullw %xmm3,%xmm6
- .byte 102,15,111,184,132,57,0,0 // movdqa 0x3984(%eax),%xmm7
+ .byte 102,15,111,184,136,57,0,0 // movdqa 0x3988(%eax),%xmm7
.byte 102,15,253,247 // paddw %xmm7,%xmm6
.byte 102,15,213,227 // pmullw %xmm3,%xmm4
.byte 102,15,253,231 // paddw %xmm7,%xmm4
@@ -66199,7 +66171,7 @@ _sk_srcin_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9aed <_sk_srcin_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9ac9 <_sk_srcin_sse2_lowp+0xd>
.byte 94 // pop %esi
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 139,77,16 // mov 0x10(%ebp),%ecx
@@ -66208,7 +66180,7 @@ _sk_srcin_sse2_lowp:
.byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5
.byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6
.byte 102,15,213,198 // pmullw %xmm6,%xmm0
- .byte 102,15,111,190,195,56,0,0 // movdqa 0x38c3(%esi),%xmm7
+ .byte 102,15,111,190,199,56,0,0 // movdqa 0x38c7(%esi),%xmm7
.byte 102,15,253,199 // paddw %xmm7,%xmm0
.byte 102,15,213,206 // pmullw %xmm6,%xmm1
.byte 102,15,253,207 // paddw %xmm7,%xmm1
@@ -66247,14 +66219,14 @@ _sk_dstin_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9b84 <_sk_dstin_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9b60 <_sk_dstin_sse2_lowp+0xd>
.byte 88 // pop %eax
.byte 102,15,111,85,56 // movdqa 0x38(%ebp),%xmm2
.byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5
.byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6
.byte 102,15,111,198 // movdqa %xmm6,%xmm0
.byte 102,15,213,195 // pmullw %xmm3,%xmm0
- .byte 102,15,111,184,44,56,0,0 // movdqa 0x382c(%eax),%xmm7
+ .byte 102,15,111,184,48,56,0,0 // movdqa 0x3830(%eax),%xmm7
.byte 102,15,253,199 // paddw %xmm7,%xmm0
.byte 102,15,111,205 // movdqa %xmm5,%xmm1
.byte 102,15,213,203 // pmullw %xmm3,%xmm1
@@ -66298,14 +66270,14 @@ _sk_srcout_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9c2c <_sk_srcout_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9c08 <_sk_srcout_sse2_lowp+0xd>
.byte 94 // pop %esi
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 139,77,16 // mov 0x10(%ebp),%ecx
.byte 139,85,20 // mov 0x14(%ebp),%edx
.byte 15,40,101,24 // movaps 0x18(%ebp),%xmm4
.byte 102,15,111,109,72 // movdqa 0x48(%ebp),%xmm5
- .byte 102,15,111,182,132,55,0,0 // movdqa 0x3784(%esi),%xmm6
+ .byte 102,15,111,182,136,55,0,0 // movdqa 0x3788(%esi),%xmm6
.byte 102,15,111,254 // movdqa %xmm6,%xmm7
.byte 102,15,249,253 // psubw %xmm5,%xmm7
.byte 102,15,213,199 // pmullw %xmm7,%xmm0
@@ -66349,11 +66321,11 @@ _sk_dstout_sse2_lowp:
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
- .byte 232,0,0,0,0 // call 9ccf <_sk_dstout_sse2_lowp+0x11>
+ .byte 232,0,0,0,0 // call 9cab <_sk_dstout_sse2_lowp+0x11>
.byte 88 // pop %eax
.byte 102,15,111,109,56 // movdqa 0x38(%ebp),%xmm5
.byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6
- .byte 102,15,111,184,225,54,0,0 // movdqa 0x36e1(%eax),%xmm7
+ .byte 102,15,111,184,229,54,0,0 // movdqa 0x36e5(%eax),%xmm7
.byte 102,15,111,223 // movdqa %xmm7,%xmm3
.byte 102,15,249,216 // psubw %xmm0,%xmm3
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
@@ -66405,9 +66377,9 @@ _sk_srcover_sse2_lowp:
.byte 15,41,85,232 // movaps %xmm2,-0x18(%ebp)
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,111,224 // movdqa %xmm0,%xmm4
- .byte 232,0,0,0,0 // call 9d8b <_sk_srcover_sse2_lowp+0x19>
+ .byte 232,0,0,0,0 // call 9d67 <_sk_srcover_sse2_lowp+0x19>
.byte 88 // pop %eax
- .byte 102,15,111,136,37,54,0,0 // movdqa 0x3625(%eax),%xmm1
+ .byte 102,15,111,136,41,54,0,0 // movdqa 0x3629(%eax),%xmm1
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,249,195 // psubw %xmm3,%xmm0
.byte 102,15,111,248 // movdqa %xmm0,%xmm7
@@ -66466,7 +66438,7 @@ _sk_dstover_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9e5b <_sk_dstover_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9e37 <_sk_dstover_sse2_lowp+0xd>
.byte 95 // pop %edi
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,16 // mov 0x10(%ebp),%edx
@@ -66474,7 +66446,7 @@ _sk_dstover_sse2_lowp:
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 102,15,111,101,56 // movdqa 0x38(%ebp),%xmm4
.byte 102,15,111,109,72 // movdqa 0x48(%ebp),%xmm5
- .byte 102,15,111,183,85,53,0,0 // movdqa 0x3555(%edi),%xmm6
+ .byte 102,15,111,183,89,53,0,0 // movdqa 0x3559(%edi),%xmm6
.byte 102,15,111,254 // movdqa %xmm6,%xmm7
.byte 102,15,249,253 // psubw %xmm5,%xmm7
.byte 102,15,213,199 // pmullw %xmm7,%xmm0
@@ -66520,12 +66492,12 @@ _sk_modulate_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9f10 <_sk_modulate_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9eec <_sk_modulate_sse2_lowp+0xd>
.byte 88 // pop %eax
.byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5
.byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6
.byte 102,15,213,198 // pmullw %xmm6,%xmm0
- .byte 102,15,111,184,160,52,0,0 // movdqa 0x34a0(%eax),%xmm7
+ .byte 102,15,111,184,164,52,0,0 // movdqa 0x34a4(%eax),%xmm7
.byte 102,15,253,199 // paddw %xmm7,%xmm0
.byte 102,15,213,205 // pmullw %xmm5,%xmm1
.byte 102,15,253,207 // paddw %xmm7,%xmm1
@@ -66568,10 +66540,10 @@ _sk_multiply_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call 9fac <_sk_multiply_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call 9f88 <_sk_multiply_sse2_lowp+0xd>
.byte 88 // pop %eax
.byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5
- .byte 102,15,111,160,4,52,0,0 // movdqa 0x3404(%eax),%xmm4
+ .byte 102,15,111,160,8,52,0,0 // movdqa 0x3408(%eax),%xmm4
.byte 102,15,111,245 // movdqa %xmm5,%xmm6
.byte 102,15,253,244 // paddw %xmm4,%xmm6
.byte 102,15,249,117,72 // psubw 0x48(%ebp),%xmm6
@@ -66641,17 +66613,17 @@ _sk_plus__sse2_lowp:
.byte 131,236,96 // sub $0x60,%esp
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call a0ad <_sk_plus__sse2_lowp+0x15>
+ .byte 232,0,0,0,0 // call a089 <_sk_plus__sse2_lowp+0x15>
.byte 88 // pop %eax
.byte 102,15,253,77,24 // paddw 0x18(%ebp),%xmm1
- .byte 102,15,111,168,19,51,0,0 // movdqa 0x3313(%eax),%xmm5
+ .byte 102,15,111,168,23,51,0,0 // movdqa 0x3317(%eax),%xmm5
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,217,197 // psubusw %xmm5,%xmm0
.byte 102,15,127,109,232 // movdqa %xmm5,-0x18(%ebp)
.byte 102,15,239,255 // pxor %xmm7,%xmm7
.byte 102,15,117,199 // pcmpeqw %xmm7,%xmm0
.byte 102,15,219,200 // pand %xmm0,%xmm1
- .byte 102,15,111,176,3,51,0,0 // movdqa 0x3303(%eax),%xmm6
+ .byte 102,15,111,176,7,51,0,0 // movdqa 0x3307(%eax),%xmm6
.byte 102,15,223,198 // pandn %xmm6,%xmm0
.byte 102,15,235,193 // por %xmm1,%xmm0
.byte 102,15,253,101,40 // paddw 0x28(%ebp),%xmm4
@@ -66712,14 +66684,14 @@ _sk_screen_sse2_lowp:
.byte 131,236,80 // sub $0x50,%esp
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call a1a5 <_sk_screen_sse2_lowp+0x15>
+ .byte 232,0,0,0,0 // call a181 <_sk_screen_sse2_lowp+0x15>
.byte 88 // pop %eax
.byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5
.byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6
.byte 102,15,111,198 // movdqa %xmm6,%xmm0
.byte 102,15,253,193 // paddw %xmm1,%xmm0
.byte 102,15,213,206 // pmullw %xmm6,%xmm1
- .byte 102,15,111,176,11,50,0,0 // movdqa 0x320b(%eax),%xmm6
+ .byte 102,15,111,176,15,50,0,0 // movdqa 0x320f(%eax),%xmm6
.byte 102,15,253,206 // paddw %xmm6,%xmm1
.byte 102,15,113,209,8 // psrlw $0x8,%xmm1
.byte 102,15,249,193 // psubw %xmm1,%xmm0
@@ -66777,9 +66749,9 @@ _sk_xor__sse2_lowp:
.byte 86 // push %esi
.byte 131,236,96 // sub $0x60,%esp
.byte 102,15,127,93,232 // movdqa %xmm3,-0x18(%ebp)
- .byte 232,0,0,0,0 // call a285 <_sk_xor__sse2_lowp+0x12>
+ .byte 232,0,0,0,0 // call a261 <_sk_xor__sse2_lowp+0x12>
.byte 88 // pop %eax
- .byte 102,15,111,176,43,49,0,0 // movdqa 0x312b(%eax),%xmm6
+ .byte 102,15,111,176,47,49,0,0 // movdqa 0x312f(%eax),%xmm6
.byte 102,15,111,254 // movdqa %xmm6,%xmm7
.byte 102,15,249,125,72 // psubw 0x48(%ebp),%xmm7
.byte 102,15,213,199 // pmullw %xmm7,%xmm0
@@ -66846,7 +66818,7 @@ _sk_darken_sse2_lowp:
.byte 15,41,85,200 // movaps %xmm2,-0x38(%ebp)
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call a37a <_sk_darken_sse2_lowp+0x25>
+ .byte 232,0,0,0,0 // call a356 <_sk_darken_sse2_lowp+0x25>
.byte 88 // pop %eax
.byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6
.byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5
@@ -66857,7 +66829,7 @@ _sk_darken_sse2_lowp:
.byte 102,15,111,222 // movdqa %xmm6,%xmm3
.byte 102,15,111,197 // movdqa %xmm5,%xmm0
.byte 102,15,213,199 // pmullw %xmm7,%xmm0
- .byte 102,15,111,184,86,48,0,0 // movdqa 0x3056(%eax),%xmm7
+ .byte 102,15,111,184,90,48,0,0 // movdqa 0x305a(%eax),%xmm7
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
.byte 102,15,239,247 // pxor %xmm7,%xmm6
.byte 102,15,111,232 // movdqa %xmm0,%xmm5
@@ -66866,7 +66838,7 @@ _sk_darken_sse2_lowp:
.byte 102,15,219,197 // pand %xmm5,%xmm0
.byte 102,15,223,233 // pandn %xmm1,%xmm5
.byte 102,15,235,232 // por %xmm0,%xmm5
- .byte 102,15,111,128,54,48,0,0 // movdqa 0x3036(%eax),%xmm0
+ .byte 102,15,111,128,58,48,0,0 // movdqa 0x303a(%eax),%xmm0
.byte 102,15,127,69,232 // movdqa %xmm0,-0x18(%ebp)
.byte 102,15,253,232 // paddw %xmm0,%xmm5
.byte 102,15,113,213,8 // psrlw $0x8,%xmm5
@@ -66957,7 +66929,7 @@ _sk_lighten_sse2_lowp:
.byte 15,41,85,200 // movaps %xmm2,-0x38(%ebp)
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call a523 <_sk_lighten_sse2_lowp+0x25>
+ .byte 232,0,0,0,0 // call a4ff <_sk_lighten_sse2_lowp+0x25>
.byte 88 // pop %eax
.byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5
.byte 102,15,111,197 // movdqa %xmm5,%xmm0
@@ -66966,7 +66938,7 @@ _sk_lighten_sse2_lowp:
.byte 102,15,213,77,72 // pmullw 0x48(%ebp),%xmm1
.byte 102,15,111,197 // movdqa %xmm5,%xmm0
.byte 102,15,213,198 // pmullw %xmm6,%xmm0
- .byte 102,15,111,184,173,46,0,0 // movdqa 0x2ead(%eax),%xmm7
+ .byte 102,15,111,184,177,46,0,0 // movdqa 0x2eb1(%eax),%xmm7
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
.byte 102,15,239,247 // pxor %xmm7,%xmm6
.byte 102,15,111,232 // movdqa %xmm0,%xmm5
@@ -66975,7 +66947,7 @@ _sk_lighten_sse2_lowp:
.byte 102,15,219,205 // pand %xmm5,%xmm1
.byte 102,15,223,232 // pandn %xmm0,%xmm5
.byte 102,15,235,233 // por %xmm1,%xmm5
- .byte 102,15,111,128,141,46,0,0 // movdqa 0x2e8d(%eax),%xmm0
+ .byte 102,15,111,128,145,46,0,0 // movdqa 0x2e91(%eax),%xmm0
.byte 102,15,253,232 // paddw %xmm0,%xmm5
.byte 102,15,111,208 // movdqa %xmm0,%xmm2
.byte 102,15,127,85,232 // movdqa %xmm2,-0x18(%ebp)
@@ -67065,7 +67037,7 @@ _sk_difference_sse2_lowp:
.byte 15,41,85,184 // movaps %xmm2,-0x48(%ebp)
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call a6c1 <_sk_difference_sse2_lowp+0x25>
+ .byte 232,0,0,0,0 // call a69d <_sk_difference_sse2_lowp+0x25>
.byte 88 // pop %eax
.byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6
.byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5
@@ -67076,7 +67048,7 @@ _sk_difference_sse2_lowp:
.byte 102,15,111,222 // movdqa %xmm6,%xmm3
.byte 102,15,111,197 // movdqa %xmm5,%xmm0
.byte 102,15,213,199 // pmullw %xmm7,%xmm0
- .byte 102,15,111,184,15,45,0,0 // movdqa 0x2d0f(%eax),%xmm7
+ .byte 102,15,111,184,19,45,0,0 // movdqa 0x2d13(%eax),%xmm7
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
.byte 102,15,239,247 // pxor %xmm7,%xmm6
.byte 102,15,111,232 // movdqa %xmm0,%xmm5
@@ -67085,11 +67057,11 @@ _sk_difference_sse2_lowp:
.byte 102,15,219,205 // pand %xmm5,%xmm1
.byte 102,15,223,232 // pandn %xmm0,%xmm5
.byte 102,15,235,233 // por %xmm1,%xmm5
- .byte 102,15,111,128,239,44,0,0 // movdqa 0x2cef(%eax),%xmm0
+ .byte 102,15,111,128,243,44,0,0 // movdqa 0x2cf3(%eax),%xmm0
.byte 102,15,127,69,216 // movdqa %xmm0,-0x28(%ebp)
.byte 102,15,253,232 // paddw %xmm0,%xmm5
.byte 102,15,113,213,7 // psrlw $0x7,%xmm5
- .byte 102,15,111,128,31,45,0,0 // movdqa 0x2d1f(%eax),%xmm0
+ .byte 102,15,111,128,35,45,0,0 // movdqa 0x2d23(%eax),%xmm0
.byte 102,15,127,69,232 // movdqa %xmm0,-0x18(%ebp)
.byte 102,15,219,232 // pand %xmm0,%xmm5
.byte 102,15,249,213 // psubw %xmm5,%xmm2
@@ -67178,16 +67150,16 @@ _sk_exclusion_sse2_lowp:
.byte 131,236,80 // sub $0x50,%esp
.byte 102,15,111,225 // movdqa %xmm1,%xmm4
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call a875 <_sk_exclusion_sse2_lowp+0x15>
+ .byte 232,0,0,0,0 // call a851 <_sk_exclusion_sse2_lowp+0x15>
.byte 88 // pop %eax
.byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5
.byte 102,15,111,197 // movdqa %xmm5,%xmm0
.byte 102,15,253,193 // paddw %xmm1,%xmm0
.byte 102,15,213,205 // pmullw %xmm5,%xmm1
- .byte 102,15,111,184,59,43,0,0 // movdqa 0x2b3b(%eax),%xmm7
+ .byte 102,15,111,184,63,43,0,0 // movdqa 0x2b3f(%eax),%xmm7
.byte 102,15,253,207 // paddw %xmm7,%xmm1
.byte 102,15,113,209,7 // psrlw $0x7,%xmm1
- .byte 102,15,111,176,107,43,0,0 // movdqa 0x2b6b(%eax),%xmm6
+ .byte 102,15,111,176,111,43,0,0 // movdqa 0x2b6f(%eax),%xmm6
.byte 102,15,219,206 // pand %xmm6,%xmm1
.byte 102,15,249,193 // psubw %xmm1,%xmm0
.byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5
@@ -67248,9 +67220,9 @@ _sk_hardlight_sse2_lowp:
.byte 15,41,85,152 // movaps %xmm2,-0x68(%ebp)
.byte 102,15,111,233 // movdqa %xmm1,%xmm5
.byte 102,15,111,224 // movdqa %xmm0,%xmm4
- .byte 232,0,0,0,0 // call a96f <_sk_hardlight_sse2_lowp+0x1c>
+ .byte 232,0,0,0,0 // call a94b <_sk_hardlight_sse2_lowp+0x1c>
.byte 88 // pop %eax
- .byte 102,15,111,184,65,42,0,0 // movdqa 0x2a41(%eax),%xmm7
+ .byte 102,15,111,184,69,42,0,0 // movdqa 0x2a45(%eax),%xmm7
.byte 102,15,127,125,200 // movdqa %xmm7,-0x38(%ebp)
.byte 102,15,111,215 // movdqa %xmm7,%xmm2
.byte 102,15,249,85,72 // psubw 0x48(%ebp),%xmm2
@@ -67277,7 +67249,7 @@ _sk_hardlight_sse2_lowp:
.byte 102,15,111,214 // movdqa %xmm6,%xmm2
.byte 102,15,249,209 // psubw %xmm1,%xmm2
.byte 102,15,253,228 // paddw %xmm4,%xmm4
- .byte 102,15,111,128,97,42,0,0 // movdqa 0x2a61(%eax),%xmm0
+ .byte 102,15,111,128,101,42,0,0 // movdqa 0x2a65(%eax),%xmm0
.byte 102,15,239,216 // pxor %xmm0,%xmm3
.byte 102,15,127,93,184 // movdqa %xmm3,-0x48(%ebp)
.byte 102,15,111,204 // movdqa %xmm4,%xmm1
@@ -67384,10 +67356,10 @@ _sk_overlay_sse2_lowp:
.byte 15,41,85,152 // movaps %xmm2,-0x68(%ebp)
.byte 15,41,141,120,255,255,255 // movaps %xmm1,-0x88(%ebp)
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call ab91 <_sk_overlay_sse2_lowp+0x1f>
+ .byte 232,0,0,0,0 // call ab6d <_sk_overlay_sse2_lowp+0x1f>
.byte 88 // pop %eax
.byte 102,15,111,69,72 // movdqa 0x48(%ebp),%xmm0
- .byte 102,15,111,184,31,40,0,0 // movdqa 0x281f(%eax),%xmm7
+ .byte 102,15,111,184,35,40,0,0 // movdqa 0x2823(%eax),%xmm7
.byte 102,15,127,125,232 // movdqa %xmm7,-0x18(%ebp)
.byte 102,15,111,215 // movdqa %xmm7,%xmm2
.byte 102,15,249,208 // psubw %xmm0,%xmm2
@@ -67414,7 +67386,7 @@ _sk_overlay_sse2_lowp:
.byte 102,15,249,234 // psubw %xmm2,%xmm5
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,253,192 // paddw %xmm0,%xmm0
- .byte 102,15,111,144,63,40,0,0 // movdqa 0x283f(%eax),%xmm2
+ .byte 102,15,111,144,67,40,0,0 // movdqa 0x2843(%eax),%xmm2
.byte 102,15,127,85,184 // movdqa %xmm2,-0x48(%ebp)
.byte 102,15,239,226 // pxor %xmm2,%xmm4
.byte 102,15,239,194 // pxor %xmm2,%xmm0
@@ -67544,10 +67516,10 @@ _sk_load_8888_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call ae00 <_sk_load_8888_sse2_lowp+0x30>
+ .byte 232,0,0,0,0 // call addc <_sk_load_8888_sse2_lowp+0x30>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,32 // ja ae26 <_sk_load_8888_sse2_lowp+0x56>
+ .byte 119,32 // ja ae02 <_sk_load_8888_sse2_lowp+0x56>
.byte 102,15,239,246 // pxor %xmm6,%xmm6
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,52,1,0,0 // mov 0x134(%edi,%ecx,4),%ecx
@@ -67556,14 +67528,14 @@ _sk_load_8888_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 243,15,16,28,179 // movss (%ebx,%esi,4),%xmm3
.byte 15,87,246 // xorps %xmm6,%xmm6
- .byte 235,73 // jmp ae6f <_sk_load_8888_sse2_lowp+0x9f>
+ .byte 235,73 // jmp ae4b <_sk_load_8888_sse2_lowp+0x9f>
.byte 102,15,16,28,179 // movupd (%ebx,%esi,4),%xmm3
.byte 15,16,116,179,16 // movups 0x10(%ebx,%esi,4),%xmm6
- .byte 235,61 // jmp ae6f <_sk_load_8888_sse2_lowp+0x9f>
+ .byte 235,61 // jmp ae4b <_sk_load_8888_sse2_lowp+0x9f>
.byte 102,15,110,68,179,8 // movd 0x8(%ebx,%esi,4),%xmm0
.byte 102,15,112,216,69 // pshufd $0x45,%xmm0,%xmm3
.byte 102,15,18,28,179 // movlpd (%ebx,%esi,4),%xmm3
- .byte 235,43 // jmp ae6f <_sk_load_8888_sse2_lowp+0x9f>
+ .byte 235,43 // jmp ae4b <_sk_load_8888_sse2_lowp+0x9f>
.byte 102,15,110,68,179,24 // movd 0x18(%ebx,%esi,4),%xmm0
.byte 102,15,112,240,69 // pshufd $0x45,%xmm0,%xmm6
.byte 243,15,16,68,179,20 // movss 0x14(%ebx,%esi,4),%xmm0
@@ -67580,7 +67552,7 @@ _sk_load_8888_sse2_lowp:
.byte 102,15,114,240,16 // pslld $0x10,%xmm0
.byte 102,15,114,224,16 // psrad $0x10,%xmm0
.byte 102,15,107,200 // packssdw %xmm0,%xmm1
- .byte 102,15,111,175,176,37,0,0 // movdqa 0x25b0(%edi),%xmm5
+ .byte 102,15,111,175,180,37,0,0 // movdqa 0x25b4(%edi),%xmm5
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,219,197 // pand %xmm5,%xmm0
.byte 102,15,113,209,8 // psrlw $0x8,%xmm1
@@ -67660,10 +67632,10 @@ _sk_load_8888_dst_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call af8d <_sk_load_8888_dst_sse2_lowp+0x3d>
+ .byte 232,0,0,0,0 // call af69 <_sk_load_8888_dst_sse2_lowp+0x3d>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,32 // ja afb3 <_sk_load_8888_dst_sse2_lowp+0x63>
+ .byte 119,32 // ja af8f <_sk_load_8888_dst_sse2_lowp+0x63>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,59,1,0,0 // mov 0x13b(%edi,%ecx,4),%ecx
@@ -67672,14 +67644,14 @@ _sk_load_8888_dst_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 243,15,16,60,179 // movss (%ebx,%esi,4),%xmm7
.byte 15,87,219 // xorps %xmm3,%xmm3
- .byte 235,73 // jmp affc <_sk_load_8888_dst_sse2_lowp+0xac>
+ .byte 235,73 // jmp afd8 <_sk_load_8888_dst_sse2_lowp+0xac>
.byte 102,15,16,60,179 // movupd (%ebx,%esi,4),%xmm7
.byte 15,16,92,179,16 // movups 0x10(%ebx,%esi,4),%xmm3
- .byte 235,61 // jmp affc <_sk_load_8888_dst_sse2_lowp+0xac>
+ .byte 235,61 // jmp afd8 <_sk_load_8888_dst_sse2_lowp+0xac>
.byte 102,15,110,84,179,8 // movd 0x8(%ebx,%esi,4),%xmm2
.byte 102,15,112,250,69 // pshufd $0x45,%xmm2,%xmm7
.byte 102,15,18,60,179 // movlpd (%ebx,%esi,4),%xmm7
- .byte 235,43 // jmp affc <_sk_load_8888_dst_sse2_lowp+0xac>
+ .byte 235,43 // jmp afd8 <_sk_load_8888_dst_sse2_lowp+0xac>
.byte 102,15,110,84,179,24 // movd 0x18(%ebx,%esi,4),%xmm2
.byte 102,15,112,218,69 // pshufd $0x45,%xmm2,%xmm3
.byte 243,15,16,84,179,20 // movss 0x14(%ebx,%esi,4),%xmm2
@@ -67696,7 +67668,7 @@ _sk_load_8888_dst_sse2_lowp:
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,114,226,16 // psrad $0x10,%xmm2
.byte 102,15,107,242 // packssdw %xmm2,%xmm6
- .byte 102,15,111,151,35,36,0,0 // movdqa 0x2423(%edi),%xmm2
+ .byte 102,15,111,151,39,36,0,0 // movdqa 0x2427(%edi),%xmm2
.byte 102,15,111,206 // movdqa %xmm6,%xmm1
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 102,15,113,214,8 // psrlw $0x8,%xmm6
@@ -67790,19 +67762,19 @@ _sk_store_8888_sse2_lowp:
.byte 128,227,7 // and $0x7,%bl
.byte 254,203 // dec %bl
.byte 128,251,6 // cmp $0x6,%bl
- .byte 232,0,0,0,0 // call b158 <_sk_store_8888_sse2_lowp+0x74>
+ .byte 232,0,0,0,0 // call b134 <_sk_store_8888_sse2_lowp+0x74>
.byte 89 // pop %ecx
.byte 139,117,16 // mov 0x10(%ebp),%esi
.byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5
- .byte 119,19 // ja b175 <_sk_store_8888_sse2_lowp+0x91>
+ .byte 119,19 // ja b151 <_sk_store_8888_sse2_lowp+0x91>
.byte 15,182,219 // movzbl %bl,%ebx
.byte 3,140,153,184,0,0,0 // add 0xb8(%ecx,%ebx,4),%ecx
.byte 255,225 // jmp *%ecx
.byte 102,15,126,60,183 // movd %xmm7,(%edi,%esi,4)
- .byte 235,93 // jmp b1d2 <_sk_store_8888_sse2_lowp+0xee>
+ .byte 235,93 // jmp b1ae <_sk_store_8888_sse2_lowp+0xee>
.byte 243,15,127,60,183 // movdqu %xmm7,(%edi,%esi,4)
.byte 243,15,127,116,183,16 // movdqu %xmm6,0x10(%edi,%esi,4)
- .byte 235,80 // jmp b1d2 <_sk_store_8888_sse2_lowp+0xee>
+ .byte 235,80 // jmp b1ae <_sk_store_8888_sse2_lowp+0xee>
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
.byte 15,40,227 // movaps %xmm3,%xmm4
.byte 102,15,112,223,78 // pshufd $0x4e,%xmm7,%xmm3
@@ -67810,7 +67782,7 @@ _sk_store_8888_sse2_lowp:
.byte 15,40,220 // movaps %xmm4,%xmm3
.byte 102,15,111,230 // movdqa %xmm6,%xmm4
.byte 102,15,214,60,183 // movq %xmm7,(%edi,%esi,4)
- .byte 235,48 // jmp b1d2 <_sk_store_8888_sse2_lowp+0xee>
+ .byte 235,48 // jmp b1ae <_sk_store_8888_sse2_lowp+0xee>
.byte 102,15,112,222,78 // pshufd $0x4e,%xmm6,%xmm3
.byte 102,15,126,92,183,24 // movd %xmm3,0x18(%edi,%esi,4)
.byte 15,40,93,72 // movaps 0x48(%ebp),%xmm3
@@ -67847,7 +67819,7 @@ _sk_store_8888_sse2_lowp:
.byte 0,0 // add %al,(%eax)
.byte 42,0 // sub (%eax),%al
.byte 0,0 // add %al,(%eax)
- .byte 117,0 // jne b21e <_sk_store_8888_sse2_lowp+0x13a>
+ .byte 117,0 // jne b1fa <_sk_store_8888_sse2_lowp+0x13a>
.byte 0,0 // add %al,(%eax)
.byte 111 // outsl %ds:(%esi),(%dx)
.byte 0,0 // add %al,(%eax)
@@ -67879,10 +67851,10 @@ _sk_load_bgra_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call b25c <_sk_load_bgra_sse2_lowp+0x30>
+ .byte 232,0,0,0,0 // call b238 <_sk_load_bgra_sse2_lowp+0x30>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,32 // ja b282 <_sk_load_bgra_sse2_lowp+0x56>
+ .byte 119,32 // ja b25e <_sk_load_bgra_sse2_lowp+0x56>
.byte 102,15,239,246 // pxor %xmm6,%xmm6
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,52,1,0,0 // mov 0x134(%edi,%ecx,4),%ecx
@@ -67891,14 +67863,14 @@ _sk_load_bgra_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 243,15,16,28,179 // movss (%ebx,%esi,4),%xmm3
.byte 15,87,246 // xorps %xmm6,%xmm6
- .byte 235,73 // jmp b2cb <_sk_load_bgra_sse2_lowp+0x9f>
+ .byte 235,73 // jmp b2a7 <_sk_load_bgra_sse2_lowp+0x9f>
.byte 102,15,16,28,179 // movupd (%ebx,%esi,4),%xmm3
.byte 15,16,116,179,16 // movups 0x10(%ebx,%esi,4),%xmm6
- .byte 235,61 // jmp b2cb <_sk_load_bgra_sse2_lowp+0x9f>
+ .byte 235,61 // jmp b2a7 <_sk_load_bgra_sse2_lowp+0x9f>
.byte 102,15,110,68,179,8 // movd 0x8(%ebx,%esi,4),%xmm0
.byte 102,15,112,216,69 // pshufd $0x45,%xmm0,%xmm3
.byte 102,15,18,28,179 // movlpd (%ebx,%esi,4),%xmm3
- .byte 235,43 // jmp b2cb <_sk_load_bgra_sse2_lowp+0x9f>
+ .byte 235,43 // jmp b2a7 <_sk_load_bgra_sse2_lowp+0x9f>
.byte 102,15,110,68,179,24 // movd 0x18(%ebx,%esi,4),%xmm0
.byte 102,15,112,240,69 // pshufd $0x45,%xmm0,%xmm6
.byte 243,15,16,68,179,20 // movss 0x14(%ebx,%esi,4),%xmm0
@@ -67915,7 +67887,7 @@ _sk_load_bgra_sse2_lowp:
.byte 102,15,114,240,16 // pslld $0x10,%xmm0
.byte 102,15,114,224,16 // psrad $0x10,%xmm0
.byte 102,15,107,200 // packssdw %xmm0,%xmm1
- .byte 102,15,111,175,84,33,0,0 // movdqa 0x2154(%edi),%xmm5
+ .byte 102,15,111,175,88,33,0,0 // movdqa 0x2158(%edi),%xmm5
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,219,213 // pand %xmm5,%xmm2
.byte 102,15,113,209,8 // psrlw $0x8,%xmm1
@@ -67995,10 +67967,10 @@ _sk_load_bgra_dst_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call b3e9 <_sk_load_bgra_dst_sse2_lowp+0x3d>
+ .byte 232,0,0,0,0 // call b3c5 <_sk_load_bgra_dst_sse2_lowp+0x3d>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,32 // ja b40f <_sk_load_bgra_dst_sse2_lowp+0x63>
+ .byte 119,32 // ja b3eb <_sk_load_bgra_dst_sse2_lowp+0x63>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,59,1,0,0 // mov 0x13b(%edi,%ecx,4),%ecx
@@ -68007,14 +67979,14 @@ _sk_load_bgra_dst_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 243,15,16,60,179 // movss (%ebx,%esi,4),%xmm7
.byte 15,87,219 // xorps %xmm3,%xmm3
- .byte 235,73 // jmp b458 <_sk_load_bgra_dst_sse2_lowp+0xac>
+ .byte 235,73 // jmp b434 <_sk_load_bgra_dst_sse2_lowp+0xac>
.byte 102,15,16,60,179 // movupd (%ebx,%esi,4),%xmm7
.byte 15,16,92,179,16 // movups 0x10(%ebx,%esi,4),%xmm3
- .byte 235,61 // jmp b458 <_sk_load_bgra_dst_sse2_lowp+0xac>
+ .byte 235,61 // jmp b434 <_sk_load_bgra_dst_sse2_lowp+0xac>
.byte 102,15,110,84,179,8 // movd 0x8(%ebx,%esi,4),%xmm2
.byte 102,15,112,250,69 // pshufd $0x45,%xmm2,%xmm7
.byte 102,15,18,60,179 // movlpd (%ebx,%esi,4),%xmm7
- .byte 235,43 // jmp b458 <_sk_load_bgra_dst_sse2_lowp+0xac>
+ .byte 235,43 // jmp b434 <_sk_load_bgra_dst_sse2_lowp+0xac>
.byte 102,15,110,84,179,24 // movd 0x18(%ebx,%esi,4),%xmm2
.byte 102,15,112,218,69 // pshufd $0x45,%xmm2,%xmm3
.byte 243,15,16,84,179,20 // movss 0x14(%ebx,%esi,4),%xmm2
@@ -68031,7 +68003,7 @@ _sk_load_bgra_dst_sse2_lowp:
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,114,226,16 // psrad $0x10,%xmm2
.byte 102,15,107,242 // packssdw %xmm2,%xmm6
- .byte 102,15,111,151,199,31,0,0 // movdqa 0x1fc7(%edi),%xmm2
+ .byte 102,15,111,151,203,31,0,0 // movdqa 0x1fcb(%edi),%xmm2
.byte 102,15,111,206 // movdqa %xmm6,%xmm1
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 102,15,113,214,8 // psrlw $0x8,%xmm6
@@ -68125,19 +68097,19 @@ _sk_store_bgra_sse2_lowp:
.byte 128,227,7 // and $0x7,%bl
.byte 254,203 // dec %bl
.byte 128,251,6 // cmp $0x6,%bl
- .byte 232,0,0,0,0 // call b5b4 <_sk_store_bgra_sse2_lowp+0x74>
+ .byte 232,0,0,0,0 // call b590 <_sk_store_bgra_sse2_lowp+0x74>
.byte 89 // pop %ecx
.byte 139,117,16 // mov 0x10(%ebp),%esi
.byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5
- .byte 119,19 // ja b5d1 <_sk_store_bgra_sse2_lowp+0x91>
+ .byte 119,19 // ja b5ad <_sk_store_bgra_sse2_lowp+0x91>
.byte 15,182,219 // movzbl %bl,%ebx
.byte 3,140,153,184,0,0,0 // add 0xb8(%ecx,%ebx,4),%ecx
.byte 255,225 // jmp *%ecx
.byte 102,15,126,60,183 // movd %xmm7,(%edi,%esi,4)
- .byte 235,93 // jmp b62e <_sk_store_bgra_sse2_lowp+0xee>
+ .byte 235,93 // jmp b60a <_sk_store_bgra_sse2_lowp+0xee>
.byte 243,15,127,60,183 // movdqu %xmm7,(%edi,%esi,4)
.byte 243,15,127,116,183,16 // movdqu %xmm6,0x10(%edi,%esi,4)
- .byte 235,80 // jmp b62e <_sk_store_bgra_sse2_lowp+0xee>
+ .byte 235,80 // jmp b60a <_sk_store_bgra_sse2_lowp+0xee>
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
.byte 15,40,227 // movaps %xmm3,%xmm4
.byte 102,15,112,223,78 // pshufd $0x4e,%xmm7,%xmm3
@@ -68145,7 +68117,7 @@ _sk_store_bgra_sse2_lowp:
.byte 15,40,220 // movaps %xmm4,%xmm3
.byte 102,15,111,230 // movdqa %xmm6,%xmm4
.byte 102,15,214,60,183 // movq %xmm7,(%edi,%esi,4)
- .byte 235,48 // jmp b62e <_sk_store_bgra_sse2_lowp+0xee>
+ .byte 235,48 // jmp b60a <_sk_store_bgra_sse2_lowp+0xee>
.byte 102,15,112,222,78 // pshufd $0x4e,%xmm6,%xmm3
.byte 102,15,126,92,183,24 // movd %xmm3,0x18(%edi,%esi,4)
.byte 15,40,93,72 // movaps 0x48(%ebp),%xmm3
@@ -68182,7 +68154,7 @@ _sk_store_bgra_sse2_lowp:
.byte 0,0 // add %al,(%eax)
.byte 42,0 // sub (%eax),%al
.byte 0,0 // add %al,(%eax)
- .byte 117,0 // jne b67a <_sk_store_bgra_sse2_lowp+0x13a>
+ .byte 117,0 // jne b656 <_sk_store_bgra_sse2_lowp+0x13a>
.byte 0,0 // add %al,(%eax)
.byte 111 // outsl %ds:(%esi),(%dx)
.byte 0,0 // add %al,(%eax)
@@ -68217,10 +68189,10 @@ _sk_load_565_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call b6c3 <_sk_load_565_sse2_lowp+0x3b>
+ .byte 232,0,0,0,0 // call b69f <_sk_load_565_sse2_lowp+0x3b>
.byte 94 // pop %esi
.byte 139,125,16 // mov 0x10(%ebp),%edi
- .byte 119,28 // ja b6e5 <_sk_load_565_sse2_lowp+0x5d>
+ .byte 119,28 // ja b6c1 <_sk_load_565_sse2_lowp+0x5d>
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,142,245,0,0,0 // mov 0xf5(%esi,%ecx,4),%ecx
@@ -68228,14 +68200,14 @@ _sk_load_565_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,183,12,123 // movzwl (%ebx,%edi,2),%ecx
.byte 102,15,110,193 // movd %ecx,%xmm0
- .byte 235,59 // jmp b720 <_sk_load_565_sse2_lowp+0x98>
+ .byte 235,59 // jmp b6fc <_sk_load_565_sse2_lowp+0x98>
.byte 243,15,111,4,123 // movdqu (%ebx,%edi,2),%xmm0
- .byte 235,52 // jmp b720 <_sk_load_565_sse2_lowp+0x98>
+ .byte 235,52 // jmp b6fc <_sk_load_565_sse2_lowp+0x98>
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,196,68,123,4,2 // pinsrw $0x2,0x4(%ebx,%edi,2),%xmm0
.byte 243,15,16,12,123 // movss (%ebx,%edi,2),%xmm1
.byte 243,15,16,193 // movss %xmm1,%xmm0
- .byte 235,30 // jmp b720 <_sk_load_565_sse2_lowp+0x98>
+ .byte 235,30 // jmp b6fc <_sk_load_565_sse2_lowp+0x98>
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,196,68,123,12,6 // pinsrw $0x6,0xc(%ebx,%edi,2),%xmm0
.byte 102,15,196,68,123,10,5 // pinsrw $0x5,0xa(%ebx,%edi,2),%xmm0
@@ -68243,11 +68215,11 @@ _sk_load_565_sse2_lowp:
.byte 102,15,18,4,123 // movlpd (%ebx,%edi,2),%xmm0
.byte 102,15,111,248 // movdqa %xmm0,%xmm7
.byte 102,15,113,215,8 // psrlw $0x8,%xmm7
- .byte 102,15,219,190,45,29,0,0 // pand 0x1d2d(%esi),%xmm7
+ .byte 102,15,219,190,49,29,0,0 // pand 0x1d31(%esi),%xmm7
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
.byte 102,15,113,209,5 // psrlw $0x5,%xmm1
- .byte 102,15,219,142,61,29,0,0 // pand 0x1d3d(%esi),%xmm1
- .byte 102,15,111,150,77,29,0,0 // movdqa 0x1d4d(%esi),%xmm2
+ .byte 102,15,219,142,65,29,0,0 // pand 0x1d41(%esi),%xmm1
+ .byte 102,15,111,150,81,29,0,0 // movdqa 0x1d51(%esi),%xmm2
.byte 102,15,219,208 // pand %xmm0,%xmm2
.byte 102,15,113,208,13 // psrlw $0xd,%xmm0
.byte 102,15,235,199 // por %xmm7,%xmm0
@@ -68269,7 +68241,7 @@ _sk_load_565_sse2_lowp:
.byte 137,124,36,8 // mov %edi,0x8(%esp)
.byte 137,76,36,4 // mov %ecx,0x4(%esp)
.byte 137,20,36 // mov %edx,(%esp)
- .byte 15,40,158,237,28,0,0 // movaps 0x1ced(%esi),%xmm3
+ .byte 15,40,158,241,28,0,0 // movaps 0x1cf1(%esi),%xmm3
.byte 255,80,4 // call *0x4(%eax)
.byte 131,196,92 // add $0x5c,%esp
.byte 94 // pop %esi
@@ -68315,10 +68287,10 @@ _sk_load_565_dst_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call b7ff <_sk_load_565_dst_sse2_lowp+0x2b>
+ .byte 232,0,0,0,0 // call b7db <_sk_load_565_dst_sse2_lowp+0x2b>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja b821 <_sk_load_565_dst_sse2_lowp+0x4d>
+ .byte 119,28 // ja b7fd <_sk_load_565_dst_sse2_lowp+0x4d>
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,249,0,0,0 // mov 0xf9(%edi,%ecx,4),%ecx
@@ -68326,14 +68298,14 @@ _sk_load_565_dst_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,183,12,115 // movzwl (%ebx,%esi,2),%ecx
.byte 102,15,110,225 // movd %ecx,%xmm4
- .byte 235,59 // jmp b85c <_sk_load_565_dst_sse2_lowp+0x88>
+ .byte 235,59 // jmp b838 <_sk_load_565_dst_sse2_lowp+0x88>
.byte 243,15,111,36,115 // movdqu (%ebx,%esi,2),%xmm4
- .byte 235,52 // jmp b85c <_sk_load_565_dst_sse2_lowp+0x88>
+ .byte 235,52 // jmp b838 <_sk_load_565_dst_sse2_lowp+0x88>
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,100,115,4,2 // pinsrw $0x2,0x4(%ebx,%esi,2),%xmm4
.byte 243,15,16,44,115 // movss (%ebx,%esi,2),%xmm5
.byte 243,15,16,229 // movss %xmm5,%xmm4
- .byte 235,30 // jmp b85c <_sk_load_565_dst_sse2_lowp+0x88>
+ .byte 235,30 // jmp b838 <_sk_load_565_dst_sse2_lowp+0x88>
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,100,115,12,6 // pinsrw $0x6,0xc(%ebx,%esi,2),%xmm4
.byte 102,15,196,100,115,10,5 // pinsrw $0x5,0xa(%ebx,%esi,2),%xmm4
@@ -68341,11 +68313,11 @@ _sk_load_565_dst_sse2_lowp:
.byte 102,15,18,36,115 // movlpd (%ebx,%esi,2),%xmm4
.byte 102,15,111,244 // movdqa %xmm4,%xmm6
.byte 102,15,113,214,8 // psrlw $0x8,%xmm6
- .byte 102,15,219,183,241,27,0,0 // pand 0x1bf1(%edi),%xmm6
+ .byte 102,15,219,183,245,27,0,0 // pand 0x1bf5(%edi),%xmm6
.byte 102,15,111,236 // movdqa %xmm4,%xmm5
.byte 102,15,113,213,5 // psrlw $0x5,%xmm5
- .byte 102,15,219,175,1,28,0,0 // pand 0x1c01(%edi),%xmm5
- .byte 102,15,111,191,17,28,0,0 // movdqa 0x1c11(%edi),%xmm7
+ .byte 102,15,219,175,5,28,0,0 // pand 0x1c05(%edi),%xmm5
+ .byte 102,15,111,191,21,28,0,0 // movdqa 0x1c15(%edi),%xmm7
.byte 102,15,219,252 // pand %xmm4,%xmm7
.byte 102,15,113,212,13 // psrlw $0xd,%xmm4
.byte 102,15,235,230 // por %xmm6,%xmm4
@@ -68358,7 +68330,7 @@ _sk_load_565_dst_sse2_lowp:
.byte 102,15,113,215,2 // psrlw $0x2,%xmm7
.byte 102,15,235,254 // por %xmm6,%xmm7
.byte 141,72,8 // lea 0x8(%eax),%ecx
- .byte 15,40,183,177,27,0,0 // movaps 0x1bb1(%edi),%xmm6
+ .byte 15,40,183,181,27,0,0 // movaps 0x1bb5(%edi),%xmm6
.byte 15,41,116,36,64 // movaps %xmm6,0x40(%esp)
.byte 139,125,20 // mov 0x14(%ebp),%edi
.byte 137,124,36,12 // mov %edi,0xc(%esp)
@@ -68403,15 +68375,15 @@ _sk_store_565_sse2_lowp:
.byte 86 // push %esi
.byte 131,236,92 // sub $0x5c,%esp
.byte 102,15,111,226 // movdqa %xmm2,%xmm4
- .byte 232,0,0,0,0 // call b926 <_sk_store_565_sse2_lowp+0x12>
+ .byte 232,0,0,0,0 // call b902 <_sk_store_565_sse2_lowp+0x12>
.byte 95 // pop %edi
.byte 15,40,109,72 // movaps 0x48(%ebp),%xmm5
.byte 102,15,111,208 // movdqa %xmm0,%xmm2
.byte 102,15,113,242,8 // psllw $0x8,%xmm2
- .byte 102,15,219,151,250,26,0,0 // pand 0x1afa(%edi),%xmm2
+ .byte 102,15,219,151,254,26,0,0 // pand 0x1afe(%edi),%xmm2
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
.byte 102,15,113,246,3 // psllw $0x3,%xmm6
- .byte 102,15,219,183,10,27,0,0 // pand 0x1b0a(%edi),%xmm6
+ .byte 102,15,219,183,14,27,0,0 // pand 0x1b0e(%edi),%xmm6
.byte 102,15,235,242 // por %xmm2,%xmm6
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
.byte 102,15,113,210,3 // psrlw $0x3,%xmm2
@@ -68430,19 +68402,19 @@ _sk_store_565_sse2_lowp:
.byte 128,249,6 // cmp $0x6,%cl
.byte 139,117,16 // mov 0x10(%ebp),%esi
.byte 15,40,125,24 // movaps 0x18(%ebp),%xmm7
- .byte 119,22 // ja b99e <_sk_store_565_sse2_lowp+0x8a>
+ .byte 119,22 // ja b97a <_sk_store_565_sse2_lowp+0x8a>
.byte 15,182,201 // movzbl %cl,%ecx
.byte 3,188,143,242,0,0,0 // add 0xf2(%edi,%ecx,4),%edi
.byte 255,231 // jmp *%edi
.byte 102,15,126,209 // movd %xmm2,%ecx
.byte 102,137,12,115 // mov %cx,(%ebx,%esi,2)
- .byte 235,59 // jmp b9d9 <_sk_store_565_sse2_lowp+0xc5>
+ .byte 235,59 // jmp b9b5 <_sk_store_565_sse2_lowp+0xc5>
.byte 243,15,127,20,115 // movdqu %xmm2,(%ebx,%esi,2)
- .byte 235,52 // jmp b9d9 <_sk_store_565_sse2_lowp+0xc5>
+ .byte 235,52 // jmp b9b5 <_sk_store_565_sse2_lowp+0xc5>
.byte 102,15,197,202,2 // pextrw $0x2,%xmm2,%ecx
.byte 102,137,76,115,4 // mov %cx,0x4(%ebx,%esi,2)
.byte 102,15,126,20,115 // movd %xmm2,(%ebx,%esi,2)
- .byte 235,35 // jmp b9d9 <_sk_store_565_sse2_lowp+0xc5>
+ .byte 235,35 // jmp b9b5 <_sk_store_565_sse2_lowp+0xc5>
.byte 102,15,197,202,6 // pextrw $0x6,%xmm2,%ecx
.byte 102,137,76,115,12 // mov %cx,0xc(%ebx,%esi,2)
.byte 102,15,197,202,5 // pextrw $0x5,%xmm2,%ecx
@@ -68504,10 +68476,10 @@ _sk_load_a8_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call ba6e <_sk_load_a8_sse2_lowp+0x3a>
+ .byte 232,0,0,0,0 // call ba4a <_sk_load_a8_sse2_lowp+0x3a>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja ba90 <_sk_load_a8_sse2_lowp+0x5c>
+ .byte 119,28 // ja ba6c <_sk_load_a8_sse2_lowp+0x5c>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,198,0,0,0 // mov 0xc6(%edi,%ecx,4),%ecx
@@ -68515,10 +68487,10 @@ _sk_load_a8_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx
.byte 102,15,110,217 // movd %ecx,%xmm3
- .byte 235,90 // jmp baea <_sk_load_a8_sse2_lowp+0xb6>
+ .byte 235,90 // jmp bac6 <_sk_load_a8_sse2_lowp+0xb6>
.byte 243,15,126,28,51 // movq (%ebx,%esi,1),%xmm3
.byte 102,15,96,216 // punpcklbw %xmm0,%xmm3
- .byte 235,79 // jmp baea <_sk_load_a8_sse2_lowp+0xb6>
+ .byte 235,79 // jmp bac6 <_sk_load_a8_sse2_lowp+0xb6>
.byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,217,2 // pinsrw $0x2,%ecx,%xmm3
@@ -68526,7 +68498,7 @@ _sk_load_a8_sse2_lowp:
.byte 102,15,110,233 // movd %ecx,%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 243,15,16,221 // movss %xmm5,%xmm3
- .byte 235,47 // jmp baea <_sk_load_a8_sse2_lowp+0xb6>
+ .byte 235,47 // jmp bac6 <_sk_load_a8_sse2_lowp+0xb6>
.byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,217,6 // pinsrw $0x6,%ecx,%xmm3
@@ -68537,7 +68509,7 @@ _sk_load_a8_sse2_lowp:
.byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 242,15,16,221 // movsd %xmm5,%xmm3
- .byte 102,15,219,159,66,25,0,0 // pand 0x1942(%edi),%xmm3
+ .byte 102,15,219,159,70,25,0,0 // pand 0x1946(%edi),%xmm3
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 15,41,100,36,64 // movaps %xmm4,0x40(%esp)
.byte 15,41,84,36,48 // movaps %xmm2,0x30(%esp)
@@ -68592,10 +68564,10 @@ _sk_load_a8_dst_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call bb79 <_sk_load_a8_dst_sse2_lowp+0x29>
+ .byte 232,0,0,0,0 // call bb55 <_sk_load_a8_dst_sse2_lowp+0x29>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja bb9b <_sk_load_a8_dst_sse2_lowp+0x4b>
+ .byte 119,28 // ja bb77 <_sk_load_a8_dst_sse2_lowp+0x4b>
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,195,0,0,0 // mov 0xc3(%edi,%ecx,4),%ecx
@@ -68603,10 +68575,10 @@ _sk_load_a8_dst_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx
.byte 102,15,110,225 // movd %ecx,%xmm4
- .byte 235,90 // jmp bbf5 <_sk_load_a8_dst_sse2_lowp+0xa5>
+ .byte 235,90 // jmp bbd1 <_sk_load_a8_dst_sse2_lowp+0xa5>
.byte 243,15,126,36,51 // movq (%ebx,%esi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
- .byte 235,79 // jmp bbf5 <_sk_load_a8_dst_sse2_lowp+0xa5>
+ .byte 235,79 // jmp bbd1 <_sk_load_a8_dst_sse2_lowp+0xa5>
.byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,225,2 // pinsrw $0x2,%ecx,%xmm4
@@ -68614,7 +68586,7 @@ _sk_load_a8_dst_sse2_lowp:
.byte 102,15,110,233 // movd %ecx,%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 243,15,16,229 // movss %xmm5,%xmm4
- .byte 235,47 // jmp bbf5 <_sk_load_a8_dst_sse2_lowp+0xa5>
+ .byte 235,47 // jmp bbd1 <_sk_load_a8_dst_sse2_lowp+0xa5>
.byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,225,6 // pinsrw $0x6,%ecx,%xmm4
@@ -68625,7 +68597,7 @@ _sk_load_a8_dst_sse2_lowp:
.byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 242,15,16,229 // movsd %xmm5,%xmm4
- .byte 102,15,219,167,55,24,0,0 // pand 0x1837(%edi),%xmm4
+ .byte 102,15,219,167,59,24,0,0 // pand 0x183b(%edi),%xmm4
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 102,15,127,100,36,64 // movdqa %xmm4,0x40(%esp)
.byte 102,15,239,228 // pxor %xmm4,%xmm4
@@ -68682,32 +68654,32 @@ _sk_store_a8_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call bc91 <_sk_store_a8_sse2_lowp+0x39>
+ .byte 232,0,0,0,0 // call bc6d <_sk_store_a8_sse2_lowp+0x39>
.byte 91 // pop %ebx
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,26 // ja bcb1 <_sk_store_a8_sse2_lowp+0x59>
+ .byte 119,26 // ja bc8d <_sk_store_a8_sse2_lowp+0x59>
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,139,223,0,0,0 // mov 0xdf(%ebx,%ecx,4),%ecx
.byte 1,217 // add %ebx,%ecx
.byte 255,225 // jmp *%ecx
.byte 102,15,126,217 // movd %xmm3,%ecx
.byte 136,12,55 // mov %cl,(%edi,%esi,1)
- .byte 233,136,0,0,0 // jmp bd39 <_sk_store_a8_sse2_lowp+0xe1>
- .byte 102,15,111,163,31,23,0,0 // movdqa 0x171f(%ebx),%xmm4
+ .byte 233,136,0,0,0 // jmp bd15 <_sk_store_a8_sse2_lowp+0xe1>
+ .byte 102,15,111,163,35,23,0,0 // movdqa 0x1723(%ebx),%xmm4
.byte 102,15,219,227 // pand %xmm3,%xmm4
.byte 102,15,103,228 // packuswb %xmm4,%xmm4
.byte 102,15,214,36,55 // movq %xmm4,(%edi,%esi,1)
.byte 15,40,101,24 // movaps 0x18(%ebp),%xmm4
- .byte 235,109 // jmp bd39 <_sk_store_a8_sse2_lowp+0xe1>
+ .byte 235,109 // jmp bd15 <_sk_store_a8_sse2_lowp+0xe1>
.byte 102,15,197,203,2 // pextrw $0x2,%xmm3,%ecx
.byte 136,76,55,2 // mov %cl,0x2(%edi,%esi,1)
- .byte 102,15,111,163,31,23,0,0 // movdqa 0x171f(%ebx),%xmm4
+ .byte 102,15,111,163,35,23,0,0 // movdqa 0x1723(%ebx),%xmm4
.byte 102,15,219,227 // pand %xmm3,%xmm4
.byte 102,15,103,228 // packuswb %xmm4,%xmm4
.byte 102,15,126,225 // movd %xmm4,%ecx
.byte 15,40,101,24 // movaps 0x18(%ebp),%xmm4
.byte 102,137,12,55 // mov %cx,(%edi,%esi,1)
- .byte 235,70 // jmp bd39 <_sk_store_a8_sse2_lowp+0xe1>
+ .byte 235,70 // jmp bd15 <_sk_store_a8_sse2_lowp+0xe1>
.byte 102,15,197,203,6 // pextrw $0x6,%xmm3,%ecx
.byte 136,76,55,6 // mov %cl,0x6(%edi,%esi,1)
.byte 102,15,197,203,5 // pextrw $0x5,%xmm3,%ecx
@@ -68717,7 +68689,7 @@ _sk_store_a8_sse2_lowp:
.byte 15,40,254 // movaps %xmm6,%xmm7
.byte 15,40,245 // movaps %xmm5,%xmm6
.byte 15,40,236 // movaps %xmm4,%xmm5
- .byte 102,15,111,163,31,23,0,0 // movdqa 0x171f(%ebx),%xmm4
+ .byte 102,15,111,163,35,23,0,0 // movdqa 0x1723(%ebx),%xmm4
.byte 102,15,219,227 // pand %xmm3,%xmm4
.byte 102,15,103,228 // packuswb %xmm4,%xmm4
.byte 102,15,126,36,55 // movd %xmm4,(%edi,%esi,1)
@@ -68751,7 +68723,7 @@ _sk_store_a8_sse2_lowp:
.byte 0,0 // add %al,(%eax)
.byte 0,125,0 // add %bh,0x0(%ebp)
.byte 0,0 // add %al,(%eax)
- .byte 116,0 // je bd82 <_sk_store_a8_sse2_lowp+0x12a>
+ .byte 116,0 // je bd5e <_sk_store_a8_sse2_lowp+0x12a>
.byte 0,0 // add %al,(%eax)
.byte 107,0,0 // imul $0x0,(%eax),%eax
.byte 0,98,0 // add %ah,0x0(%edx)
@@ -68781,10 +68753,10 @@ _sk_load_g8_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call bdc5 <_sk_load_g8_sse2_lowp+0x39>
+ .byte 232,0,0,0,0 // call bda1 <_sk_load_g8_sse2_lowp+0x39>
.byte 94 // pop %esi
.byte 139,125,16 // mov 0x10(%ebp),%edi
- .byte 119,28 // ja bde7 <_sk_load_g8_sse2_lowp+0x5b>
+ .byte 119,28 // ja bdc3 <_sk_load_g8_sse2_lowp+0x5b>
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,142,199,0,0,0 // mov 0xc7(%esi,%ecx,4),%ecx
@@ -68792,10 +68764,10 @@ _sk_load_g8_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,182,12,59 // movzbl (%ebx,%edi,1),%ecx
.byte 102,15,110,193 // movd %ecx,%xmm0
- .byte 235,90 // jmp be41 <_sk_load_g8_sse2_lowp+0xb5>
+ .byte 235,90 // jmp be1d <_sk_load_g8_sse2_lowp+0xb5>
.byte 243,15,126,4,59 // movq (%ebx,%edi,1),%xmm0
.byte 102,15,96,192 // punpcklbw %xmm0,%xmm0
- .byte 235,79 // jmp be41 <_sk_load_g8_sse2_lowp+0xb5>
+ .byte 235,79 // jmp be1d <_sk_load_g8_sse2_lowp+0xb5>
.byte 15,182,76,59,2 // movzbl 0x2(%ebx,%edi,1),%ecx
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,196,193,2 // pinsrw $0x2,%ecx,%xmm0
@@ -68803,7 +68775,7 @@ _sk_load_g8_sse2_lowp:
.byte 102,15,110,233 // movd %ecx,%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 243,15,16,197 // movss %xmm5,%xmm0
- .byte 235,47 // jmp be41 <_sk_load_g8_sse2_lowp+0xb5>
+ .byte 235,47 // jmp be1d <_sk_load_g8_sse2_lowp+0xb5>
.byte 15,182,76,59,6 // movzbl 0x6(%ebx,%edi,1),%ecx
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,196,193,6 // pinsrw $0x6,%ecx,%xmm0
@@ -68814,7 +68786,7 @@ _sk_load_g8_sse2_lowp:
.byte 102,15,110,44,59 // movd (%ebx,%edi,1),%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 242,15,16,197 // movsd %xmm5,%xmm0
- .byte 102,15,219,134,235,21,0,0 // pand 0x15eb(%esi),%xmm0
+ .byte 102,15,219,134,239,21,0,0 // pand 0x15ef(%esi),%xmm0
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 15,41,100,36,64 // movaps %xmm4,0x40(%esp)
.byte 15,41,92,36,48 // movaps %xmm3,0x30(%esp)
@@ -68825,7 +68797,7 @@ _sk_load_g8_sse2_lowp:
.byte 137,124,36,8 // mov %edi,0x8(%esp)
.byte 137,76,36,4 // mov %ecx,0x4(%esp)
.byte 137,20,36 // mov %edx,(%esp)
- .byte 15,40,158,235,21,0,0 // movaps 0x15eb(%esi),%xmm3
+ .byte 15,40,158,239,21,0,0 // movaps 0x15ef(%esi),%xmm3
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
.byte 102,15,111,208 // movdqa %xmm0,%xmm2
.byte 255,80,4 // call *0x4(%eax)
@@ -68868,10 +68840,10 @@ _sk_load_g8_dst_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call bed1 <_sk_load_g8_dst_sse2_lowp+0x29>
+ .byte 232,0,0,0,0 // call bead <_sk_load_g8_dst_sse2_lowp+0x29>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja bef3 <_sk_load_g8_dst_sse2_lowp+0x4b>
+ .byte 119,28 // ja becf <_sk_load_g8_dst_sse2_lowp+0x4b>
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,195,0,0,0 // mov 0xc3(%edi,%ecx,4),%ecx
@@ -68879,10 +68851,10 @@ _sk_load_g8_dst_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx
.byte 102,15,110,225 // movd %ecx,%xmm4
- .byte 235,90 // jmp bf4d <_sk_load_g8_dst_sse2_lowp+0xa5>
+ .byte 235,90 // jmp bf29 <_sk_load_g8_dst_sse2_lowp+0xa5>
.byte 243,15,126,36,51 // movq (%ebx,%esi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
- .byte 235,79 // jmp bf4d <_sk_load_g8_dst_sse2_lowp+0xa5>
+ .byte 235,79 // jmp bf29 <_sk_load_g8_dst_sse2_lowp+0xa5>
.byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,225,2 // pinsrw $0x2,%ecx,%xmm4
@@ -68890,7 +68862,7 @@ _sk_load_g8_dst_sse2_lowp:
.byte 102,15,110,233 // movd %ecx,%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 243,15,16,229 // movss %xmm5,%xmm4
- .byte 235,47 // jmp bf4d <_sk_load_g8_dst_sse2_lowp+0xa5>
+ .byte 235,47 // jmp bf29 <_sk_load_g8_dst_sse2_lowp+0xa5>
.byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,225,6 // pinsrw $0x6,%ecx,%xmm4
@@ -68901,9 +68873,9 @@ _sk_load_g8_dst_sse2_lowp:
.byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 242,15,16,229 // movsd %xmm5,%xmm4
- .byte 102,15,219,167,223,20,0,0 // pand 0x14df(%edi),%xmm4
+ .byte 102,15,219,167,227,20,0,0 // pand 0x14e3(%edi),%xmm4
.byte 141,72,8 // lea 0x8(%eax),%ecx
- .byte 15,40,175,223,20,0,0 // movaps 0x14df(%edi),%xmm5
+ .byte 15,40,175,227,20,0,0 // movaps 0x14e3(%edi),%xmm5
.byte 15,41,108,36,64 // movaps %xmm5,0x40(%esp)
.byte 102,15,127,100,36,48 // movdqa %xmm4,0x30(%esp)
.byte 102,15,127,100,36,32 // movdqa %xmm4,0x20(%esp)
@@ -68944,7 +68916,7 @@ _sk_luminance_to_alpha_sse2_lowp:
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
.byte 102,15,111,218 // movdqa %xmm2,%xmm3
- .byte 232,0,0,0,0 // call bfc1 <_sk_luminance_to_alpha_sse2_lowp+0x11>
+ .byte 232,0,0,0,0 // call bf9d <_sk_luminance_to_alpha_sse2_lowp+0x11>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,16 // mov 0x10(%ebp),%edx
@@ -68954,10 +68926,10 @@ _sk_luminance_to_alpha_sse2_lowp:
.byte 15,40,109,56 // movaps 0x38(%ebp),%xmm5
.byte 15,40,117,72 // movaps 0x48(%ebp),%xmm6
.byte 139,125,12 // mov 0xc(%ebp),%edi
- .byte 102,15,213,128,127,20,0,0 // pmullw 0x147f(%eax),%xmm0
- .byte 102,15,213,136,143,20,0,0 // pmullw 0x148f(%eax),%xmm1
+ .byte 102,15,213,128,131,20,0,0 // pmullw 0x1483(%eax),%xmm0
+ .byte 102,15,213,136,147,20,0,0 // pmullw 0x1493(%eax),%xmm1
.byte 102,15,253,200 // paddw %xmm0,%xmm1
- .byte 102,15,213,152,159,20,0,0 // pmullw 0x149f(%eax),%xmm3
+ .byte 102,15,213,152,163,20,0,0 // pmullw 0x14a3(%eax),%xmm3
.byte 102,15,253,217 // paddw %xmm1,%xmm3
.byte 102,15,113,211,8 // psrlw $0x8,%xmm3
.byte 141,71,4 // lea 0x4(%edi),%eax
@@ -68988,15 +68960,15 @@ _sk_scale_1_float_sse2_lowp:
.byte 87 // push %edi
.byte 86 // push %esi
.byte 131,236,80 // sub $0x50,%esp
- .byte 232,0,0,0,0 // call c04a <_sk_scale_1_float_sse2_lowp+0xd>
+ .byte 232,0,0,0,0 // call c026 <_sk_scale_1_float_sse2_lowp+0xd>
.byte 94 // pop %esi
.byte 139,69,8 // mov 0x8(%ebp),%eax
.byte 139,85,16 // mov 0x10(%ebp),%edx
.byte 139,77,12 // mov 0xc(%ebp),%ecx
.byte 139,57 // mov (%ecx),%edi
.byte 243,15,16,39 // movss (%edi),%xmm4
- .byte 243,15,89,166,42,20,0,0 // mulss 0x142a(%esi),%xmm4
- .byte 243,15,88,166,38,20,0,0 // addss 0x1426(%esi),%xmm4
+ .byte 243,15,89,166,46,20,0,0 // mulss 0x142e(%esi),%xmm4
+ .byte 243,15,88,166,42,20,0,0 // addss 0x142a(%esi),%xmm4
.byte 243,15,44,252 // cvttss2si %xmm4,%edi
.byte 102,15,110,239 // movd %edi,%xmm5
.byte 139,125,20 // mov 0x14(%ebp),%edi
@@ -69009,7 +68981,7 @@ _sk_scale_1_float_sse2_lowp:
.byte 102,15,213,205 // pmullw %xmm5,%xmm1
.byte 102,15,213,213 // pmullw %xmm5,%xmm2
.byte 102,15,213,221 // pmullw %xmm5,%xmm3
- .byte 102,15,111,174,102,19,0,0 // movdqa 0x1366(%esi),%xmm5
+ .byte 102,15,111,174,106,19,0,0 // movdqa 0x136a(%esi),%xmm5
.byte 102,15,253,197 // paddw %xmm5,%xmm0
.byte 102,15,253,205 // paddw %xmm5,%xmm1
.byte 102,15,253,213 // paddw %xmm5,%xmm2
@@ -69048,19 +69020,19 @@ _sk_lerp_1_float_sse2_lowp:
.byte 102,15,111,218 // movdqa %xmm2,%xmm3
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 232,0,0,0,0 // call c118 <_sk_lerp_1_float_sse2_lowp+0x1d>
+ .byte 232,0,0,0,0 // call c0f4 <_sk_lerp_1_float_sse2_lowp+0x1d>
.byte 89 // pop %ecx
.byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,16 // mov (%eax),%edx
.byte 243,15,16,50 // movss (%edx),%xmm6
- .byte 243,15,89,177,92,19,0,0 // mulss 0x135c(%ecx),%xmm6
- .byte 243,15,88,177,88,19,0,0 // addss 0x1358(%ecx),%xmm6
+ .byte 243,15,89,177,96,19,0,0 // mulss 0x1360(%ecx),%xmm6
+ .byte 243,15,88,177,92,19,0,0 // addss 0x135c(%ecx),%xmm6
.byte 243,15,44,214 // cvttss2si %xmm6,%edx
.byte 102,15,110,242 // movd %edx,%xmm6
.byte 242,15,112,246,0 // pshuflw $0x0,%xmm6,%xmm6
.byte 102,15,112,246,80 // pshufd $0x50,%xmm6,%xmm6
- .byte 102,15,111,129,152,18,0,0 // movdqa 0x1298(%ecx),%xmm0
+ .byte 102,15,111,129,156,18,0,0 // movdqa 0x129c(%ecx),%xmm0
.byte 102,15,213,206 // pmullw %xmm6,%xmm1
.byte 102,15,253,200 // paddw %xmm0,%xmm1
.byte 102,15,213,214 // pmullw %xmm6,%xmm2
@@ -69133,10 +69105,10 @@ _sk_scale_u8_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call c241 <_sk_scale_u8_sse2_lowp+0x31>
+ .byte 232,0,0,0,0 // call c21d <_sk_scale_u8_sse2_lowp+0x31>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja c263 <_sk_scale_u8_sse2_lowp+0x53>
+ .byte 119,28 // ja c23f <_sk_scale_u8_sse2_lowp+0x53>
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,3,1,0,0 // mov 0x103(%edi,%ecx,4),%ecx
@@ -69144,10 +69116,10 @@ _sk_scale_u8_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx
.byte 102,15,110,225 // movd %ecx,%xmm4
- .byte 235,90 // jmp c2bd <_sk_scale_u8_sse2_lowp+0xad>
+ .byte 235,90 // jmp c299 <_sk_scale_u8_sse2_lowp+0xad>
.byte 243,15,126,36,51 // movq (%ebx,%esi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
- .byte 235,79 // jmp c2bd <_sk_scale_u8_sse2_lowp+0xad>
+ .byte 235,79 // jmp c299 <_sk_scale_u8_sse2_lowp+0xad>
.byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,225,2 // pinsrw $0x2,%ecx,%xmm4
@@ -69155,7 +69127,7 @@ _sk_scale_u8_sse2_lowp:
.byte 102,15,110,233 // movd %ecx,%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 243,15,16,229 // movss %xmm5,%xmm4
- .byte 235,47 // jmp c2bd <_sk_scale_u8_sse2_lowp+0xad>
+ .byte 235,47 // jmp c299 <_sk_scale_u8_sse2_lowp+0xad>
.byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx
.byte 102,15,239,228 // pxor %xmm4,%xmm4
.byte 102,15,196,225,6 // pinsrw $0x6,%ecx,%xmm4
@@ -69166,9 +69138,9 @@ _sk_scale_u8_sse2_lowp:
.byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5
.byte 102,15,96,232 // punpcklbw %xmm0,%xmm5
.byte 242,15,16,229 // movsd %xmm5,%xmm4
- .byte 102,15,219,167,111,17,0,0 // pand 0x116f(%edi),%xmm4
+ .byte 102,15,219,167,115,17,0,0 // pand 0x1173(%edi),%xmm4
.byte 102,15,213,196 // pmullw %xmm4,%xmm0
- .byte 102,15,111,175,111,17,0,0 // movdqa 0x116f(%edi),%xmm5
+ .byte 102,15,111,175,115,17,0,0 // movdqa 0x1173(%edi),%xmm5
.byte 102,15,253,197 // paddw %xmm5,%xmm0
.byte 102,15,113,208,8 // psrlw $0x8,%xmm0
.byte 102,15,213,204 // pmullw %xmm4,%xmm1
@@ -69235,10 +69207,10 @@ _sk_lerp_u8_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call c38e <_sk_lerp_u8_sse2_lowp+0x2e>
+ .byte 232,0,0,0,0 // call c36a <_sk_lerp_u8_sse2_lowp+0x2e>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja c3b0 <_sk_lerp_u8_sse2_lowp+0x50>
+ .byte 119,28 // ja c38c <_sk_lerp_u8_sse2_lowp+0x50>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,74,1,0,0 // mov 0x14a(%edi,%ecx,4),%ecx
@@ -69246,10 +69218,10 @@ _sk_lerp_u8_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx
.byte 102,15,110,217 // movd %ecx,%xmm3
- .byte 235,90 // jmp c40a <_sk_lerp_u8_sse2_lowp+0xaa>
+ .byte 235,90 // jmp c3e6 <_sk_lerp_u8_sse2_lowp+0xaa>
.byte 243,15,126,28,51 // movq (%ebx,%esi,1),%xmm3
.byte 102,15,96,216 // punpcklbw %xmm0,%xmm3
- .byte 235,79 // jmp c40a <_sk_lerp_u8_sse2_lowp+0xaa>
+ .byte 235,79 // jmp c3e6 <_sk_lerp_u8_sse2_lowp+0xaa>
.byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,217,2 // pinsrw $0x2,%ecx,%xmm3
@@ -69257,7 +69229,7 @@ _sk_lerp_u8_sse2_lowp:
.byte 102,15,110,225 // movd %ecx,%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
.byte 243,15,16,220 // movss %xmm4,%xmm3
- .byte 235,47 // jmp c40a <_sk_lerp_u8_sse2_lowp+0xaa>
+ .byte 235,47 // jmp c3e6 <_sk_lerp_u8_sse2_lowp+0xaa>
.byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,217,6 // pinsrw $0x6,%ecx,%xmm3
@@ -69268,8 +69240,8 @@ _sk_lerp_u8_sse2_lowp:
.byte 102,15,110,36,51 // movd (%ebx,%esi,1),%xmm4
.byte 102,15,96,224 // punpcklbw %xmm0,%xmm4
.byte 242,15,16,220 // movsd %xmm4,%xmm3
- .byte 102,15,219,159,34,16,0,0 // pand 0x1022(%edi),%xmm3
- .byte 102,15,111,183,34,16,0,0 // movdqa 0x1022(%edi),%xmm6
+ .byte 102,15,219,159,38,16,0,0 // pand 0x1026(%edi),%xmm3
+ .byte 102,15,111,183,38,16,0,0 // movdqa 0x1026(%edi),%xmm6
.byte 102,15,111,227 // movdqa %xmm3,%xmm4
.byte 102,15,239,230 // pxor %xmm6,%xmm4
.byte 102,15,111,252 // movdqa %xmm4,%xmm7
@@ -69358,10 +69330,10 @@ _sk_scale_565_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call c537 <_sk_scale_565_sse2_lowp+0x43>
+ .byte 232,0,0,0,0 // call c513 <_sk_scale_565_sse2_lowp+0x43>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja c559 <_sk_scale_565_sse2_lowp+0x65>
+ .byte 119,28 // ja c535 <_sk_scale_565_sse2_lowp+0x65>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,249,1,0,0 // mov 0x1f9(%edi,%ecx,4),%ecx
@@ -69369,14 +69341,14 @@ _sk_scale_565_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,183,12,115 // movzwl (%ebx,%esi,2),%ecx
.byte 102,15,110,217 // movd %ecx,%xmm3
- .byte 235,59 // jmp c594 <_sk_scale_565_sse2_lowp+0xa0>
+ .byte 235,59 // jmp c570 <_sk_scale_565_sse2_lowp+0xa0>
.byte 243,15,111,28,115 // movdqu (%ebx,%esi,2),%xmm3
- .byte 235,52 // jmp c594 <_sk_scale_565_sse2_lowp+0xa0>
+ .byte 235,52 // jmp c570 <_sk_scale_565_sse2_lowp+0xa0>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,92,115,4,2 // pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3
.byte 243,15,16,12,115 // movss (%ebx,%esi,2),%xmm1
.byte 243,15,16,217 // movss %xmm1,%xmm3
- .byte 235,30 // jmp c594 <_sk_scale_565_sse2_lowp+0xa0>
+ .byte 235,30 // jmp c570 <_sk_scale_565_sse2_lowp+0xa0>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,92,115,12,6 // pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3
.byte 102,15,196,92,115,10,5 // pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3
@@ -69384,11 +69356,11 @@ _sk_scale_565_sse2_lowp:
.byte 102,15,18,28,115 // movlpd (%ebx,%esi,2),%xmm3
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,113,209,8 // psrlw $0x8,%xmm1
- .byte 102,15,219,143,185,14,0,0 // pand 0xeb9(%edi),%xmm1
+ .byte 102,15,219,143,189,14,0,0 // pand 0xebd(%edi),%xmm1
.byte 102,15,111,211 // movdqa %xmm3,%xmm2
.byte 102,15,113,210,5 // psrlw $0x5,%xmm2
- .byte 102,15,219,151,201,14,0,0 // pand 0xec9(%edi),%xmm2
- .byte 102,15,111,135,217,14,0,0 // movdqa 0xed9(%edi),%xmm0
+ .byte 102,15,219,151,205,14,0,0 // pand 0xecd(%edi),%xmm2
+ .byte 102,15,111,135,221,14,0,0 // movdqa 0xedd(%edi),%xmm0
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 102,15,113,211,13 // psrlw $0xd,%xmm3
.byte 102,15,235,217 // por %xmm1,%xmm3
@@ -69401,7 +69373,7 @@ _sk_scale_565_sse2_lowp:
.byte 102,15,113,208,2 // psrlw $0x2,%xmm0
.byte 102,15,235,193 // por %xmm1,%xmm0
.byte 102,15,127,69,200 // movdqa %xmm0,-0x38(%ebp)
- .byte 102,15,111,167,153,14,0,0 // movdqa 0xe99(%edi),%xmm4
+ .byte 102,15,111,167,157,14,0,0 // movdqa 0xe9d(%edi),%xmm4
.byte 15,41,117,184 // movaps %xmm6,-0x48(%ebp)
.byte 102,15,239,244 // pxor %xmm4,%xmm6
.byte 102,15,239,252 // pxor %xmm4,%xmm7
@@ -69444,7 +69416,7 @@ _sk_scale_565_sse2_lowp:
.byte 102,15,111,229 // movdqa %xmm5,%xmm4
.byte 102,15,213,101,136 // pmullw -0x78(%ebp),%xmm4
.byte 102,15,213,125,184 // pmullw -0x48(%ebp),%xmm7
- .byte 102,15,111,135,121,14,0,0 // movdqa 0xe79(%edi),%xmm0
+ .byte 102,15,111,135,125,14,0,0 // movdqa 0xe7d(%edi),%xmm0
.byte 102,15,253,216 // paddw %xmm0,%xmm3
.byte 102,15,253,208 // paddw %xmm0,%xmm2
.byte 102,15,253,224 // paddw %xmm0,%xmm4
@@ -69521,10 +69493,10 @@ _sk_lerp_565_sse2_lowp:
.byte 128,225,7 // and $0x7,%cl
.byte 254,201 // dec %cl
.byte 128,249,6 // cmp $0x6,%cl
- .byte 232,0,0,0,0 // call c78f <_sk_lerp_565_sse2_lowp+0x43>
+ .byte 232,0,0,0,0 // call c76b <_sk_lerp_565_sse2_lowp+0x43>
.byte 95 // pop %edi
.byte 139,117,16 // mov 0x10(%ebp),%esi
- .byte 119,28 // ja c7b1 <_sk_lerp_565_sse2_lowp+0x65>
+ .byte 119,28 // ja c78d <_sk_lerp_565_sse2_lowp+0x65>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 15,182,201 // movzbl %cl,%ecx
.byte 139,140,143,73,2,0,0 // mov 0x249(%edi,%ecx,4),%ecx
@@ -69532,14 +69504,14 @@ _sk_lerp_565_sse2_lowp:
.byte 255,225 // jmp *%ecx
.byte 15,183,12,115 // movzwl (%ebx,%esi,2),%ecx
.byte 102,15,110,217 // movd %ecx,%xmm3
- .byte 235,59 // jmp c7ec <_sk_lerp_565_sse2_lowp+0xa0>
+ .byte 235,59 // jmp c7c8 <_sk_lerp_565_sse2_lowp+0xa0>
.byte 243,15,111,28,115 // movdqu (%ebx,%esi,2),%xmm3
- .byte 235,52 // jmp c7ec <_sk_lerp_565_sse2_lowp+0xa0>
+ .byte 235,52 // jmp c7c8 <_sk_lerp_565_sse2_lowp+0xa0>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,92,115,4,2 // pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3
.byte 243,15,16,12,115 // movss (%ebx,%esi,2),%xmm1
.byte 243,15,16,217 // movss %xmm1,%xmm3
- .byte 235,30 // jmp c7ec <_sk_lerp_565_sse2_lowp+0xa0>
+ .byte 235,30 // jmp c7c8 <_sk_lerp_565_sse2_lowp+0xa0>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,15,196,92,115,12,6 // pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3
.byte 102,15,196,92,115,10,5 // pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3
@@ -69547,11 +69519,11 @@ _sk_lerp_565_sse2_lowp:
.byte 102,15,18,28,115 // movlpd (%ebx,%esi,2),%xmm3
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,113,209,8 // psrlw $0x8,%xmm1
- .byte 102,15,219,143,97,12,0,0 // pand 0xc61(%edi),%xmm1
+ .byte 102,15,219,143,101,12,0,0 // pand 0xc65(%edi),%xmm1
.byte 102,15,111,211 // movdqa %xmm3,%xmm2
.byte 102,15,113,210,5 // psrlw $0x5,%xmm2
- .byte 102,15,219,151,113,12,0,0 // pand 0xc71(%edi),%xmm2
- .byte 102,15,111,175,129,12,0,0 // movdqa 0xc81(%edi),%xmm5
+ .byte 102,15,219,151,117,12,0,0 // pand 0xc75(%edi),%xmm2
+ .byte 102,15,111,175,133,12,0,0 // movdqa 0xc85(%edi),%xmm5
.byte 102,15,219,235 // pand %xmm3,%xmm5
.byte 102,15,113,211,13 // psrlw $0xd,%xmm3
.byte 102,15,235,217 // por %xmm1,%xmm3
@@ -69564,7 +69536,7 @@ _sk_lerp_565_sse2_lowp:
.byte 102,15,113,213,2 // psrlw $0x2,%xmm5
.byte 102,15,235,233 // por %xmm1,%xmm5
.byte 102,15,127,109,216 // movdqa %xmm5,-0x28(%ebp)
- .byte 102,15,111,167,65,12,0,0 // movdqa 0xc41(%edi),%xmm4
+ .byte 102,15,111,167,69,12,0,0 // movdqa 0xc45(%edi),%xmm4
.byte 102,15,111,198 // movdqa %xmm6,%xmm0
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
.byte 102,15,239,204 // pxor %xmm4,%xmm1
@@ -69605,7 +69577,7 @@ _sk_lerp_565_sse2_lowp:
.byte 102,15,235,249 // por %xmm1,%xmm7
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,213,93,168 // pmullw -0x58(%ebp),%xmm3
- .byte 102,15,111,143,33,12,0,0 // movdqa 0xc21(%edi),%xmm1
+ .byte 102,15,111,143,37,12,0,0 // movdqa 0xc25(%edi),%xmm1
.byte 102,15,239,193 // pxor %xmm1,%xmm0
.byte 102,15,111,101,24 // movdqa 0x18(%ebp),%xmm4
.byte 102,15,213,196 // pmullw %xmm4,%xmm0
@@ -69701,11 +69673,11 @@ _sk_srcover_rgba_8888_sse2_lowp:
.byte 128,227,7 // and $0x7,%bl
.byte 254,203 // dec %bl
.byte 128,251,6 // cmp $0x6,%bl
- .byte 232,0,0,0,0 // call ca33 <_sk_srcover_rgba_8888_sse2_lowp+0x3f>
+ .byte 232,0,0,0,0 // call ca0f <_sk_srcover_rgba_8888_sse2_lowp+0x3f>
.byte 89 // pop %ecx
.byte 139,117,16 // mov 0x10(%ebp),%esi
.byte 15,182,211 // movzbl %bl,%edx
- .byte 119,29 // ja ca59 <_sk_srcover_rgba_8888_sse2_lowp+0x65>
+ .byte 119,29 // ja ca35 <_sk_srcover_rgba_8888_sse2_lowp+0x65>
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 139,132,145,77,2,0,0 // mov 0x24d(%ecx,%edx,4),%eax
.byte 1,200 // add %ecx,%eax
@@ -69713,14 +69685,14 @@ _sk_srcover_rgba_8888_sse2_lowp:
.byte 255,224 // jmp *%eax
.byte 243,15,16,52,183 // movss (%edi,%esi,4),%xmm6
.byte 15,87,219 // xorps %xmm3,%xmm3
- .byte 235,73 // jmp caa2 <_sk_srcover_rgba_8888_sse2_lowp+0xae>
+ .byte 235,73 // jmp ca7e <_sk_srcover_rgba_8888_sse2_lowp+0xae>
.byte 102,15,16,52,183 // movupd (%edi,%esi,4),%xmm6
.byte 15,16,92,183,16 // movups 0x10(%edi,%esi,4),%xmm3
- .byte 235,61 // jmp caa2 <_sk_srcover_rgba_8888_sse2_lowp+0xae>
+ .byte 235,61 // jmp ca7e <_sk_srcover_rgba_8888_sse2_lowp+0xae>
.byte 102,15,110,68,183,8 // movd 0x8(%edi,%esi,4),%xmm0
.byte 102,15,112,240,69 // pshufd $0x45,%xmm0,%xmm6
.byte 102,15,18,52,183 // movlpd (%edi,%esi,4),%xmm6
- .byte 235,43 // jmp caa2 <_sk_srcover_rgba_8888_sse2_lowp+0xae>
+ .byte 235,43 // jmp ca7e <_sk_srcover_rgba_8888_sse2_lowp+0xae>
.byte 102,15,110,68,183,24 // movd 0x18(%edi,%esi,4),%xmm0
.byte 102,15,112,216,69 // pshufd $0x45,%xmm0,%xmm3
.byte 243,15,16,68,183,20 // movss 0x14(%edi,%esi,4),%xmm0
@@ -69746,7 +69718,7 @@ _sk_srcover_rgba_8888_sse2_lowp:
.byte 102,15,114,243,16 // pslld $0x10,%xmm3
.byte 102,15,114,227,16 // psrad $0x10,%xmm3
.byte 102,15,107,243 // packssdw %xmm3,%xmm6
- .byte 102,15,111,153,125,9,0,0 // movdqa 0x97d(%ecx),%xmm3
+ .byte 102,15,111,153,129,9,0,0 // movdqa 0x981(%ecx),%xmm3
.byte 102,15,114,208,16 // psrld $0x10,%xmm0
.byte 102,15,114,210,16 // psrld $0x10,%xmm2
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
@@ -69798,18 +69770,18 @@ _sk_srcover_rgba_8888_sse2_lowp:
.byte 102,15,105,220 // punpckhwd %xmm4,%xmm3
.byte 102,15,235,222 // por %xmm6,%xmm3
.byte 128,251,6 // cmp $0x6,%bl
- .byte 119,16 // ja cbe3 <_sk_srcover_rgba_8888_sse2_lowp+0x1ef>
+ .byte 119,16 // ja cbbf <_sk_srcover_rgba_8888_sse2_lowp+0x1ef>
.byte 3,140,145,105,2,0,0 // add 0x269(%ecx,%edx,4),%ecx
.byte 255,225 // jmp *%ecx
.byte 102,15,126,4,183 // movd %xmm0,(%edi,%esi,4)
- .byte 235,64 // jmp cc23 <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
+ .byte 235,64 // jmp cbff <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
.byte 243,15,127,4,183 // movdqu %xmm0,(%edi,%esi,4)
.byte 243,15,127,92,183,16 // movdqu %xmm3,0x10(%edi,%esi,4)
- .byte 235,51 // jmp cc23 <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
+ .byte 235,51 // jmp cbff <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
.byte 102,15,112,208,78 // pshufd $0x4e,%xmm0,%xmm2
.byte 102,15,126,84,183,8 // movd %xmm2,0x8(%edi,%esi,4)
.byte 102,15,214,4,183 // movq %xmm0,(%edi,%esi,4)
- .byte 235,33 // jmp cc23 <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
+ .byte 235,33 // jmp cbff <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
.byte 102,15,112,211,78 // pshufd $0x4e,%xmm3,%xmm2
.byte 102,15,126,84,183,24 // movd %xmm2,0x18(%edi,%esi,4)
.byte 102,15,112,211,229 // pshufd $0xe5,%xmm3,%xmm2
@@ -69938,11 +69910,11 @@ BALIGN16
.byte 0,128,191,0,0,128 // add %al,-0x7fffff41(%eax)
.byte 191,0,0,224,64 // mov $0x40e00000,%edi
.byte 0,0 // add %al,(%eax)
- .byte 224,64 // loopne cda8 <.literal16+0xe8>
+ .byte 224,64 // loopne cd88 <.literal16+0xe8>
.byte 0,0 // add %al,(%eax)
- .byte 224,64 // loopne cdac <.literal16+0xec>
+ .byte 224,64 // loopne cd8c <.literal16+0xec>
.byte 0,0 // add %al,(%eax)
- .byte 224,64 // loopne cdb0 <.literal16+0xf0>
+ .byte 224,64 // loopne cd90 <.literal16+0xf0>
.byte 154,153,153,62,154,153,153 // lcall $0x9999,$0x9a3e9999
.byte 62,154,153,153,62,154,153,153 // ds lcall $0x9999,$0x9a3e9999
.byte 62,61,10,23,63,61 // ds cmp $0x3d3f170a,%eax
@@ -69953,16 +69925,16 @@ BALIGN16
.byte 63 // aas
.byte 174 // scas %es:(%edi),%al
.byte 71 // inc %edi
- .byte 225,61 // loope cdd1 <.literal16+0x111>
+ .byte 225,61 // loope cdb1 <.literal16+0x111>
.byte 174 // scas %es:(%edi),%al
.byte 71 // inc %edi
- .byte 225,61 // loope cdd5 <.literal16+0x115>
+ .byte 225,61 // loope cdb5 <.literal16+0x115>
.byte 174 // scas %es:(%edi),%al
.byte 71 // inc %edi
- .byte 225,61 // loope cdd9 <.literal16+0x119>
+ .byte 225,61 // loope cdb9 <.literal16+0x119>
.byte 174 // scas %es:(%edi),%al
.byte 71 // inc %edi
- .byte 225,61 // loope cddd <.literal16+0x11d>
+ .byte 225,61 // loope cdbd <.literal16+0x11d>
.byte 255,0 // incl (%eax)
.byte 0,0 // add %al,(%eax)
.byte 255,0 // incl (%eax)
@@ -69972,13 +69944,13 @@ BALIGN16
.byte 255,0 // incl (%eax)
.byte 0,0 // add %al,(%eax)
.byte 0,0 // add %al,(%eax)
- .byte 127,67 // jg cdf7 <.literal16+0x137>
+ .byte 127,67 // jg cdd7 <.literal16+0x137>
.byte 0,0 // add %al,(%eax)
- .byte 127,67 // jg cdfb <.literal16+0x13b>
+ .byte 127,67 // jg cddb <.literal16+0x13b>
.byte 0,0 // add %al,(%eax)
- .byte 127,67 // jg cdff <.literal16+0x13f>
+ .byte 127,67 // jg cddf <.literal16+0x13f>
.byte 0,0 // add %al,(%eax)
- .byte 127,67 // jg ce03 <.literal16+0x143>
+ .byte 127,67 // jg cde3 <.literal16+0x143>
.byte 145 // xchg %eax,%ecx
.byte 131,158,61,145,131,158,61 // sbbl $0x3d,-0x617c6ec3(%esi)
.byte 145 // xchg %eax,%ecx
@@ -70129,13 +70101,13 @@ BALIGN16
.byte 132,55 // test %dh,(%edi)
.byte 8,33 // or %ah,(%ecx)
.byte 132,55 // test %dh,(%edi)
- .byte 224,7 // loopne cf09 <.literal16+0x249>
+ .byte 224,7 // loopne cee9 <.literal16+0x249>
.byte 0,0 // add %al,(%eax)
- .byte 224,7 // loopne cf0d <.literal16+0x24d>
+ .byte 224,7 // loopne ceed <.literal16+0x24d>
.byte 0,0 // add %al,(%eax)
- .byte 224,7 // loopne cf11 <.literal16+0x251>
+ .byte 224,7 // loopne cef1 <.literal16+0x251>
.byte 0,0 // add %al,(%eax)
- .byte 224,7 // loopne cf15 <.literal16+0x255>
+ .byte 224,7 // loopne cef5 <.literal16+0x255>
.byte 0,0 // add %al,(%eax)
.byte 33,8 // and %ecx,(%eax)
.byte 2,58 // add (%edx),%bh
@@ -70184,17 +70156,17 @@ BALIGN16
.byte 0,0 // add %al,(%eax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg cf74 <.literal16+0x2b4>
+ .byte 127,0 // jg cf54 <.literal16+0x2b4>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 127,0 // jg cf78 <.literal16+0x2b8>
+ .byte 127,0 // jg cf58 <.literal16+0x2b8>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 127,0 // jg cf7c <.literal16+0x2bc>
+ .byte 127,0 // jg cf5c <.literal16+0x2bc>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 127,0 // jg cf80 <.literal16+0x2c0>
- .byte 119,115 // ja cff5 <.literal16+0x335>
+ .byte 127,0 // jg cf60 <.literal16+0x2c0>
+ .byte 119,115 // ja cfd5 <.literal16+0x335>
.byte 248 // clc
.byte 194,119,115 // ret $0x7377
.byte 248 // clc
@@ -70205,7 +70177,7 @@ BALIGN16
.byte 194,117,191 // ret $0xbf75
.byte 191,63,117,191,191 // mov $0xbfbf753f,%edi
.byte 63 // aas
- .byte 117,191 // jne cf59 <.literal16+0x299>
+ .byte 117,191 // jne cf39 <.literal16+0x299>
.byte 191,63,117,191,191 // mov $0xbfbf753f,%edi
.byte 63 // aas
.byte 249 // stc
@@ -70221,7 +70193,7 @@ BALIGN16
.byte 68 // inc %esp
.byte 180,62 // mov $0x3e,%ah
.byte 163,233,220,63,163 // mov %eax,0xa33fdce9
- .byte 233,220,63,163,233 // jmp e9a40f96 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a345a2>
+ .byte 233,220,63,163,233 // jmp e9a40f76 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a345a6>
.byte 220,63 // fdivrl (%edi)
.byte 163,233,220,63,81 // mov %eax,0x513fdce9
.byte 140,242 // mov %?,%edx
@@ -70317,16 +70289,16 @@ BALIGN16
.byte 128,3,62 // addb $0x3e,(%ebx)
.byte 31 // pop %ds
.byte 215 // xlat %ds:(%ebx)
- .byte 118,63 // jbe d0e3 <.literal16+0x423>
+ .byte 118,63 // jbe d0c3 <.literal16+0x423>
.byte 31 // pop %ds
.byte 215 // xlat %ds:(%ebx)
- .byte 118,63 // jbe d0e7 <.literal16+0x427>
+ .byte 118,63 // jbe d0c7 <.literal16+0x427>
.byte 31 // pop %ds
.byte 215 // xlat %ds:(%ebx)
- .byte 118,63 // jbe d0eb <.literal16+0x42b>
+ .byte 118,63 // jbe d0cb <.literal16+0x42b>
.byte 31 // pop %ds
.byte 215 // xlat %ds:(%ebx)
- .byte 118,63 // jbe d0ef <.literal16+0x42f>
+ .byte 118,63 // jbe d0cf <.literal16+0x42f>
.byte 246,64,83,63 // testb $0x3f,0x53(%eax)
.byte 246,64,83,63 // testb $0x3f,0x53(%eax)
.byte 246,64,83,63 // testb $0x3f,0x53(%eax)
@@ -70352,13 +70324,13 @@ BALIGN16
.byte 248 // clc
.byte 65 // inc %ecx
.byte 0,0 // add %al,(%eax)
- .byte 124,66 // jl d126 <.literal16+0x466>
+ .byte 124,66 // jl d106 <.literal16+0x466>
.byte 0,0 // add %al,(%eax)
- .byte 124,66 // jl d12a <.literal16+0x46a>
+ .byte 124,66 // jl d10a <.literal16+0x46a>
.byte 0,0 // add %al,(%eax)
- .byte 124,66 // jl d12e <.literal16+0x46e>
+ .byte 124,66 // jl d10e <.literal16+0x46e>
.byte 0,0 // add %al,(%eax)
- .byte 124,66 // jl d132 <.literal16+0x472>
+ .byte 124,66 // jl d112 <.literal16+0x472>
.byte 0,240 // add %dh,%al
.byte 0,0 // add %al,(%eax)
.byte 0,240 // add %dh,%al
@@ -70404,25 +70376,25 @@ BALIGN16
.byte 136,136,61,137,136,136 // mov %cl,-0x777776c3(%eax)
.byte 61,137,136,136,61 // cmp $0x3d888889,%eax
.byte 0,0 // add %al,(%eax)
- .byte 112,65 // jo d1b5 <.literal16+0x4f5>
+ .byte 112,65 // jo d195 <.literal16+0x4f5>
.byte 0,0 // add %al,(%eax)
- .byte 112,65 // jo d1b9 <.literal16+0x4f9>
+ .byte 112,65 // jo d199 <.literal16+0x4f9>
.byte 0,0 // add %al,(%eax)
- .byte 112,65 // jo d1bd <.literal16+0x4fd>
+ .byte 112,65 // jo d19d <.literal16+0x4fd>
.byte 0,0 // add %al,(%eax)
- .byte 112,65 // jo d1c1 <.literal16+0x501>
+ .byte 112,65 // jo d1a1 <.literal16+0x501>
.byte 0,128,0,0,0,128 // add %al,-0x80000000(%eax)
.byte 0,0 // add %al,(%eax)
.byte 0,128,0,0,0,128 // add %al,-0x80000000(%eax)
.byte 0,0 // add %al,(%eax)
.byte 255 // (bad)
- .byte 127,0 // jg d193 <.literal16+0x4d3>
+ .byte 127,0 // jg d173 <.literal16+0x4d3>
.byte 0,255 // add %bh,%bh
- .byte 127,0 // jg d197 <.literal16+0x4d7>
+ .byte 127,0 // jg d177 <.literal16+0x4d7>
.byte 0,255 // add %bh,%bh
- .byte 127,0 // jg d19b <.literal16+0x4db>
+ .byte 127,0 // jg d17b <.literal16+0x4db>
.byte 0,255 // add %bh,%bh
- .byte 127,0 // jg d19f <.literal16+0x4df>
+ .byte 127,0 // jg d17f <.literal16+0x4df>
.byte 0,0 // add %al,(%eax)
.byte 4,0 // add $0x0,%al
.byte 0,0 // add %al,(%eax)
@@ -70448,13 +70420,13 @@ BALIGN16
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 127,255 // jg d1d8 <.literal16+0x518>
+ .byte 127,255 // jg d1b8 <.literal16+0x518>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 127,255 // jg d1dc <.literal16+0x51c>
+ .byte 127,255 // jg d1bc <.literal16+0x51c>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 127,0 // jg d1e1 <.literal16+0x521>
+ .byte 127,0 // jg d1c1 <.literal16+0x521>
.byte 0,128,56,0,0,128 // add %al,-0x7fffffc8(%eax)
.byte 56,0 // cmp %al,(%eax)
.byte 0,128,56,0,0,128 // add %al,-0x7fffffc8(%eax)
@@ -70468,13 +70440,13 @@ BALIGN16
.byte 0,255 // add %bh,%bh
.byte 255,0 // incl (%eax)
.byte 255 // (bad)
- .byte 127,71 // jg d24b <.literal16+0x58b>
+ .byte 127,71 // jg d22b <.literal16+0x58b>
.byte 0,255 // add %bh,%bh
- .byte 127,71 // jg d24f <.literal16+0x58f>
+ .byte 127,71 // jg d22f <.literal16+0x58f>
.byte 0,255 // add %bh,%bh
- .byte 127,71 // jg d253 <.literal16+0x593>
+ .byte 127,71 // jg d233 <.literal16+0x593>
.byte 0,255 // add %bh,%bh
- .byte 127,71 // jg d257 <.literal16+0x597>
+ .byte 127,71 // jg d237 <.literal16+0x597>
.byte 208 // (bad)
.byte 179,89 // mov $0x59,%bl
.byte 62,208 // ds (bad)
@@ -70527,7 +70499,7 @@ BALIGN16
.byte 192,45,16,17,192,45,16 // shrb $0x10,0x2dc01110
.byte 17,192 // adc %eax,%eax
.byte 45,16,17,192,18 // sub $0x12c01110,%eax
- .byte 120,57 // js d2bc <.literal16+0x5fc>
+ .byte 120,57 // js d29c <.literal16+0x5fc>
.byte 64 // inc %eax
.byte 18,120,57 // adc 0x39(%eax),%bh
.byte 64 // inc %eax
@@ -70598,13 +70570,13 @@ BALIGN16
.byte 192,191,0,0,192,191,0 // sarb $0x0,-0x40400000(%edi)
.byte 0,192 // add %al,%al
.byte 191,0,0,192,191 // mov $0xbfc00000,%edi
- .byte 114,28 // jb d36e <.literal16+0x6ae>
+ .byte 114,28 // jb d34e <.literal16+0x6ae>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt d372 <.literal16+0x6b2>
+ .byte 62,114,28 // jb,pt d352 <.literal16+0x6b2>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt d376 <.literal16+0x6b6>
+ .byte 62,114,28 // jb,pt d356 <.literal16+0x6b6>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt d37a <.literal16+0x6ba>
+ .byte 62,114,28 // jb,pt d35a <.literal16+0x6ba>
.byte 199 // (bad)
.byte 62,85 // ds push %ebp
.byte 85 // push %ebp
@@ -70625,13 +70597,13 @@ BALIGN16
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%esi)
.byte 99,61,57,142,99,61 // arpl %di,0x3d638e39
.byte 57,142,99,61,114,249 // cmp %ecx,-0x68dc29d(%esi)
- .byte 127,63 // jg d3d3 <.literal16+0x713>
- .byte 114,249 // jb d38f <.literal16+0x6cf>
- .byte 127,63 // jg d3d7 <.literal16+0x717>
- .byte 114,249 // jb d393 <.literal16+0x6d3>
- .byte 127,63 // jg d3db <.literal16+0x71b>
- .byte 114,249 // jb d397 <.literal16+0x6d7>
- .byte 127,63 // jg d3df <.literal16+0x71f>
+ .byte 127,63 // jg d3b3 <.literal16+0x713>
+ .byte 114,249 // jb d36f <.literal16+0x6cf>
+ .byte 127,63 // jg d3b7 <.literal16+0x717>
+ .byte 114,249 // jb d373 <.literal16+0x6d3>
+ .byte 127,63 // jg d3bb <.literal16+0x71b>
+ .byte 114,249 // jb d377 <.literal16+0x6d7>
+ .byte 127,63 // jg d3bf <.literal16+0x71f>
.byte 3,0 // add (%eax),%eax
.byte 0,0 // add %al,(%eax)
.byte 3,0 // add (%eax),%eax
@@ -70699,14 +70671,14 @@ BALIGN16
.byte 0,248 // add %bh,%al
.byte 0,248 // add %bh,%al
.byte 0,248 // add %bh,%al
- .byte 224,255 // loopne d431 <.literal16+0x771>
- .byte 224,255 // loopne d433 <.literal16+0x773>
- .byte 224,255 // loopne d435 <.literal16+0x775>
- .byte 224,255 // loopne d437 <.literal16+0x777>
- .byte 224,255 // loopne d439 <.literal16+0x779>
- .byte 224,255 // loopne d43b <.literal16+0x77b>
- .byte 224,255 // loopne d43d <.literal16+0x77d>
- .byte 224,255 // loopne d43f <.literal16+0x77f>
+ .byte 224,255 // loopne d411 <.literal16+0x771>
+ .byte 224,255 // loopne d413 <.literal16+0x773>
+ .byte 224,255 // loopne d415 <.literal16+0x775>
+ .byte 224,255 // loopne d417 <.literal16+0x777>
+ .byte 224,255 // loopne d419 <.literal16+0x779>
+ .byte 224,255 // loopne d41b <.literal16+0x77b>
+ .byte 224,255 // loopne d41d <.literal16+0x77d>
+ .byte 224,255 // loopne d41f <.literal16+0x77f>
.byte 54,0,54 // add %dh,%ss:(%esi)
.byte 0,54 // add %dh,(%esi)
.byte 0,54 // add %dh,(%esi)
@@ -70730,5 +70702,5 @@ BALIGN4
.byte 0,0 // add %al,(%eax)
.byte 0,63 // add %bh,(%edi)
.byte 0,0 // add %al,(%eax)
- .byte 127,67 // jg d4bb <_sk_srcover_rgba_8888_sse2_lowp+0xac7>
+ .byte 127,67 // jg d49b <_sk_srcover_rgba_8888_sse2_lowp+0xacb>
#endif
diff --git a/src/jumper/SkJumper_generated_win.S b/src/jumper/SkJumper_generated_win.S
index fe43ec82ae..5dc6f3a640 100644
--- a/src/jumper/SkJumper_generated_win.S
+++ b/src/jumper/SkJumper_generated_win.S
@@ -43575,11 +43575,11 @@ _sk_seed_shader_sse2 LABEL PROC
DB 102,15,110,2 ; movd (%edx),%xmm0
DB 102,15,112,192,0 ; pshufd $0x0,%xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,88,128,247,203,0,0 ; addps 0xcbf7(%eax),%xmm0
+ DB 15,88,128,215,203,0,0 ; addps 0xcbd7(%eax),%xmm0
DB 102,15,110,74,4 ; movd 0x4(%edx),%xmm1
DB 102,15,112,201,0 ; pshufd $0x0,%xmm1,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,88,136,7,204,0,0 ; addps 0xcc07(%eax),%xmm1
+ DB 15,88,136,231,203,0,0 ; addps 0xcbe7(%eax),%xmm1
DB 141,113,4 ; lea 0x4(%ecx),%esi
DB 15,87,210 ; xorps %xmm2,%xmm2
DB 15,41,82,64 ; movaps %xmm2,0x40(%edx)
@@ -43587,7 +43587,7 @@ _sk_seed_shader_sse2 LABEL PROC
DB 15,41,82,32 ; movaps %xmm2,0x20(%edx)
DB 15,41,82,16 ; movaps %xmm2,0x10(%edx)
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,144,23,204,0,0 ; movaps 0xcc17(%eax),%xmm2
+ DB 15,40,144,247,203,0,0 ; movaps 0xcbf7(%eax),%xmm2
DB 15,87,219 ; xorps %xmm3,%xmm3
DB 86 ; push %esi
DB 82 ; push %edx
@@ -43612,15 +43612,15 @@ _sk_dither_sse2 LABEL PROC
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 102,15,110,32 ; movd (%eax),%xmm4
DB 102,15,112,228,0 ; pshufd $0x0,%xmm4,%xmm4
- DB 102,15,254,161,178,203,0,0 ; paddd 0xcbb2(%ecx),%xmm4
+ DB 102,15,254,161,146,203,0,0 ; paddd 0xcb92(%ecx),%xmm4
DB 102,15,110,104,4 ; movd 0x4(%eax),%xmm5
DB 102,15,112,253,0 ; pshufd $0x0,%xmm5,%xmm7
DB 102,15,239,252 ; pxor %xmm4,%xmm7
- DB 102,15,111,177,194,203,0,0 ; movdqa 0xcbc2(%ecx),%xmm6
+ DB 102,15,111,177,162,203,0,0 ; movdqa 0xcba2(%ecx),%xmm6
DB 102,15,111,207 ; movdqa %xmm7,%xmm1
DB 102,15,219,206 ; pand %xmm6,%xmm1
DB 102,15,114,241,5 ; pslld $0x5,%xmm1
- DB 102,15,111,129,226,203,0,0 ; movdqa 0xcbe2(%ecx),%xmm0
+ DB 102,15,111,129,194,203,0,0 ; movdqa 0xcbc2(%ecx),%xmm0
DB 102,15,111,239 ; movdqa %xmm7,%xmm5
DB 102,15,219,232 ; pand %xmm0,%xmm5
DB 102,15,114,245,2 ; pslld $0x2,%xmm5
@@ -43630,7 +43630,7 @@ _sk_dither_sse2 LABEL PROC
DB 102,15,219,196 ; pand %xmm4,%xmm0
DB 102,15,254,192 ; paddd %xmm0,%xmm0
DB 102,15,235,198 ; por %xmm6,%xmm0
- DB 102,15,111,137,210,203,0,0 ; movdqa 0xcbd2(%ecx),%xmm1
+ DB 102,15,111,137,178,203,0,0 ; movdqa 0xcbb2(%ecx),%xmm1
DB 102,15,219,249 ; pand %xmm1,%xmm7
DB 102,15,219,225 ; pand %xmm1,%xmm4
DB 102,15,114,212,2 ; psrld $0x2,%xmm4
@@ -43641,8 +43641,8 @@ _sk_dither_sse2 LABEL PROC
DB 102,15,114,215,1 ; psrld $0x1,%xmm7
DB 102,15,235,231 ; por %xmm7,%xmm4
DB 15,91,196 ; cvtdq2ps %xmm4,%xmm0
- DB 15,89,129,242,203,0,0 ; mulps 0xcbf2(%ecx),%xmm0
- DB 15,88,129,2,204,0,0 ; addps 0xcc02(%ecx),%xmm0
+ DB 15,89,129,210,203,0,0 ; mulps 0xcbd2(%ecx),%xmm0
+ DB 15,88,129,226,203,0,0 ; addps 0xcbe2(%ecx),%xmm0
DB 243,15,16,14 ; movss (%esi),%xmm1
DB 15,198,201,0 ; shufps $0x0,%xmm1,%xmm1
DB 15,89,200 ; mulps %xmm0,%xmm1
@@ -43706,7 +43706,7 @@ _sk_black_color_sse2 LABEL PROC
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 141,81,4 ; lea 0x4(%ecx),%edx
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,152,102,202,0,0 ; movaps 0xca66(%eax),%xmm3
+ DB 15,40,152,70,202,0,0 ; movaps 0xca46(%eax),%xmm3
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,87,201 ; xorps %xmm1,%xmm1
DB 15,87,210 ; xorps %xmm2,%xmm2
@@ -43727,7 +43727,7 @@ _sk_white_color_sse2 LABEL PROC
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 141,81,4 ; lea 0x4(%ecx),%edx
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,128,54,202,0,0 ; movaps 0xca36(%eax),%xmm0
+ DB 15,40,128,22,202,0,0 ; movaps 0xca16(%eax),%xmm0
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,40,216 ; movaps %xmm0,%xmm3
@@ -43809,7 +43809,7 @@ _sk_srcatop_sse2 LABEL PROC
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 15,40,97,64 ; movaps 0x40(%ecx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
- DB 15,40,170,135,201,0,0 ; movaps 0xc987(%edx),%xmm5
+ DB 15,40,170,103,201,0,0 ; movaps 0xc967(%edx),%xmm5
DB 15,92,235 ; subps %xmm3,%xmm5
DB 15,40,113,16 ; movaps 0x10(%ecx),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
@@ -43846,7 +43846,7 @@ _sk_dstatop_sse2 LABEL PROC
DB 15,40,105,64 ; movaps 0x40(%ecx),%xmm5
DB 15,40,113,16 ; movaps 0x10(%ecx),%xmm6
DB 15,89,243 ; mulps %xmm3,%xmm6
- DB 15,40,162,40,201,0,0 ; movaps 0xc928(%edx),%xmm4
+ DB 15,40,162,8,201,0,0 ; movaps 0xc908(%edx),%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 15,88,198 ; addps %xmm6,%xmm0
@@ -43924,7 +43924,7 @@ _sk_srcout_sse2 LABEL PROC
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,85,8 ; mov 0x8(%ebp),%edx
- DB 15,40,160,103,200,0,0 ; movaps 0xc867(%eax),%xmm4
+ DB 15,40,160,71,200,0,0 ; movaps 0xc847(%eax),%xmm4
DB 15,92,98,64 ; subps 0x40(%edx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 15,89,204 ; mulps %xmm4,%xmm1
@@ -43948,7 +43948,7 @@ _sk_dstout_sse2 LABEL PROC
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,85,8 ; mov 0x8(%ebp),%edx
- DB 15,40,160,47,200,0,0 ; movaps 0xc82f(%eax),%xmm4
+ DB 15,40,160,15,200,0,0 ; movaps 0xc80f(%eax),%xmm4
DB 15,92,227 ; subps %xmm3,%xmm4
DB 15,40,66,16 ; movaps 0x10(%edx),%xmm0
DB 15,89,196 ; mulps %xmm4,%xmm0
@@ -43976,7 +43976,7 @@ _sk_srcover_sse2 LABEL PROC
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,85,8 ; mov 0x8(%ebp),%edx
- DB 15,40,160,232,199,0,0 ; movaps 0xc7e8(%eax),%xmm4
+ DB 15,40,160,200,199,0,0 ; movaps 0xc7c8(%eax),%xmm4
DB 15,92,227 ; subps %xmm3,%xmm4
DB 15,40,106,16 ; movaps 0x10(%edx),%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
@@ -44008,7 +44008,7 @@ _sk_dstover_sse2 LABEL PROC
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,85,8 ; mov 0x8(%ebp),%edx
DB 15,40,106,64 ; movaps 0x40(%edx),%xmm5
- DB 15,40,160,152,199,0,0 ; movaps 0xc798(%eax),%xmm4
+ DB 15,40,160,120,199,0,0 ; movaps 0xc778(%eax),%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 15,88,66,16 ; addps 0x10(%edx),%xmm0
@@ -44060,7 +44060,7 @@ _sk_multiply_sse2 LABEL PROC
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 15,40,80,64 ; movaps 0x40(%eax),%xmm2
DB 15,41,85,200 ; movaps %xmm2,-0x38(%ebp)
- DB 15,40,129,25,199,0,0 ; movaps 0xc719(%ecx),%xmm0
+ DB 15,40,129,249,198,0,0 ; movaps 0xc6f9(%ecx),%xmm0
DB 15,40,240 ; movaps %xmm0,%xmm6
DB 15,92,242 ; subps %xmm2,%xmm6
DB 15,40,254 ; movaps %xmm6,%xmm7
@@ -44118,7 +44118,7 @@ _sk_plus__sse2 LABEL PROC
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,85,8 ; mov 0x8(%ebp),%edx
DB 15,88,66,16 ; addps 0x10(%edx),%xmm0
- DB 15,40,160,115,198,0,0 ; movaps 0xc673(%eax),%xmm4
+ DB 15,40,160,83,198,0,0 ; movaps 0xc653(%eax),%xmm4
DB 15,93,196 ; minps %xmm4,%xmm0
DB 15,88,74,32 ; addps 0x20(%edx),%xmm1
DB 15,93,204 ; minps %xmm4,%xmm1
@@ -44186,7 +44186,7 @@ _sk_xor__sse2 LABEL PROC
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 15,40,105,64 ; movaps 0x40(%ecx),%xmm5
- DB 15,40,154,197,197,0,0 ; movaps 0xc5c5(%edx),%xmm3
+ DB 15,40,154,165,197,0,0 ; movaps 0xc5a5(%edx),%xmm3
DB 15,40,243 ; movaps %xmm3,%xmm6
DB 15,92,245 ; subps %xmm5,%xmm6
DB 15,89,198 ; mulps %xmm6,%xmm0
@@ -44246,7 +44246,7 @@ _sk_darken_sse2 LABEL PROC
DB 15,89,203 ; mulps %xmm3,%xmm1
DB 15,95,209 ; maxps %xmm1,%xmm2
DB 15,92,234 ; subps %xmm2,%xmm5
- DB 15,40,138,93,197,0,0 ; movaps 0xc55d(%edx),%xmm1
+ DB 15,40,138,61,197,0,0 ; movaps 0xc53d(%edx),%xmm1
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,89,206 ; mulps %xmm6,%xmm1
DB 15,88,217 ; addps %xmm1,%xmm3
@@ -44293,7 +44293,7 @@ _sk_lighten_sse2 LABEL PROC
DB 15,89,203 ; mulps %xmm3,%xmm1
DB 15,93,209 ; minps %xmm1,%xmm2
DB 15,92,234 ; subps %xmm2,%xmm5
- DB 15,40,138,221,196,0,0 ; movaps 0xc4dd(%edx),%xmm1
+ DB 15,40,138,189,196,0,0 ; movaps 0xc4bd(%edx),%xmm1
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,89,206 ; mulps %xmm6,%xmm1
DB 15,88,217 ; addps %xmm1,%xmm3
@@ -44344,7 +44344,7 @@ _sk_difference_sse2 LABEL PROC
DB 15,93,214 ; minps %xmm6,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 15,92,226 ; subps %xmm2,%xmm4
- DB 15,40,146,90,196,0,0 ; movaps 0xc45a(%edx),%xmm2
+ DB 15,40,146,58,196,0,0 ; movaps 0xc43a(%edx),%xmm2
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,213 ; mulps %xmm5,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -44386,7 +44386,7 @@ _sk_exclusion_sse2 LABEL PROC
DB 15,89,202 ; mulps %xmm2,%xmm1
DB 15,88,201 ; addps %xmm1,%xmm1
DB 15,92,233 ; subps %xmm1,%xmm5
- DB 15,40,138,212,195,0,0 ; movaps 0xc3d4(%edx),%xmm1
+ DB 15,40,138,180,195,0,0 ; movaps 0xc3b4(%edx),%xmm1
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,89,73,64 ; mulps 0x40(%ecx),%xmm1
DB 15,88,217 ; addps %xmm1,%xmm3
@@ -44425,7 +44425,7 @@ _sk_colorburn_sse2 LABEL PROC
DB 15,93,198 ; minps %xmm6,%xmm0
DB 15,40,233 ; movaps %xmm1,%xmm5
DB 15,92,232 ; subps %xmm0,%xmm5
- DB 15,40,177,85,195,0,0 ; movaps 0xc355(%ecx),%xmm6
+ DB 15,40,177,53,195,0,0 ; movaps 0xc335(%ecx),%xmm6
DB 15,40,198 ; movaps %xmm6,%xmm0
DB 15,92,193 ; subps %xmm1,%xmm0
DB 15,41,69,200 ; movaps %xmm0,-0x38(%ebp)
@@ -44540,7 +44540,7 @@ _sk_colordodge_sse2 LABEL PROC
DB 89 ; pop %ecx
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 15,40,72,16 ; movaps 0x10(%eax),%xmm1
- DB 15,40,145,204,193,0,0 ; movaps 0xc1cc(%ecx),%xmm2
+ DB 15,40,145,172,193,0,0 ; movaps 0xc1ac(%ecx),%xmm2
DB 15,40,226 ; movaps %xmm2,%xmm4
DB 15,92,214 ; subps %xmm6,%xmm2
DB 15,40,250 ; movaps %xmm2,%xmm7
@@ -44655,7 +44655,7 @@ _sk_hardlight_sse2 LABEL PROC
DB 89 ; pop %ecx
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 15,40,72,64 ; movaps 0x40(%eax),%xmm1
- DB 15,40,145,107,192,0,0 ; movaps 0xc06b(%ecx),%xmm2
+ DB 15,40,145,75,192,0,0 ; movaps 0xc04b(%ecx),%xmm2
DB 15,40,234 ; movaps %xmm2,%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
DB 15,40,225 ; movaps %xmm1,%xmm4
@@ -44763,7 +44763,7 @@ _sk_overlay_sse2 LABEL PROC
DB 89 ; pop %ecx
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 15,40,80,64 ; movaps 0x40(%eax),%xmm2
- DB 15,40,161,32,191,0,0 ; movaps 0xbf20(%ecx),%xmm4
+ DB 15,40,161,0,191,0,0 ; movaps 0xbf00(%ecx),%xmm4
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 15,92,242 ; subps %xmm2,%xmm6
DB 15,40,206 ; movaps %xmm6,%xmm1
@@ -44889,17 +44889,17 @@ _sk_softlight_sse2 LABEL PROC
DB 232,0,0,0,0 ; call f60 <_sk_softlight_sse2+0x52>
DB 89 ; pop %ecx
DB 15,40,194 ; movaps %xmm2,%xmm0
- DB 15,40,137,0,190,0,0 ; movaps 0xbe00(%ecx),%xmm1
+ DB 15,40,137,224,189,0,0 ; movaps 0xbde0(%ecx),%xmm1
DB 15,41,141,104,255,255,255 ; movaps %xmm1,-0x98(%ebp)
DB 15,88,193 ; addps %xmm1,%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
- DB 15,40,185,144,189,0,0 ; movaps 0xbd90(%ecx),%xmm7
+ DB 15,40,185,112,189,0,0 ; movaps 0xbd70(%ecx),%xmm7
DB 15,41,125,232 ; movaps %xmm7,-0x18(%ebp)
DB 15,92,250 ; subps %xmm2,%xmm7
DB 15,82,242 ; rsqrtps %xmm2,%xmm6
DB 15,83,206 ; rcpps %xmm6,%xmm1
DB 15,92,202 ; subps %xmm2,%xmm1
- DB 15,40,161,16,190,0,0 ; movaps 0xbe10(%ecx),%xmm4
+ DB 15,40,161,240,189,0,0 ; movaps 0xbdf0(%ecx),%xmm4
DB 15,41,101,152 ; movaps %xmm4,-0x68(%ebp)
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
@@ -45103,7 +45103,7 @@ _sk_hue_sse2 LABEL PROC
DB 15,40,226 ; movaps %xmm2,%xmm4
DB 15,40,72,64 ; movaps 0x40(%eax),%xmm1
DB 15,41,77,216 ; movaps %xmm1,-0x28(%ebp)
- DB 15,40,169,207,186,0,0 ; movaps 0xbacf(%ecx),%xmm5
+ DB 15,40,169,175,186,0,0 ; movaps 0xbaaf(%ecx),%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
DB 15,89,197 ; mulps %xmm5,%xmm0
DB 15,41,133,72,255,255,255 ; movaps %xmm0,-0xb8(%ebp)
@@ -45136,17 +45136,17 @@ _sk_hue_sse2 LABEL PROC
DB 15,89,233 ; mulps %xmm1,%xmm5
DB 15,41,173,120,255,255,255 ; movaps %xmm5,-0x88(%ebp)
DB 15,89,193 ; mulps %xmm1,%xmm0
- DB 15,40,153,95,187,0,0 ; movaps 0xbb5f(%ecx),%xmm3
+ DB 15,40,153,63,187,0,0 ; movaps 0xbb3f(%ecx),%xmm3
DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp)
DB 15,40,117,152 ; movaps -0x68(%ebp),%xmm6
DB 15,40,206 ; movaps %xmm6,%xmm1
DB 15,89,203 ; mulps %xmm3,%xmm1
- DB 15,40,153,111,187,0,0 ; movaps 0xbb6f(%ecx),%xmm3
+ DB 15,40,153,79,187,0,0 ; movaps 0xbb4f(%ecx),%xmm3
DB 15,40,109,136 ; movaps -0x78(%ebp),%xmm5
DB 15,40,253 ; movaps %xmm5,%xmm7
DB 15,89,251 ; mulps %xmm3,%xmm7
DB 15,88,249 ; addps %xmm1,%xmm7
- DB 15,40,137,207,186,0,0 ; movaps 0xbacf(%ecx),%xmm1
+ DB 15,40,137,175,186,0,0 ; movaps 0xbaaf(%ecx),%xmm1
DB 15,92,77,184 ; subps -0x48(%ebp),%xmm1
DB 15,89,241 ; mulps %xmm1,%xmm6
DB 15,41,117,152 ; movaps %xmm6,-0x68(%ebp)
@@ -45156,7 +45156,7 @@ _sk_hue_sse2 LABEL PROC
DB 15,40,77,200 ; movaps -0x38(%ebp),%xmm1
DB 15,89,241 ; mulps %xmm1,%xmm6
DB 15,41,117,168 ; movaps %xmm6,-0x58(%ebp)
- DB 15,40,169,127,187,0,0 ; movaps 0xbb7f(%ecx),%xmm5
+ DB 15,40,169,95,187,0,0 ; movaps 0xbb5f(%ecx),%xmm5
DB 15,89,205 ; mulps %xmm5,%xmm1
DB 15,88,207 ; addps %xmm7,%xmm1
DB 15,94,212 ; divps %xmm4,%xmm2
@@ -45347,17 +45347,17 @@ _sk_saturation_sse2 LABEL PROC
DB 15,89,253 ; mulps %xmm5,%xmm7
DB 232,0,0,0,0 ; call 1575 <_sk_saturation_sse2+0xb0>
DB 89 ; pop %ecx
- DB 15,40,153,11,184,0,0 ; movaps 0xb80b(%ecx),%xmm3
+ DB 15,40,153,235,183,0,0 ; movaps 0xb7eb(%ecx),%xmm3
DB 15,41,157,88,255,255,255 ; movaps %xmm3,-0xa8(%ebp)
DB 15,40,77,184 ; movaps -0x48(%ebp),%xmm1
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,40,153,27,184,0,0 ; movaps 0xb81b(%ecx),%xmm3
+ DB 15,40,153,251,183,0,0 ; movaps 0xb7fb(%ecx),%xmm3
DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp)
DB 15,40,238 ; movaps %xmm6,%xmm5
DB 15,89,235 ; mulps %xmm3,%xmm5
DB 15,88,232 ; addps %xmm0,%xmm5
- DB 15,40,129,123,183,0,0 ; movaps 0xb77b(%ecx),%xmm0
+ DB 15,40,129,91,183,0,0 ; movaps 0xb75b(%ecx),%xmm0
DB 15,41,133,104,255,255,255 ; movaps %xmm0,-0x98(%ebp)
DB 15,92,69,216 ; subps -0x28(%ebp),%xmm0
DB 15,89,200 ; mulps %xmm0,%xmm1
@@ -45369,7 +45369,7 @@ _sk_saturation_sse2 LABEL PROC
DB 15,89,200 ; mulps %xmm0,%xmm1
DB 15,41,141,120,255,255,255 ; movaps %xmm1,-0x88(%ebp)
DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 15,40,129,43,184,0,0 ; movaps 0xb82b(%ecx),%xmm0
+ DB 15,40,129,11,184,0,0 ; movaps 0xb80b(%ecx),%xmm0
DB 15,89,200 ; mulps %xmm0,%xmm1
DB 15,88,205 ; addps %xmm5,%xmm1
DB 15,40,109,168 ; movaps -0x58(%ebp),%xmm5
@@ -45526,16 +45526,16 @@ _sk_color_sse2 LABEL PROC
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 15,40,80,16 ; movaps 0x10(%eax),%xmm2
DB 15,40,72,32 ; movaps 0x20(%eax),%xmm1
- DB 15,40,177,176,181,0,0 ; movaps 0xb5b0(%ecx),%xmm6
+ DB 15,40,177,144,181,0,0 ; movaps 0xb590(%ecx),%xmm6
DB 15,41,117,216 ; movaps %xmm6,-0x28(%ebp)
DB 15,40,194 ; movaps %xmm2,%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
- DB 15,40,153,192,181,0,0 ; movaps 0xb5c0(%ecx),%xmm3
+ DB 15,40,153,160,181,0,0 ; movaps 0xb5a0(%ecx),%xmm3
DB 15,41,93,184 ; movaps %xmm3,-0x48(%ebp)
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,243 ; mulps %xmm3,%xmm6
DB 15,88,240 ; addps %xmm0,%xmm6
- DB 15,40,129,32,181,0,0 ; movaps 0xb520(%ecx),%xmm0
+ DB 15,40,129,0,181,0,0 ; movaps 0xb500(%ecx),%xmm0
DB 15,41,69,168 ; movaps %xmm0,-0x58(%ebp)
DB 15,92,69,200 ; subps -0x38(%ebp),%xmm0
DB 15,89,208 ; mulps %xmm0,%xmm2
@@ -45545,7 +45545,7 @@ _sk_color_sse2 LABEL PROC
DB 15,40,80,48 ; movaps 0x30(%eax),%xmm2
DB 15,89,194 ; mulps %xmm2,%xmm0
DB 15,41,133,72,255,255,255 ; movaps %xmm0,-0xb8(%ebp)
- DB 15,40,137,208,181,0,0 ; movaps 0xb5d0(%ecx),%xmm1
+ DB 15,40,137,176,181,0,0 ; movaps 0xb5b0(%ecx),%xmm1
DB 15,89,209 ; mulps %xmm1,%xmm2
DB 15,88,214 ; addps %xmm6,%xmm2
DB 15,40,88,64 ; movaps 0x40(%eax),%xmm3
@@ -45702,18 +45702,18 @@ _sk_luminosity_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 1a33 <_sk_luminosity_sse2+0x11>
DB 89 ; pop %ecx
DB 139,69,8 ; mov 0x8(%ebp),%eax
- DB 15,40,161,77,179,0,0 ; movaps 0xb34d(%ecx),%xmm4
+ DB 15,40,161,45,179,0,0 ; movaps 0xb32d(%ecx),%xmm4
DB 15,41,101,232 ; movaps %xmm4,-0x18(%ebp)
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,89,212 ; mulps %xmm4,%xmm2
- DB 15,40,161,93,179,0,0 ; movaps 0xb35d(%ecx),%xmm4
+ DB 15,40,161,61,179,0,0 ; movaps 0xb33d(%ecx),%xmm4
DB 15,41,101,216 ; movaps %xmm4,-0x28(%ebp)
DB 15,40,233 ; movaps %xmm1,%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
DB 15,88,234 ; addps %xmm2,%xmm5
DB 15,40,80,64 ; movaps 0x40(%eax),%xmm2
DB 15,41,85,184 ; movaps %xmm2,-0x48(%ebp)
- DB 15,40,161,189,178,0,0 ; movaps 0xb2bd(%ecx),%xmm4
+ DB 15,40,161,157,178,0,0 ; movaps 0xb29d(%ecx),%xmm4
DB 15,40,252 ; movaps %xmm4,%xmm7
DB 15,92,250 ; subps %xmm2,%xmm7
DB 15,89,199 ; mulps %xmm7,%xmm0
@@ -45723,7 +45723,7 @@ _sk_luminosity_sse2 LABEL PROC
DB 15,89,254 ; mulps %xmm6,%xmm7
DB 15,41,189,104,255,255,255 ; movaps %xmm7,-0x98(%ebp)
DB 15,40,214 ; movaps %xmm6,%xmm2
- DB 15,40,137,109,179,0,0 ; movaps 0xb36d(%ecx),%xmm1
+ DB 15,40,137,77,179,0,0 ; movaps 0xb34d(%ecx),%xmm1
DB 15,89,209 ; mulps %xmm1,%xmm2
DB 15,88,213 ; addps %xmm5,%xmm2
DB 15,40,104,16 ; movaps 0x10(%eax),%xmm5
@@ -45897,7 +45897,7 @@ _sk_srcover_rgba_8888_sse2 LABEL PROC
DB 139,49 ; mov (%ecx),%esi
DB 15,133,224,0,0,0 ; jne 1da0 <_sk_srcover_rgba_8888_sse2+0x119>
DB 243,15,111,20,178 ; movdqu (%edx,%esi,4),%xmm2
- DB 102,15,111,167,18,177,0,0 ; movdqa 0xb112(%edi),%xmm4
+ DB 102,15,111,167,242,176,0,0 ; movdqa 0xb0f2(%edi),%xmm4
DB 102,15,111,234 ; movdqa %xmm2,%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 102,15,111,242 ; movdqa %xmm2,%xmm6
@@ -45908,9 +45908,9 @@ _sk_srcover_rgba_8888_sse2 LABEL PROC
DB 102,15,219,252 ; pand %xmm4,%xmm7
DB 15,91,229 ; cvtdq2ps %xmm5,%xmm4
DB 15,41,97,16 ; movaps %xmm4,0x10(%ecx)
- DB 15,40,175,82,176,0,0 ; movaps 0xb052(%edi),%xmm5
+ DB 15,40,175,50,176,0,0 ; movaps 0xb032(%edi),%xmm5
DB 15,92,235 ; subps %xmm3,%xmm5
- DB 15,40,143,34,177,0,0 ; movaps 0xb122(%edi),%xmm1
+ DB 15,40,143,2,177,0,0 ; movaps 0xb102(%edi),%xmm1
DB 15,89,193 ; mulps %xmm1,%xmm0
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,88,224 ; addps %xmm0,%xmm4
@@ -46020,7 +46020,7 @@ _sk_clamp_1_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 1e4a <_sk_clamp_1_sse2+0xb>
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,40,160,166,174,0,0 ; movaps 0xaea6(%eax),%xmm4
+ DB 15,40,160,134,174,0,0 ; movaps 0xae86(%eax),%xmm4
DB 15,93,196 ; minps %xmm4,%xmm0
DB 15,93,204 ; minps %xmm4,%xmm1
DB 15,93,212 ; minps %xmm4,%xmm2
@@ -46042,7 +46042,7 @@ _sk_clamp_a_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 1e7d <_sk_clamp_a_sse2+0xb>
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,93,152,115,174,0,0 ; minps 0xae73(%eax),%xmm3
+ DB 15,93,152,83,174,0,0 ; minps 0xae53(%eax),%xmm3
DB 15,93,195 ; minps %xmm3,%xmm0
DB 15,93,203 ; minps %xmm3,%xmm1
DB 15,93,211 ; minps %xmm3,%xmm2
@@ -46065,7 +46065,7 @@ _sk_clamp_a_dst_sse2 LABEL PROC
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,85,8 ; mov 0x8(%ebp),%edx
DB 15,40,98,64 ; movaps 0x40(%edx),%xmm4
- DB 15,93,160,67,174,0,0 ; minps 0xae43(%eax),%xmm4
+ DB 15,93,160,35,174,0,0 ; minps 0xae23(%eax),%xmm4
DB 15,41,98,64 ; movaps %xmm4,0x40(%edx)
DB 15,40,106,16 ; movaps 0x10(%edx),%xmm5
DB 15,40,114,32 ; movaps 0x20(%edx),%xmm6
@@ -46133,7 +46133,7 @@ _sk_invert_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 1f58 <_sk_invert_sse2+0xb>
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,40,160,152,173,0,0 ; movaps 0xad98(%eax),%xmm4
+ DB 15,40,160,120,173,0,0 ; movaps 0xad78(%eax),%xmm4
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,92,232 ; subps %xmm0,%xmm5
DB 15,40,244 ; movaps %xmm4,%xmm6
@@ -46246,7 +46246,7 @@ _sk_unpremul_sse2 LABEL PROC
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 15,87,228 ; xorps %xmm4,%xmm4
- DB 15,40,168,154,172,0,0 ; movaps 0xac9a(%eax),%xmm5
+ DB 15,40,168,122,172,0,0 ; movaps 0xac7a(%eax),%xmm5
DB 15,94,235 ; divps %xmm3,%xmm5
DB 15,194,227,4 ; cmpneqps %xmm3,%xmm4
DB 15,84,229 ; andps %xmm5,%xmm4
@@ -46275,19 +46275,19 @@ _sk_from_srgb_sse2 LABEL PROC
DB 88 ; pop %eax
DB 15,40,202 ; movaps %xmm2,%xmm1
DB 15,89,201 ; mulps %xmm1,%xmm1
- DB 15,40,160,224,172,0,0 ; movaps 0xace0(%eax),%xmm4
+ DB 15,40,160,192,172,0,0 ; movaps 0xacc0(%eax),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
- DB 15,40,176,64,173,0,0 ; movaps 0xad40(%eax),%xmm6
+ DB 15,40,176,32,173,0,0 ; movaps 0xad20(%eax),%xmm6
DB 15,41,117,216 ; movaps %xmm6,-0x28(%ebp)
DB 15,88,198 ; addps %xmm6,%xmm0
DB 15,89,193 ; mulps %xmm1,%xmm0
- DB 15,40,176,48,173,0,0 ; movaps 0xad30(%eax),%xmm6
+ DB 15,40,176,16,173,0,0 ; movaps 0xad10(%eax),%xmm6
DB 15,40,202 ; movaps %xmm2,%xmm1
DB 15,89,206 ; mulps %xmm6,%xmm1
- DB 15,40,184,80,173,0,0 ; movaps 0xad50(%eax),%xmm7
+ DB 15,40,184,48,173,0,0 ; movaps 0xad30(%eax),%xmm7
DB 15,41,125,232 ; movaps %xmm7,-0x18(%ebp)
DB 15,88,199 ; addps %xmm7,%xmm0
- DB 15,40,184,96,173,0,0 ; movaps 0xad60(%eax),%xmm7
+ DB 15,40,184,64,173,0,0 ; movaps 0xad40(%eax),%xmm7
DB 15,194,215,1 ; cmpltps %xmm7,%xmm2
DB 15,84,202 ; andps %xmm2,%xmm1
DB 15,85,208 ; andnps %xmm0,%xmm2
@@ -46345,18 +46345,18 @@ _sk_from_srgb_dst_sse2 LABEL PROC
DB 15,40,72,16 ; movaps 0x10(%eax),%xmm1
DB 15,40,233 ; movaps %xmm1,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
- DB 15,40,161,5,172,0,0 ; movaps 0xac05(%ecx),%xmm4
+ DB 15,40,161,229,171,0,0 ; movaps 0xabe5(%ecx),%xmm4
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 15,89,196 ; mulps %xmm4,%xmm0
- DB 15,40,177,101,172,0,0 ; movaps 0xac65(%ecx),%xmm6
+ DB 15,40,177,69,172,0,0 ; movaps 0xac45(%ecx),%xmm6
DB 15,88,198 ; addps %xmm6,%xmm0
DB 15,89,197 ; mulps %xmm5,%xmm0
- DB 15,40,169,85,172,0,0 ; movaps 0xac55(%ecx),%xmm5
+ DB 15,40,169,53,172,0,0 ; movaps 0xac35(%ecx),%xmm5
DB 15,40,209 ; movaps %xmm1,%xmm2
DB 15,89,213 ; mulps %xmm5,%xmm2
- DB 15,40,185,117,172,0,0 ; movaps 0xac75(%ecx),%xmm7
+ DB 15,40,185,85,172,0,0 ; movaps 0xac55(%ecx),%xmm7
DB 15,88,199 ; addps %xmm7,%xmm0
- DB 15,40,153,133,172,0,0 ; movaps 0xac85(%ecx),%xmm3
+ DB 15,40,153,101,172,0,0 ; movaps 0xac65(%ecx),%xmm3
DB 15,194,203,1 ; cmpltps %xmm3,%xmm1
DB 15,84,209 ; andps %xmm1,%xmm2
DB 15,85,200 ; andnps %xmm0,%xmm1
@@ -46416,25 +46416,25 @@ _sk_to_srgb_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 2266 <_sk_to_srgb_sse2+0x18>
DB 88 ; pop %eax
DB 15,82,218 ; rsqrtps %xmm2,%xmm3
- DB 15,40,160,186,171,0,0 ; movaps 0xabba(%eax),%xmm4
+ DB 15,40,160,154,171,0,0 ; movaps 0xab9a(%eax),%xmm4
DB 15,40,235 ; movaps %xmm3,%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
- DB 15,40,128,202,171,0,0 ; movaps 0xabca(%eax),%xmm0
+ DB 15,40,128,170,171,0,0 ; movaps 0xabaa(%eax),%xmm0
DB 15,41,69,232 ; movaps %xmm0,-0x18(%ebp)
DB 15,88,232 ; addps %xmm0,%xmm5
DB 15,89,235 ; mulps %xmm3,%xmm5
- DB 15,40,128,218,171,0,0 ; movaps 0xabda(%eax),%xmm0
+ DB 15,40,128,186,171,0,0 ; movaps 0xabba(%eax),%xmm0
DB 15,41,69,200 ; movaps %xmm0,-0x38(%ebp)
DB 15,88,232 ; addps %xmm0,%xmm5
- DB 15,40,128,234,171,0,0 ; movaps 0xabea(%eax),%xmm0
+ DB 15,40,128,202,171,0,0 ; movaps 0xabca(%eax),%xmm0
DB 15,41,69,216 ; movaps %xmm0,-0x28(%ebp)
DB 15,88,216 ; addps %xmm0,%xmm3
DB 15,83,195 ; rcpps %xmm3,%xmm0
DB 15,89,197 ; mulps %xmm5,%xmm0
- DB 15,40,168,170,171,0,0 ; movaps 0xabaa(%eax),%xmm5
+ DB 15,40,168,138,171,0,0 ; movaps 0xab8a(%eax),%xmm5
DB 15,40,202 ; movaps %xmm2,%xmm1
DB 15,89,205 ; mulps %xmm5,%xmm1
- DB 15,40,152,250,171,0,0 ; movaps 0xabfa(%eax),%xmm3
+ DB 15,40,152,218,171,0,0 ; movaps 0xabda(%eax),%xmm3
DB 15,194,211,1 ; cmpltps %xmm3,%xmm2
DB 15,84,202 ; andps %xmm2,%xmm1
DB 15,85,208 ; andnps %xmm0,%xmm2
@@ -46503,14 +46503,14 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 15,40,195 ; movaps %xmm3,%xmm0
DB 15,92,193 ; subps %xmm1,%xmm0
DB 15,41,69,216 ; movaps %xmm0,-0x28(%ebp)
- DB 15,40,136,147,169,0,0 ; movaps 0xa993(%eax),%xmm1
+ DB 15,40,136,115,169,0,0 ; movaps 0xa973(%eax),%xmm1
DB 15,94,200 ; divps %xmm0,%xmm1
DB 15,40,199 ; movaps %xmm7,%xmm0
DB 15,92,194 ; subps %xmm2,%xmm0
DB 15,89,193 ; mulps %xmm1,%xmm0
DB 15,40,239 ; movaps %xmm7,%xmm5
DB 15,194,234,1 ; cmpltps %xmm2,%xmm5
- DB 15,84,168,19,171,0,0 ; andps 0xab13(%eax),%xmm5
+ DB 15,84,168,243,170,0,0 ; andps 0xaaf3(%eax),%xmm5
DB 15,88,232 ; addps %xmm0,%xmm5
DB 15,40,195 ; movaps %xmm3,%xmm0
DB 15,194,196,0 ; cmpeqps %xmm4,%xmm0
@@ -46520,9 +46520,9 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 15,92,231 ; subps %xmm7,%xmm4
DB 15,89,209 ; mulps %xmm1,%xmm2
DB 15,89,225 ; mulps %xmm1,%xmm4
- DB 15,40,136,35,171,0,0 ; movaps 0xab23(%eax),%xmm1
+ DB 15,40,136,3,171,0,0 ; movaps 0xab03(%eax),%xmm1
DB 15,88,209 ; addps %xmm1,%xmm2
- DB 15,88,160,51,171,0,0 ; addps 0xab33(%eax),%xmm4
+ DB 15,88,160,19,171,0,0 ; addps 0xab13(%eax),%xmm4
DB 15,84,214 ; andps %xmm6,%xmm2
DB 15,85,244 ; andnps %xmm4,%xmm6
DB 15,86,242 ; orps %xmm2,%xmm6
@@ -46534,7 +46534,7 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 15,194,226,4 ; cmpneqps %xmm2,%xmm4
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,88,218 ; addps %xmm2,%xmm3
- DB 15,40,168,131,169,0,0 ; movaps 0xa983(%eax),%xmm5
+ DB 15,40,168,99,169,0,0 ; movaps 0xa963(%eax),%xmm5
DB 15,92,202 ; subps %xmm2,%xmm1
DB 15,40,211 ; movaps %xmm3,%xmm2
DB 15,89,213 ; mulps %xmm5,%xmm2
@@ -46544,7 +46544,7 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 15,86,233 ; orps %xmm1,%xmm5
DB 15,40,77,216 ; movaps -0x28(%ebp),%xmm1
DB 15,94,205 ; divps %xmm5,%xmm1
- DB 15,89,128,67,171,0,0 ; mulps 0xab43(%eax),%xmm0
+ DB 15,89,128,35,171,0,0 ; mulps 0xab23(%eax),%xmm0
DB 15,84,196 ; andps %xmm4,%xmm0
DB 15,84,204 ; andps %xmm4,%xmm1
DB 139,69,12 ; mov 0xc(%ebp),%eax
@@ -46567,7 +46567,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,41,69,184 ; movaps %xmm0,-0x48(%ebp)
DB 232,0,0,0,0 ; call 2458 <_sk_hsl_to_rgb_sse2+0x19>
DB 88 ; pop %eax
- DB 15,40,160,136,168,0,0 ; movaps 0xa888(%eax),%xmm4
+ DB 15,40,160,104,168,0,0 ; movaps 0xa868(%eax),%xmm4
DB 15,40,220 ; movaps %xmm4,%xmm3
DB 15,41,165,104,255,255,255 ; movaps %xmm4,-0x98(%ebp)
DB 15,194,218,2 ; cmpleps %xmm2,%xmm3
@@ -46580,13 +46580,13 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,84,243 ; andps %xmm3,%xmm6
DB 15,85,217 ; andnps %xmm1,%xmm3
DB 15,86,222 ; orps %xmm6,%xmm3
- DB 15,40,168,88,170,0,0 ; movaps 0xaa58(%eax),%xmm5
+ DB 15,40,168,56,170,0,0 ; movaps 0xaa38(%eax),%xmm5
DB 15,88,232 ; addps %xmm0,%xmm5
DB 243,15,91,205 ; cvttps2dq %xmm5,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,194,193,1 ; cmpltps %xmm1,%xmm0
- DB 15,40,176,152,168,0,0 ; movaps 0xa898(%eax),%xmm6
+ DB 15,40,176,120,168,0,0 ; movaps 0xa878(%eax),%xmm6
DB 15,41,117,136 ; movaps %xmm6,-0x78(%ebp)
DB 15,84,198 ; andps %xmm6,%xmm0
DB 15,92,200 ; subps %xmm0,%xmm1
@@ -46596,19 +46596,19 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,41,93,216 ; movaps %xmm3,-0x28(%ebp)
DB 15,88,210 ; addps %xmm2,%xmm2
DB 15,92,211 ; subps %xmm3,%xmm2
- DB 15,40,184,104,170,0,0 ; movaps 0xaa68(%eax),%xmm7
+ DB 15,40,184,72,170,0,0 ; movaps 0xaa48(%eax),%xmm7
DB 15,41,189,88,255,255,255 ; movaps %xmm7,-0xa8(%ebp)
DB 15,194,253,2 ; cmpleps %xmm5,%xmm7
DB 15,92,218 ; subps %xmm2,%xmm3
DB 15,41,93,200 ; movaps %xmm3,-0x38(%ebp)
DB 15,40,204 ; movaps %xmm4,%xmm1
DB 15,194,205,2 ; cmpleps %xmm5,%xmm1
- DB 15,40,160,72,170,0,0 ; movaps 0xaa48(%eax),%xmm4
+ DB 15,40,160,40,170,0,0 ; movaps 0xaa28(%eax),%xmm4
DB 15,41,165,120,255,255,255 ; movaps %xmm4,-0x88(%ebp)
DB 15,194,229,2 ; cmpleps %xmm5,%xmm4
- DB 15,40,176,24,170,0,0 ; movaps 0xaa18(%eax),%xmm6
+ DB 15,40,176,248,169,0,0 ; movaps 0xa9f8(%eax),%xmm6
DB 15,89,238 ; mulps %xmm6,%xmm5
- DB 15,40,128,56,170,0,0 ; movaps 0xaa38(%eax),%xmm0
+ DB 15,40,128,24,170,0,0 ; movaps 0xaa18(%eax),%xmm0
DB 15,41,69,168 ; movaps %xmm0,-0x58(%ebp)
DB 15,92,197 ; subps %xmm5,%xmm0
DB 15,89,195 ; mulps %xmm3,%xmm0
@@ -46634,18 +46634,18 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,40,203 ; movaps %xmm3,%xmm1
DB 15,194,200,1 ; cmpltps %xmm0,%xmm1
- DB 15,84,136,152,168,0,0 ; andps 0xa898(%eax),%xmm1
+ DB 15,84,136,120,168,0,0 ; andps 0xa878(%eax),%xmm1
DB 15,92,193 ; subps %xmm1,%xmm0
DB 15,40,203 ; movaps %xmm3,%xmm1
DB 15,92,200 ; subps %xmm0,%xmm1
- DB 15,40,128,104,170,0,0 ; movaps 0xaa68(%eax),%xmm0
+ DB 15,40,128,72,170,0,0 ; movaps 0xaa48(%eax),%xmm0
DB 15,194,193,2 ; cmpleps %xmm1,%xmm0
- DB 15,40,152,136,168,0,0 ; movaps 0xa888(%eax),%xmm3
+ DB 15,40,152,104,168,0,0 ; movaps 0xa868(%eax),%xmm3
DB 15,194,217,2 ; cmpleps %xmm1,%xmm3
- DB 15,40,160,72,170,0,0 ; movaps 0xaa48(%eax),%xmm4
+ DB 15,40,160,40,170,0,0 ; movaps 0xaa28(%eax),%xmm4
DB 15,194,225,2 ; cmpleps %xmm1,%xmm4
DB 15,89,206 ; mulps %xmm6,%xmm1
- DB 15,40,168,56,170,0,0 ; movaps 0xaa38(%eax),%xmm5
+ DB 15,40,168,24,170,0,0 ; movaps 0xaa18(%eax),%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
DB 15,89,239 ; mulps %xmm7,%xmm5
DB 15,88,234 ; addps %xmm2,%xmm5
@@ -46665,7 +46665,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,40,125,232 ; movaps -0x18(%ebp),%xmm7
DB 15,85,252 ; andnps %xmm4,%xmm7
DB 15,40,93,184 ; movaps -0x48(%ebp),%xmm3
- DB 15,88,152,120,170,0,0 ; addps 0xaa78(%eax),%xmm3
+ DB 15,88,152,88,170,0,0 ; addps 0xaa58(%eax),%xmm3
DB 243,15,91,195 ; cvttps2dq %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,40,203 ; movaps %xmm3,%xmm1
@@ -46763,9 +46763,9 @@ _sk_scale_u8_sse2 LABEL PROC
DB 102,15,110,36,62 ; movd (%esi,%edi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,219,162,222,166,0,0 ; pand 0xa6de(%edx),%xmm4
+ DB 102,15,219,162,190,166,0,0 ; pand 0xa6be(%edx),%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,162,14,168,0,0 ; mulps 0xa80e(%edx),%xmm4
+ DB 15,89,162,238,167,0,0 ; mulps 0xa7ee(%edx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 15,89,204 ; mulps %xmm4,%xmm1
DB 15,89,212 ; mulps %xmm4,%xmm2
@@ -46829,17 +46829,17 @@ _sk_scale_565_sse2 LABEL PROC
DB 15,133,157,0,0,0 ; jne 284a <_sk_scale_565_sse2+0xd8>
DB 243,15,126,52,126 ; movq (%esi,%edi,2),%xmm6
DB 102,15,97,240 ; punpcklwd %xmm0,%xmm6
- DB 102,15,111,162,100,167,0,0 ; movdqa 0xa764(%edx),%xmm4
+ DB 102,15,111,162,68,167,0,0 ; movdqa 0xa744(%edx),%xmm4
DB 102,15,219,230 ; pand %xmm6,%xmm4
DB 15,91,212 ; cvtdq2ps %xmm4,%xmm2
- DB 15,89,146,116,167,0,0 ; mulps 0xa774(%edx),%xmm2
- DB 102,15,111,170,132,167,0,0 ; movdqa 0xa784(%edx),%xmm5
+ DB 15,89,146,84,167,0,0 ; mulps 0xa754(%edx),%xmm2
+ DB 102,15,111,170,100,167,0,0 ; movdqa 0xa764(%edx),%xmm5
DB 102,15,219,238 ; pand %xmm6,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,170,148,167,0,0 ; mulps 0xa794(%edx),%xmm5
- DB 102,15,219,178,164,167,0,0 ; pand 0xa7a4(%edx),%xmm6
+ DB 15,89,170,116,167,0,0 ; mulps 0xa774(%edx),%xmm5
+ DB 102,15,219,178,132,167,0,0 ; pand 0xa784(%edx),%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,89,178,180,167,0,0 ; mulps 0xa7b4(%edx),%xmm6
+ DB 15,89,178,148,167,0,0 ; mulps 0xa794(%edx),%xmm6
DB 15,40,253 ; movaps %xmm5,%xmm7
DB 15,93,254 ; minps %xmm6,%xmm7
DB 15,40,226 ; movaps %xmm2,%xmm4
@@ -46949,9 +46949,9 @@ _sk_lerp_u8_sse2 LABEL PROC
DB 102,15,110,36,62 ; movd (%esi,%edi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,219,162,182,164,0,0 ; pand 0xa4b6(%edx),%xmm4
+ DB 102,15,219,162,150,164,0,0 ; pand 0xa496(%edx),%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,162,230,165,0,0 ; mulps 0xa5e6(%edx),%xmm4
+ DB 15,89,162,198,165,0,0 ; mulps 0xa5c6(%edx),%xmm4
DB 15,40,105,16 ; movaps 0x10(%ecx),%xmm5
DB 15,40,113,32 ; movaps 0x20(%ecx),%xmm6
DB 15,92,197 ; subps %xmm5,%xmm0
@@ -47027,17 +47027,17 @@ _sk_lerp_565_sse2 LABEL PROC
DB 15,133,211,0,0,0 ; jne 2ad8 <_sk_lerp_565_sse2+0x113>
DB 243,15,126,44,126 ; movq (%esi,%edi,2),%xmm5
DB 102,15,97,232 ; punpcklwd %xmm0,%xmm5
- DB 102,15,111,162,12,165,0,0 ; movdqa 0xa50c(%edx),%xmm4
+ DB 102,15,111,162,236,164,0,0 ; movdqa 0xa4ec(%edx),%xmm4
DB 102,15,219,229 ; pand %xmm5,%xmm4
DB 15,91,204 ; cvtdq2ps %xmm4,%xmm1
- DB 15,89,138,28,165,0,0 ; mulps 0xa51c(%edx),%xmm1
- DB 102,15,111,178,44,165,0,0 ; movdqa 0xa52c(%edx),%xmm6
+ DB 15,89,138,252,164,0,0 ; mulps 0xa4fc(%edx),%xmm1
+ DB 102,15,111,178,12,165,0,0 ; movdqa 0xa50c(%edx),%xmm6
DB 102,15,219,245 ; pand %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,89,178,60,165,0,0 ; mulps 0xa53c(%edx),%xmm6
- DB 102,15,219,170,76,165,0,0 ; pand 0xa54c(%edx),%xmm5
+ DB 15,89,178,28,165,0,0 ; mulps 0xa51c(%edx),%xmm6
+ DB 102,15,219,170,44,165,0,0 ; pand 0xa52c(%edx),%xmm5
DB 15,91,213 ; cvtdq2ps %xmm5,%xmm2
- DB 15,89,146,92,165,0,0 ; mulps 0xa55c(%edx),%xmm2
+ DB 15,89,146,60,165,0,0 ; mulps 0xa53c(%edx),%xmm2
DB 15,40,218 ; movaps %xmm2,%xmm3
DB 15,41,93,200 ; movaps %xmm3,-0x38(%ebp)
DB 15,40,254 ; movaps %xmm6,%xmm7
@@ -47114,16 +47114,16 @@ _sk_load_tables_sse2 LABEL PROC
DB 131,236,12 ; sub $0xc,%esp
DB 232,0,0,0,0 ; call 2b2e <_sk_load_tables_sse2+0xe>
DB 90 ; pop %edx
- DB 139,117,12 ; mov 0xc(%ebp),%esi
+ DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,57 ; mov (%ecx),%edi
+ DB 139,48 ; mov (%eax),%esi
DB 139,65,8 ; mov 0x8(%ecx),%eax
DB 133,192 ; test %eax,%eax
- DB 139,54 ; mov (%esi),%esi
+ DB 139,57 ; mov (%ecx),%edi
DB 139,30 ; mov (%esi),%ebx
DB 15,133,22,1,0,0 ; jne 2c5c <_sk_load_tables_sse2+0x13c>
DB 243,15,111,28,187 ; movdqu (%ebx,%edi,4),%xmm3
- DB 102,15,111,146,130,162,0,0 ; movdqa 0xa282(%edx),%xmm2
+ DB 102,15,111,146,98,162,0,0 ; movdqa 0xa262(%edx),%xmm2
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
@@ -47179,7 +47179,7 @@ _sk_load_tables_sse2 LABEL PROC
DB 102,15,20,215 ; unpcklpd %xmm7,%xmm2
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,154,178,163,0,0 ; mulps 0xa3b2(%edx),%xmm3
+ DB 15,89,154,146,163,0,0 ; mulps 0xa392(%edx),%xmm3
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 137,194 ; mov %eax,%edx
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -47218,17 +47218,17 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 131,236,44 ; sub $0x2c,%esp
DB 232,0,0,0,0 ; call 2c9f <_sk_load_tables_u16_be_sse2+0xe>
DB 90 ; pop %edx
- DB 139,69,12 ; mov 0xc(%ebp),%eax
+ DB 139,117,12 ; mov 0xc(%ebp),%esi
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,57 ; mov (%ecx),%edi
- DB 139,89,8 ; mov 0x8(%ecx),%ebx
+ DB 139,65,8 ; mov 0x8(%ecx),%eax
DB 193,231,2 ; shl $0x2,%edi
- DB 133,219 ; test %ebx,%ebx
- DB 139,48 ; mov (%eax),%esi
- DB 139,6 ; mov (%esi),%eax
+ DB 133,192 ; test %eax,%eax
+ DB 139,54 ; mov (%esi),%esi
+ DB 139,30 ; mov (%esi),%ebx
DB 15,133,210,1,0,0 ; jne 2e8c <_sk_load_tables_u16_be_sse2+0x1fb>
- DB 102,15,16,4,120 ; movupd (%eax,%edi,2),%xmm0
- DB 243,15,111,76,120,16 ; movdqu 0x10(%eax,%edi,2),%xmm1
+ DB 102,15,16,4,123 ; movupd (%ebx,%edi,2),%xmm0
+ DB 243,15,111,76,123,16 ; movdqu 0x10(%ebx,%edi,2),%xmm1
DB 102,15,40,216 ; movapd %xmm0,%xmm3
DB 102,15,97,217 ; punpcklwd %xmm1,%xmm3
DB 102,15,105,193 ; punpckhwd %xmm1,%xmm0
@@ -47252,7 +47252,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 242,15,112,192,232 ; pshuflw $0xe8,%xmm0,%xmm0
DB 243,15,112,192,232 ; pshufhw $0xe8,%xmm0,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
- DB 102,15,111,146,177,162,0,0 ; movdqa 0xa2b1(%edx),%xmm2
+ DB 102,15,111,146,145,162,0,0 ; movdqa 0xa291(%edx),%xmm2
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,97,196 ; punpcklwd %xmm4,%xmm0
@@ -47324,7 +47324,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 243,15,126,93,232 ; movq -0x18(%ebp),%xmm3
DB 102,15,97,220 ; punpcklwd %xmm4,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,154,193,162,0,0 ; mulps 0xa2c1(%edx),%xmm3
+ DB 15,89,154,161,162,0,0 ; mulps 0xa2a1(%edx),%xmm3
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 137,194 ; mov %eax,%edx
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -47338,14 +47338,14 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 91 ; pop %ebx
DB 93 ; pop %ebp
DB 195 ; ret
- DB 242,15,16,4,120 ; movsd (%eax,%edi,2),%xmm0
+ DB 242,15,16,4,123 ; movsd (%ebx,%edi,2),%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
- DB 131,251,1 ; cmp $0x1,%ebx
+ DB 131,248,1 ; cmp $0x1,%eax
DB 15,132,39,254,255,255 ; je 2cc5 <_sk_load_tables_u16_be_sse2+0x34>
- DB 102,15,22,68,120,8 ; movhpd 0x8(%eax,%edi,2),%xmm0
- DB 131,251,3 ; cmp $0x3,%ebx
+ DB 102,15,22,68,123,8 ; movhpd 0x8(%ebx,%edi,2),%xmm0
+ DB 131,248,3 ; cmp $0x3,%eax
DB 15,130,24,254,255,255 ; jb 2cc5 <_sk_load_tables_u16_be_sse2+0x34>
- DB 243,15,126,76,120,16 ; movq 0x10(%eax,%edi,2),%xmm1
+ DB 243,15,126,76,123,16 ; movq 0x10(%ebx,%edi,2),%xmm1
DB 233,13,254,255,255 ; jmp 2cc5 <_sk_load_tables_u16_be_sse2+0x34>
PUBLIC _sk_load_tables_rgb_u16_be_sse2
@@ -47395,7 +47395,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC
DB 242,15,112,194,232 ; pshuflw $0xe8,%xmm2,%xmm0
DB 243,15,112,192,232 ; pshufhw $0xe8,%xmm0,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
- DB 102,15,111,146,138,160,0,0 ; movdqa 0xa08a(%edx),%xmm2
+ DB 102,15,111,146,106,160,0,0 ; movdqa 0xa06a(%edx),%xmm2
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,97,195 ; punpcklwd %xmm3,%xmm0
@@ -47460,7 +47460,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC
DB 137,198 ; mov %eax,%esi
DB 141,70,8 ; lea 0x8(%esi),%eax
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,154,42,158,0,0 ; movaps 0x9e2a(%edx),%xmm3
+ DB 15,40,154,10,158,0,0 ; movaps 0x9e0a(%edx),%xmm3
DB 80 ; push %eax
DB 81 ; push %ecx
DB 255,86,4 ; call *0x4(%esi)
@@ -47501,7 +47501,7 @@ _sk_byte_tables_sse2 LABEL PROC
DB 90 ; pop %edx
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,8 ; mov (%eax),%ecx
- DB 15,40,162,205,156,0,0 ; movaps 0x9ccd(%edx),%xmm4
+ DB 15,40,162,173,156,0,0 ; movaps 0x9cad(%edx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 102,15,112,232,78 ; pshufd $0x4e,%xmm0,%xmm5
@@ -47523,7 +47523,7 @@ _sk_byte_tables_sse2 LABEL PROC
DB 102,15,110,192 ; movd %eax,%xmm0
DB 139,65,4 ; mov 0x4(%ecx),%eax
DB 102,15,196,195,1 ; pinsrw $0x1,%ebx,%xmm0
- DB 15,40,170,237,157,0,0 ; movaps 0x9ded(%edx),%xmm5
+ DB 15,40,170,205,157,0,0 ; movaps 0x9dcd(%edx),%xmm5
DB 15,89,204 ; mulps %xmm4,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6
@@ -47651,7 +47651,7 @@ _sk_byte_tables_rgb_sse2 LABEL PROC
DB 102,15,110,199 ; movd %edi,%xmm0
DB 139,121,4 ; mov 0x4(%ecx),%edi
DB 102,15,196,198,1 ; pinsrw $0x1,%esi,%xmm0
- DB 15,40,170,241,155,0,0 ; movaps 0x9bf1(%edx),%xmm5
+ DB 15,40,170,209,155,0,0 ; movaps 0x9bd1(%edx),%xmm5
DB 15,89,204 ; mulps %xmm4,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6
@@ -47897,15 +47897,15 @@ _sk_parametric_r_sse2 LABEL PROC
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,88,245 ; addps %xmm5,%xmm6
DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5
- DB 15,89,170,177,153,0,0 ; mulps 0x99b1(%edx),%xmm5
- DB 15,84,178,193,153,0,0 ; andps 0x99c1(%edx),%xmm6
- DB 15,86,178,33,151,0,0 ; orps 0x9721(%edx),%xmm6
- DB 15,88,170,209,153,0,0 ; addps 0x99d1(%edx),%xmm5
- DB 15,40,186,225,153,0,0 ; movaps 0x99e1(%edx),%xmm7
+ DB 15,89,170,145,153,0,0 ; mulps 0x9991(%edx),%xmm5
+ DB 15,84,178,161,153,0,0 ; andps 0x99a1(%edx),%xmm6
+ DB 15,86,178,1,151,0,0 ; orps 0x9701(%edx),%xmm6
+ DB 15,88,170,177,153,0,0 ; addps 0x99b1(%edx),%xmm5
+ DB 15,40,186,193,153,0,0 ; movaps 0x99c1(%edx),%xmm7
DB 15,89,254 ; mulps %xmm6,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,88,178,241,153,0,0 ; addps 0x99f1(%edx),%xmm6
- DB 15,40,186,1,154,0,0 ; movaps 0x9a01(%edx),%xmm7
+ DB 15,88,178,209,153,0,0 ; addps 0x99d1(%edx),%xmm6
+ DB 15,40,186,225,153,0,0 ; movaps 0x99e1(%edx),%xmm7
DB 15,94,254 ; divps %xmm6,%xmm7
DB 243,15,16,49 ; movss (%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -47915,21 +47915,21 @@ _sk_parametric_r_sse2 LABEL PROC
DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,194,199,1 ; cmpltps %xmm7,%xmm0
- DB 15,40,178,49,151,0,0 ; movaps 0x9731(%edx),%xmm6
+ DB 15,40,178,17,151,0,0 ; movaps 0x9711(%edx),%xmm6
DB 15,84,198 ; andps %xmm6,%xmm0
DB 15,92,248 ; subps %xmm0,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,199 ; subps %xmm7,%xmm0
- DB 15,88,170,17,154,0,0 ; addps 0x9a11(%edx),%xmm5
- DB 15,40,186,33,154,0,0 ; movaps 0x9a21(%edx),%xmm7
+ DB 15,88,170,241,153,0,0 ; addps 0x99f1(%edx),%xmm5
+ DB 15,40,186,1,154,0,0 ; movaps 0x9a01(%edx),%xmm7
DB 15,89,248 ; mulps %xmm0,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,40,186,49,154,0,0 ; movaps 0x9a31(%edx),%xmm7
+ DB 15,40,186,17,154,0,0 ; movaps 0x9a11(%edx),%xmm7
DB 15,92,248 ; subps %xmm0,%xmm7
- DB 15,40,130,65,154,0,0 ; movaps 0x9a41(%edx),%xmm0
+ DB 15,40,130,33,154,0,0 ; movaps 0x9a21(%edx),%xmm0
DB 15,94,199 ; divps %xmm7,%xmm0
DB 15,88,197 ; addps %xmm5,%xmm0
- DB 15,89,130,81,154,0,0 ; mulps 0x9a51(%edx),%xmm0
+ DB 15,89,130,49,154,0,0 ; mulps 0x9a31(%edx),%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
@@ -47981,15 +47981,15 @@ _sk_parametric_g_sse2 LABEL PROC
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,88,245 ; addps %xmm5,%xmm6
DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5
- DB 15,89,170,122,152,0,0 ; mulps 0x987a(%edx),%xmm5
- DB 15,84,178,138,152,0,0 ; andps 0x988a(%edx),%xmm6
- DB 15,86,178,234,149,0,0 ; orps 0x95ea(%edx),%xmm6
- DB 15,88,170,154,152,0,0 ; addps 0x989a(%edx),%xmm5
- DB 15,40,186,170,152,0,0 ; movaps 0x98aa(%edx),%xmm7
+ DB 15,89,170,90,152,0,0 ; mulps 0x985a(%edx),%xmm5
+ DB 15,84,178,106,152,0,0 ; andps 0x986a(%edx),%xmm6
+ DB 15,86,178,202,149,0,0 ; orps 0x95ca(%edx),%xmm6
+ DB 15,88,170,122,152,0,0 ; addps 0x987a(%edx),%xmm5
+ DB 15,40,186,138,152,0,0 ; movaps 0x988a(%edx),%xmm7
DB 15,89,254 ; mulps %xmm6,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,88,178,186,152,0,0 ; addps 0x98ba(%edx),%xmm6
- DB 15,40,186,202,152,0,0 ; movaps 0x98ca(%edx),%xmm7
+ DB 15,88,178,154,152,0,0 ; addps 0x989a(%edx),%xmm6
+ DB 15,40,186,170,152,0,0 ; movaps 0x98aa(%edx),%xmm7
DB 15,94,254 ; divps %xmm6,%xmm7
DB 243,15,16,49 ; movss (%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -47999,21 +47999,21 @@ _sk_parametric_g_sse2 LABEL PROC
DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,194,199,1 ; cmpltps %xmm7,%xmm0
- DB 15,40,178,250,149,0,0 ; movaps 0x95fa(%edx),%xmm6
+ DB 15,40,178,218,149,0,0 ; movaps 0x95da(%edx),%xmm6
DB 15,84,198 ; andps %xmm6,%xmm0
DB 15,92,248 ; subps %xmm0,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,199 ; subps %xmm7,%xmm0
- DB 15,88,170,218,152,0,0 ; addps 0x98da(%edx),%xmm5
- DB 15,40,186,234,152,0,0 ; movaps 0x98ea(%edx),%xmm7
+ DB 15,88,170,186,152,0,0 ; addps 0x98ba(%edx),%xmm5
+ DB 15,40,186,202,152,0,0 ; movaps 0x98ca(%edx),%xmm7
DB 15,89,248 ; mulps %xmm0,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,40,186,250,152,0,0 ; movaps 0x98fa(%edx),%xmm7
+ DB 15,40,186,218,152,0,0 ; movaps 0x98da(%edx),%xmm7
DB 15,92,248 ; subps %xmm0,%xmm7
- DB 15,40,130,10,153,0,0 ; movaps 0x990a(%edx),%xmm0
+ DB 15,40,130,234,152,0,0 ; movaps 0x98ea(%edx),%xmm0
DB 15,94,199 ; divps %xmm7,%xmm0
DB 15,88,197 ; addps %xmm5,%xmm0
- DB 15,89,130,26,153,0,0 ; mulps 0x991a(%edx),%xmm0
+ DB 15,89,130,250,152,0,0 ; mulps 0x98fa(%edx),%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
@@ -48064,15 +48064,15 @@ _sk_parametric_b_sse2 LABEL PROC
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,88,245 ; addps %xmm5,%xmm6
DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5
- DB 15,89,170,70,151,0,0 ; mulps 0x9746(%edx),%xmm5
- DB 15,84,178,86,151,0,0 ; andps 0x9756(%edx),%xmm6
- DB 15,86,178,182,148,0,0 ; orps 0x94b6(%edx),%xmm6
- DB 15,88,170,102,151,0,0 ; addps 0x9766(%edx),%xmm5
- DB 15,40,186,118,151,0,0 ; movaps 0x9776(%edx),%xmm7
+ DB 15,89,170,38,151,0,0 ; mulps 0x9726(%edx),%xmm5
+ DB 15,84,178,54,151,0,0 ; andps 0x9736(%edx),%xmm6
+ DB 15,86,178,150,148,0,0 ; orps 0x9496(%edx),%xmm6
+ DB 15,88,170,70,151,0,0 ; addps 0x9746(%edx),%xmm5
+ DB 15,40,186,86,151,0,0 ; movaps 0x9756(%edx),%xmm7
DB 15,89,254 ; mulps %xmm6,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,88,178,134,151,0,0 ; addps 0x9786(%edx),%xmm6
- DB 15,40,186,150,151,0,0 ; movaps 0x9796(%edx),%xmm7
+ DB 15,88,178,102,151,0,0 ; addps 0x9766(%edx),%xmm6
+ DB 15,40,186,118,151,0,0 ; movaps 0x9776(%edx),%xmm7
DB 15,94,254 ; divps %xmm6,%xmm7
DB 243,15,16,49 ; movss (%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -48082,21 +48082,21 @@ _sk_parametric_b_sse2 LABEL PROC
DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,194,199,1 ; cmpltps %xmm7,%xmm0
- DB 15,40,178,198,148,0,0 ; movaps 0x94c6(%edx),%xmm6
+ DB 15,40,178,166,148,0,0 ; movaps 0x94a6(%edx),%xmm6
DB 15,84,198 ; andps %xmm6,%xmm0
DB 15,92,248 ; subps %xmm0,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,199 ; subps %xmm7,%xmm0
- DB 15,88,170,166,151,0,0 ; addps 0x97a6(%edx),%xmm5
- DB 15,40,186,182,151,0,0 ; movaps 0x97b6(%edx),%xmm7
+ DB 15,88,170,134,151,0,0 ; addps 0x9786(%edx),%xmm5
+ DB 15,40,186,150,151,0,0 ; movaps 0x9796(%edx),%xmm7
DB 15,89,248 ; mulps %xmm0,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,40,186,198,151,0,0 ; movaps 0x97c6(%edx),%xmm7
+ DB 15,40,186,166,151,0,0 ; movaps 0x97a6(%edx),%xmm7
DB 15,92,248 ; subps %xmm0,%xmm7
- DB 15,40,130,214,151,0,0 ; movaps 0x97d6(%edx),%xmm0
+ DB 15,40,130,182,151,0,0 ; movaps 0x97b6(%edx),%xmm0
DB 15,94,199 ; divps %xmm7,%xmm0
DB 15,88,197 ; addps %xmm5,%xmm0
- DB 15,89,130,230,151,0,0 ; mulps 0x97e6(%edx),%xmm0
+ DB 15,89,130,198,151,0,0 ; mulps 0x97c6(%edx),%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
@@ -48147,15 +48147,15 @@ _sk_parametric_a_sse2 LABEL PROC
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,88,245 ; addps %xmm5,%xmm6
DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5
- DB 15,89,170,18,150,0,0 ; mulps 0x9612(%edx),%xmm5
- DB 15,84,178,34,150,0,0 ; andps 0x9622(%edx),%xmm6
- DB 15,86,178,130,147,0,0 ; orps 0x9382(%edx),%xmm6
- DB 15,88,170,50,150,0,0 ; addps 0x9632(%edx),%xmm5
- DB 15,40,186,66,150,0,0 ; movaps 0x9642(%edx),%xmm7
+ DB 15,89,170,242,149,0,0 ; mulps 0x95f2(%edx),%xmm5
+ DB 15,84,178,2,150,0,0 ; andps 0x9602(%edx),%xmm6
+ DB 15,86,178,98,147,0,0 ; orps 0x9362(%edx),%xmm6
+ DB 15,88,170,18,150,0,0 ; addps 0x9612(%edx),%xmm5
+ DB 15,40,186,34,150,0,0 ; movaps 0x9622(%edx),%xmm7
DB 15,89,254 ; mulps %xmm6,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,88,178,82,150,0,0 ; addps 0x9652(%edx),%xmm6
- DB 15,40,186,98,150,0,0 ; movaps 0x9662(%edx),%xmm7
+ DB 15,88,178,50,150,0,0 ; addps 0x9632(%edx),%xmm6
+ DB 15,40,186,66,150,0,0 ; movaps 0x9642(%edx),%xmm7
DB 15,94,254 ; divps %xmm6,%xmm7
DB 243,15,16,49 ; movss (%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -48165,21 +48165,21 @@ _sk_parametric_a_sse2 LABEL PROC
DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,194,199,1 ; cmpltps %xmm7,%xmm0
- DB 15,40,178,146,147,0,0 ; movaps 0x9392(%edx),%xmm6
+ DB 15,40,178,114,147,0,0 ; movaps 0x9372(%edx),%xmm6
DB 15,84,198 ; andps %xmm6,%xmm0
DB 15,92,248 ; subps %xmm0,%xmm7
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,199 ; subps %xmm7,%xmm0
- DB 15,88,170,114,150,0,0 ; addps 0x9672(%edx),%xmm5
- DB 15,40,186,130,150,0,0 ; movaps 0x9682(%edx),%xmm7
+ DB 15,88,170,82,150,0,0 ; addps 0x9652(%edx),%xmm5
+ DB 15,40,186,98,150,0,0 ; movaps 0x9662(%edx),%xmm7
DB 15,89,248 ; mulps %xmm0,%xmm7
DB 15,92,239 ; subps %xmm7,%xmm5
- DB 15,40,186,146,150,0,0 ; movaps 0x9692(%edx),%xmm7
+ DB 15,40,186,114,150,0,0 ; movaps 0x9672(%edx),%xmm7
DB 15,92,248 ; subps %xmm0,%xmm7
- DB 15,40,130,162,150,0,0 ; movaps 0x96a2(%edx),%xmm0
+ DB 15,40,130,130,150,0,0 ; movaps 0x9682(%edx),%xmm0
DB 15,94,199 ; divps %xmm7,%xmm0
DB 15,88,197 ; addps %xmm5,%xmm0
- DB 15,89,130,178,150,0,0 ; mulps 0x96b2(%edx),%xmm0
+ DB 15,89,130,146,150,0,0 ; mulps 0x9692(%edx),%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
@@ -48212,15 +48212,15 @@ _sk_gamma_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 3a8f <_sk_gamma_sse2+0x12>
DB 88 ; pop %eax
DB 15,91,195 ; cvtdq2ps %xmm3,%xmm0
- DB 15,89,128,225,148,0,0 ; mulps 0x94e1(%eax),%xmm0
- DB 15,84,152,241,148,0,0 ; andps 0x94f1(%eax),%xmm3
- DB 15,86,152,81,146,0,0 ; orps 0x9251(%eax),%xmm3
- DB 15,88,128,1,149,0,0 ; addps 0x9501(%eax),%xmm0
+ DB 15,89,128,193,148,0,0 ; mulps 0x94c1(%eax),%xmm0
+ DB 15,84,152,209,148,0,0 ; andps 0x94d1(%eax),%xmm3
+ DB 15,86,152,49,146,0,0 ; orps 0x9231(%eax),%xmm3
+ DB 15,88,128,225,148,0,0 ; addps 0x94e1(%eax),%xmm0
DB 15,40,227 ; movaps %xmm3,%xmm4
- DB 15,89,160,17,149,0,0 ; mulps 0x9511(%eax),%xmm4
+ DB 15,89,160,241,148,0,0 ; mulps 0x94f1(%eax),%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,88,152,33,149,0,0 ; addps 0x9521(%eax),%xmm3
- DB 15,40,160,49,149,0,0 ; movaps 0x9531(%eax),%xmm4
+ DB 15,88,152,1,149,0,0 ; addps 0x9501(%eax),%xmm3
+ DB 15,40,160,17,149,0,0 ; movaps 0x9511(%eax),%xmm4
DB 15,94,227 ; divps %xmm3,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
DB 139,77,12 ; mov 0xc(%ebp),%ecx
@@ -48233,30 +48233,30 @@ _sk_gamma_sse2 LABEL PROC
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
DB 15,40,224 ; movaps %xmm0,%xmm4
DB 15,194,227,1 ; cmpltps %xmm3,%xmm4
- DB 15,84,160,97,146,0,0 ; andps 0x9261(%eax),%xmm4
+ DB 15,84,160,65,146,0,0 ; andps 0x9241(%eax),%xmm4
DB 15,92,220 ; subps %xmm4,%xmm3
DB 15,40,224 ; movaps %xmm0,%xmm4
DB 15,92,227 ; subps %xmm3,%xmm4
- DB 15,88,128,65,149,0,0 ; addps 0x9541(%eax),%xmm0
- DB 15,40,176,97,149,0,0 ; movaps 0x9561(%eax),%xmm6
+ DB 15,88,128,33,149,0,0 ; addps 0x9521(%eax),%xmm0
+ DB 15,40,176,65,149,0,0 ; movaps 0x9541(%eax),%xmm6
DB 15,92,244 ; subps %xmm4,%xmm6
- DB 15,40,168,81,149,0,0 ; movaps 0x9551(%eax),%xmm5
+ DB 15,40,168,49,149,0,0 ; movaps 0x9531(%eax),%xmm5
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,40,152,113,149,0,0 ; movaps 0x9571(%eax),%xmm3
+ DB 15,40,152,81,149,0,0 ; movaps 0x9551(%eax),%xmm3
DB 15,40,227 ; movaps %xmm3,%xmm4
DB 15,94,230 ; divps %xmm6,%xmm4
DB 15,88,224 ; addps %xmm0,%xmm4
DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0
- DB 15,89,128,225,148,0,0 ; mulps 0x94e1(%eax),%xmm0
- DB 15,84,136,241,148,0,0 ; andps 0x94f1(%eax),%xmm1
- DB 15,86,136,81,146,0,0 ; orps 0x9251(%eax),%xmm1
- DB 15,88,128,1,149,0,0 ; addps 0x9501(%eax),%xmm0
+ DB 15,89,128,193,148,0,0 ; mulps 0x94c1(%eax),%xmm0
+ DB 15,84,136,209,148,0,0 ; andps 0x94d1(%eax),%xmm1
+ DB 15,86,136,49,146,0,0 ; orps 0x9231(%eax),%xmm1
+ DB 15,88,128,225,148,0,0 ; addps 0x94e1(%eax),%xmm0
DB 15,40,241 ; movaps %xmm1,%xmm6
- DB 15,89,176,17,149,0,0 ; mulps 0x9511(%eax),%xmm6
+ DB 15,89,176,241,148,0,0 ; mulps 0x94f1(%eax),%xmm6
DB 15,92,198 ; subps %xmm6,%xmm0
- DB 15,88,136,33,149,0,0 ; addps 0x9521(%eax),%xmm1
- DB 15,40,176,49,149,0,0 ; movaps 0x9531(%eax),%xmm6
+ DB 15,88,136,1,149,0,0 ; addps 0x9501(%eax),%xmm1
+ DB 15,40,176,17,149,0,0 ; movaps 0x9511(%eax),%xmm6
DB 15,94,241 ; divps %xmm1,%xmm6
DB 15,92,198 ; subps %xmm6,%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
@@ -48264,12 +48264,12 @@ _sk_gamma_sse2 LABEL PROC
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,40,240 ; movaps %xmm0,%xmm6
DB 15,194,241,1 ; cmpltps %xmm1,%xmm6
- DB 15,84,176,97,146,0,0 ; andps 0x9261(%eax),%xmm6
+ DB 15,84,176,65,146,0,0 ; andps 0x9241(%eax),%xmm6
DB 15,92,206 ; subps %xmm6,%xmm1
DB 15,40,240 ; movaps %xmm0,%xmm6
DB 15,92,241 ; subps %xmm1,%xmm6
- DB 15,88,128,65,149,0,0 ; addps 0x9541(%eax),%xmm0
- DB 15,40,184,97,149,0,0 ; movaps 0x9561(%eax),%xmm7
+ DB 15,88,128,33,149,0,0 ; addps 0x9521(%eax),%xmm0
+ DB 15,40,184,65,149,0,0 ; movaps 0x9541(%eax),%xmm7
DB 15,92,254 ; subps %xmm6,%xmm7
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,92,198 ; subps %xmm6,%xmm0
@@ -48277,15 +48277,15 @@ _sk_gamma_sse2 LABEL PROC
DB 15,94,207 ; divps %xmm7,%xmm1
DB 15,88,200 ; addps %xmm0,%xmm1
DB 15,91,194 ; cvtdq2ps %xmm2,%xmm0
- DB 15,89,128,225,148,0,0 ; mulps 0x94e1(%eax),%xmm0
- DB 15,84,144,241,148,0,0 ; andps 0x94f1(%eax),%xmm2
- DB 15,86,144,81,146,0,0 ; orps 0x9251(%eax),%xmm2
- DB 15,88,128,1,149,0,0 ; addps 0x9501(%eax),%xmm0
- DB 15,40,176,17,149,0,0 ; movaps 0x9511(%eax),%xmm6
+ DB 15,89,128,193,148,0,0 ; mulps 0x94c1(%eax),%xmm0
+ DB 15,84,144,209,148,0,0 ; andps 0x94d1(%eax),%xmm2
+ DB 15,86,144,49,146,0,0 ; orps 0x9231(%eax),%xmm2
+ DB 15,88,128,225,148,0,0 ; addps 0x94e1(%eax),%xmm0
+ DB 15,40,176,241,148,0,0 ; movaps 0x94f1(%eax),%xmm6
DB 15,89,242 ; mulps %xmm2,%xmm6
DB 15,92,198 ; subps %xmm6,%xmm0
- DB 15,88,144,33,149,0,0 ; addps 0x9521(%eax),%xmm2
- DB 15,40,176,49,149,0,0 ; movaps 0x9531(%eax),%xmm6
+ DB 15,88,144,1,149,0,0 ; addps 0x9501(%eax),%xmm2
+ DB 15,40,176,17,149,0,0 ; movaps 0x9511(%eax),%xmm6
DB 15,94,242 ; divps %xmm2,%xmm6
DB 15,92,198 ; subps %xmm6,%xmm0
DB 15,89,69,232 ; mulps -0x18(%ebp),%xmm0
@@ -48293,18 +48293,18 @@ _sk_gamma_sse2 LABEL PROC
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 15,40,240 ; movaps %xmm0,%xmm6
DB 15,194,242,1 ; cmpltps %xmm2,%xmm6
- DB 15,84,176,97,146,0,0 ; andps 0x9261(%eax),%xmm6
+ DB 15,84,176,65,146,0,0 ; andps 0x9241(%eax),%xmm6
DB 15,92,214 ; subps %xmm6,%xmm2
DB 15,40,240 ; movaps %xmm0,%xmm6
DB 15,92,242 ; subps %xmm2,%xmm6
- DB 15,88,128,65,149,0,0 ; addps 0x9541(%eax),%xmm0
+ DB 15,88,128,33,149,0,0 ; addps 0x9521(%eax),%xmm0
DB 15,89,238 ; mulps %xmm6,%xmm5
DB 15,92,197 ; subps %xmm5,%xmm0
- DB 15,40,144,97,149,0,0 ; movaps 0x9561(%eax),%xmm2
+ DB 15,40,144,65,149,0,0 ; movaps 0x9541(%eax),%xmm2
DB 15,92,214 ; subps %xmm6,%xmm2
DB 15,94,218 ; divps %xmm2,%xmm3
DB 15,88,216 ; addps %xmm0,%xmm3
- DB 15,40,128,129,149,0,0 ; movaps 0x9581(%eax),%xmm0
+ DB 15,40,128,97,149,0,0 ; movaps 0x9561(%eax),%xmm0
DB 15,89,224 ; mulps %xmm0,%xmm4
DB 15,89,200 ; mulps %xmm0,%xmm1
DB 15,89,216 ; mulps %xmm0,%xmm3
@@ -48331,29 +48331,29 @@ _sk_lab_to_xyz_sse2 LABEL PROC
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 232,0,0,0,0 ; call 3c77 <_sk_lab_to_xyz_sse2+0x15>
DB 88 ; pop %eax
- DB 15,89,144,169,147,0,0 ; mulps 0x93a9(%eax),%xmm2
- DB 15,40,160,73,145,0,0 ; movaps 0x9149(%eax),%xmm4
+ DB 15,89,144,137,147,0,0 ; mulps 0x9389(%eax),%xmm2
+ DB 15,40,160,41,145,0,0 ; movaps 0x9129(%eax),%xmm4
DB 15,89,204 ; mulps %xmm4,%xmm1
- DB 15,40,168,185,147,0,0 ; movaps 0x93b9(%eax),%xmm5
+ DB 15,40,168,153,147,0,0 ; movaps 0x9399(%eax),%xmm5
DB 15,88,205 ; addps %xmm5,%xmm1
DB 15,89,220 ; mulps %xmm4,%xmm3
DB 15,88,221 ; addps %xmm5,%xmm3
- DB 15,88,144,201,147,0,0 ; addps 0x93c9(%eax),%xmm2
- DB 15,89,144,217,147,0,0 ; mulps 0x93d9(%eax),%xmm2
- DB 15,89,136,233,147,0,0 ; mulps 0x93e9(%eax),%xmm1
+ DB 15,88,144,169,147,0,0 ; addps 0x93a9(%eax),%xmm2
+ DB 15,89,144,185,147,0,0 ; mulps 0x93b9(%eax),%xmm2
+ DB 15,89,136,201,147,0,0 ; mulps 0x93c9(%eax),%xmm1
DB 15,88,202 ; addps %xmm2,%xmm1
- DB 15,89,152,249,147,0,0 ; mulps 0x93f9(%eax),%xmm3
+ DB 15,89,152,217,147,0,0 ; mulps 0x93d9(%eax),%xmm3
DB 15,40,234 ; movaps %xmm2,%xmm5
DB 15,92,235 ; subps %xmm3,%xmm5
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 15,89,193 ; mulps %xmm1,%xmm0
- DB 15,40,152,9,148,0,0 ; movaps 0x9409(%eax),%xmm3
+ DB 15,40,152,233,147,0,0 ; movaps 0x93e9(%eax),%xmm3
DB 15,40,227 ; movaps %xmm3,%xmm4
DB 15,194,224,1 ; cmpltps %xmm0,%xmm4
- DB 15,40,176,25,148,0,0 ; movaps 0x9419(%eax),%xmm6
+ DB 15,40,176,249,147,0,0 ; movaps 0x93f9(%eax),%xmm6
DB 15,88,206 ; addps %xmm6,%xmm1
- DB 15,40,184,41,148,0,0 ; movaps 0x9429(%eax),%xmm7
+ DB 15,40,184,9,148,0,0 ; movaps 0x9409(%eax),%xmm7
DB 15,89,207 ; mulps %xmm7,%xmm1
DB 15,84,196 ; andps %xmm4,%xmm0
DB 15,85,225 ; andnps %xmm1,%xmm4
@@ -48378,8 +48378,8 @@ _sk_lab_to_xyz_sse2 LABEL PROC
DB 15,85,221 ; andnps %xmm5,%xmm3
DB 15,86,216 ; orps %xmm0,%xmm3
DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,89,160,57,148,0,0 ; mulps 0x9439(%eax),%xmm4
- DB 15,89,152,73,148,0,0 ; mulps 0x9449(%eax),%xmm3
+ DB 15,89,160,25,148,0,0 ; mulps 0x9419(%eax),%xmm4
+ DB 15,89,152,41,148,0,0 ; mulps 0x9429(%eax),%xmm3
DB 141,65,4 ; lea 0x4(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
DB 15,40,196 ; movaps %xmm4,%xmm0
@@ -48415,9 +48415,9 @@ _sk_load_a8_sse2 LABEL PROC
DB 102,15,110,4,62 ; movd (%esi,%edi,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
DB 102,15,97,192 ; punpcklwd %xmm0,%xmm0
- DB 102,15,219,130,73,144,0,0 ; pand 0x9049(%edx),%xmm0
+ DB 102,15,219,130,41,144,0,0 ; pand 0x9029(%edx),%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,154,121,145,0,0 ; mulps 0x9179(%edx),%xmm3
+ DB 15,89,154,89,145,0,0 ; mulps 0x9159(%edx),%xmm3
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
DB 15,87,192 ; xorps %xmm0,%xmm0
@@ -48463,8 +48463,8 @@ _sk_load_a8_dst_sse2 LABEL PROC
DB 131,236,12 ; sub $0xc,%esp
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,49 ; mov (%ecx),%esi
DB 139,16 ; mov (%eax),%edx
+ DB 139,49 ; mov (%ecx),%esi
DB 139,122,4 ; mov 0x4(%edx),%edi
DB 15,175,121,4 ; imul 0x4(%ecx),%edi
DB 3,58 ; add (%edx),%edi
@@ -48480,9 +48480,9 @@ _sk_load_a8_dst_sse2 LABEL PROC
DB 102,15,110,36,55 ; movd (%edi,%esi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,219,162,117,143,0,0 ; pand 0x8f75(%edx),%xmm4
+ DB 102,15,219,162,85,143,0,0 ; pand 0x8f55(%edx),%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,162,165,144,0,0 ; mulps 0x90a5(%edx),%xmm4
+ DB 15,89,162,133,144,0,0 ; mulps 0x9085(%edx),%xmm4
DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx)
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
@@ -48571,7 +48571,7 @@ _sk_gather_a8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,153,120,143,0,0 ; mulps 0x8f78(%ecx),%xmm3
+ DB 15,89,153,88,143,0,0 ; mulps 0x8f58(%ecx),%xmm3
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 131,236,8 ; sub $0x8,%esp
DB 15,87,192 ; xorps %xmm0,%xmm0
@@ -48603,7 +48603,7 @@ _sk_store_a8_sse2 LABEL PROC
DB 15,175,81,4 ; imul 0x4(%ecx),%edx
DB 3,23 ; add (%edi),%edx
DB 139,89,8 ; mov 0x8(%ecx),%ebx
- DB 15,40,166,20,142,0,0 ; movaps 0x8e14(%esi),%xmm4
+ DB 15,40,166,244,141,0,0 ; movaps 0x8df4(%esi),%xmm4
DB 15,89,227 ; mulps %xmm3,%xmm4
DB 102,15,91,228 ; cvtps2dq %xmm4,%xmm4
DB 102,15,114,244,16 ; pslld $0x10,%xmm4
@@ -48638,7 +48638,7 @@ _sk_store_a8_sse2 LABEL PROC
DB 102,15,197,220,4 ; pextrw $0x4,%xmm4,%ebx
DB 136,92,58,2 ; mov %bl,0x2(%edx,%edi,1)
DB 102,15,112,228,212 ; pshufd $0xd4,%xmm4,%xmm4
- DB 102,15,219,166,36,145,0,0 ; pand 0x9124(%esi),%xmm4
+ DB 102,15,219,166,4,145,0,0 ; pand 0x9104(%esi),%xmm4
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
@@ -48672,12 +48672,12 @@ _sk_load_g8_sse2 LABEL PROC
DB 102,15,110,4,62 ; movd (%esi,%edi,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
DB 102,15,97,192 ; punpcklwd %xmm0,%xmm0
- DB 102,15,219,130,82,141,0,0 ; pand 0x8d52(%edx),%xmm0
+ DB 102,15,219,130,50,141,0,0 ; pand 0x8d32(%edx),%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,130,130,142,0,0 ; mulps 0x8e82(%edx),%xmm0
+ DB 15,89,130,98,142,0,0 ; mulps 0x8e62(%edx),%xmm0
DB 141,112,8 ; lea 0x8(%eax),%esi
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,154,146,140,0,0 ; movaps 0x8c92(%edx),%xmm3
+ DB 15,40,154,114,140,0,0 ; movaps 0x8c72(%edx),%xmm3
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 86 ; push %esi
@@ -48733,13 +48733,13 @@ _sk_load_g8_dst_sse2 LABEL PROC
DB 102,15,110,36,62 ; movd (%esi,%edi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,219,162,166,140,0,0 ; pand 0x8ca6(%edx),%xmm4
+ DB 102,15,219,162,134,140,0,0 ; pand 0x8c86(%edx),%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,162,214,141,0,0 ; mulps 0x8dd6(%edx),%xmm4
+ DB 15,89,162,182,141,0,0 ; mulps 0x8db6(%edx),%xmm4
DB 15,41,97,48 ; movaps %xmm4,0x30(%ecx)
DB 15,41,97,32 ; movaps %xmm4,0x20(%ecx)
DB 15,41,97,16 ; movaps %xmm4,0x10(%ecx)
- DB 15,40,162,230,139,0,0 ; movaps 0x8be6(%edx),%xmm4
+ DB 15,40,162,198,139,0,0 ; movaps 0x8bc6(%edx),%xmm4
DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx)
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
@@ -48829,10 +48829,10 @@ _sk_gather_g8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,129,127,140,0,0 ; mulps 0x8c7f(%ecx),%xmm0
+ DB 15,89,129,95,140,0,0 ; mulps 0x8c5f(%ecx),%xmm0
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,153,143,138,0,0 ; movaps 0x8a8f(%ecx),%xmm3
+ DB 15,40,153,111,138,0,0 ; movaps 0x8a6f(%ecx),%xmm3
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 82 ; push %edx
@@ -48867,20 +48867,20 @@ _sk_load_565_sse2 LABEL PROC
DB 117,97 ; jne 432a <_sk_load_565_sse2+0x8c>
DB 243,15,126,20,126 ; movq (%esi,%edi,2),%xmm2
DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2
- DB 102,15,111,130,68,140,0,0 ; movdqa 0x8c44(%edx),%xmm0
+ DB 102,15,111,130,36,140,0,0 ; movdqa 0x8c24(%edx),%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,130,84,140,0,0 ; mulps 0x8c54(%edx),%xmm0
- DB 102,15,111,138,100,140,0,0 ; movdqa 0x8c64(%edx),%xmm1
+ DB 15,89,130,52,140,0,0 ; mulps 0x8c34(%edx),%xmm0
+ DB 102,15,111,138,68,140,0,0 ; movdqa 0x8c44(%edx),%xmm1
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,138,116,140,0,0 ; mulps 0x8c74(%edx),%xmm1
- DB 102,15,219,146,132,140,0,0 ; pand 0x8c84(%edx),%xmm2
+ DB 15,89,138,84,140,0,0 ; mulps 0x8c54(%edx),%xmm1
+ DB 102,15,219,146,100,140,0,0 ; pand 0x8c64(%edx),%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,146,148,140,0,0 ; mulps 0x8c94(%edx),%xmm2
+ DB 15,89,146,116,140,0,0 ; mulps 0x8c74(%edx),%xmm2
DB 141,112,8 ; lea 0x8(%eax),%esi
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,154,68,138,0,0 ; movaps 0x8a44(%edx),%xmm3
+ DB 15,40,154,36,138,0,0 ; movaps 0x8a24(%edx),%xmm3
DB 86 ; push %esi
DB 81 ; push %ecx
DB 255,80,4 ; call *0x4(%eax)
@@ -48932,21 +48932,21 @@ _sk_load_565_dst_sse2 LABEL PROC
DB 117,113 ; jne 440a <_sk_load_565_dst_sse2+0x9c>
DB 243,15,126,36,126 ; movq (%esi,%edi,2),%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,111,170,116,139,0,0 ; movdqa 0x8b74(%edx),%xmm5
+ DB 102,15,111,170,84,139,0,0 ; movdqa 0x8b54(%edx),%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,170,132,139,0,0 ; mulps 0x8b84(%edx),%xmm5
+ DB 15,89,170,100,139,0,0 ; mulps 0x8b64(%edx),%xmm5
DB 15,41,105,16 ; movaps %xmm5,0x10(%ecx)
- DB 102,15,111,170,148,139,0,0 ; movdqa 0x8b94(%edx),%xmm5
+ DB 102,15,111,170,116,139,0,0 ; movdqa 0x8b74(%edx),%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,170,164,139,0,0 ; mulps 0x8ba4(%edx),%xmm5
+ DB 15,89,170,132,139,0,0 ; mulps 0x8b84(%edx),%xmm5
DB 15,41,105,32 ; movaps %xmm5,0x20(%ecx)
- DB 102,15,219,162,180,139,0,0 ; pand 0x8bb4(%edx),%xmm4
+ DB 102,15,219,162,148,139,0,0 ; pand 0x8b94(%edx),%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,162,196,139,0,0 ; mulps 0x8bc4(%edx),%xmm4
+ DB 15,89,162,164,139,0,0 ; mulps 0x8ba4(%edx),%xmm4
DB 15,41,97,48 ; movaps %xmm4,0x30(%ecx)
- DB 15,40,162,116,137,0,0 ; movaps 0x8974(%edx),%xmm4
+ DB 15,40,162,84,137,0,0 ; movaps 0x8954(%edx),%xmm4
DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx)
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
@@ -49029,20 +49029,20 @@ _sk_gather_565_sse2 LABEL PROC
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,209,3 ; pinsrw $0x3,%ecx,%xmm2
DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2
- DB 102,15,111,130,242,137,0,0 ; movdqa 0x89f2(%edx),%xmm0
+ DB 102,15,111,130,210,137,0,0 ; movdqa 0x89d2(%edx),%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,130,2,138,0,0 ; mulps 0x8a02(%edx),%xmm0
- DB 102,15,111,138,18,138,0,0 ; movdqa 0x8a12(%edx),%xmm1
+ DB 15,89,130,226,137,0,0 ; mulps 0x89e2(%edx),%xmm0
+ DB 102,15,111,138,242,137,0,0 ; movdqa 0x89f2(%edx),%xmm1
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,138,34,138,0,0 ; mulps 0x8a22(%edx),%xmm1
- DB 102,15,219,146,50,138,0,0 ; pand 0x8a32(%edx),%xmm2
+ DB 15,89,138,2,138,0,0 ; mulps 0x8a02(%edx),%xmm1
+ DB 102,15,219,146,18,138,0,0 ; pand 0x8a12(%edx),%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,146,66,138,0,0 ; mulps 0x8a42(%edx),%xmm2
+ DB 15,89,146,34,138,0,0 ; mulps 0x8a22(%edx),%xmm2
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,154,242,135,0,0 ; movaps 0x87f2(%edx),%xmm3
+ DB 15,40,154,210,135,0,0 ; movaps 0x87d2(%edx),%xmm3
DB 81 ; push %ecx
DB 255,117,8 ; pushl 0x8(%ebp)
DB 255,80,4 ; call *0x4(%eax)
@@ -49068,8 +49068,8 @@ _sk_store_565_sse2 LABEL PROC
DB 1,210 ; add %edx,%edx
DB 3,22 ; add (%esi),%edx
DB 139,49 ; mov (%ecx),%esi
- DB 15,40,167,111,139,0,0 ; movaps 0x8b6f(%edi),%xmm4
- DB 15,40,175,127,139,0,0 ; movaps 0x8b7f(%edi),%xmm5
+ DB 15,40,167,79,139,0,0 ; movaps 0x8b4f(%edi),%xmm4
+ DB 15,40,175,95,139,0,0 ; movaps 0x8b5f(%edi),%xmm5
DB 139,89,8 ; mov 0x8(%ecx),%ebx
DB 15,40,240 ; movaps %xmm0,%xmm6
DB 15,89,244 ; mulps %xmm4,%xmm6
@@ -49147,21 +49147,21 @@ _sk_load_4444_sse2 LABEL PROC
DB 117,112 ; jne 46e0 <_sk_load_4444_sse2+0x9b>
DB 243,15,126,28,126 ; movq (%esi,%edi,2),%xmm3
DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3
- DB 102,15,111,130,173,138,0,0 ; movdqa 0x8aad(%edx),%xmm0
+ DB 102,15,111,130,141,138,0,0 ; movdqa 0x8a8d(%edx),%xmm0
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,130,189,138,0,0 ; mulps 0x8abd(%edx),%xmm0
- DB 102,15,111,138,205,138,0,0 ; movdqa 0x8acd(%edx),%xmm1
+ DB 15,89,130,157,138,0,0 ; mulps 0x8a9d(%edx),%xmm0
+ DB 102,15,111,138,173,138,0,0 ; movdqa 0x8aad(%edx),%xmm1
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,138,221,138,0,0 ; mulps 0x8add(%edx),%xmm1
- DB 102,15,111,146,237,138,0,0 ; movdqa 0x8aed(%edx),%xmm2
+ DB 15,89,138,189,138,0,0 ; mulps 0x8abd(%edx),%xmm1
+ DB 102,15,111,146,205,138,0,0 ; movdqa 0x8acd(%edx),%xmm2
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,146,253,138,0,0 ; mulps 0x8afd(%edx),%xmm2
- DB 102,15,219,154,13,139,0,0 ; pand 0x8b0d(%edx),%xmm3
+ DB 15,89,146,221,138,0,0 ; mulps 0x8add(%edx),%xmm2
+ DB 102,15,219,154,237,138,0,0 ; pand 0x8aed(%edx),%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,154,29,139,0,0 ; mulps 0x8b1d(%edx),%xmm3
+ DB 15,89,154,253,138,0,0 ; mulps 0x8afd(%edx),%xmm3
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
DB 82 ; push %edx
@@ -49215,24 +49215,24 @@ _sk_load_4444_dst_sse2 LABEL PROC
DB 15,133,128,0,0,0 ; jne 47d3 <_sk_load_4444_dst_sse2+0xaf>
DB 243,15,126,36,126 ; movq (%esi,%edi,2),%xmm4
DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4
- DB 102,15,111,170,206,137,0,0 ; movdqa 0x89ce(%edx),%xmm5
+ DB 102,15,111,170,174,137,0,0 ; movdqa 0x89ae(%edx),%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,170,222,137,0,0 ; mulps 0x89de(%edx),%xmm5
+ DB 15,89,170,190,137,0,0 ; mulps 0x89be(%edx),%xmm5
DB 15,41,105,16 ; movaps %xmm5,0x10(%ecx)
- DB 102,15,111,170,238,137,0,0 ; movdqa 0x89ee(%edx),%xmm5
+ DB 102,15,111,170,206,137,0,0 ; movdqa 0x89ce(%edx),%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,170,254,137,0,0 ; mulps 0x89fe(%edx),%xmm5
+ DB 15,89,170,222,137,0,0 ; mulps 0x89de(%edx),%xmm5
DB 15,41,105,32 ; movaps %xmm5,0x20(%ecx)
- DB 102,15,111,170,14,138,0,0 ; movdqa 0x8a0e(%edx),%xmm5
+ DB 102,15,111,170,238,137,0,0 ; movdqa 0x89ee(%edx),%xmm5
DB 102,15,219,236 ; pand %xmm4,%xmm5
DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5
- DB 15,89,170,30,138,0,0 ; mulps 0x8a1e(%edx),%xmm5
+ DB 15,89,170,254,137,0,0 ; mulps 0x89fe(%edx),%xmm5
DB 15,41,105,48 ; movaps %xmm5,0x30(%ecx)
- DB 102,15,219,162,46,138,0,0 ; pand 0x8a2e(%edx),%xmm4
+ DB 102,15,219,162,14,138,0,0 ; pand 0x8a0e(%edx),%xmm4
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
- DB 15,89,162,62,138,0,0 ; mulps 0x8a3e(%edx),%xmm4
+ DB 15,89,162,30,138,0,0 ; mulps 0x8a1e(%edx),%xmm4
DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx)
DB 141,80,8 ; lea 0x8(%eax),%edx
DB 131,236,8 ; sub $0x8,%esp
@@ -49315,21 +49315,21 @@ _sk_gather_4444_sse2 LABEL PROC
DB 89 ; pop %ecx
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3
- DB 102,15,111,129,48,136,0,0 ; movdqa 0x8830(%ecx),%xmm0
+ DB 102,15,111,129,16,136,0,0 ; movdqa 0x8810(%ecx),%xmm0
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,129,64,136,0,0 ; mulps 0x8840(%ecx),%xmm0
- DB 102,15,111,137,80,136,0,0 ; movdqa 0x8850(%ecx),%xmm1
+ DB 15,89,129,32,136,0,0 ; mulps 0x8820(%ecx),%xmm0
+ DB 102,15,111,137,48,136,0,0 ; movdqa 0x8830(%ecx),%xmm1
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,137,96,136,0,0 ; mulps 0x8860(%ecx),%xmm1
- DB 102,15,111,145,112,136,0,0 ; movdqa 0x8870(%ecx),%xmm2
+ DB 15,89,137,64,136,0,0 ; mulps 0x8840(%ecx),%xmm1
+ DB 102,15,111,145,80,136,0,0 ; movdqa 0x8850(%ecx),%xmm2
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,145,128,136,0,0 ; mulps 0x8880(%ecx),%xmm2
- DB 102,15,219,153,144,136,0,0 ; pand 0x8890(%ecx),%xmm3
+ DB 15,89,145,96,136,0,0 ; mulps 0x8860(%ecx),%xmm2
+ DB 102,15,219,153,112,136,0,0 ; pand 0x8870(%ecx),%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,153,160,136,0,0 ; mulps 0x88a0(%ecx),%xmm3
+ DB 15,89,153,128,136,0,0 ; mulps 0x8880(%ecx),%xmm3
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 131,236,8 ; sub $0x8,%esp
DB 81 ; push %ecx
@@ -49357,7 +49357,7 @@ _sk_store_4444_sse2 LABEL PROC
DB 1,210 ; add %edx,%edx
DB 3,22 ; add (%esi),%edx
DB 139,49 ; mov (%ecx),%esi
- DB 15,40,167,51,136,0,0 ; movaps 0x8833(%edi),%xmm4
+ DB 15,40,167,19,136,0,0 ; movaps 0x8813(%edi),%xmm4
DB 139,89,8 ; mov 0x8(%ecx),%ebx
DB 15,40,232 ; movaps %xmm0,%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
@@ -49440,11 +49440,11 @@ _sk_load_8888_sse2 LABEL PROC
DB 139,57 ; mov (%ecx),%edi
DB 117,102 ; jne 4ac2 <_sk_load_8888_sse2+0x92>
DB 243,15,111,28,190 ; movdqu (%esi,%edi,4),%xmm3
- DB 102,15,111,146,114,131,0,0 ; movdqa 0x8372(%edx),%xmm2
+ DB 102,15,111,146,82,131,0,0 ; movdqa 0x8352(%edx),%xmm2
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,40,162,162,132,0,0 ; movaps 0x84a2(%edx),%xmm4
+ DB 15,40,162,130,132,0,0 ; movaps 0x8482(%edx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -49507,11 +49507,11 @@ _sk_load_8888_dst_sse2 LABEL PROC
DB 139,57 ; mov (%ecx),%edi
DB 117,118 ; jne 4b99 <_sk_load_8888_dst_sse2+0xa2>
DB 243,15,111,36,190 ; movdqu (%esi,%edi,4),%xmm4
- DB 102,15,111,170,171,130,0,0 ; movdqa 0x82ab(%edx),%xmm5
+ DB 102,15,111,170,139,130,0,0 ; movdqa 0x828b(%edx),%xmm5
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
DB 102,15,219,245 ; pand %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,40,186,219,131,0,0 ; movaps 0x83db(%edx),%xmm7
+ DB 15,40,186,187,131,0,0 ; movaps 0x83bb(%edx),%xmm7
DB 15,89,247 ; mulps %xmm7,%xmm6
DB 15,41,113,16 ; movaps %xmm6,0x10(%ecx)
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
@@ -49604,11 +49604,11 @@ _sk_gather_8888_sse2 LABEL PROC
DB 102,15,98,194 ; punpckldq %xmm2,%xmm0
DB 102,15,98,217 ; punpckldq %xmm1,%xmm3
DB 102,15,108,216 ; punpcklqdq %xmm0,%xmm3
- DB 102,15,111,145,56,129,0,0 ; movdqa 0x8138(%ecx),%xmm2
+ DB 102,15,111,145,24,129,0,0 ; movdqa 0x8118(%ecx),%xmm2
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,40,161,104,130,0,0 ; movaps 0x8268(%ecx),%xmm4
+ DB 15,40,161,72,130,0,0 ; movaps 0x8248(%ecx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -49650,7 +49650,7 @@ _sk_store_8888_sse2 LABEL PROC
DB 193,226,2 ; shl $0x2,%edx
DB 3,22 ; add (%esi),%edx
DB 139,49 ; mov (%ecx),%esi
- DB 15,40,167,205,128,0,0 ; movaps 0x80cd(%edi),%xmm4
+ DB 15,40,167,173,128,0,0 ; movaps 0x80ad(%edi),%xmm4
DB 139,89,8 ; mov 0x8(%ecx),%ebx
DB 15,40,232 ; movaps %xmm0,%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
@@ -49719,11 +49719,11 @@ _sk_load_bgra_sse2 LABEL PROC
DB 139,57 ; mov (%ecx),%edi
DB 117,102 ; jne 4e2d <_sk_load_bgra_sse2+0x92>
DB 243,15,111,28,190 ; movdqu (%esi,%edi,4),%xmm3
- DB 102,15,111,130,7,128,0,0 ; movdqa 0x8007(%edx),%xmm0
+ DB 102,15,111,130,231,127,0,0 ; movdqa 0x7fe7(%edx),%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,219,200 ; pand %xmm0,%xmm1
DB 15,91,209 ; cvtdq2ps %xmm1,%xmm2
- DB 15,40,162,55,129,0,0 ; movaps 0x8137(%edx),%xmm4
+ DB 15,40,162,23,129,0,0 ; movaps 0x8117(%edx),%xmm4
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -49786,11 +49786,11 @@ _sk_load_bgra_dst_sse2 LABEL PROC
DB 139,57 ; mov (%ecx),%edi
DB 117,118 ; jne 4f04 <_sk_load_bgra_dst_sse2+0xa2>
DB 243,15,111,36,190 ; movdqu (%esi,%edi,4),%xmm4
- DB 102,15,111,170,64,127,0,0 ; movdqa 0x7f40(%edx),%xmm5
+ DB 102,15,111,170,32,127,0,0 ; movdqa 0x7f20(%edx),%xmm5
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
DB 102,15,219,245 ; pand %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
- DB 15,40,186,112,128,0,0 ; movaps 0x8070(%edx),%xmm7
+ DB 15,40,186,80,128,0,0 ; movaps 0x8050(%edx),%xmm7
DB 15,89,247 ; mulps %xmm7,%xmm6
DB 15,41,113,48 ; movaps %xmm6,0x30(%ecx)
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
@@ -49883,11 +49883,11 @@ _sk_gather_bgra_sse2 LABEL PROC
DB 102,15,98,194 ; punpckldq %xmm2,%xmm0
DB 102,15,98,217 ; punpckldq %xmm1,%xmm3
DB 102,15,108,216 ; punpcklqdq %xmm0,%xmm3
- DB 102,15,111,129,205,125,0,0 ; movdqa 0x7dcd(%ecx),%xmm0
+ DB 102,15,111,129,173,125,0,0 ; movdqa 0x7dad(%ecx),%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,219,200 ; pand %xmm0,%xmm1
DB 15,91,209 ; cvtdq2ps %xmm1,%xmm2
- DB 15,40,161,253,126,0,0 ; movaps 0x7efd(%ecx),%xmm4
+ DB 15,40,161,221,126,0,0 ; movaps 0x7edd(%ecx),%xmm4
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -49929,7 +49929,7 @@ _sk_store_bgra_sse2 LABEL PROC
DB 193,226,2 ; shl $0x2,%edx
DB 3,22 ; add (%esi),%edx
DB 139,49 ; mov (%ecx),%esi
- DB 15,40,167,98,125,0,0 ; movaps 0x7d62(%edi),%xmm4
+ DB 15,40,167,66,125,0,0 ; movaps 0x7d42(%edi),%xmm4
DB 139,89,8 ; mov 0x8(%ecx),%ebx
DB 15,40,234 ; movaps %xmm2,%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
@@ -50026,11 +50026,11 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,200 ; punpcklwd %xmm0,%xmm1
DB 102,15,239,210 ; pxor %xmm2,%xmm2
- DB 102,15,111,170,124,128,0,0 ; movdqa 0x807c(%edx),%xmm5
+ DB 102,15,111,170,92,128,0,0 ; movdqa 0x805c(%edx),%xmm5
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,219,245 ; pand %xmm5,%xmm6
- DB 102,15,219,138,140,128,0,0 ; pand 0x808c(%edx),%xmm1
- DB 102,15,111,130,156,128,0,0 ; movdqa 0x809c(%edx),%xmm0
+ DB 102,15,219,138,108,128,0,0 ; pand 0x806c(%edx),%xmm1
+ DB 102,15,111,130,124,128,0,0 ; movdqa 0x807c(%edx),%xmm0
DB 102,15,127,69,184 ; movdqa %xmm0,-0x48(%ebp)
DB 102,15,114,246,16 ; pslld $0x10,%xmm6
DB 102,15,111,216 ; movdqa %xmm0,%xmm3
@@ -50042,7 +50042,7 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,15,239,255 ; pxor %xmm7,%xmm7
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
DB 102,15,219,213 ; pand %xmm5,%xmm2
- DB 102,15,111,154,140,128,0,0 ; movdqa 0x808c(%edx),%xmm3
+ DB 102,15,111,154,108,128,0,0 ; movdqa 0x806c(%edx),%xmm3
DB 102,15,219,227 ; pand %xmm3,%xmm4
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,102,196 ; pcmpgtd %xmm4,%xmm0
@@ -50055,7 +50055,7 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,15,219,253 ; pand %xmm5,%xmm7
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 102,15,114,247,16 ; pslld $0x10,%xmm7
- DB 102,15,111,146,156,128,0,0 ; movdqa 0x809c(%edx),%xmm2
+ DB 102,15,111,146,124,128,0,0 ; movdqa 0x807c(%edx),%xmm2
DB 102,15,102,208 ; pcmpgtd %xmm0,%xmm2
DB 102,15,114,240,13 ; pslld $0xd,%xmm0
DB 102,15,235,199 ; por %xmm7,%xmm0
@@ -50070,7 +50070,7 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,15,127,93,184 ; movdqa %xmm3,-0x48(%ebp)
DB 102,15,114,247,13 ; pslld $0xd,%xmm7
DB 102,15,235,253 ; por %xmm5,%xmm7
- DB 102,15,111,154,172,128,0,0 ; movdqa 0x80ac(%edx),%xmm3
+ DB 102,15,111,154,140,128,0,0 ; movdqa 0x808c(%edx),%xmm3
DB 102,15,254,203 ; paddd %xmm3,%xmm1
DB 102,15,254,227 ; paddd %xmm3,%xmm4
DB 102,15,254,195 ; paddd %xmm3,%xmm0
@@ -50157,18 +50157,18 @@ _sk_load_f16_dst_sse2 LABEL PROC
DB 102,15,126,85,232 ; movd %xmm2,-0x18(%ebp)
DB 102,15,239,210 ; pxor %xmm2,%xmm2
DB 102,15,97,202 ; punpcklwd %xmm2,%xmm1
- DB 102,15,111,186,95,126,0,0 ; movdqa 0x7e5f(%edx),%xmm7
+ DB 102,15,111,186,63,126,0,0 ; movdqa 0x7e3f(%edx),%xmm7
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,219,215 ; pand %xmm7,%xmm2
- DB 102,15,111,154,111,126,0,0 ; movdqa 0x7e6f(%edx),%xmm3
+ DB 102,15,111,154,79,126,0,0 ; movdqa 0x7e4f(%edx),%xmm3
DB 102,15,219,203 ; pand %xmm3,%xmm1
- DB 102,15,111,162,127,126,0,0 ; movdqa 0x7e7f(%edx),%xmm4
+ DB 102,15,111,162,95,126,0,0 ; movdqa 0x7e5f(%edx),%xmm4
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,111,236 ; movdqa %xmm4,%xmm5
DB 102,15,102,233 ; pcmpgtd %xmm1,%xmm5
DB 102,15,114,241,13 ; pslld $0xd,%xmm1
DB 102,15,235,202 ; por %xmm2,%xmm1
- DB 102,15,111,146,143,126,0,0 ; movdqa 0x7e8f(%edx),%xmm2
+ DB 102,15,111,146,111,126,0,0 ; movdqa 0x7e6f(%edx),%xmm2
DB 102,15,127,85,184 ; movdqa %xmm2,-0x48(%ebp)
DB 102,15,254,202 ; paddd %xmm2,%xmm1
DB 102,15,223,233 ; pandn %xmm1,%xmm5
@@ -50312,11 +50312,11 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,15,126,69,248 ; movd %xmm0,-0x8(%ebp)
DB 102,15,97,206 ; punpcklwd %xmm6,%xmm1
DB 102,15,239,210 ; pxor %xmm2,%xmm2
- DB 102,15,111,177,195,123,0,0 ; movdqa 0x7bc3(%ecx),%xmm6
+ DB 102,15,111,177,163,123,0,0 ; movdqa 0x7ba3(%ecx),%xmm6
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,219,230 ; pand %xmm6,%xmm4
- DB 102,15,219,137,211,123,0,0 ; pand 0x7bd3(%ecx),%xmm1
- DB 102,15,111,129,227,123,0,0 ; movdqa 0x7be3(%ecx),%xmm0
+ DB 102,15,219,137,179,123,0,0 ; pand 0x7bb3(%ecx),%xmm1
+ DB 102,15,111,129,195,123,0,0 ; movdqa 0x7bc3(%ecx),%xmm0
DB 102,15,114,244,16 ; pslld $0x10,%xmm4
DB 102,15,111,216 ; movdqa %xmm0,%xmm3
DB 102,15,102,217 ; pcmpgtd %xmm1,%xmm3
@@ -50327,7 +50327,7 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,15,239,255 ; pxor %xmm7,%xmm7
DB 102,15,111,213 ; movdqa %xmm5,%xmm2
DB 102,15,219,214 ; pand %xmm6,%xmm2
- DB 102,15,111,153,211,123,0,0 ; movdqa 0x7bd3(%ecx),%xmm3
+ DB 102,15,111,153,179,123,0,0 ; movdqa 0x7bb3(%ecx),%xmm3
DB 102,15,219,235 ; pand %xmm3,%xmm5
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
@@ -50341,7 +50341,7 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,15,219,254 ; pand %xmm6,%xmm7
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 102,15,114,247,16 ; pslld $0x10,%xmm7
- DB 102,15,111,145,227,123,0,0 ; movdqa 0x7be3(%ecx),%xmm2
+ DB 102,15,111,145,195,123,0,0 ; movdqa 0x7bc3(%ecx),%xmm2
DB 102,15,111,218 ; movdqa %xmm2,%xmm3
DB 102,15,102,216 ; pcmpgtd %xmm0,%xmm3
DB 102,15,114,240,13 ; pslld $0xd,%xmm0
@@ -50350,12 +50350,12 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,97,252 ; punpcklwd %xmm4,%xmm7
DB 102,15,219,247 ; pand %xmm7,%xmm6
- DB 102,15,219,185,211,123,0,0 ; pand 0x7bd3(%ecx),%xmm7
+ DB 102,15,219,185,179,123,0,0 ; pand 0x7bb3(%ecx),%xmm7
DB 102,15,114,246,16 ; pslld $0x10,%xmm6
DB 102,15,102,215 ; pcmpgtd %xmm7,%xmm2
DB 102,15,114,247,13 ; pslld $0xd,%xmm7
DB 102,15,235,254 ; por %xmm6,%xmm7
- DB 102,15,111,161,243,123,0,0 ; movdqa 0x7bf3(%ecx),%xmm4
+ DB 102,15,111,161,211,123,0,0 ; movdqa 0x7bd3(%ecx),%xmm4
DB 102,15,254,204 ; paddd %xmm4,%xmm1
DB 102,15,254,236 ; paddd %xmm4,%xmm5
DB 102,15,254,196 ; paddd %xmm4,%xmm0
@@ -50392,22 +50392,22 @@ _sk_store_f16_sse2 LABEL PROC
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 232,0,0,0,0 ; call 5791 <_sk_store_f16_sse2+0x19>
DB 88 ; pop %eax
- DB 102,15,111,152,63,122,0,0 ; movdqa 0x7a3f(%eax),%xmm3
+ DB 102,15,111,152,31,122,0,0 ; movdqa 0x7a1f(%eax),%xmm3
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
DB 102,15,219,227 ; pand %xmm3,%xmm4
- DB 102,15,111,136,111,122,0,0 ; movdqa 0x7a6f(%eax),%xmm1
+ DB 102,15,111,136,79,122,0,0 ; movdqa 0x7a4f(%eax),%xmm1
DB 102,15,127,77,232 ; movdqa %xmm1,-0x18(%ebp)
DB 102,15,111,240 ; movdqa %xmm0,%xmm6
DB 102,15,114,246,3 ; pslld $0x3,%xmm6
DB 102,15,219,241 ; pand %xmm1,%xmm6
DB 102,15,254,244 ; paddd %xmm4,%xmm6
- DB 102,15,111,184,79,122,0,0 ; movdqa 0x7a4f(%eax),%xmm7
+ DB 102,15,111,184,47,122,0,0 ; movdqa 0x7a2f(%eax),%xmm7
DB 102,15,127,69,168 ; movdqa %xmm0,-0x58(%ebp)
DB 102,15,219,199 ; pand %xmm7,%xmm0
- DB 102,15,111,168,95,122,0,0 ; movdqa 0x7a5f(%eax),%xmm5
+ DB 102,15,111,168,63,122,0,0 ; movdqa 0x7a3f(%eax),%xmm5
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 102,15,102,200 ; pcmpgtd %xmm0,%xmm1
- DB 102,15,111,128,239,118,0,0 ; movdqa 0x76ef(%eax),%xmm0
+ DB 102,15,111,128,207,118,0,0 ; movdqa 0x76cf(%eax),%xmm0
DB 102,15,127,69,216 ; movdqa %xmm0,-0x28(%ebp)
DB 102,15,254,240 ; paddd %xmm0,%xmm6
DB 102,15,114,230,16 ; psrad $0x10,%xmm6
@@ -50459,8 +50459,8 @@ _sk_store_f16_sse2 LABEL PROC
DB 102,15,97,245 ; punpcklwd %xmm5,%xmm6
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,17 ; mov (%ecx),%edx
DB 139,56 ; mov (%eax),%edi
+ DB 139,17 ; mov (%ecx),%edx
DB 139,119,4 ; mov 0x4(%edi),%esi
DB 15,175,113,4 ; imul 0x4(%ecx),%esi
DB 193,230,3 ; shl $0x3,%esi
@@ -50507,8 +50507,8 @@ _sk_load_u16_be_sse2 LABEL PROC
DB 131,236,44 ; sub $0x2c,%esp
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,49 ; mov (%ecx),%esi
DB 139,16 ; mov (%eax),%edx
+ DB 139,49 ; mov (%ecx),%esi
DB 139,122,4 ; mov 0x4(%edx),%edi
DB 15,175,121,4 ; imul 0x4(%ecx),%edi
DB 1,255 ; add %edi,%edi
@@ -50539,7 +50539,7 @@ _sk_load_u16_be_sse2 LABEL PROC
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,97,195 ; punpcklwd %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,40,162,2,118,0,0 ; movaps 0x7602(%edx),%xmm4
+ DB 15,40,162,226,117,0,0 ; movaps 0x75e2(%edx),%xmm4
DB 15,89,196 ; mulps %xmm4,%xmm0
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -50606,8 +50606,8 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 131,236,28 ; sub $0x1c,%esp
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,121,8 ; mov 0x8(%ecx),%edi
DB 139,16 ; mov (%eax),%edx
+ DB 139,121,8 ; mov 0x8(%ecx),%edi
DB 139,114,4 ; mov 0x4(%edx),%esi
DB 15,175,113,4 ; imul 0x4(%ecx),%esi
DB 1,246 ; add %esi,%esi
@@ -50641,7 +50641,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,97,195 ; punpcklwd %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,40,170,155,116,0,0 ; movaps 0x749b(%edx),%xmm5
+ DB 15,40,170,123,116,0,0 ; movaps 0x747b(%edx),%xmm5
DB 15,89,197 ; mulps %xmm5,%xmm0
DB 102,15,111,204 ; movdqa %xmm4,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -50667,7 +50667,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 15,89,213 ; mulps %xmm5,%xmm2
DB 141,112,8 ; lea 0x8(%eax),%esi
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,154,43,114,0,0 ; movaps 0x722b(%edx),%xmm3
+ DB 15,40,154,11,114,0,0 ; movaps 0x720b(%edx),%xmm3
DB 86 ; push %esi
DB 81 ; push %ecx
DB 255,80,4 ; call *0x4(%eax)
@@ -50712,7 +50712,7 @@ _sk_store_u16_be_sse2 LABEL PROC
DB 1,210 ; add %edx,%edx
DB 3,22 ; add (%esi),%edx
DB 139,49 ; mov (%ecx),%esi
- DB 15,40,183,247,117,0,0 ; movaps 0x75f7(%edi),%xmm6
+ DB 15,40,183,215,117,0,0 ; movaps 0x75d7(%edi),%xmm6
DB 139,121,8 ; mov 0x8(%ecx),%edi
DB 193,230,2 ; shl $0x2,%esi
DB 15,40,224 ; movaps %xmm0,%xmm4
@@ -50791,8 +50791,8 @@ _sk_load_f32_sse2 LABEL PROC
DB 86 ; push %esi
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,57 ; mov (%ecx),%edi
DB 139,48 ; mov (%eax),%esi
+ DB 139,57 ; mov (%ecx),%edi
DB 139,86,4 ; mov 0x4(%esi),%edx
DB 15,175,81,4 ; imul 0x4(%ecx),%edx
DB 193,226,2 ; shl $0x2,%edx
@@ -50853,8 +50853,8 @@ _sk_load_f32_dst_sse2 LABEL PROC
DB 15,41,85,232 ; movaps %xmm2,-0x18(%ebp)
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,57 ; mov (%ecx),%edi
DB 139,48 ; mov (%eax),%esi
+ DB 139,57 ; mov (%ecx),%edi
DB 139,86,4 ; mov 0x4(%esi),%edx
DB 15,175,81,4 ; imul 0x4(%ecx),%edx
DB 193,226,2 ; shl $0x2,%edx
@@ -50920,8 +50920,8 @@ _sk_store_f32_sse2 LABEL PROC
DB 131,236,12 ; sub $0xc,%esp
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 139,25 ; mov (%ecx),%ebx
DB 139,48 ; mov (%eax),%esi
+ DB 139,25 ; mov (%ecx),%ebx
DB 139,86,4 ; mov 0x4(%esi),%edx
DB 15,175,81,4 ; imul 0x4(%ecx),%edx
DB 193,226,2 ; shl $0x2,%edx
@@ -50984,7 +50984,7 @@ _sk_repeat_x_sse2 LABEL PROC
DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 15,194,238,1 ; cmpltps %xmm6,%xmm5
- DB 15,84,168,179,109,0,0 ; andps 0x6db3(%eax),%xmm5
+ DB 15,84,168,147,109,0,0 ; andps 0x6d93(%eax),%xmm5
DB 15,92,245 ; subps %xmm5,%xmm6
DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
DB 15,89,230 ; mulps %xmm6,%xmm4
@@ -51014,7 +51014,7 @@ _sk_repeat_y_sse2 LABEL PROC
DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 15,194,238,1 ; cmpltps %xmm6,%xmm5
- DB 15,84,168,97,109,0,0 ; andps 0x6d61(%eax),%xmm5
+ DB 15,84,168,65,109,0,0 ; andps 0x6d41(%eax),%xmm5
DB 15,92,245 ; subps %xmm5,%xmm6
DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
DB 15,89,230 ; mulps %xmm6,%xmm4
@@ -51042,13 +51042,13 @@ _sk_mirror_x_sse2 LABEL PROC
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
DB 15,92,198 ; subps %xmm6,%xmm0
- DB 243,15,89,169,159,116,0,0 ; mulss 0x749f(%ecx),%xmm5
+ DB 243,15,89,169,127,116,0,0 ; mulss 0x747f(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,89,232 ; mulps %xmm0,%xmm5
DB 243,15,91,253 ; cvttps2dq %xmm5,%xmm7
DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7
DB 15,194,239,1 ; cmpltps %xmm7,%xmm5
- DB 15,84,169,15,109,0,0 ; andps 0x6d0f(%ecx),%xmm5
+ DB 15,84,169,239,108,0,0 ; andps 0x6cef(%ecx),%xmm5
DB 15,92,253 ; subps %xmm5,%xmm7
DB 243,15,88,228 ; addss %xmm4,%xmm4
DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
@@ -51081,13 +51081,13 @@ _sk_mirror_y_sse2 LABEL PROC
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
DB 15,92,206 ; subps %xmm6,%xmm1
- DB 243,15,89,169,43,116,0,0 ; mulss 0x742b(%ecx),%xmm5
+ DB 243,15,89,169,11,116,0,0 ; mulss 0x740b(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,89,233 ; mulps %xmm1,%xmm5
DB 243,15,91,253 ; cvttps2dq %xmm5,%xmm7
DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7
DB 15,194,239,1 ; cmpltps %xmm7,%xmm5
- DB 15,84,169,155,108,0,0 ; andps 0x6c9b(%ecx),%xmm5
+ DB 15,84,169,123,108,0,0 ; andps 0x6c7b(%ecx),%xmm5
DB 15,92,253 ; subps %xmm5,%xmm7
DB 243,15,88,228 ; addss %xmm4,%xmm4
DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
@@ -51116,7 +51116,7 @@ _sk_clamp_x_1_sse2 LABEL PROC
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,95,224 ; maxps %xmm0,%xmm4
- DB 15,93,160,39,108,0,0 ; minps 0x6c27(%eax),%xmm4
+ DB 15,93,160,7,108,0,0 ; minps 0x6c07(%eax),%xmm4
DB 141,65,4 ; lea 0x4(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
DB 15,40,196 ; movaps %xmm4,%xmm0
@@ -51139,7 +51139,7 @@ _sk_repeat_x_1_sse2 LABEL PROC
DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4
DB 15,40,232 ; movaps %xmm0,%xmm5
DB 15,194,236,1 ; cmpltps %xmm4,%xmm5
- DB 15,84,168,247,107,0,0 ; andps 0x6bf7(%eax),%xmm5
+ DB 15,84,168,215,107,0,0 ; andps 0x6bd7(%eax),%xmm5
DB 15,92,229 ; subps %xmm5,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
DB 141,65,4 ; lea 0x4(%ecx),%eax
@@ -51159,14 +51159,14 @@ _sk_mirror_x_1_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 6134 <_sk_mirror_x_1_sse2+0xb>
DB 89 ; pop %ecx
DB 139,69,12 ; mov 0xc(%ebp),%eax
- DB 15,40,161,44,108,0,0 ; movaps 0x6c2c(%ecx),%xmm4
+ DB 15,40,161,12,108,0,0 ; movaps 0x6c0c(%ecx),%xmm4
DB 15,88,196 ; addps %xmm4,%xmm0
- DB 15,40,169,172,107,0,0 ; movaps 0x6bac(%ecx),%xmm5
+ DB 15,40,169,140,107,0,0 ; movaps 0x6b8c(%ecx),%xmm5
DB 15,89,232 ; mulps %xmm0,%xmm5
DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 15,194,238,1 ; cmpltps %xmm6,%xmm5
- DB 15,84,169,188,107,0,0 ; andps 0x6bbc(%ecx),%xmm5
+ DB 15,84,169,156,107,0,0 ; andps 0x6b9c(%ecx),%xmm5
DB 15,87,255 ; xorps %xmm7,%xmm7
DB 15,92,245 ; subps %xmm5,%xmm6
DB 15,88,246 ; addps %xmm6,%xmm6
@@ -51192,10 +51192,10 @@ _sk_luminance_to_alpha_sse2 LABEL PROC
DB 232,0,0,0,0 ; call 6192 <_sk_luminance_to_alpha_sse2+0xe>
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,89,128,142,112,0,0 ; mulps 0x708e(%eax),%xmm0
- DB 15,89,136,158,112,0,0 ; mulps 0x709e(%eax),%xmm1
+ DB 15,89,128,110,112,0,0 ; mulps 0x706e(%eax),%xmm0
+ DB 15,89,136,126,112,0,0 ; mulps 0x707e(%eax),%xmm1
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,152,174,112,0,0 ; mulps 0x70ae(%eax),%xmm3
+ DB 15,89,152,142,112,0,0 ; mulps 0x708e(%eax),%xmm3
DB 15,88,217 ; addps %xmm1,%xmm3
DB 141,65,4 ; lea 0x4(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -51363,13 +51363,12 @@ _sk_matrix_4x5_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 131,236,8 ; sub $0x8,%esp
DB 15,40,233 ; movaps %xmm1,%xmm5
+ DB 15,40,224 ; movaps %xmm0,%xmm4
DB 139,69,12 ; mov 0xc(%ebp),%eax
- DB 141,72,4 ; lea 0x4(%eax),%ecx
- DB 137,77,252 ; mov %ecx,-0x4(%ebp)
DB 139,8 ; mov (%eax),%ecx
- DB 243,15,16,33 ; movss (%ecx),%xmm4
+ DB 243,15,16,1 ; movss (%ecx),%xmm0
DB 243,15,16,73,4 ; movss 0x4(%ecx),%xmm1
- DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
+ DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0
DB 243,15,16,113,48 ; movss 0x30(%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
DB 243,15,16,121,64 ; movss 0x40(%ecx),%xmm7
@@ -51384,8 +51383,8 @@ _sk_matrix_4x5_sse2 LABEL PROC
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,88,247 ; addps %xmm7,%xmm6
- DB 15,89,224 ; mulps %xmm0,%xmm4
- DB 15,88,230 ; addps %xmm6,%xmm4
+ DB 15,89,196 ; mulps %xmm4,%xmm0
+ DB 15,88,198 ; addps %xmm6,%xmm0
DB 15,198,201,0 ; shufps $0x0,%xmm1,%xmm1
DB 243,15,16,113,52 ; movss 0x34(%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -51401,7 +51400,7 @@ _sk_matrix_4x5_sse2 LABEL PROC
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,88,247 ; addps %xmm7,%xmm6
- DB 15,89,200 ; mulps %xmm0,%xmm1
+ DB 15,89,204 ; mulps %xmm4,%xmm1
DB 15,88,206 ; addps %xmm6,%xmm1
DB 243,15,16,113,56 ; movss 0x38(%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -51419,7 +51418,7 @@ _sk_matrix_4x5_sse2 LABEL PROC
DB 15,88,247 ; addps %xmm7,%xmm6
DB 243,15,16,121,8 ; movss 0x8(%ecx),%xmm7
DB 15,198,255,0 ; shufps $0x0,%xmm7,%xmm7
- DB 15,89,248 ; mulps %xmm0,%xmm7
+ DB 15,89,252 ; mulps %xmm4,%xmm7
DB 15,88,254 ; addps %xmm6,%xmm7
DB 243,15,16,113,60 ; movss 0x3c(%ecx),%xmm6
DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6
@@ -51437,15 +51436,13 @@ _sk_matrix_4x5_sse2 LABEL PROC
DB 15,88,211 ; addps %xmm3,%xmm2
DB 243,15,16,89,12 ; movss 0xc(%ecx),%xmm3
DB 15,198,219,0 ; shufps $0x0,%xmm3,%xmm3
- DB 15,89,216 ; mulps %xmm0,%xmm3
+ DB 15,89,220 ; mulps %xmm4,%xmm3
DB 15,88,218 ; addps %xmm2,%xmm3
- DB 139,77,8 ; mov 0x8(%ebp),%ecx
- DB 141,80,8 ; lea 0x8(%eax),%edx
+ DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,196 ; movaps %xmm4,%xmm0
DB 15,40,215 ; movaps %xmm7,%xmm2
- DB 82 ; push %edx
DB 81 ; push %ecx
+ DB 255,117,8 ; pushl 0x8(%ebp)
DB 255,80,4 ; call *0x4(%eax)
DB 131,196,24 ; add $0x18,%esp
DB 93 ; pop %ebp
@@ -51569,23 +51566,21 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC
DB 86 ; push %esi
DB 131,236,60 ; sub $0x3c,%esp
DB 15,41,69,184 ; movaps %xmm0,-0x48(%ebp)
- DB 232,0,0,0,0 ; call 662f <_sk_evenly_spaced_gradient_sse2+0x12>
+ DB 232,0,0,0,0 ; call 6628 <_sk_evenly_spaced_gradient_sse2+0x12>
DB 90 ; pop %edx
- DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 141,65,4 ; lea 0x4(%ecx),%eax
- DB 137,69,240 ; mov %eax,-0x10(%ebp)
- DB 139,9 ; mov (%ecx),%ecx
+ DB 139,69,12 ; mov 0xc(%ebp),%eax
+ DB 139,8 ; mov (%eax),%ecx
DB 139,49 ; mov (%ecx),%esi
DB 139,65,4 ; mov 0x4(%ecx),%eax
DB 78 ; dec %esi
DB 102,15,110,206 ; movd %esi,%xmm1
DB 102,15,112,201,0 ; pshufd $0x0,%xmm1,%xmm1
- DB 102,15,111,146,33,108,0,0 ; movdqa 0x6c21(%edx),%xmm2
+ DB 102,15,111,146,8,108,0,0 ; movdqa 0x6c08(%edx),%xmm2
DB 102,15,219,209 ; pand %xmm1,%xmm2
- DB 102,15,235,146,225,105,0,0 ; por 0x69e1(%edx),%xmm2
+ DB 102,15,235,146,200,105,0,0 ; por 0x69c8(%edx),%xmm2
DB 102,15,114,209,16 ; psrld $0x10,%xmm1
- DB 102,15,235,138,49,108,0,0 ; por 0x6c31(%edx),%xmm1
- DB 15,88,138,65,108,0,0 ; addps 0x6c41(%edx),%xmm1
+ DB 102,15,235,138,24,108,0,0 ; por 0x6c18(%edx),%xmm1
+ DB 15,88,138,40,108,0,0 ; addps 0x6c28(%edx),%xmm1
DB 15,88,202 ; addps %xmm2,%xmm1
DB 15,89,200 ; mulps %xmm0,%xmm1
DB 243,15,91,201 ; cvttps2dq %xmm1,%xmm1
@@ -51670,14 +51665,13 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC
DB 15,88,215 ; addps %xmm7,%xmm2
DB 15,89,221 ; mulps %xmm5,%xmm3
DB 15,88,216 ; addps %xmm0,%xmm3
- DB 139,69,8 ; mov 0x8(%ebp),%eax
- DB 139,85,12 ; mov 0xc(%ebp),%edx
- DB 141,74,8 ; lea 0x8(%edx),%ecx
+ DB 139,77,12 ; mov 0xc(%ebp),%ecx
+ DB 141,65,8 ; lea 0x8(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
DB 15,40,196 ; movaps %xmm4,%xmm0
- DB 81 ; push %ecx
DB 80 ; push %eax
- DB 255,82,4 ; call *0x4(%edx)
+ DB 255,117,8 ; pushl 0x8(%ebp)
+ DB 255,81,4 ; call *0x4(%ecx)
DB 131,196,76 ; add $0x4c,%esp
DB 94 ; pop %esi
DB 95 ; pop %edi
@@ -51690,18 +51684,18 @@ _sk_gauss_a_to_rgba_sse2 LABEL PROC
DB 85 ; push %ebp
DB 137,229 ; mov %esp,%ebp
DB 131,236,8 ; sub $0x8,%esp
- DB 232,0,0,0,0 ; call 67ef <_sk_gauss_a_to_rgba_sse2+0xb>
+ DB 232,0,0,0,0 ; call 67e1 <_sk_gauss_a_to_rgba_sse2+0xb>
DB 88 ; pop %eax
DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,40,128,145,106,0,0 ; movaps 0x6a91(%eax),%xmm0
+ DB 15,40,128,127,106,0,0 ; movaps 0x6a7f(%eax),%xmm0
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,161,106,0,0 ; addps 0x6aa1(%eax),%xmm0
+ DB 15,88,128,143,106,0,0 ; addps 0x6a8f(%eax),%xmm0
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,177,106,0,0 ; addps 0x6ab1(%eax),%xmm0
+ DB 15,88,128,159,106,0,0 ; addps 0x6a9f(%eax),%xmm0
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,193,106,0,0 ; addps 0x6ac1(%eax),%xmm0
+ DB 15,88,128,175,106,0,0 ; addps 0x6aaf(%eax),%xmm0
DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,209,106,0,0 ; addps 0x6ad1(%eax),%xmm0
+ DB 15,88,128,191,106,0,0 ; addps 0x6abf(%eax),%xmm0
DB 141,65,4 ; lea 0x4(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
DB 15,40,200 ; movaps %xmm0,%xmm1
@@ -51722,16 +51716,14 @@ _sk_gradient_sse2 LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,60 ; sub $0x3c,%esp
- DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 141,81,4 ; lea 0x4(%ecx),%edx
- DB 137,85,240 ; mov %edx,-0x10(%ebp)
- DB 139,9 ; mov (%ecx),%ecx
- DB 139,17 ; mov (%ecx),%edx
+ DB 139,69,12 ; mov 0xc(%ebp),%eax
+ DB 139,16 ; mov (%eax),%edx
+ DB 139,10 ; mov (%edx),%ecx
DB 102,15,239,201 ; pxor %xmm1,%xmm1
- DB 131,250,2 ; cmp $0x2,%edx
- DB 114,33 ; jb 687c <_sk_gradient_sse2+0x40>
- DB 139,113,36 ; mov 0x24(%ecx),%esi
- DB 74 ; dec %edx
+ DB 131,249,2 ; cmp $0x2,%ecx
+ DB 114,33 ; jb 6868 <_sk_gradient_sse2+0x3a>
+ DB 139,114,36 ; mov 0x24(%edx),%esi
+ DB 73 ; dec %ecx
DB 131,198,4 ; add $0x4,%esi
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 243,15,16,22 ; movss (%esi),%xmm2
@@ -51739,80 +51731,80 @@ _sk_gradient_sse2 LABEL PROC
DB 15,194,208,2 ; cmpleps %xmm0,%xmm2
DB 102,15,250,202 ; psubd %xmm2,%xmm1
DB 131,198,4 ; add $0x4,%esi
- DB 74 ; dec %edx
- DB 117,234 ; jne 6866 <_sk_gradient_sse2+0x2a>
- DB 102,15,126,202 ; movd %xmm1,%edx
+ DB 73 ; dec %ecx
+ DB 117,234 ; jne 6852 <_sk_gradient_sse2+0x24>
+ DB 102,15,126,206 ; movd %xmm1,%esi
DB 102,15,112,209,229 ; pshufd $0xe5,%xmm1,%xmm2
DB 102,15,112,217,78 ; pshufd $0x4e,%xmm1,%xmm3
- DB 102,15,126,222 ; movd %xmm3,%esi
+ DB 102,15,126,223 ; movd %xmm3,%edi
DB 102,15,112,201,231 ; pshufd $0xe7,%xmm1,%xmm1
- DB 102,15,126,207 ; movd %xmm1,%edi
- DB 139,65,4 ; mov 0x4(%ecx),%eax
- DB 243,15,16,12,184 ; movss (%eax,%edi,4),%xmm1
- DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3
- DB 243,15,16,36,144 ; movss (%eax,%edx,4),%xmm4
- DB 102,15,126,211 ; movd %xmm2,%ebx
- DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2
+ DB 102,15,126,203 ; movd %xmm1,%ebx
+ DB 139,66,4 ; mov 0x4(%edx),%eax
+ DB 243,15,16,12,152 ; movss (%eax,%ebx,4),%xmm1
+ DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3
+ DB 243,15,16,36,176 ; movss (%eax,%esi,4),%xmm4
+ DB 102,15,126,209 ; movd %xmm2,%ecx
+ DB 243,15,16,20,136 ; movss (%eax,%ecx,4),%xmm2
DB 15,20,217 ; unpcklps %xmm1,%xmm3
- DB 139,65,20 ; mov 0x14(%ecx),%eax
- DB 243,15,16,12,184 ; movss (%eax,%edi,4),%xmm1
- DB 243,15,16,52,176 ; movss (%eax,%esi,4),%xmm6
- DB 243,15,16,44,144 ; movss (%eax,%edx,4),%xmm5
- DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7
+ DB 139,66,20 ; mov 0x14(%edx),%eax
+ DB 243,15,16,12,152 ; movss (%eax,%ebx,4),%xmm1
+ DB 243,15,16,52,184 ; movss (%eax,%edi,4),%xmm6
+ DB 243,15,16,44,176 ; movss (%eax,%esi,4),%xmm5
+ DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7
DB 15,20,226 ; unpcklps %xmm2,%xmm4
DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4
DB 102,15,41,101,184 ; movapd %xmm4,-0x48(%ebp)
DB 15,20,241 ; unpcklps %xmm1,%xmm6
DB 15,20,239 ; unpcklps %xmm7,%xmm5
- DB 139,65,8 ; mov 0x8(%ecx),%eax
- DB 243,15,16,20,184 ; movss (%eax,%edi,4),%xmm2
- DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3
- DB 243,15,16,12,144 ; movss (%eax,%edx,4),%xmm1
- DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7
+ DB 139,66,8 ; mov 0x8(%edx),%eax
+ DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2
+ DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3
+ DB 243,15,16,12,176 ; movss (%eax,%esi,4),%xmm1
+ DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7
DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5
DB 102,15,41,109,200 ; movapd %xmm5,-0x38(%ebp)
DB 15,20,218 ; unpcklps %xmm2,%xmm3
DB 15,20,207 ; unpcklps %xmm7,%xmm1
DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1
- DB 139,65,24 ; mov 0x18(%ecx),%eax
- DB 243,15,16,20,184 ; movss (%eax,%edi,4),%xmm2
- DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3
- DB 243,15,16,36,144 ; movss (%eax,%edx,4),%xmm4
- DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7
+ DB 139,66,24 ; mov 0x18(%edx),%eax
+ DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2
+ DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3
+ DB 243,15,16,36,176 ; movss (%eax,%esi,4),%xmm4
+ DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7
DB 15,20,218 ; unpcklps %xmm2,%xmm3
DB 15,20,231 ; unpcklps %xmm7,%xmm4
DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4
DB 102,15,41,101,216 ; movapd %xmm4,-0x28(%ebp)
- DB 139,65,12 ; mov 0xc(%ecx),%eax
- DB 243,15,16,20,184 ; movss (%eax,%edi,4),%xmm2
- DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3
+ DB 139,66,12 ; mov 0xc(%edx),%eax
+ DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2
+ DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3
DB 15,20,218 ; unpcklps %xmm2,%xmm3
- DB 243,15,16,20,144 ; movss (%eax,%edx,4),%xmm2
- DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7
+ DB 243,15,16,20,176 ; movss (%eax,%esi,4),%xmm2
+ DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7
DB 15,20,215 ; unpcklps %xmm7,%xmm2
DB 102,15,20,211 ; unpcklpd %xmm3,%xmm2
- DB 139,65,28 ; mov 0x1c(%ecx),%eax
- DB 243,15,16,60,184 ; movss (%eax,%edi,4),%xmm7
- DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3
+ DB 139,66,28 ; mov 0x1c(%edx),%eax
+ DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7
+ DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3
DB 15,20,223 ; unpcklps %xmm7,%xmm3
- DB 243,15,16,60,144 ; movss (%eax,%edx,4),%xmm7
- DB 243,15,16,44,152 ; movss (%eax,%ebx,4),%xmm5
+ DB 243,15,16,60,176 ; movss (%eax,%esi,4),%xmm7
+ DB 243,15,16,44,136 ; movss (%eax,%ecx,4),%xmm5
DB 15,20,253 ; unpcklps %xmm5,%xmm7
DB 102,15,20,251 ; unpcklpd %xmm3,%xmm7
- DB 139,65,16 ; mov 0x10(%ecx),%eax
- DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3
- DB 243,15,16,44,176 ; movss (%eax,%esi,4),%xmm5
+ DB 139,66,16 ; mov 0x10(%edx),%eax
+ DB 243,15,16,28,152 ; movss (%eax,%ebx,4),%xmm3
+ DB 243,15,16,44,184 ; movss (%eax,%edi,4),%xmm5
DB 15,20,235 ; unpcklps %xmm3,%xmm5
- DB 243,15,16,28,144 ; movss (%eax,%edx,4),%xmm3
- DB 243,15,16,52,152 ; movss (%eax,%ebx,4),%xmm6
+ DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3
+ DB 243,15,16,52,136 ; movss (%eax,%ecx,4),%xmm6
DB 15,20,222 ; unpcklps %xmm6,%xmm3
DB 102,15,20,221 ; unpcklpd %xmm5,%xmm3
- DB 139,65,32 ; mov 0x20(%ecx),%eax
- DB 243,15,16,44,184 ; movss (%eax,%edi,4),%xmm5
- DB 243,15,16,52,176 ; movss (%eax,%esi,4),%xmm6
+ DB 139,66,32 ; mov 0x20(%edx),%eax
+ DB 243,15,16,44,152 ; movss (%eax,%ebx,4),%xmm5
+ DB 243,15,16,52,184 ; movss (%eax,%edi,4),%xmm6
DB 15,20,245 ; unpcklps %xmm5,%xmm6
- DB 243,15,16,44,144 ; movss (%eax,%edx,4),%xmm5
- DB 243,15,16,36,152 ; movss (%eax,%ebx,4),%xmm4
+ DB 243,15,16,44,176 ; movss (%eax,%esi,4),%xmm5
+ DB 243,15,16,36,136 ; movss (%eax,%ecx,4),%xmm4
DB 15,20,236 ; unpcklps %xmm4,%xmm5
DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5
DB 15,40,101,184 ; movaps -0x48(%ebp),%xmm4
@@ -51824,13 +51816,14 @@ _sk_gradient_sse2 LABEL PROC
DB 15,88,215 ; addps %xmm7,%xmm2
DB 15,89,216 ; mulps %xmm0,%xmm3
DB 15,88,221 ; addps %xmm5,%xmm3
- DB 139,69,240 ; mov -0x10(%ebp),%eax
- DB 141,72,4 ; lea 0x4(%eax),%ecx
+ DB 139,69,12 ; mov 0xc(%ebp),%eax
+ DB 137,193 ; mov %eax,%ecx
+ DB 141,65,8 ; lea 0x8(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
DB 15,40,196 ; movaps %xmm4,%xmm0
- DB 81 ; push %ecx
+ DB 80 ; push %eax
DB 255,117,8 ; pushl 0x8(%ebp)
- DB 255,16 ; call *(%eax)
+ DB 255,81,4 ; call *0x4(%ecx)
DB 131,196,76 ; add $0x4c,%esp
DB 94 ; pop %esi
DB 95 ; pop %edi
@@ -51888,7 +51881,7 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
DB 15,40,209 ; movaps %xmm1,%xmm2
DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 232,0,0,0,0 ; call 6a81 <_sk_xy_to_unit_angle_sse2+0x18>
+ DB 232,0,0,0,0 ; call 6a70 <_sk_xy_to_unit_angle_sse2+0x18>
DB 88 ; pop %eax
DB 15,87,237 ; xorps %xmm5,%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
@@ -51903,30 +51896,30 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC
DB 15,94,247 ; divps %xmm7,%xmm6
DB 15,40,254 ; movaps %xmm6,%xmm7
DB 15,89,255 ; mulps %xmm7,%xmm7
- DB 15,40,128,79,104,0,0 ; movaps 0x684f(%eax),%xmm0
+ DB 15,40,128,64,104,0,0 ; movaps 0x6840(%eax),%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 15,88,128,95,104,0,0 ; addps 0x685f(%eax),%xmm0
+ DB 15,88,128,80,104,0,0 ; addps 0x6850(%eax),%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 15,88,128,111,104,0,0 ; addps 0x686f(%eax),%xmm0
+ DB 15,88,128,96,104,0,0 ; addps 0x6860(%eax),%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 15,88,128,127,104,0,0 ; addps 0x687f(%eax),%xmm0
+ DB 15,88,128,112,104,0,0 ; addps 0x6870(%eax),%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
DB 15,194,236,1 ; cmpltps %xmm4,%xmm5
- DB 15,40,176,143,104,0,0 ; movaps 0x688f(%eax),%xmm6
+ DB 15,40,176,128,104,0,0 ; movaps 0x6880(%eax),%xmm6
DB 15,92,240 ; subps %xmm0,%xmm6
DB 15,84,245 ; andps %xmm5,%xmm6
DB 15,85,232 ; andnps %xmm0,%xmm5
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,86,238 ; orps %xmm6,%xmm5
DB 15,194,204,1 ; cmpltps %xmm4,%xmm1
- DB 15,40,128,95,98,0,0 ; movaps 0x625f(%eax),%xmm0
+ DB 15,40,128,80,98,0,0 ; movaps 0x6250(%eax),%xmm0
DB 15,92,197 ; subps %xmm5,%xmm0
DB 15,84,193 ; andps %xmm1,%xmm0
DB 15,85,205 ; andnps %xmm5,%xmm1
DB 15,86,200 ; orps %xmm0,%xmm1
DB 15,40,194 ; movaps %xmm2,%xmm0
DB 15,194,196,1 ; cmpltps %xmm4,%xmm0
- DB 15,40,168,111,98,0,0 ; movaps 0x626f(%eax),%xmm5
+ DB 15,40,168,96,98,0,0 ; movaps 0x6260(%eax),%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
DB 15,84,232 ; andps %xmm0,%xmm5
DB 15,85,193 ; andnps %xmm1,%xmm0
@@ -51983,15 +51976,15 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,246 ; mulps %xmm6,%xmm6
DB 15,88,240 ; addps %xmm0,%xmm6
- DB 232,0,0,0,0 ; call 6b9e <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
+ DB 232,0,0,0,0 ; call 6b8d <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
DB 90 ; pop %edx
DB 243,15,89,237 ; mulss %xmm5,%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,92,245 ; subps %xmm5,%xmm6
DB 243,15,16,65,32 ; movss 0x20(%ecx),%xmm0
DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0
- DB 15,89,162,130,103,0,0 ; mulps 0x6782(%edx),%xmm4
- DB 15,89,130,146,103,0,0 ; mulps 0x6792(%edx),%xmm0
+ DB 15,89,162,115,103,0,0 ; mulps 0x6773(%edx),%xmm4
+ DB 15,89,130,131,103,0,0 ; mulps 0x6783(%edx),%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
@@ -51999,11 +51992,11 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 15,81,237 ; sqrtps %xmm5,%xmm5
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,87,162,50,102,0,0 ; xorps 0x6632(%edx),%xmm4
+ DB 15,87,162,35,102,0,0 ; xorps 0x6623(%edx),%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 243,15,16,105,36 ; movss 0x24(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
- DB 15,89,170,66,97,0,0 ; mulps 0x6142(%edx),%xmm5
+ DB 15,89,170,51,97,0,0 ; mulps 0x6133(%edx),%xmm5
DB 15,89,197 ; mulps %xmm5,%xmm0
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,95,196 ; maxps %xmm4,%xmm0
@@ -52032,15 +52025,15 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,246 ; mulps %xmm6,%xmm6
DB 15,88,240 ; addps %xmm0,%xmm6
- DB 232,0,0,0,0 ; call 6c3c <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
+ DB 232,0,0,0,0 ; call 6c2b <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
DB 90 ; pop %edx
DB 243,15,89,237 ; mulss %xmm5,%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,92,245 ; subps %xmm5,%xmm6
DB 243,15,16,65,32 ; movss 0x20(%ecx),%xmm0
DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0
- DB 15,89,162,228,102,0,0 ; mulps 0x66e4(%edx),%xmm4
- DB 15,89,130,244,102,0,0 ; mulps 0x66f4(%edx),%xmm0
+ DB 15,89,162,213,102,0,0 ; mulps 0x66d5(%edx),%xmm4
+ DB 15,89,130,229,102,0,0 ; mulps 0x66e5(%edx),%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
@@ -52048,11 +52041,11 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 15,81,237 ; sqrtps %xmm5,%xmm5
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,87,162,148,101,0,0 ; xorps 0x6594(%edx),%xmm4
+ DB 15,87,162,133,101,0,0 ; xorps 0x6585(%edx),%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 243,15,16,105,36 ; movss 0x24(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
- DB 15,89,170,164,96,0,0 ; mulps 0x60a4(%edx),%xmm5
+ DB 15,89,170,149,96,0,0 ; mulps 0x6095(%edx),%xmm5
DB 15,89,197 ; mulps %xmm5,%xmm0
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,93,196 ; minps %xmm4,%xmm0
@@ -52070,7 +52063,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 85 ; push %ebp
DB 137,229 ; mov %esp,%ebp
DB 131,236,8 ; sub $0x8,%esp
- DB 232,0,0,0,0 ; call 6cb4 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
+ DB 232,0,0,0,0 ; call 6ca3 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
DB 89 ; pop %ecx
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,16 ; mov (%eax),%edx
@@ -52079,7 +52072,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,15,89,236 ; mulss %xmm4,%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,88,232 ; addps %xmm0,%xmm5
- DB 15,89,169,108,102,0,0 ; mulps 0x666c(%ecx),%xmm5
+ DB 15,89,169,93,102,0,0 ; mulps 0x665d(%ecx),%xmm5
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,246 ; mulps %xmm6,%xmm6
@@ -52087,7 +52080,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,15,89,228 ; mulss %xmm4,%xmm4
DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,87,129,28,101,0,0 ; xorps 0x651c(%ecx),%xmm0
+ DB 15,87,129,13,101,0,0 ; xorps 0x650d(%ecx),%xmm0
DB 15,94,197 ; divps %xmm5,%xmm0
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 131,236,8 ; sub $0x8,%esp
@@ -52158,16 +52151,16 @@ _sk_save_xy_sse2 LABEL PROC
DB 131,236,24 ; sub $0x18,%esp
DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp)
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 232,0,0,0,0 ; call 6d9d <_sk_save_xy_sse2+0x12>
+ DB 232,0,0,0,0 ; call 6d8c <_sk_save_xy_sse2+0x12>
DB 88 ; pop %eax
- DB 15,40,160,67,95,0,0 ; movaps 0x5f43(%eax),%xmm4
+ DB 15,40,160,52,95,0,0 ; movaps 0x5f34(%eax),%xmm4
DB 15,40,232 ; movaps %xmm0,%xmm5
DB 15,88,236 ; addps %xmm4,%xmm5
DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 15,40,253 ; movaps %xmm5,%xmm7
DB 15,194,254,1 ; cmpltps %xmm6,%xmm7
- DB 15,40,144,83,95,0,0 ; movaps 0x5f53(%eax),%xmm2
+ DB 15,40,144,68,95,0,0 ; movaps 0x5f44(%eax),%xmm2
DB 15,84,250 ; andps %xmm2,%xmm7
DB 15,92,247 ; subps %xmm7,%xmm6
DB 15,92,238 ; subps %xmm6,%xmm5
@@ -52238,15 +52231,15 @@ _sk_bilinear_nx_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 6e7f <_sk_bilinear_nx_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6e6e <_sk_bilinear_nx_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,102,64 ; movups 0x40(%esi),%xmm4
- DB 15,88,128,193,100,0,0 ; addps 0x64c1(%eax),%xmm0
- DB 15,40,168,113,94,0,0 ; movaps 0x5e71(%eax),%xmm5
+ DB 15,88,128,178,100,0,0 ; addps 0x64b2(%eax),%xmm0
+ DB 15,40,168,98,94,0,0 ; movaps 0x5e62(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,17,174,128,0,0,0 ; movups %xmm5,0x80(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -52265,14 +52258,14 @@ _sk_bilinear_px_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 6ec2 <_sk_bilinear_px_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6eb1 <_sk_bilinear_px_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,102,64 ; movups 0x40(%esi),%xmm4
- DB 15,88,128,30,94,0,0 ; addps 0x5e1e(%eax),%xmm0
+ DB 15,88,128,15,94,0,0 ; addps 0x5e0f(%eax),%xmm0
DB 15,17,166,128,0,0,0 ; movups %xmm4,0x80(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -52290,15 +52283,15 @@ _sk_bilinear_ny_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 6efb <_sk_bilinear_ny_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6eea <_sk_bilinear_ny_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,32 ; movups 0x20(%esi),%xmm1
DB 15,16,102,96 ; movups 0x60(%esi),%xmm4
- DB 15,88,136,69,100,0,0 ; addps 0x6445(%eax),%xmm1
- DB 15,40,168,245,93,0,0 ; movaps 0x5df5(%eax),%xmm5
+ DB 15,88,136,54,100,0,0 ; addps 0x6436(%eax),%xmm1
+ DB 15,40,168,230,93,0,0 ; movaps 0x5de6(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,17,174,160,0,0,0 ; movups %xmm5,0xa0(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -52317,14 +52310,14 @@ _sk_bilinear_py_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 6f3f <_sk_bilinear_py_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6f2e <_sk_bilinear_py_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,32 ; movups 0x20(%esi),%xmm1
DB 15,16,102,96 ; movups 0x60(%esi),%xmm4
- DB 15,88,136,161,93,0,0 ; addps 0x5da1(%eax),%xmm1
+ DB 15,88,136,146,93,0,0 ; addps 0x5d92(%eax),%xmm1
DB 15,17,166,160,0,0,0 ; movups %xmm4,0xa0(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -52342,20 +52335,20 @@ _sk_bicubic_n3x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 6f79 <_sk_bicubic_n3x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6f68 <_sk_bicubic_n3x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,102,64 ; movups 0x40(%esi),%xmm4
- DB 15,88,128,215,99,0,0 ; addps 0x63d7(%eax),%xmm0
- DB 15,40,168,119,93,0,0 ; movaps 0x5d77(%eax),%xmm5
+ DB 15,88,128,200,99,0,0 ; addps 0x63c8(%eax),%xmm0
+ DB 15,40,168,104,93,0,0 ; movaps 0x5d68(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,40,229 ; movaps %xmm5,%xmm4
DB 15,89,228 ; mulps %xmm4,%xmm4
- DB 15,89,168,231,99,0,0 ; mulps 0x63e7(%eax),%xmm5
- DB 15,88,168,87,95,0,0 ; addps 0x5f57(%eax),%xmm5
+ DB 15,89,168,216,99,0,0 ; mulps 0x63d8(%eax),%xmm5
+ DB 15,88,168,72,95,0,0 ; addps 0x5f48(%eax),%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
DB 15,17,174,128,0,0,0 ; movups %xmm5,0x80(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -52374,23 +52367,23 @@ _sk_bicubic_n1x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 6fd3 <_sk_bicubic_n1x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6fc2 <_sk_bicubic_n1x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,102,64 ; movups 0x40(%esi),%xmm4
- DB 15,88,128,109,99,0,0 ; addps 0x636d(%eax),%xmm0
- DB 15,40,168,29,93,0,0 ; movaps 0x5d1d(%eax),%xmm5
+ DB 15,88,128,94,99,0,0 ; addps 0x635e(%eax),%xmm0
+ DB 15,40,168,14,93,0,0 ; movaps 0x5d0e(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
- DB 15,40,160,157,99,0,0 ; movaps 0x639d(%eax),%xmm4
+ DB 15,40,160,142,99,0,0 ; movaps 0x638e(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,173,99,0,0 ; addps 0x63ad(%eax),%xmm4
+ DB 15,88,160,158,99,0,0 ; addps 0x639e(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,13,93,0,0 ; addps 0x5d0d(%eax),%xmm4
+ DB 15,88,160,254,92,0,0 ; addps 0x5cfe(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,189,99,0,0 ; addps 0x63bd(%eax),%xmm4
+ DB 15,88,160,174,99,0,0 ; addps 0x63ae(%eax),%xmm4
DB 15,17,166,128,0,0,0 ; movups %xmm4,0x80(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -52408,22 +52401,22 @@ _sk_bicubic_p1x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 703b <_sk_bicubic_p1x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 702a <_sk_bicubic_p1x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
- DB 15,40,160,165,92,0,0 ; movaps 0x5ca5(%eax),%xmm4
+ DB 15,40,160,150,92,0,0 ; movaps 0x5c96(%eax),%xmm4
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,110,64 ; movups 0x40(%esi),%xmm5
DB 15,88,196 ; addps %xmm4,%xmm0
- DB 15,40,176,53,99,0,0 ; movaps 0x6335(%eax),%xmm6
+ DB 15,40,176,38,99,0,0 ; movaps 0x6326(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,69,99,0,0 ; addps 0x6345(%eax),%xmm6
+ DB 15,88,176,54,99,0,0 ; addps 0x6336(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,88,244 ; addps %xmm4,%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,85,99,0,0 ; addps 0x6355(%eax),%xmm6
+ DB 15,88,176,70,99,0,0 ; addps 0x6346(%eax),%xmm6
DB 15,17,182,128,0,0,0 ; movups %xmm6,0x80(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -52441,18 +52434,18 @@ _sk_bicubic_p3x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7098 <_sk_bicubic_p3x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 7087 <_sk_bicubic_p3x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,102,64 ; movups 0x40(%esi),%xmm4
- DB 15,88,128,232,98,0,0 ; addps 0x62e8(%eax),%xmm0
+ DB 15,88,128,217,98,0,0 ; addps 0x62d9(%eax),%xmm0
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
- DB 15,89,160,200,98,0,0 ; mulps 0x62c8(%eax),%xmm4
- DB 15,88,160,56,94,0,0 ; addps 0x5e38(%eax),%xmm4
+ DB 15,89,160,185,98,0,0 ; mulps 0x62b9(%eax),%xmm4
+ DB 15,88,160,41,94,0,0 ; addps 0x5e29(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,17,166,128,0,0,0 ; movups %xmm4,0x80(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -52471,20 +52464,20 @@ _sk_bicubic_n3y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 70e8 <_sk_bicubic_n3y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 70d7 <_sk_bicubic_n3y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,32 ; movups 0x20(%esi),%xmm1
DB 15,16,102,96 ; movups 0x60(%esi),%xmm4
- DB 15,88,136,104,98,0,0 ; addps 0x6268(%eax),%xmm1
- DB 15,40,168,8,92,0,0 ; movaps 0x5c08(%eax),%xmm5
+ DB 15,88,136,89,98,0,0 ; addps 0x6259(%eax),%xmm1
+ DB 15,40,168,249,91,0,0 ; movaps 0x5bf9(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,40,229 ; movaps %xmm5,%xmm4
DB 15,89,228 ; mulps %xmm4,%xmm4
- DB 15,89,168,120,98,0,0 ; mulps 0x6278(%eax),%xmm5
- DB 15,88,168,232,93,0,0 ; addps 0x5de8(%eax),%xmm5
+ DB 15,89,168,105,98,0,0 ; mulps 0x6269(%eax),%xmm5
+ DB 15,88,168,217,93,0,0 ; addps 0x5dd9(%eax),%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
DB 15,17,174,160,0,0,0 ; movups %xmm5,0xa0(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -52503,23 +52496,23 @@ _sk_bicubic_n1y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7143 <_sk_bicubic_n1y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 7132 <_sk_bicubic_n1y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,32 ; movups 0x20(%esi),%xmm1
DB 15,16,102,96 ; movups 0x60(%esi),%xmm4
- DB 15,88,136,253,97,0,0 ; addps 0x61fd(%eax),%xmm1
- DB 15,40,168,173,91,0,0 ; movaps 0x5bad(%eax),%xmm5
+ DB 15,88,136,238,97,0,0 ; addps 0x61ee(%eax),%xmm1
+ DB 15,40,168,158,91,0,0 ; movaps 0x5b9e(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
- DB 15,40,160,45,98,0,0 ; movaps 0x622d(%eax),%xmm4
+ DB 15,40,160,30,98,0,0 ; movaps 0x621e(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,61,98,0,0 ; addps 0x623d(%eax),%xmm4
+ DB 15,88,160,46,98,0,0 ; addps 0x622e(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,157,91,0,0 ; addps 0x5b9d(%eax),%xmm4
+ DB 15,88,160,142,91,0,0 ; addps 0x5b8e(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,77,98,0,0 ; addps 0x624d(%eax),%xmm4
+ DB 15,88,160,62,98,0,0 ; addps 0x623e(%eax),%xmm4
DB 15,17,166,160,0,0,0 ; movups %xmm4,0xa0(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -52537,22 +52530,22 @@ _sk_bicubic_p1y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 71ac <_sk_bicubic_p1y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 719b <_sk_bicubic_p1y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
- DB 15,40,160,52,91,0,0 ; movaps 0x5b34(%eax),%xmm4
+ DB 15,40,160,37,91,0,0 ; movaps 0x5b25(%eax),%xmm4
DB 15,16,78,32 ; movups 0x20(%esi),%xmm1
DB 15,16,110,96 ; movups 0x60(%esi),%xmm5
DB 15,88,204 ; addps %xmm4,%xmm1
- DB 15,40,176,196,97,0,0 ; movaps 0x61c4(%eax),%xmm6
+ DB 15,40,176,181,97,0,0 ; movaps 0x61b5(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,212,97,0,0 ; addps 0x61d4(%eax),%xmm6
+ DB 15,88,176,197,97,0,0 ; addps 0x61c5(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,88,244 ; addps %xmm4,%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,228,97,0,0 ; addps 0x61e4(%eax),%xmm6
+ DB 15,88,176,213,97,0,0 ; addps 0x61d5(%eax),%xmm6
DB 15,17,182,160,0,0,0 ; movups %xmm6,0xa0(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -52570,18 +52563,18 @@ _sk_bicubic_p3y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 720a <_sk_bicubic_p3y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 71f9 <_sk_bicubic_p3y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,32 ; movups 0x20(%esi),%xmm1
DB 15,16,102,96 ; movups 0x60(%esi),%xmm4
- DB 15,88,136,118,97,0,0 ; addps 0x6176(%eax),%xmm1
+ DB 15,88,136,103,97,0,0 ; addps 0x6167(%eax),%xmm1
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
- DB 15,89,160,86,97,0,0 ; mulps 0x6156(%eax),%xmm4
- DB 15,88,160,198,92,0,0 ; addps 0x5cc6(%eax),%xmm4
+ DB 15,89,160,71,97,0,0 ; mulps 0x6147(%eax),%xmm4
+ DB 15,88,160,183,92,0,0 ; addps 0x5cb7(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,17,166,160,0,0,0 ; movups %xmm4,0xa0(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -52602,10 +52595,10 @@ _sk_callback_sse2 LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,12 ; sub $0xc,%esp
- DB 139,117,12 ; mov 0xc(%ebp),%esi
- DB 139,125,8 ; mov 0x8(%ebp),%edi
- DB 139,71,8 ; mov 0x8(%edi),%eax
- DB 139,30 ; mov (%esi),%ebx
+ DB 139,117,8 ; mov 0x8(%ebp),%esi
+ DB 139,125,12 ; mov 0xc(%ebp),%edi
+ DB 139,31 ; mov (%edi),%ebx
+ DB 139,70,8 ; mov 0x8(%esi),%eax
DB 15,40,224 ; movaps %xmm0,%xmm4
DB 15,20,225 ; unpcklps %xmm1,%xmm4
DB 15,40,234 ; movaps %xmm2,%xmm5
@@ -52647,11 +52640,11 @@ _sk_callback_sse2 LABEL PROC
DB 15,40,212 ; movaps %xmm4,%xmm2
DB 102,15,20,211 ; unpcklpd %xmm3,%xmm2
DB 15,18,220 ; movhlps %xmm4,%xmm3
- DB 141,70,8 ; lea 0x8(%esi),%eax
+ DB 141,71,8 ; lea 0x8(%edi),%eax
DB 131,236,8 ; sub $0x8,%esp
DB 80 ; push %eax
- DB 87 ; push %edi
- DB 255,86,4 ; call *0x4(%esi)
+ DB 86 ; push %esi
+ DB 255,87,4 ; call *0x4(%edi)
DB 131,196,28 ; add $0x1c,%esp
DB 94 ; pop %esi
DB 95 ; pop %edi
@@ -52666,12 +52659,10 @@ _sk_clut_3D_sse2 LABEL PROC
DB 83 ; push %ebx
DB 87 ; push %edi
DB 86 ; push %esi
- DB 129,236,44,1,0,0 ; sub $0x12c,%esp
- DB 15,41,157,200,254,255,255 ; movaps %xmm3,-0x138(%ebp)
+ DB 129,236,28,1,0,0 ; sub $0x11c,%esp
+ DB 15,41,157,216,254,255,255 ; movaps %xmm3,-0x128(%ebp)
DB 15,40,216 ; movaps %xmm0,%xmm3
DB 139,69,12 ; mov 0xc(%ebp),%eax
- DB 141,72,4 ; lea 0x4(%eax),%ecx
- DB 137,141,20,255,255,255 ; mov %ecx,-0xec(%ebp)
DB 139,8 ; mov (%eax),%ecx
DB 139,81,12 ; mov 0xc(%ecx),%edx
DB 141,114,255 ; lea -0x1(%edx),%esi
@@ -52680,7 +52671,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,89,194 ; mulps %xmm2,%xmm0
DB 15,40,224 ; movaps %xmm0,%xmm4
- DB 15,41,165,232,254,255,255 ; movaps %xmm4,-0x118(%ebp)
+ DB 15,41,165,248,254,255,255 ; movaps %xmm4,-0x108(%ebp)
DB 102,15,110,194 ; movd %edx,%xmm0
DB 102,15,112,240,0 ; pshufd $0x0,%xmm0,%xmm6
DB 102,15,127,117,152 ; movdqa %xmm6,-0x68(%ebp)
@@ -52722,15 +52713,15 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
DB 102,15,98,200 ; punpckldq %xmm0,%xmm1
DB 102,15,127,77,136 ; movdqa %xmm1,-0x78(%ebp)
- DB 232,0,0,0,0 ; call 73f6 <_sk_clut_3D_sse2+0xf7>
+ DB 232,0,0,0,0 ; call 73dc <_sk_clut_3D_sse2+0xee>
DB 90 ; pop %edx
DB 243,15,91,196 ; cvttps2dq %xmm4,%xmm0
- DB 102,15,127,133,248,254,255,255 ; movdqa %xmm0,-0x108(%ebp)
+ DB 102,15,127,133,8,255,255,255 ; movdqa %xmm0,-0xf8(%ebp)
DB 102,15,111,221 ; movdqa %xmm5,%xmm3
DB 102,15,254,216 ; paddd %xmm0,%xmm3
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,254,195 ; paddd %xmm3,%xmm0
- DB 102,15,111,162,186,95,0,0 ; movdqa 0x5fba(%edx),%xmm4
+ DB 102,15,111,162,180,95,0,0 ; movdqa 0x5fb4(%edx),%xmm4
DB 102,15,127,165,120,255,255,255 ; movdqa %xmm4,-0x88(%ebp)
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
@@ -52770,7 +52761,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,4,129 ; movss (%ecx,%eax,4),%xmm0
DB 15,20,248 ; unpcklps %xmm0,%xmm7
DB 102,15,20,252 ; unpcklpd %xmm4,%xmm7
- DB 102,15,111,130,58,89,0,0 ; movdqa 0x593a(%edx),%xmm0
+ DB 102,15,111,130,52,89,0,0 ; movdqa 0x5934(%edx),%xmm0
DB 102,15,127,133,104,255,255,255 ; movdqa %xmm0,-0x98(%ebp)
DB 102,15,254,200 ; paddd %xmm0,%xmm1
DB 102,15,112,193,229 ; pshufd $0xe5,%xmm1,%xmm0
@@ -52787,8 +52778,8 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,4,129 ; movss (%ecx,%eax,4),%xmm0
DB 15,20,240 ; unpcklps %xmm0,%xmm6
DB 102,15,20,241 ; unpcklpd %xmm1,%xmm6
- DB 15,40,130,170,95,0,0 ; movaps 0x5faa(%edx),%xmm0
- DB 15,40,141,232,254,255,255 ; movaps -0x118(%ebp),%xmm1
+ DB 15,40,130,164,95,0,0 ; movaps 0x5fa4(%edx),%xmm0
+ DB 15,40,141,248,254,255,255 ; movaps -0x108(%ebp),%xmm1
DB 15,88,200 ; addps %xmm0,%xmm1
DB 15,41,77,200 ; movaps %xmm1,-0x38(%ebp)
DB 15,40,141,88,255,255,255 ; movaps -0xa8(%ebp),%xmm1
@@ -52872,7 +52863,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,92,206 ; subps %xmm6,%xmm1
DB 15,89,204 ; mulps %xmm4,%xmm1
DB 15,88,206 ; addps %xmm6,%xmm1
- DB 15,41,141,216,254,255,255 ; movaps %xmm1,-0x128(%ebp)
+ DB 15,41,141,232,254,255,255 ; movaps %xmm1,-0x118(%ebp)
DB 243,15,91,133,72,255,255,255 ; cvttps2dq -0xb8(%ebp),%xmm0
DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4
DB 102,15,111,77,152 ; movdqa -0x68(%ebp),%xmm1
@@ -52883,7 +52874,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,112,196,232 ; pshufd $0xe8,%xmm4,%xmm0
DB 102,15,98,248 ; punpckldq %xmm0,%xmm7
DB 102,15,127,125,152 ; movdqa %xmm7,-0x68(%ebp)
- DB 102,15,254,189,248,254,255,255 ; paddd -0x108(%ebp),%xmm7
+ DB 102,15,254,189,8,255,255,255 ; paddd -0xf8(%ebp),%xmm7
DB 102,15,111,199 ; movdqa %xmm7,%xmm0
DB 102,15,254,69,136 ; paddd -0x78(%ebp),%xmm0
DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4
@@ -53020,7 +53011,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
DB 15,41,149,56,255,255,255 ; movaps %xmm2,-0xc8(%ebp)
- DB 15,40,133,216,254,255,255 ; movaps -0x128(%ebp),%xmm0
+ DB 15,40,133,232,254,255,255 ; movaps -0x118(%ebp),%xmm0
DB 15,92,216 ; subps %xmm0,%xmm3
DB 15,89,220 ; mulps %xmm4,%xmm3
DB 15,88,216 ; addps %xmm0,%xmm3
@@ -53291,8 +53282,8 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,92,214 ; subps %xmm6,%xmm2
DB 15,89,211 ; mulps %xmm3,%xmm2
DB 15,88,214 ; addps %xmm6,%xmm2
- DB 15,91,157,248,254,255,255 ; cvtdq2ps -0x108(%ebp),%xmm3
- DB 15,40,165,232,254,255,255 ; movaps -0x118(%ebp),%xmm4
+ DB 15,91,157,8,255,255,255 ; cvtdq2ps -0xf8(%ebp),%xmm3
+ DB 15,40,165,248,254,255,255 ; movaps -0x108(%ebp),%xmm4
DB 15,92,227 ; subps %xmm3,%xmm4
DB 15,40,93,184 ; movaps -0x48(%ebp),%xmm3
DB 15,92,195 ; subps %xmm3,%xmm0
@@ -53306,15 +53297,14 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,88,211 ; addps %xmm3,%xmm2
- DB 139,69,8 ; mov 0x8(%ebp),%eax
- DB 139,85,12 ; mov 0xc(%ebp),%edx
- DB 141,74,8 ; lea 0x8(%edx),%ecx
+ DB 139,77,12 ; mov 0xc(%ebp),%ecx
+ DB 141,65,8 ; lea 0x8(%ecx),%eax
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,157,200,254,255,255 ; movaps -0x138(%ebp),%xmm3
- DB 81 ; push %ecx
+ DB 15,40,157,216,254,255,255 ; movaps -0x128(%ebp),%xmm3
DB 80 ; push %eax
- DB 255,82,4 ; call *0x4(%edx)
- DB 129,196,60,1,0,0 ; add $0x13c,%esp
+ DB 255,117,8 ; pushl 0x8(%ebp)
+ DB 255,81,4 ; call *0x4(%ecx)
+ DB 129,196,44,1,0,0 ; add $0x12c,%esp
DB 94 ; pop %esi
DB 95 ; pop %edi
DB 91 ; pop %ebx
@@ -53328,10 +53318,8 @@ _sk_clut_4D_sse2 LABEL PROC
DB 83 ; push %ebx
DB 87 ; push %edi
DB 86 ; push %esi
- DB 129,236,92,1,0,0 ; sub $0x15c,%esp
+ DB 129,236,76,1,0,0 ; sub $0x14c,%esp
DB 139,69,12 ; mov 0xc(%ebp),%eax
- DB 141,72,4 ; lea 0x4(%eax),%ecx
- DB 137,141,212,254,255,255 ; mov %ecx,-0x12c(%ebp)
DB 139,16 ; mov (%eax),%edx
DB 139,74,16 ; mov 0x10(%edx),%ecx
DB 141,113,255 ; lea -0x1(%ecx),%esi
@@ -53408,18 +53396,18 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,112,201,232 ; pshufd $0xe8,%xmm1,%xmm1
DB 102,15,98,217 ; punpckldq %xmm1,%xmm3
DB 102,15,127,93,152 ; movdqa %xmm3,-0x68(%ebp)
- DB 232,0,0,0,0 ; call 7f8c <_sk_clut_4D_sse2+0x16e>
+ DB 232,0,0,0,0 ; call 7f68 <_sk_clut_4D_sse2+0x165>
DB 89 ; pop %ecx
DB 15,40,197 ; movaps %xmm5,%xmm0
- DB 15,41,133,152,254,255,255 ; movaps %xmm0,-0x168(%ebp)
+ DB 15,41,133,168,254,255,255 ; movaps %xmm0,-0x158(%ebp)
DB 243,15,91,200 ; cvttps2dq %xmm0,%xmm1
- DB 102,15,127,141,184,254,255,255 ; movdqa %xmm1,-0x148(%ebp)
+ DB 102,15,127,141,200,254,255,255 ; movdqa %xmm1,-0x138(%ebp)
DB 102,15,254,241 ; paddd %xmm1,%xmm6
DB 102,15,127,117,200 ; movdqa %xmm6,-0x38(%ebp)
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
DB 102,15,254,214 ; paddd %xmm6,%xmm2
DB 102,15,254,218 ; paddd %xmm2,%xmm3
- DB 102,15,111,161,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm4
+ DB 102,15,111,161,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm4
DB 102,15,112,203,245 ; pshufd $0xf5,%xmm3,%xmm1
DB 102,15,244,220 ; pmuludq %xmm4,%xmm3
DB 102,15,244,204 ; pmuludq %xmm4,%xmm1
@@ -53461,7 +53449,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,223 ; unpcklps %xmm7,%xmm3
DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3
DB 102,15,41,157,232,254,255,255 ; movapd %xmm3,-0x118(%ebp)
- DB 102,15,254,137,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm1
+ DB 102,15,254,137,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm1
DB 102,15,112,241,229 ; pshufd $0xe5,%xmm1,%xmm6
DB 102,15,126,240 ; movd %xmm6,%eax
DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6
@@ -53476,7 +53464,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,60,130 ; movss (%edx,%eax,4),%xmm7
DB 15,20,223 ; unpcklps %xmm7,%xmm3
DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3
- DB 15,40,185,20,84,0,0 ; movaps 0x5414(%ecx),%xmm7
+ DB 15,40,185,24,84,0,0 ; movaps 0x5418(%ecx),%xmm7
DB 15,88,199 ; addps %xmm7,%xmm0
DB 15,41,133,120,255,255,255 ; movaps %xmm0,-0x88(%ebp)
DB 15,40,133,248,254,255,255 ; movaps -0x108(%ebp),%xmm0
@@ -53484,7 +53472,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,41,69,136 ; movaps %xmm0,-0x78(%ebp)
DB 15,40,133,56,255,255,255 ; movaps -0xc8(%ebp),%xmm0
DB 15,88,199 ; addps %xmm7,%xmm0
- DB 15,41,133,168,254,255,255 ; movaps %xmm0,-0x158(%ebp)
+ DB 15,41,133,184,254,255,255 ; movaps %xmm0,-0x148(%ebp)
DB 15,88,125,216 ; addps -0x28(%ebp),%xmm7
DB 243,15,91,255 ; cvttps2dq %xmm7,%xmm7
DB 102,15,112,199,245 ; pshufd $0xf5,%xmm7,%xmm0
@@ -53497,7 +53485,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,127,101,168 ; movdqa %xmm4,-0x58(%ebp)
DB 102,15,254,212 ; paddd %xmm4,%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,161,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm4
+ DB 102,15,111,161,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm4
DB 102,15,244,212 ; pmuludq %xmm4,%xmm2
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
DB 102,15,112,240,232 ; pshufd $0xe8,%xmm0,%xmm6
@@ -53533,7 +53521,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5
DB 15,20,213 ; unpcklps %xmm5,%xmm2
DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2
- DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0
+ DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0
DB 102,15,112,232,229 ; pshufd $0xe5,%xmm0,%xmm5
DB 102,15,126,232 ; movd %xmm5,%eax
DB 102,15,112,232,78 ; pshufd $0x4e,%xmm0,%xmm5
@@ -53565,7 +53553,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,92,251 ; subps %xmm3,%xmm7
DB 15,89,248 ; mulps %xmm0,%xmm7
DB 15,88,251 ; addps %xmm3,%xmm7
- DB 243,15,91,141,168,254,255,255 ; cvttps2dq -0x158(%ebp),%xmm1
+ DB 243,15,91,141,184,254,255,255 ; cvttps2dq -0x148(%ebp),%xmm1
DB 102,15,112,217,245 ; pshufd $0xf5,%xmm1,%xmm3
DB 102,15,111,133,88,255,255,255 ; movdqa -0xa8(%ebp),%xmm0
DB 102,15,244,216 ; pmuludq %xmm0,%xmm3
@@ -53617,7 +53605,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5
DB 15,20,245 ; unpcklps %xmm5,%xmm6
DB 102,15,20,240 ; unpcklpd %xmm0,%xmm6
- DB 102,15,254,137,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm1
+ DB 102,15,254,137,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm1
DB 102,15,112,193,229 ; pshufd $0xe5,%xmm1,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
DB 102,15,112,193,78 ; pshufd $0x4e,%xmm1,%xmm0
@@ -53635,7 +53623,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,15,254,77,168 ; paddd -0x58(%ebp),%xmm1
DB 102,15,112,193,245 ; pshufd $0xf5,%xmm1,%xmm0
- DB 102,15,111,145,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm2
+ DB 102,15,111,145,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm2
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
@@ -53671,7 +53659,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0
DB 15,20,216 ; unpcklps %xmm0,%xmm3
DB 102,15,20,217 ; unpcklpd %xmm1,%xmm3
- DB 102,15,254,169,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm5
+ DB 102,15,254,169,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm5
DB 102,15,112,197,229 ; pshufd $0xe5,%xmm5,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
DB 102,15,112,197,78 ; pshufd $0x4e,%xmm5,%xmm0
@@ -53724,14 +53712,14 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,112,193,232 ; pshufd $0xe8,%xmm1,%xmm0
DB 102,15,98,224 ; punpckldq %xmm0,%xmm4
DB 102,15,127,165,24,255,255,255 ; movdqa %xmm4,-0xe8(%ebp)
- DB 102,15,254,165,184,254,255,255 ; paddd -0x148(%ebp),%xmm4
+ DB 102,15,254,165,200,254,255,255 ; paddd -0x138(%ebp),%xmm4
DB 102,15,127,101,200 ; movdqa %xmm4,-0x38(%ebp)
DB 102,15,111,204 ; movdqa %xmm4,%xmm1
DB 102,15,254,141,72,255,255,255 ; paddd -0xb8(%ebp),%xmm1
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,254,85,152 ; paddd -0x68(%ebp),%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,153,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm3
+ DB 102,15,111,153,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm3
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,111,251 ; movdqa %xmm3,%xmm7
@@ -53770,7 +53758,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5
DB 15,20,229 ; unpcklps %xmm5,%xmm4
DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4
- DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0
+ DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0
DB 102,15,112,216,229 ; pshufd $0xe5,%xmm0,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,216,78 ; pshufd $0x4e,%xmm0,%xmm3
@@ -53822,7 +53810,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,52,130 ; movss (%edx,%eax,4),%xmm6
DB 15,20,238 ; unpcklps %xmm6,%xmm5
DB 102,15,20,235 ; unpcklpd %xmm3,%xmm5
- DB 102,15,111,137,164,77,0,0 ; movdqa 0x4da4(%ecx),%xmm1
+ DB 102,15,111,137,168,77,0,0 ; movdqa 0x4da8(%ecx),%xmm1
DB 102,15,254,249 ; paddd %xmm1,%xmm7
DB 102,15,112,223,229 ; pshufd $0xe5,%xmm7,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
@@ -53856,7 +53844,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,226 ; movdqa %xmm2,%xmm4
DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0
DB 102,15,112,208,245 ; pshufd $0xf5,%xmm0,%xmm2
- DB 102,15,111,153,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm3
+ DB 102,15,111,153,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm3
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
DB 102,15,112,218,232 ; pshufd $0xe8,%xmm2,%xmm3
@@ -53913,7 +53901,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
DB 102,15,254,85,168 ; paddd -0x58(%ebp),%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,137,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm1
+ DB 102,15,111,137,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm1
DB 102,15,244,209 ; pmuludq %xmm1,%xmm2
DB 102,15,244,193 ; pmuludq %xmm1,%xmm0
DB 102,15,112,240,232 ; pshufd $0xe8,%xmm0,%xmm6
@@ -53950,7 +53938,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4
DB 15,20,212 ; unpcklps %xmm4,%xmm2
DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2
- DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0
+ DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0
DB 102,15,112,224,229 ; pshufd $0xe5,%xmm0,%xmm4
DB 102,15,126,224 ; movd %xmm4,%eax
DB 102,15,112,224,78 ; pshufd $0x4e,%xmm0,%xmm4
@@ -54018,7 +54006,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,93,152 ; movdqa -0x68(%ebp),%xmm3
DB 102,15,254,217 ; paddd %xmm1,%xmm3
DB 102,15,112,211,245 ; pshufd $0xf5,%xmm3,%xmm2
- DB 102,15,111,129,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm0
+ DB 102,15,111,129,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm0
DB 102,15,244,216 ; pmuludq %xmm0,%xmm3
DB 102,15,244,208 ; pmuludq %xmm0,%xmm2
DB 102,15,111,248 ; movdqa %xmm0,%xmm7
@@ -54057,7 +54045,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,28,130 ; movss (%edx,%eax,4),%xmm3
DB 15,20,235 ; unpcklps %xmm3,%xmm5
DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5
- DB 102,15,254,145,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm2
+ DB 102,15,254,145,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm2
DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
@@ -54109,7 +54097,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0
DB 15,20,208 ; unpcklps %xmm0,%xmm2
DB 102,15,20,215 ; unpcklpd %xmm7,%xmm2
- DB 102,15,111,137,164,77,0,0 ; movdqa 0x4da4(%ecx),%xmm1
+ DB 102,15,111,137,168,77,0,0 ; movdqa 0x4da8(%ecx),%xmm1
DB 102,15,254,217 ; paddd %xmm1,%xmm3
DB 102,15,112,195,229 ; pshufd $0xe5,%xmm3,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
@@ -54144,7 +54132,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,194 ; movdqa %xmm2,%xmm0
DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0
DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4
- DB 102,15,111,169,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm5
+ DB 102,15,111,169,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm5
DB 102,15,111,221 ; movdqa %xmm5,%xmm3
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,244,227 ; pmuludq %xmm3,%xmm4
@@ -54200,7 +54188,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,15,254,77,168 ; paddd -0x58(%ebp),%xmm1
DB 102,15,112,193,245 ; pshufd $0xf5,%xmm1,%xmm0
- DB 102,15,111,145,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm2
+ DB 102,15,111,145,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm2
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
@@ -54236,7 +54224,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0
DB 15,20,216 ; unpcklps %xmm0,%xmm3
DB 102,15,20,217 ; unpcklpd %xmm1,%xmm3
- DB 102,15,254,185,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm7
+ DB 102,15,254,185,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm7
DB 102,15,112,199,229 ; pshufd $0xe5,%xmm7,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
DB 102,15,112,199,78 ; pshufd $0x4e,%xmm7,%xmm0
@@ -54286,7 +54274,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,233 ; movdqa %xmm1,%xmm5
DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
- DB 102,15,111,145,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm2
+ DB 102,15,111,145,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm2
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,15,111,250 ; movdqa %xmm2,%xmm7
@@ -54325,7 +54313,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4
DB 15,20,204 ; unpcklps %xmm4,%xmm1
DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1
- DB 102,15,254,145,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm2
+ DB 102,15,254,145,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm2
DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
@@ -54379,7 +54367,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4
DB 15,20,252 ; unpcklps %xmm4,%xmm7
DB 102,15,20,254 ; unpcklpd %xmm6,%xmm7
- DB 102,15,254,153,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm3
+ DB 102,15,254,153,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm3
DB 102,15,112,227,229 ; pshufd $0xe5,%xmm3,%xmm4
DB 102,15,126,224 ; movd %xmm4,%eax
DB 102,15,112,227,78 ; pshufd $0x4e,%xmm3,%xmm4
@@ -54412,7 +54400,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,254,208 ; paddd %xmm0,%xmm2
DB 102,15,111,216 ; movdqa %xmm0,%xmm3
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,137,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm1
+ DB 102,15,111,137,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm1
DB 102,15,244,209 ; pmuludq %xmm1,%xmm2
DB 102,15,244,193 ; pmuludq %xmm1,%xmm0
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
@@ -54452,7 +54440,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,225 ; unpcklps %xmm1,%xmm4
DB 102,15,20,226 ; unpcklpd %xmm2,%xmm4
DB 102,15,41,165,88,255,255,255 ; movapd %xmm4,-0xa8(%ebp)
- DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0
+ DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0
DB 102,15,112,200,229 ; pshufd $0xe5,%xmm0,%xmm1
DB 102,15,126,200 ; movd %xmm1,%eax
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
@@ -54506,7 +54494,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,52,130 ; movss (%edx,%eax,4),%xmm6
DB 15,20,206 ; unpcklps %xmm6,%xmm1
DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1
- DB 102,15,254,145,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm2
+ DB 102,15,254,145,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm2
DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
@@ -54557,8 +54545,8 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,92,212 ; subps %xmm4,%xmm2
DB 15,89,211 ; mulps %xmm3,%xmm2
DB 15,88,212 ; addps %xmm4,%xmm2
- DB 15,91,157,184,254,255,255 ; cvtdq2ps -0x148(%ebp),%xmm3
- DB 15,40,165,152,254,255,255 ; movaps -0x168(%ebp),%xmm4
+ DB 15,91,157,200,254,255,255 ; cvtdq2ps -0x138(%ebp),%xmm3
+ DB 15,40,165,168,254,255,255 ; movaps -0x158(%ebp),%xmm4
DB 15,92,227 ; subps %xmm3,%xmm4
DB 15,40,157,40,255,255,255 ; movaps -0xd8(%ebp),%xmm3
DB 15,92,195 ; subps %xmm3,%xmm0
@@ -54572,21 +54560,21 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 15,88,211 ; addps %xmm3,%xmm2
- DB 139,69,8 ; mov 0x8(%ebp),%eax
- DB 139,117,12 ; mov 0xc(%ebp),%esi
- DB 141,86,8 ; lea 0x8(%esi),%edx
+ DB 139,85,12 ; mov 0xc(%ebp),%edx
+ DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,153,100,77,0,0 ; movaps 0x4d64(%ecx),%xmm3
- DB 82 ; push %edx
+ DB 15,40,153,104,77,0,0 ; movaps 0x4d68(%ecx),%xmm3
DB 80 ; push %eax
- DB 255,86,4 ; call *0x4(%esi)
- DB 129,196,108,1,0,0 ; add $0x16c,%esp
+ DB 255,117,8 ; pushl 0x8(%ebp)
+ DB 255,82,4 ; call *0x4(%edx)
+ DB 129,196,92,1,0,0 ; add $0x15c,%esp
DB 94 ; pop %esi
DB 95 ; pop %edi
DB 91 ; pop %ebx
DB 93 ; pop %ebp
DB 195 ; ret
DB 144 ; nop
+ DB 144 ; nop
PUBLIC _sk_start_pipeline_sse2_lowp
_sk_start_pipeline_sse2_lowp LABEL PROC
@@ -54599,7 +54587,7 @@ _sk_start_pipeline_sse2_lowp LABEL PROC
DB 131,236,96 ; sub $0x60,%esp
DB 139,125,12 ; mov 0xc(%ebp),%edi
DB 59,125,20 ; cmp 0x14(%ebp),%edi
- DB 15,131,198,0,0,0 ; jae 94b6 <_sk_start_pipeline_sse2_lowp+0xde>
+ DB 15,131,198,0,0,0 ; jae 9492 <_sk_start_pipeline_sse2_lowp+0xde>
DB 139,85,16 ; mov 0x10(%ebp),%edx
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 139,117,24 ; mov 0x18(%ebp),%esi
@@ -54613,7 +54601,7 @@ _sk_start_pipeline_sse2_lowp LABEL PROC
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 137,223 ; mov %ebx,%edi
DB 137,243 ; mov %esi,%ebx
- DB 119,78 ; ja 9467 <_sk_start_pipeline_sse2_lowp+0x8f>
+ DB 119,78 ; ja 9443 <_sk_start_pipeline_sse2_lowp+0x8f>
DB 139,117,8 ; mov 0x8(%ebp),%esi
DB 15,41,68,36,64 ; movaps %xmm0,0x40(%esp)
DB 15,41,68,36,48 ; movaps %xmm0,0x30(%esp)
@@ -54635,13 +54623,13 @@ _sk_start_pipeline_sse2_lowp LABEL PROC
DB 131,198,16 ; add $0x10,%esi
DB 57,214 ; cmp %edx,%esi
DB 137,198 ; mov %eax,%esi
- DB 118,181 ; jbe 941c <_sk_start_pipeline_sse2_lowp+0x44>
+ DB 118,181 ; jbe 93f8 <_sk_start_pipeline_sse2_lowp+0x44>
DB 137,209 ; mov %edx,%ecx
DB 41,193 ; sub %eax,%ecx
DB 137,222 ; mov %ebx,%esi
DB 137,251 ; mov %edi,%ebx
DB 139,124,36,84 ; mov 0x54(%esp),%edi
- DB 116,55 ; je 94ac <_sk_start_pipeline_sse2_lowp+0xd4>
+ DB 116,55 ; je 9488 <_sk_start_pipeline_sse2_lowp+0xd4>
DB 15,41,68,36,64 ; movaps %xmm0,0x40(%esp)
DB 15,41,68,36,48 ; movaps %xmm0,0x30(%esp)
DB 15,41,68,36,32 ; movaps %xmm0,0x20(%esp)
@@ -54659,7 +54647,7 @@ _sk_start_pipeline_sse2_lowp LABEL PROC
DB 139,85,16 ; mov 0x10(%ebp),%edx
DB 71 ; inc %edi
DB 59,125,20 ; cmp 0x14(%ebp),%edi
- DB 15,133,82,255,255,255 ; jne 9408 <_sk_start_pipeline_sse2_lowp+0x30>
+ DB 15,133,82,255,255,255 ; jne 93e4 <_sk_start_pipeline_sse2_lowp+0x30>
DB 141,101,244 ; lea -0xc(%ebp),%esp
DB 94 ; pop %esi
DB 95 ; pop %edi
@@ -54725,7 +54713,7 @@ _sk_black_color_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,92 ; sub $0x5c,%esp
- DB 232,0,0,0,0 ; call 9565 <_sk_black_color_sse2_lowp+0xe>
+ DB 232,0,0,0,0 ; call 9541 <_sk_black_color_sse2_lowp+0xe>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,16 ; mov 0x10(%ebp),%edx
@@ -54744,7 +54732,7 @@ _sk_black_color_sse2_lowp LABEL PROC
DB 137,84,36,8 ; mov %edx,0x8(%esp)
DB 137,92,36,4 ; mov %ebx,0x4(%esp)
DB 137,12,36 ; mov %ecx,(%esp)
- DB 15,40,152,91,62,0,0 ; movaps 0x3e5b(%eax),%xmm3
+ DB 15,40,152,95,62,0,0 ; movaps 0x3e5f(%eax),%xmm3
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,87,201 ; xorps %xmm1,%xmm1
DB 15,87,210 ; xorps %xmm2,%xmm2
@@ -54764,7 +54752,7 @@ _sk_white_color_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,92 ; sub $0x5c,%esp
- DB 232,0,0,0,0 ; call 95d0 <_sk_white_color_sse2_lowp+0xe>
+ DB 232,0,0,0,0 ; call 95ac <_sk_white_color_sse2_lowp+0xe>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,16 ; mov 0x10(%ebp),%edx
@@ -54783,7 +54771,7 @@ _sk_white_color_sse2_lowp LABEL PROC
DB 137,84,36,8 ; mov %edx,0x8(%esp)
DB 137,92,36,4 ; mov %ebx,0x4(%esp)
DB 137,12,36 ; mov %ecx,(%esp)
- DB 15,40,128,240,61,0,0 ; movaps 0x3df0(%eax),%xmm0
+ DB 15,40,128,244,61,0,0 ; movaps 0x3df4(%eax),%xmm0
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,40,216 ; movaps %xmm0,%xmm3
@@ -54802,16 +54790,16 @@ _sk_set_rgb_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 963a <_sk_set_rgb_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9616 <_sk_set_rgb_sse2_lowp+0xd>
DB 94 ; pop %esi
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 139,85,16 ; mov 0x10(%ebp),%edx
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,57 ; mov (%ecx),%edi
- DB 243,15,16,150,74,62,0,0 ; movss 0x3e4a(%esi),%xmm2
+ DB 243,15,16,150,78,62,0,0 ; movss 0x3e4e(%esi),%xmm2
DB 243,15,16,7 ; movss (%edi),%xmm0
DB 243,15,89,194 ; mulss %xmm2,%xmm0
- DB 243,15,16,142,70,62,0,0 ; movss 0x3e46(%esi),%xmm1
+ DB 243,15,16,142,74,62,0,0 ; movss 0x3e4a(%esi),%xmm1
DB 243,15,88,193 ; addss %xmm1,%xmm0
DB 243,15,44,240 ; cvttss2si %xmm0,%esi
DB 102,15,110,198 ; movd %esi,%xmm0
@@ -54858,7 +54846,7 @@ _sk_premul_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 96fe <_sk_premul_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 96da <_sk_premul_sse2_lowp+0xd>
DB 90 ; pop %edx
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 139,77,16 ; mov 0x10(%ebp),%ecx
@@ -54867,7 +54855,7 @@ _sk_premul_sse2_lowp LABEL PROC
DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5
DB 15,40,117,56 ; movaps 0x38(%ebp),%xmm6
DB 102,15,213,195 ; pmullw %xmm3,%xmm0
- DB 102,15,111,186,194,60,0,0 ; movdqa 0x3cc2(%edx),%xmm7
+ DB 102,15,111,186,198,60,0,0 ; movdqa 0x3cc6(%edx),%xmm7
DB 102,15,253,199 ; paddw %xmm7,%xmm0
DB 102,15,213,203 ; pmullw %xmm3,%xmm1
DB 102,15,253,207 ; paddw %xmm7,%xmm1
@@ -54993,12 +54981,12 @@ _sk_invert_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9878 <_sk_invert_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9854 <_sk_invert_sse2_lowp+0xd>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,16 ; mov 0x10(%ebp),%edx
DB 139,117,20 ; mov 0x14(%ebp),%esi
- DB 102,15,111,160,72,59,0,0 ; movdqa 0x3b48(%eax),%xmm4
+ DB 102,15,111,160,76,59,0,0 ; movdqa 0x3b4c(%eax),%xmm4
DB 102,15,111,236 ; movdqa %xmm4,%xmm5
DB 102,15,249,232 ; psubw %xmm0,%xmm5
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
@@ -55076,11 +55064,11 @@ _sk_srcatop_sse2_lowp LABEL PROC
DB 102,15,111,234 ; movdqa %xmm2,%xmm5
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call 9970 <_sk_srcatop_sse2_lowp+0x19>
+ DB 232,0,0,0,0 ; call 994c <_sk_srcatop_sse2_lowp+0x19>
DB 88 ; pop %eax
DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6
DB 102,15,213,206 ; pmullw %xmm6,%xmm1
- DB 102,15,111,128,80,58,0,0 ; movdqa 0x3a50(%eax),%xmm0
+ DB 102,15,111,128,84,58,0,0 ; movdqa 0x3a54(%eax),%xmm0
DB 102,15,253,200 ; paddw %xmm0,%xmm1
DB 102,15,213,214 ; pmullw %xmm6,%xmm2
DB 102,15,253,208 ; paddw %xmm0,%xmm2
@@ -55136,12 +55124,12 @@ _sk_dstatop_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9a44 <_sk_dstatop_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9a20 <_sk_dstatop_sse2_lowp+0xd>
DB 88 ; pop %eax
DB 102,15,111,101,40 ; movdqa 0x28(%ebp),%xmm4
DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6
DB 102,15,213,243 ; pmullw %xmm3,%xmm6
- DB 102,15,111,184,124,57,0,0 ; movdqa 0x397c(%eax),%xmm7
+ DB 102,15,111,184,128,57,0,0 ; movdqa 0x3980(%eax),%xmm7
DB 102,15,253,247 ; paddw %xmm7,%xmm6
DB 102,15,213,227 ; pmullw %xmm3,%xmm4
DB 102,15,253,231 ; paddw %xmm7,%xmm4
@@ -55192,7 +55180,7 @@ _sk_srcin_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9b05 <_sk_srcin_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9ae1 <_sk_srcin_sse2_lowp+0xd>
DB 94 ; pop %esi
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 139,77,16 ; mov 0x10(%ebp),%ecx
@@ -55201,7 +55189,7 @@ _sk_srcin_sse2_lowp LABEL PROC
DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5
DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6
DB 102,15,213,198 ; pmullw %xmm6,%xmm0
- DB 102,15,111,190,187,56,0,0 ; movdqa 0x38bb(%esi),%xmm7
+ DB 102,15,111,190,191,56,0,0 ; movdqa 0x38bf(%esi),%xmm7
DB 102,15,253,199 ; paddw %xmm7,%xmm0
DB 102,15,213,206 ; pmullw %xmm6,%xmm1
DB 102,15,253,207 ; paddw %xmm7,%xmm1
@@ -55238,14 +55226,14 @@ _sk_dstin_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9b9c <_sk_dstin_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9b78 <_sk_dstin_sse2_lowp+0xd>
DB 88 ; pop %eax
DB 102,15,111,85,56 ; movdqa 0x38(%ebp),%xmm2
DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5
DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6
DB 102,15,111,198 ; movdqa %xmm6,%xmm0
DB 102,15,213,195 ; pmullw %xmm3,%xmm0
- DB 102,15,111,184,36,56,0,0 ; movdqa 0x3824(%eax),%xmm7
+ DB 102,15,111,184,40,56,0,0 ; movdqa 0x3828(%eax),%xmm7
DB 102,15,253,199 ; paddw %xmm7,%xmm0
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 102,15,213,203 ; pmullw %xmm3,%xmm1
@@ -55287,14 +55275,14 @@ _sk_srcout_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9c44 <_sk_srcout_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9c20 <_sk_srcout_sse2_lowp+0xd>
DB 94 ; pop %esi
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 139,77,16 ; mov 0x10(%ebp),%ecx
DB 139,85,20 ; mov 0x14(%ebp),%edx
DB 15,40,101,24 ; movaps 0x18(%ebp),%xmm4
DB 102,15,111,109,72 ; movdqa 0x48(%ebp),%xmm5
- DB 102,15,111,182,124,55,0,0 ; movdqa 0x377c(%esi),%xmm6
+ DB 102,15,111,182,128,55,0,0 ; movdqa 0x3780(%esi),%xmm6
DB 102,15,111,254 ; movdqa %xmm6,%xmm7
DB 102,15,249,253 ; psubw %xmm5,%xmm7
DB 102,15,213,199 ; pmullw %xmm7,%xmm0
@@ -55336,11 +55324,11 @@ _sk_dstout_sse2_lowp LABEL PROC
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
- DB 232,0,0,0,0 ; call 9ce7 <_sk_dstout_sse2_lowp+0x11>
+ DB 232,0,0,0,0 ; call 9cc3 <_sk_dstout_sse2_lowp+0x11>
DB 88 ; pop %eax
DB 102,15,111,109,56 ; movdqa 0x38(%ebp),%xmm5
DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6
- DB 102,15,111,184,217,54,0,0 ; movdqa 0x36d9(%eax),%xmm7
+ DB 102,15,111,184,221,54,0,0 ; movdqa 0x36dd(%eax),%xmm7
DB 102,15,111,223 ; movdqa %xmm7,%xmm3
DB 102,15,249,216 ; psubw %xmm0,%xmm3
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
@@ -55390,9 +55378,9 @@ _sk_srcover_sse2_lowp LABEL PROC
DB 15,41,85,232 ; movaps %xmm2,-0x18(%ebp)
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
- DB 232,0,0,0,0 ; call 9da3 <_sk_srcover_sse2_lowp+0x19>
+ DB 232,0,0,0,0 ; call 9d7f <_sk_srcover_sse2_lowp+0x19>
DB 88 ; pop %eax
- DB 102,15,111,136,29,54,0,0 ; movdqa 0x361d(%eax),%xmm1
+ DB 102,15,111,136,33,54,0,0 ; movdqa 0x3621(%eax),%xmm1
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,249,195 ; psubw %xmm3,%xmm0
DB 102,15,111,248 ; movdqa %xmm0,%xmm7
@@ -55449,7 +55437,7 @@ _sk_dstover_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9e73 <_sk_dstover_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9e4f <_sk_dstover_sse2_lowp+0xd>
DB 95 ; pop %edi
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,16 ; mov 0x10(%ebp),%edx
@@ -55457,7 +55445,7 @@ _sk_dstover_sse2_lowp LABEL PROC
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 102,15,111,101,56 ; movdqa 0x38(%ebp),%xmm4
DB 102,15,111,109,72 ; movdqa 0x48(%ebp),%xmm5
- DB 102,15,111,183,77,53,0,0 ; movdqa 0x354d(%edi),%xmm6
+ DB 102,15,111,183,81,53,0,0 ; movdqa 0x3551(%edi),%xmm6
DB 102,15,111,254 ; movdqa %xmm6,%xmm7
DB 102,15,249,253 ; psubw %xmm5,%xmm7
DB 102,15,213,199 ; pmullw %xmm7,%xmm0
@@ -55501,12 +55489,12 @@ _sk_modulate_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9f28 <_sk_modulate_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9f04 <_sk_modulate_sse2_lowp+0xd>
DB 88 ; pop %eax
DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5
DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6
DB 102,15,213,198 ; pmullw %xmm6,%xmm0
- DB 102,15,111,184,152,52,0,0 ; movdqa 0x3498(%eax),%xmm7
+ DB 102,15,111,184,156,52,0,0 ; movdqa 0x349c(%eax),%xmm7
DB 102,15,253,199 ; paddw %xmm7,%xmm0
DB 102,15,213,205 ; pmullw %xmm5,%xmm1
DB 102,15,253,207 ; paddw %xmm7,%xmm1
@@ -55547,10 +55535,10 @@ _sk_multiply_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call 9fc4 <_sk_multiply_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call 9fa0 <_sk_multiply_sse2_lowp+0xd>
DB 88 ; pop %eax
DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5
- DB 102,15,111,160,252,51,0,0 ; movdqa 0x33fc(%eax),%xmm4
+ DB 102,15,111,160,0,52,0,0 ; movdqa 0x3400(%eax),%xmm4
DB 102,15,111,245 ; movdqa %xmm5,%xmm6
DB 102,15,253,244 ; paddw %xmm4,%xmm6
DB 102,15,249,117,72 ; psubw 0x48(%ebp),%xmm6
@@ -55618,17 +55606,17 @@ _sk_plus__sse2_lowp LABEL PROC
DB 131,236,96 ; sub $0x60,%esp
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call a0c5 <_sk_plus__sse2_lowp+0x15>
+ DB 232,0,0,0,0 ; call a0a1 <_sk_plus__sse2_lowp+0x15>
DB 88 ; pop %eax
DB 102,15,253,77,24 ; paddw 0x18(%ebp),%xmm1
- DB 102,15,111,168,11,51,0,0 ; movdqa 0x330b(%eax),%xmm5
+ DB 102,15,111,168,15,51,0,0 ; movdqa 0x330f(%eax),%xmm5
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,217,197 ; psubusw %xmm5,%xmm0
DB 102,15,127,109,232 ; movdqa %xmm5,-0x18(%ebp)
DB 102,15,239,255 ; pxor %xmm7,%xmm7
DB 102,15,117,199 ; pcmpeqw %xmm7,%xmm0
DB 102,15,219,200 ; pand %xmm0,%xmm1
- DB 102,15,111,176,251,50,0,0 ; movdqa 0x32fb(%eax),%xmm6
+ DB 102,15,111,176,255,50,0,0 ; movdqa 0x32ff(%eax),%xmm6
DB 102,15,223,198 ; pandn %xmm6,%xmm0
DB 102,15,235,193 ; por %xmm1,%xmm0
DB 102,15,253,101,40 ; paddw 0x28(%ebp),%xmm4
@@ -55687,14 +55675,14 @@ _sk_screen_sse2_lowp LABEL PROC
DB 131,236,80 ; sub $0x50,%esp
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call a1bd <_sk_screen_sse2_lowp+0x15>
+ DB 232,0,0,0,0 ; call a199 <_sk_screen_sse2_lowp+0x15>
DB 88 ; pop %eax
DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5
DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6
DB 102,15,111,198 ; movdqa %xmm6,%xmm0
DB 102,15,253,193 ; paddw %xmm1,%xmm0
DB 102,15,213,206 ; pmullw %xmm6,%xmm1
- DB 102,15,111,176,3,50,0,0 ; movdqa 0x3203(%eax),%xmm6
+ DB 102,15,111,176,7,50,0,0 ; movdqa 0x3207(%eax),%xmm6
DB 102,15,253,206 ; paddw %xmm6,%xmm1
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
DB 102,15,249,193 ; psubw %xmm1,%xmm0
@@ -55750,9 +55738,9 @@ _sk_xor__sse2_lowp LABEL PROC
DB 86 ; push %esi
DB 131,236,96 ; sub $0x60,%esp
DB 102,15,127,93,232 ; movdqa %xmm3,-0x18(%ebp)
- DB 232,0,0,0,0 ; call a29d <_sk_xor__sse2_lowp+0x12>
+ DB 232,0,0,0,0 ; call a279 <_sk_xor__sse2_lowp+0x12>
DB 88 ; pop %eax
- DB 102,15,111,176,35,49,0,0 ; movdqa 0x3123(%eax),%xmm6
+ DB 102,15,111,176,39,49,0,0 ; movdqa 0x3127(%eax),%xmm6
DB 102,15,111,254 ; movdqa %xmm6,%xmm7
DB 102,15,249,125,72 ; psubw 0x48(%ebp),%xmm7
DB 102,15,213,199 ; pmullw %xmm7,%xmm0
@@ -55817,7 +55805,7 @@ _sk_darken_sse2_lowp LABEL PROC
DB 15,41,85,200 ; movaps %xmm2,-0x38(%ebp)
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call a392 <_sk_darken_sse2_lowp+0x25>
+ DB 232,0,0,0,0 ; call a36e <_sk_darken_sse2_lowp+0x25>
DB 88 ; pop %eax
DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6
DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5
@@ -55828,7 +55816,7 @@ _sk_darken_sse2_lowp LABEL PROC
DB 102,15,111,222 ; movdqa %xmm6,%xmm3
DB 102,15,111,197 ; movdqa %xmm5,%xmm0
DB 102,15,213,199 ; pmullw %xmm7,%xmm0
- DB 102,15,111,184,78,48,0,0 ; movdqa 0x304e(%eax),%xmm7
+ DB 102,15,111,184,82,48,0,0 ; movdqa 0x3052(%eax),%xmm7
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,239,247 ; pxor %xmm7,%xmm6
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
@@ -55837,7 +55825,7 @@ _sk_darken_sse2_lowp LABEL PROC
DB 102,15,219,197 ; pand %xmm5,%xmm0
DB 102,15,223,233 ; pandn %xmm1,%xmm5
DB 102,15,235,232 ; por %xmm0,%xmm5
- DB 102,15,111,128,46,48,0,0 ; movdqa 0x302e(%eax),%xmm0
+ DB 102,15,111,128,50,48,0,0 ; movdqa 0x3032(%eax),%xmm0
DB 102,15,127,69,232 ; movdqa %xmm0,-0x18(%ebp)
DB 102,15,253,232 ; paddw %xmm0,%xmm5
DB 102,15,113,213,8 ; psrlw $0x8,%xmm5
@@ -55926,7 +55914,7 @@ _sk_lighten_sse2_lowp LABEL PROC
DB 15,41,85,200 ; movaps %xmm2,-0x38(%ebp)
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call a53b <_sk_lighten_sse2_lowp+0x25>
+ DB 232,0,0,0,0 ; call a517 <_sk_lighten_sse2_lowp+0x25>
DB 88 ; pop %eax
DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5
DB 102,15,111,197 ; movdqa %xmm5,%xmm0
@@ -55935,7 +55923,7 @@ _sk_lighten_sse2_lowp LABEL PROC
DB 102,15,213,77,72 ; pmullw 0x48(%ebp),%xmm1
DB 102,15,111,197 ; movdqa %xmm5,%xmm0
DB 102,15,213,198 ; pmullw %xmm6,%xmm0
- DB 102,15,111,184,165,46,0,0 ; movdqa 0x2ea5(%eax),%xmm7
+ DB 102,15,111,184,169,46,0,0 ; movdqa 0x2ea9(%eax),%xmm7
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,239,247 ; pxor %xmm7,%xmm6
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
@@ -55944,7 +55932,7 @@ _sk_lighten_sse2_lowp LABEL PROC
DB 102,15,219,205 ; pand %xmm5,%xmm1
DB 102,15,223,232 ; pandn %xmm0,%xmm5
DB 102,15,235,233 ; por %xmm1,%xmm5
- DB 102,15,111,128,133,46,0,0 ; movdqa 0x2e85(%eax),%xmm0
+ DB 102,15,111,128,137,46,0,0 ; movdqa 0x2e89(%eax),%xmm0
DB 102,15,253,232 ; paddw %xmm0,%xmm5
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
DB 102,15,127,85,232 ; movdqa %xmm2,-0x18(%ebp)
@@ -56032,7 +56020,7 @@ _sk_difference_sse2_lowp LABEL PROC
DB 15,41,85,184 ; movaps %xmm2,-0x48(%ebp)
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call a6d9 <_sk_difference_sse2_lowp+0x25>
+ DB 232,0,0,0,0 ; call a6b5 <_sk_difference_sse2_lowp+0x25>
DB 88 ; pop %eax
DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6
DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5
@@ -56043,7 +56031,7 @@ _sk_difference_sse2_lowp LABEL PROC
DB 102,15,111,222 ; movdqa %xmm6,%xmm3
DB 102,15,111,197 ; movdqa %xmm5,%xmm0
DB 102,15,213,199 ; pmullw %xmm7,%xmm0
- DB 102,15,111,184,7,45,0,0 ; movdqa 0x2d07(%eax),%xmm7
+ DB 102,15,111,184,11,45,0,0 ; movdqa 0x2d0b(%eax),%xmm7
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,239,247 ; pxor %xmm7,%xmm6
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
@@ -56052,11 +56040,11 @@ _sk_difference_sse2_lowp LABEL PROC
DB 102,15,219,205 ; pand %xmm5,%xmm1
DB 102,15,223,232 ; pandn %xmm0,%xmm5
DB 102,15,235,233 ; por %xmm1,%xmm5
- DB 102,15,111,128,231,44,0,0 ; movdqa 0x2ce7(%eax),%xmm0
+ DB 102,15,111,128,235,44,0,0 ; movdqa 0x2ceb(%eax),%xmm0
DB 102,15,127,69,216 ; movdqa %xmm0,-0x28(%ebp)
DB 102,15,253,232 ; paddw %xmm0,%xmm5
DB 102,15,113,213,7 ; psrlw $0x7,%xmm5
- DB 102,15,111,128,23,45,0,0 ; movdqa 0x2d17(%eax),%xmm0
+ DB 102,15,111,128,27,45,0,0 ; movdqa 0x2d1b(%eax),%xmm0
DB 102,15,127,69,232 ; movdqa %xmm0,-0x18(%ebp)
DB 102,15,219,232 ; pand %xmm0,%xmm5
DB 102,15,249,213 ; psubw %xmm5,%xmm2
@@ -56143,16 +56131,16 @@ _sk_exclusion_sse2_lowp LABEL PROC
DB 131,236,80 ; sub $0x50,%esp
DB 102,15,111,225 ; movdqa %xmm1,%xmm4
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call a88d <_sk_exclusion_sse2_lowp+0x15>
+ DB 232,0,0,0,0 ; call a869 <_sk_exclusion_sse2_lowp+0x15>
DB 88 ; pop %eax
DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5
DB 102,15,111,197 ; movdqa %xmm5,%xmm0
DB 102,15,253,193 ; paddw %xmm1,%xmm0
DB 102,15,213,205 ; pmullw %xmm5,%xmm1
- DB 102,15,111,184,51,43,0,0 ; movdqa 0x2b33(%eax),%xmm7
+ DB 102,15,111,184,55,43,0,0 ; movdqa 0x2b37(%eax),%xmm7
DB 102,15,253,207 ; paddw %xmm7,%xmm1
DB 102,15,113,209,7 ; psrlw $0x7,%xmm1
- DB 102,15,111,176,99,43,0,0 ; movdqa 0x2b63(%eax),%xmm6
+ DB 102,15,111,176,103,43,0,0 ; movdqa 0x2b67(%eax),%xmm6
DB 102,15,219,206 ; pand %xmm6,%xmm1
DB 102,15,249,193 ; psubw %xmm1,%xmm0
DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5
@@ -56211,9 +56199,9 @@ _sk_hardlight_sse2_lowp LABEL PROC
DB 15,41,85,152 ; movaps %xmm2,-0x68(%ebp)
DB 102,15,111,233 ; movdqa %xmm1,%xmm5
DB 102,15,111,224 ; movdqa %xmm0,%xmm4
- DB 232,0,0,0,0 ; call a987 <_sk_hardlight_sse2_lowp+0x1c>
+ DB 232,0,0,0,0 ; call a963 <_sk_hardlight_sse2_lowp+0x1c>
DB 88 ; pop %eax
- DB 102,15,111,184,57,42,0,0 ; movdqa 0x2a39(%eax),%xmm7
+ DB 102,15,111,184,61,42,0,0 ; movdqa 0x2a3d(%eax),%xmm7
DB 102,15,127,125,200 ; movdqa %xmm7,-0x38(%ebp)
DB 102,15,111,215 ; movdqa %xmm7,%xmm2
DB 102,15,249,85,72 ; psubw 0x48(%ebp),%xmm2
@@ -56240,7 +56228,7 @@ _sk_hardlight_sse2_lowp LABEL PROC
DB 102,15,111,214 ; movdqa %xmm6,%xmm2
DB 102,15,249,209 ; psubw %xmm1,%xmm2
DB 102,15,253,228 ; paddw %xmm4,%xmm4
- DB 102,15,111,128,89,42,0,0 ; movdqa 0x2a59(%eax),%xmm0
+ DB 102,15,111,128,93,42,0,0 ; movdqa 0x2a5d(%eax),%xmm0
DB 102,15,239,216 ; pxor %xmm0,%xmm3
DB 102,15,127,93,184 ; movdqa %xmm3,-0x48(%ebp)
DB 102,15,111,204 ; movdqa %xmm4,%xmm1
@@ -56345,10 +56333,10 @@ _sk_overlay_sse2_lowp LABEL PROC
DB 15,41,85,152 ; movaps %xmm2,-0x68(%ebp)
DB 15,41,141,120,255,255,255 ; movaps %xmm1,-0x88(%ebp)
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call aba9 <_sk_overlay_sse2_lowp+0x1f>
+ DB 232,0,0,0,0 ; call ab85 <_sk_overlay_sse2_lowp+0x1f>
DB 88 ; pop %eax
DB 102,15,111,69,72 ; movdqa 0x48(%ebp),%xmm0
- DB 102,15,111,184,23,40,0,0 ; movdqa 0x2817(%eax),%xmm7
+ DB 102,15,111,184,27,40,0,0 ; movdqa 0x281b(%eax),%xmm7
DB 102,15,127,125,232 ; movdqa %xmm7,-0x18(%ebp)
DB 102,15,111,215 ; movdqa %xmm7,%xmm2
DB 102,15,249,208 ; psubw %xmm0,%xmm2
@@ -56375,7 +56363,7 @@ _sk_overlay_sse2_lowp LABEL PROC
DB 102,15,249,234 ; psubw %xmm2,%xmm5
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,253,192 ; paddw %xmm0,%xmm0
- DB 102,15,111,144,55,40,0,0 ; movdqa 0x2837(%eax),%xmm2
+ DB 102,15,111,144,59,40,0,0 ; movdqa 0x283b(%eax),%xmm2
DB 102,15,127,85,184 ; movdqa %xmm2,-0x48(%ebp)
DB 102,15,239,226 ; pxor %xmm2,%xmm4
DB 102,15,239,194 ; pxor %xmm2,%xmm0
@@ -56503,10 +56491,10 @@ _sk_load_8888_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call ae18 <_sk_load_8888_sse2_lowp+0x30>
+ DB 232,0,0,0,0 ; call adf4 <_sk_load_8888_sse2_lowp+0x30>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,32 ; ja ae3e <_sk_load_8888_sse2_lowp+0x56>
+ DB 119,32 ; ja ae1a <_sk_load_8888_sse2_lowp+0x56>
DB 102,15,239,246 ; pxor %xmm6,%xmm6
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,52,1,0,0 ; mov 0x134(%edi,%ecx,4),%ecx
@@ -56515,14 +56503,14 @@ _sk_load_8888_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 243,15,16,28,179 ; movss (%ebx,%esi,4),%xmm3
DB 15,87,246 ; xorps %xmm6,%xmm6
- DB 235,73 ; jmp ae87 <_sk_load_8888_sse2_lowp+0x9f>
+ DB 235,73 ; jmp ae63 <_sk_load_8888_sse2_lowp+0x9f>
DB 102,15,16,28,179 ; movupd (%ebx,%esi,4),%xmm3
DB 15,16,116,179,16 ; movups 0x10(%ebx,%esi,4),%xmm6
- DB 235,61 ; jmp ae87 <_sk_load_8888_sse2_lowp+0x9f>
+ DB 235,61 ; jmp ae63 <_sk_load_8888_sse2_lowp+0x9f>
DB 102,15,110,68,179,8 ; movd 0x8(%ebx,%esi,4),%xmm0
DB 102,15,112,216,69 ; pshufd $0x45,%xmm0,%xmm3
DB 102,15,18,28,179 ; movlpd (%ebx,%esi,4),%xmm3
- DB 235,43 ; jmp ae87 <_sk_load_8888_sse2_lowp+0x9f>
+ DB 235,43 ; jmp ae63 <_sk_load_8888_sse2_lowp+0x9f>
DB 102,15,110,68,179,24 ; movd 0x18(%ebx,%esi,4),%xmm0
DB 102,15,112,240,69 ; pshufd $0x45,%xmm0,%xmm6
DB 243,15,16,68,179,20 ; movss 0x14(%ebx,%esi,4),%xmm0
@@ -56539,7 +56527,7 @@ _sk_load_8888_sse2_lowp LABEL PROC
DB 102,15,114,240,16 ; pslld $0x10,%xmm0
DB 102,15,114,224,16 ; psrad $0x10,%xmm0
DB 102,15,107,200 ; packssdw %xmm0,%xmm1
- DB 102,15,111,175,168,37,0,0 ; movdqa 0x25a8(%edi),%xmm5
+ DB 102,15,111,175,172,37,0,0 ; movdqa 0x25ac(%edi),%xmm5
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,219,197 ; pand %xmm5,%xmm0
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
@@ -56617,10 +56605,10 @@ _sk_load_8888_dst_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call afa5 <_sk_load_8888_dst_sse2_lowp+0x3d>
+ DB 232,0,0,0,0 ; call af81 <_sk_load_8888_dst_sse2_lowp+0x3d>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,32 ; ja afcb <_sk_load_8888_dst_sse2_lowp+0x63>
+ DB 119,32 ; ja afa7 <_sk_load_8888_dst_sse2_lowp+0x63>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,59,1,0,0 ; mov 0x13b(%edi,%ecx,4),%ecx
@@ -56629,14 +56617,14 @@ _sk_load_8888_dst_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 243,15,16,60,179 ; movss (%ebx,%esi,4),%xmm7
DB 15,87,219 ; xorps %xmm3,%xmm3
- DB 235,73 ; jmp b014 <_sk_load_8888_dst_sse2_lowp+0xac>
+ DB 235,73 ; jmp aff0 <_sk_load_8888_dst_sse2_lowp+0xac>
DB 102,15,16,60,179 ; movupd (%ebx,%esi,4),%xmm7
DB 15,16,92,179,16 ; movups 0x10(%ebx,%esi,4),%xmm3
- DB 235,61 ; jmp b014 <_sk_load_8888_dst_sse2_lowp+0xac>
+ DB 235,61 ; jmp aff0 <_sk_load_8888_dst_sse2_lowp+0xac>
DB 102,15,110,84,179,8 ; movd 0x8(%ebx,%esi,4),%xmm2
DB 102,15,112,250,69 ; pshufd $0x45,%xmm2,%xmm7
DB 102,15,18,60,179 ; movlpd (%ebx,%esi,4),%xmm7
- DB 235,43 ; jmp b014 <_sk_load_8888_dst_sse2_lowp+0xac>
+ DB 235,43 ; jmp aff0 <_sk_load_8888_dst_sse2_lowp+0xac>
DB 102,15,110,84,179,24 ; movd 0x18(%ebx,%esi,4),%xmm2
DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3
DB 243,15,16,84,179,20 ; movss 0x14(%ebx,%esi,4),%xmm2
@@ -56653,7 +56641,7 @@ _sk_load_8888_dst_sse2_lowp LABEL PROC
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,114,226,16 ; psrad $0x10,%xmm2
DB 102,15,107,242 ; packssdw %xmm2,%xmm6
- DB 102,15,111,151,27,36,0,0 ; movdqa 0x241b(%edi),%xmm2
+ DB 102,15,111,151,31,36,0,0 ; movdqa 0x241f(%edi),%xmm2
DB 102,15,111,206 ; movdqa %xmm6,%xmm1
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
@@ -56745,19 +56733,19 @@ _sk_store_8888_sse2_lowp LABEL PROC
DB 128,227,7 ; and $0x7,%bl
DB 254,203 ; dec %bl
DB 128,251,6 ; cmp $0x6,%bl
- DB 232,0,0,0,0 ; call b170 <_sk_store_8888_sse2_lowp+0x74>
+ DB 232,0,0,0,0 ; call b14c <_sk_store_8888_sse2_lowp+0x74>
DB 89 ; pop %ecx
DB 139,117,16 ; mov 0x10(%ebp),%esi
DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5
- DB 119,19 ; ja b18d <_sk_store_8888_sse2_lowp+0x91>
+ DB 119,19 ; ja b169 <_sk_store_8888_sse2_lowp+0x91>
DB 15,182,219 ; movzbl %bl,%ebx
DB 3,140,153,184,0,0,0 ; add 0xb8(%ecx,%ebx,4),%ecx
DB 255,225 ; jmp *%ecx
DB 102,15,126,60,183 ; movd %xmm7,(%edi,%esi,4)
- DB 235,93 ; jmp b1ea <_sk_store_8888_sse2_lowp+0xee>
+ DB 235,93 ; jmp b1c6 <_sk_store_8888_sse2_lowp+0xee>
DB 243,15,127,60,183 ; movdqu %xmm7,(%edi,%esi,4)
DB 243,15,127,116,183,16 ; movdqu %xmm6,0x10(%edi,%esi,4)
- DB 235,80 ; jmp b1ea <_sk_store_8888_sse2_lowp+0xee>
+ DB 235,80 ; jmp b1c6 <_sk_store_8888_sse2_lowp+0xee>
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
DB 15,40,227 ; movaps %xmm3,%xmm4
DB 102,15,112,223,78 ; pshufd $0x4e,%xmm7,%xmm3
@@ -56765,7 +56753,7 @@ _sk_store_8888_sse2_lowp LABEL PROC
DB 15,40,220 ; movaps %xmm4,%xmm3
DB 102,15,111,230 ; movdqa %xmm6,%xmm4
DB 102,15,214,60,183 ; movq %xmm7,(%edi,%esi,4)
- DB 235,48 ; jmp b1ea <_sk_store_8888_sse2_lowp+0xee>
+ DB 235,48 ; jmp b1c6 <_sk_store_8888_sse2_lowp+0xee>
DB 102,15,112,222,78 ; pshufd $0x4e,%xmm6,%xmm3
DB 102,15,126,92,183,24 ; movd %xmm3,0x18(%edi,%esi,4)
DB 15,40,93,72 ; movaps 0x48(%ebp),%xmm3
@@ -56802,7 +56790,7 @@ _sk_store_8888_sse2_lowp LABEL PROC
DB 0,0 ; add %al,(%eax)
DB 42,0 ; sub (%eax),%al
DB 0,0 ; add %al,(%eax)
- DB 117,0 ; jne b236 <_sk_store_8888_sse2_lowp+0x13a>
+ DB 117,0 ; jne b212 <_sk_store_8888_sse2_lowp+0x13a>
DB 0,0 ; add %al,(%eax)
DB 111 ; outsl %ds:(%esi),(%dx)
DB 0,0 ; add %al,(%eax)
@@ -56832,10 +56820,10 @@ _sk_load_bgra_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call b274 <_sk_load_bgra_sse2_lowp+0x30>
+ DB 232,0,0,0,0 ; call b250 <_sk_load_bgra_sse2_lowp+0x30>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,32 ; ja b29a <_sk_load_bgra_sse2_lowp+0x56>
+ DB 119,32 ; ja b276 <_sk_load_bgra_sse2_lowp+0x56>
DB 102,15,239,246 ; pxor %xmm6,%xmm6
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,52,1,0,0 ; mov 0x134(%edi,%ecx,4),%ecx
@@ -56844,14 +56832,14 @@ _sk_load_bgra_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 243,15,16,28,179 ; movss (%ebx,%esi,4),%xmm3
DB 15,87,246 ; xorps %xmm6,%xmm6
- DB 235,73 ; jmp b2e3 <_sk_load_bgra_sse2_lowp+0x9f>
+ DB 235,73 ; jmp b2bf <_sk_load_bgra_sse2_lowp+0x9f>
DB 102,15,16,28,179 ; movupd (%ebx,%esi,4),%xmm3
DB 15,16,116,179,16 ; movups 0x10(%ebx,%esi,4),%xmm6
- DB 235,61 ; jmp b2e3 <_sk_load_bgra_sse2_lowp+0x9f>
+ DB 235,61 ; jmp b2bf <_sk_load_bgra_sse2_lowp+0x9f>
DB 102,15,110,68,179,8 ; movd 0x8(%ebx,%esi,4),%xmm0
DB 102,15,112,216,69 ; pshufd $0x45,%xmm0,%xmm3
DB 102,15,18,28,179 ; movlpd (%ebx,%esi,4),%xmm3
- DB 235,43 ; jmp b2e3 <_sk_load_bgra_sse2_lowp+0x9f>
+ DB 235,43 ; jmp b2bf <_sk_load_bgra_sse2_lowp+0x9f>
DB 102,15,110,68,179,24 ; movd 0x18(%ebx,%esi,4),%xmm0
DB 102,15,112,240,69 ; pshufd $0x45,%xmm0,%xmm6
DB 243,15,16,68,179,20 ; movss 0x14(%ebx,%esi,4),%xmm0
@@ -56868,7 +56856,7 @@ _sk_load_bgra_sse2_lowp LABEL PROC
DB 102,15,114,240,16 ; pslld $0x10,%xmm0
DB 102,15,114,224,16 ; psrad $0x10,%xmm0
DB 102,15,107,200 ; packssdw %xmm0,%xmm1
- DB 102,15,111,175,76,33,0,0 ; movdqa 0x214c(%edi),%xmm5
+ DB 102,15,111,175,80,33,0,0 ; movdqa 0x2150(%edi),%xmm5
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,219,213 ; pand %xmm5,%xmm2
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
@@ -56946,10 +56934,10 @@ _sk_load_bgra_dst_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call b401 <_sk_load_bgra_dst_sse2_lowp+0x3d>
+ DB 232,0,0,0,0 ; call b3dd <_sk_load_bgra_dst_sse2_lowp+0x3d>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,32 ; ja b427 <_sk_load_bgra_dst_sse2_lowp+0x63>
+ DB 119,32 ; ja b403 <_sk_load_bgra_dst_sse2_lowp+0x63>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,59,1,0,0 ; mov 0x13b(%edi,%ecx,4),%ecx
@@ -56958,14 +56946,14 @@ _sk_load_bgra_dst_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 243,15,16,60,179 ; movss (%ebx,%esi,4),%xmm7
DB 15,87,219 ; xorps %xmm3,%xmm3
- DB 235,73 ; jmp b470 <_sk_load_bgra_dst_sse2_lowp+0xac>
+ DB 235,73 ; jmp b44c <_sk_load_bgra_dst_sse2_lowp+0xac>
DB 102,15,16,60,179 ; movupd (%ebx,%esi,4),%xmm7
DB 15,16,92,179,16 ; movups 0x10(%ebx,%esi,4),%xmm3
- DB 235,61 ; jmp b470 <_sk_load_bgra_dst_sse2_lowp+0xac>
+ DB 235,61 ; jmp b44c <_sk_load_bgra_dst_sse2_lowp+0xac>
DB 102,15,110,84,179,8 ; movd 0x8(%ebx,%esi,4),%xmm2
DB 102,15,112,250,69 ; pshufd $0x45,%xmm2,%xmm7
DB 102,15,18,60,179 ; movlpd (%ebx,%esi,4),%xmm7
- DB 235,43 ; jmp b470 <_sk_load_bgra_dst_sse2_lowp+0xac>
+ DB 235,43 ; jmp b44c <_sk_load_bgra_dst_sse2_lowp+0xac>
DB 102,15,110,84,179,24 ; movd 0x18(%ebx,%esi,4),%xmm2
DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3
DB 243,15,16,84,179,20 ; movss 0x14(%ebx,%esi,4),%xmm2
@@ -56982,7 +56970,7 @@ _sk_load_bgra_dst_sse2_lowp LABEL PROC
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,114,226,16 ; psrad $0x10,%xmm2
DB 102,15,107,242 ; packssdw %xmm2,%xmm6
- DB 102,15,111,151,191,31,0,0 ; movdqa 0x1fbf(%edi),%xmm2
+ DB 102,15,111,151,195,31,0,0 ; movdqa 0x1fc3(%edi),%xmm2
DB 102,15,111,206 ; movdqa %xmm6,%xmm1
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
@@ -57074,19 +57062,19 @@ _sk_store_bgra_sse2_lowp LABEL PROC
DB 128,227,7 ; and $0x7,%bl
DB 254,203 ; dec %bl
DB 128,251,6 ; cmp $0x6,%bl
- DB 232,0,0,0,0 ; call b5cc <_sk_store_bgra_sse2_lowp+0x74>
+ DB 232,0,0,0,0 ; call b5a8 <_sk_store_bgra_sse2_lowp+0x74>
DB 89 ; pop %ecx
DB 139,117,16 ; mov 0x10(%ebp),%esi
DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5
- DB 119,19 ; ja b5e9 <_sk_store_bgra_sse2_lowp+0x91>
+ DB 119,19 ; ja b5c5 <_sk_store_bgra_sse2_lowp+0x91>
DB 15,182,219 ; movzbl %bl,%ebx
DB 3,140,153,184,0,0,0 ; add 0xb8(%ecx,%ebx,4),%ecx
DB 255,225 ; jmp *%ecx
DB 102,15,126,60,183 ; movd %xmm7,(%edi,%esi,4)
- DB 235,93 ; jmp b646 <_sk_store_bgra_sse2_lowp+0xee>
+ DB 235,93 ; jmp b622 <_sk_store_bgra_sse2_lowp+0xee>
DB 243,15,127,60,183 ; movdqu %xmm7,(%edi,%esi,4)
DB 243,15,127,116,183,16 ; movdqu %xmm6,0x10(%edi,%esi,4)
- DB 235,80 ; jmp b646 <_sk_store_bgra_sse2_lowp+0xee>
+ DB 235,80 ; jmp b622 <_sk_store_bgra_sse2_lowp+0xee>
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
DB 15,40,227 ; movaps %xmm3,%xmm4
DB 102,15,112,223,78 ; pshufd $0x4e,%xmm7,%xmm3
@@ -57094,7 +57082,7 @@ _sk_store_bgra_sse2_lowp LABEL PROC
DB 15,40,220 ; movaps %xmm4,%xmm3
DB 102,15,111,230 ; movdqa %xmm6,%xmm4
DB 102,15,214,60,183 ; movq %xmm7,(%edi,%esi,4)
- DB 235,48 ; jmp b646 <_sk_store_bgra_sse2_lowp+0xee>
+ DB 235,48 ; jmp b622 <_sk_store_bgra_sse2_lowp+0xee>
DB 102,15,112,222,78 ; pshufd $0x4e,%xmm6,%xmm3
DB 102,15,126,92,183,24 ; movd %xmm3,0x18(%edi,%esi,4)
DB 15,40,93,72 ; movaps 0x48(%ebp),%xmm3
@@ -57131,7 +57119,7 @@ _sk_store_bgra_sse2_lowp LABEL PROC
DB 0,0 ; add %al,(%eax)
DB 42,0 ; sub (%eax),%al
DB 0,0 ; add %al,(%eax)
- DB 117,0 ; jne b692 <_sk_store_bgra_sse2_lowp+0x13a>
+ DB 117,0 ; jne b66e <_sk_store_bgra_sse2_lowp+0x13a>
DB 0,0 ; add %al,(%eax)
DB 111 ; outsl %ds:(%esi),(%dx)
DB 0,0 ; add %al,(%eax)
@@ -57164,10 +57152,10 @@ _sk_load_565_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call b6db <_sk_load_565_sse2_lowp+0x3b>
+ DB 232,0,0,0,0 ; call b6b7 <_sk_load_565_sse2_lowp+0x3b>
DB 94 ; pop %esi
DB 139,125,16 ; mov 0x10(%ebp),%edi
- DB 119,28 ; ja b6fd <_sk_load_565_sse2_lowp+0x5d>
+ DB 119,28 ; ja b6d9 <_sk_load_565_sse2_lowp+0x5d>
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,142,245,0,0,0 ; mov 0xf5(%esi,%ecx,4),%ecx
@@ -57175,14 +57163,14 @@ _sk_load_565_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,183,12,123 ; movzwl (%ebx,%edi,2),%ecx
DB 102,15,110,193 ; movd %ecx,%xmm0
- DB 235,59 ; jmp b738 <_sk_load_565_sse2_lowp+0x98>
+ DB 235,59 ; jmp b714 <_sk_load_565_sse2_lowp+0x98>
DB 243,15,111,4,123 ; movdqu (%ebx,%edi,2),%xmm0
- DB 235,52 ; jmp b738 <_sk_load_565_sse2_lowp+0x98>
+ DB 235,52 ; jmp b714 <_sk_load_565_sse2_lowp+0x98>
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,68,123,4,2 ; pinsrw $0x2,0x4(%ebx,%edi,2),%xmm0
DB 243,15,16,12,123 ; movss (%ebx,%edi,2),%xmm1
DB 243,15,16,193 ; movss %xmm1,%xmm0
- DB 235,30 ; jmp b738 <_sk_load_565_sse2_lowp+0x98>
+ DB 235,30 ; jmp b714 <_sk_load_565_sse2_lowp+0x98>
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,68,123,12,6 ; pinsrw $0x6,0xc(%ebx,%edi,2),%xmm0
DB 102,15,196,68,123,10,5 ; pinsrw $0x5,0xa(%ebx,%edi,2),%xmm0
@@ -57190,11 +57178,11 @@ _sk_load_565_sse2_lowp LABEL PROC
DB 102,15,18,4,123 ; movlpd (%ebx,%edi,2),%xmm0
DB 102,15,111,248 ; movdqa %xmm0,%xmm7
DB 102,15,113,215,8 ; psrlw $0x8,%xmm7
- DB 102,15,219,190,37,29,0,0 ; pand 0x1d25(%esi),%xmm7
+ DB 102,15,219,190,41,29,0,0 ; pand 0x1d29(%esi),%xmm7
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,113,209,5 ; psrlw $0x5,%xmm1
- DB 102,15,219,142,53,29,0,0 ; pand 0x1d35(%esi),%xmm1
- DB 102,15,111,150,69,29,0,0 ; movdqa 0x1d45(%esi),%xmm2
+ DB 102,15,219,142,57,29,0,0 ; pand 0x1d39(%esi),%xmm1
+ DB 102,15,111,150,73,29,0,0 ; movdqa 0x1d49(%esi),%xmm2
DB 102,15,219,208 ; pand %xmm0,%xmm2
DB 102,15,113,208,13 ; psrlw $0xd,%xmm0
DB 102,15,235,199 ; por %xmm7,%xmm0
@@ -57216,7 +57204,7 @@ _sk_load_565_sse2_lowp LABEL PROC
DB 137,124,36,8 ; mov %edi,0x8(%esp)
DB 137,76,36,4 ; mov %ecx,0x4(%esp)
DB 137,20,36 ; mov %edx,(%esp)
- DB 15,40,158,229,28,0,0 ; movaps 0x1ce5(%esi),%xmm3
+ DB 15,40,158,233,28,0,0 ; movaps 0x1ce9(%esi),%xmm3
DB 255,80,4 ; call *0x4(%eax)
DB 131,196,92 ; add $0x5c,%esp
DB 94 ; pop %esi
@@ -57260,10 +57248,10 @@ _sk_load_565_dst_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call b817 <_sk_load_565_dst_sse2_lowp+0x2b>
+ DB 232,0,0,0,0 ; call b7f3 <_sk_load_565_dst_sse2_lowp+0x2b>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja b839 <_sk_load_565_dst_sse2_lowp+0x4d>
+ DB 119,28 ; ja b815 <_sk_load_565_dst_sse2_lowp+0x4d>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,249,0,0,0 ; mov 0xf9(%edi,%ecx,4),%ecx
@@ -57271,14 +57259,14 @@ _sk_load_565_dst_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,183,12,115 ; movzwl (%ebx,%esi,2),%ecx
DB 102,15,110,225 ; movd %ecx,%xmm4
- DB 235,59 ; jmp b874 <_sk_load_565_dst_sse2_lowp+0x88>
+ DB 235,59 ; jmp b850 <_sk_load_565_dst_sse2_lowp+0x88>
DB 243,15,111,36,115 ; movdqu (%ebx,%esi,2),%xmm4
- DB 235,52 ; jmp b874 <_sk_load_565_dst_sse2_lowp+0x88>
+ DB 235,52 ; jmp b850 <_sk_load_565_dst_sse2_lowp+0x88>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,100,115,4,2 ; pinsrw $0x2,0x4(%ebx,%esi,2),%xmm4
DB 243,15,16,44,115 ; movss (%ebx,%esi,2),%xmm5
DB 243,15,16,229 ; movss %xmm5,%xmm4
- DB 235,30 ; jmp b874 <_sk_load_565_dst_sse2_lowp+0x88>
+ DB 235,30 ; jmp b850 <_sk_load_565_dst_sse2_lowp+0x88>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,100,115,12,6 ; pinsrw $0x6,0xc(%ebx,%esi,2),%xmm4
DB 102,15,196,100,115,10,5 ; pinsrw $0x5,0xa(%ebx,%esi,2),%xmm4
@@ -57286,11 +57274,11 @@ _sk_load_565_dst_sse2_lowp LABEL PROC
DB 102,15,18,36,115 ; movlpd (%ebx,%esi,2),%xmm4
DB 102,15,111,244 ; movdqa %xmm4,%xmm6
DB 102,15,113,214,8 ; psrlw $0x8,%xmm6
- DB 102,15,219,183,233,27,0,0 ; pand 0x1be9(%edi),%xmm6
+ DB 102,15,219,183,237,27,0,0 ; pand 0x1bed(%edi),%xmm6
DB 102,15,111,236 ; movdqa %xmm4,%xmm5
DB 102,15,113,213,5 ; psrlw $0x5,%xmm5
- DB 102,15,219,175,249,27,0,0 ; pand 0x1bf9(%edi),%xmm5
- DB 102,15,111,191,9,28,0,0 ; movdqa 0x1c09(%edi),%xmm7
+ DB 102,15,219,175,253,27,0,0 ; pand 0x1bfd(%edi),%xmm5
+ DB 102,15,111,191,13,28,0,0 ; movdqa 0x1c0d(%edi),%xmm7
DB 102,15,219,252 ; pand %xmm4,%xmm7
DB 102,15,113,212,13 ; psrlw $0xd,%xmm4
DB 102,15,235,230 ; por %xmm6,%xmm4
@@ -57303,7 +57291,7 @@ _sk_load_565_dst_sse2_lowp LABEL PROC
DB 102,15,113,215,2 ; psrlw $0x2,%xmm7
DB 102,15,235,254 ; por %xmm6,%xmm7
DB 141,72,8 ; lea 0x8(%eax),%ecx
- DB 15,40,183,169,27,0,0 ; movaps 0x1ba9(%edi),%xmm6
+ DB 15,40,183,173,27,0,0 ; movaps 0x1bad(%edi),%xmm6
DB 15,41,116,36,64 ; movaps %xmm6,0x40(%esp)
DB 139,125,20 ; mov 0x14(%ebp),%edi
DB 137,124,36,12 ; mov %edi,0xc(%esp)
@@ -57346,15 +57334,15 @@ _sk_store_565_sse2_lowp LABEL PROC
DB 86 ; push %esi
DB 131,236,92 ; sub $0x5c,%esp
DB 102,15,111,226 ; movdqa %xmm2,%xmm4
- DB 232,0,0,0,0 ; call b93e <_sk_store_565_sse2_lowp+0x12>
+ DB 232,0,0,0,0 ; call b91a <_sk_store_565_sse2_lowp+0x12>
DB 95 ; pop %edi
DB 15,40,109,72 ; movaps 0x48(%ebp),%xmm5
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
DB 102,15,113,242,8 ; psllw $0x8,%xmm2
- DB 102,15,219,151,242,26,0,0 ; pand 0x1af2(%edi),%xmm2
+ DB 102,15,219,151,246,26,0,0 ; pand 0x1af6(%edi),%xmm2
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
DB 102,15,113,246,3 ; psllw $0x3,%xmm6
- DB 102,15,219,183,2,27,0,0 ; pand 0x1b02(%edi),%xmm6
+ DB 102,15,219,183,6,27,0,0 ; pand 0x1b06(%edi),%xmm6
DB 102,15,235,242 ; por %xmm2,%xmm6
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
DB 102,15,113,210,3 ; psrlw $0x3,%xmm2
@@ -57373,19 +57361,19 @@ _sk_store_565_sse2_lowp LABEL PROC
DB 128,249,6 ; cmp $0x6,%cl
DB 139,117,16 ; mov 0x10(%ebp),%esi
DB 15,40,125,24 ; movaps 0x18(%ebp),%xmm7
- DB 119,22 ; ja b9b6 <_sk_store_565_sse2_lowp+0x8a>
+ DB 119,22 ; ja b992 <_sk_store_565_sse2_lowp+0x8a>
DB 15,182,201 ; movzbl %cl,%ecx
DB 3,188,143,242,0,0,0 ; add 0xf2(%edi,%ecx,4),%edi
DB 255,231 ; jmp *%edi
DB 102,15,126,209 ; movd %xmm2,%ecx
DB 102,137,12,115 ; mov %cx,(%ebx,%esi,2)
- DB 235,59 ; jmp b9f1 <_sk_store_565_sse2_lowp+0xc5>
+ DB 235,59 ; jmp b9cd <_sk_store_565_sse2_lowp+0xc5>
DB 243,15,127,20,115 ; movdqu %xmm2,(%ebx,%esi,2)
- DB 235,52 ; jmp b9f1 <_sk_store_565_sse2_lowp+0xc5>
+ DB 235,52 ; jmp b9cd <_sk_store_565_sse2_lowp+0xc5>
DB 102,15,197,202,2 ; pextrw $0x2,%xmm2,%ecx
DB 102,137,76,115,4 ; mov %cx,0x4(%ebx,%esi,2)
DB 102,15,126,20,115 ; movd %xmm2,(%ebx,%esi,2)
- DB 235,35 ; jmp b9f1 <_sk_store_565_sse2_lowp+0xc5>
+ DB 235,35 ; jmp b9cd <_sk_store_565_sse2_lowp+0xc5>
DB 102,15,197,202,6 ; pextrw $0x6,%xmm2,%ecx
DB 102,137,76,115,12 ; mov %cx,0xc(%ebx,%esi,2)
DB 102,15,197,202,5 ; pextrw $0x5,%xmm2,%ecx
@@ -57445,10 +57433,10 @@ _sk_load_a8_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call ba86 <_sk_load_a8_sse2_lowp+0x3a>
+ DB 232,0,0,0,0 ; call ba62 <_sk_load_a8_sse2_lowp+0x3a>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja baa8 <_sk_load_a8_sse2_lowp+0x5c>
+ DB 119,28 ; ja ba84 <_sk_load_a8_sse2_lowp+0x5c>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,198,0,0,0 ; mov 0xc6(%edi,%ecx,4),%ecx
@@ -57456,10 +57444,10 @@ _sk_load_a8_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx
DB 102,15,110,217 ; movd %ecx,%xmm3
- DB 235,90 ; jmp bb02 <_sk_load_a8_sse2_lowp+0xb6>
+ DB 235,90 ; jmp bade <_sk_load_a8_sse2_lowp+0xb6>
DB 243,15,126,28,51 ; movq (%ebx,%esi,1),%xmm3
DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3
- DB 235,79 ; jmp bb02 <_sk_load_a8_sse2_lowp+0xb6>
+ DB 235,79 ; jmp bade <_sk_load_a8_sse2_lowp+0xb6>
DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,217,2 ; pinsrw $0x2,%ecx,%xmm3
@@ -57467,7 +57455,7 @@ _sk_load_a8_sse2_lowp LABEL PROC
DB 102,15,110,233 ; movd %ecx,%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 243,15,16,221 ; movss %xmm5,%xmm3
- DB 235,47 ; jmp bb02 <_sk_load_a8_sse2_lowp+0xb6>
+ DB 235,47 ; jmp bade <_sk_load_a8_sse2_lowp+0xb6>
DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,217,6 ; pinsrw $0x6,%ecx,%xmm3
@@ -57478,7 +57466,7 @@ _sk_load_a8_sse2_lowp LABEL PROC
DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 242,15,16,221 ; movsd %xmm5,%xmm3
- DB 102,15,219,159,58,25,0,0 ; pand 0x193a(%edi),%xmm3
+ DB 102,15,219,159,62,25,0,0 ; pand 0x193e(%edi),%xmm3
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 15,41,100,36,64 ; movaps %xmm4,0x40(%esp)
DB 15,41,84,36,48 ; movaps %xmm2,0x30(%esp)
@@ -57531,10 +57519,10 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call bb91 <_sk_load_a8_dst_sse2_lowp+0x29>
+ DB 232,0,0,0,0 ; call bb6d <_sk_load_a8_dst_sse2_lowp+0x29>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja bbb3 <_sk_load_a8_dst_sse2_lowp+0x4b>
+ DB 119,28 ; ja bb8f <_sk_load_a8_dst_sse2_lowp+0x4b>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,195,0,0,0 ; mov 0xc3(%edi,%ecx,4),%ecx
@@ -57542,10 +57530,10 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx
DB 102,15,110,225 ; movd %ecx,%xmm4
- DB 235,90 ; jmp bc0d <_sk_load_a8_dst_sse2_lowp+0xa5>
+ DB 235,90 ; jmp bbe9 <_sk_load_a8_dst_sse2_lowp+0xa5>
DB 243,15,126,36,51 ; movq (%ebx,%esi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
- DB 235,79 ; jmp bc0d <_sk_load_a8_dst_sse2_lowp+0xa5>
+ DB 235,79 ; jmp bbe9 <_sk_load_a8_dst_sse2_lowp+0xa5>
DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,225,2 ; pinsrw $0x2,%ecx,%xmm4
@@ -57553,7 +57541,7 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC
DB 102,15,110,233 ; movd %ecx,%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 243,15,16,229 ; movss %xmm5,%xmm4
- DB 235,47 ; jmp bc0d <_sk_load_a8_dst_sse2_lowp+0xa5>
+ DB 235,47 ; jmp bbe9 <_sk_load_a8_dst_sse2_lowp+0xa5>
DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,225,6 ; pinsrw $0x6,%ecx,%xmm4
@@ -57564,7 +57552,7 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC
DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 242,15,16,229 ; movsd %xmm5,%xmm4
- DB 102,15,219,167,47,24,0,0 ; pand 0x182f(%edi),%xmm4
+ DB 102,15,219,167,51,24,0,0 ; pand 0x1833(%edi),%xmm4
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 102,15,127,100,36,64 ; movdqa %xmm4,0x40(%esp)
DB 102,15,239,228 ; pxor %xmm4,%xmm4
@@ -57619,32 +57607,32 @@ _sk_store_a8_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call bca9 <_sk_store_a8_sse2_lowp+0x39>
+ DB 232,0,0,0,0 ; call bc85 <_sk_store_a8_sse2_lowp+0x39>
DB 91 ; pop %ebx
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,26 ; ja bcc9 <_sk_store_a8_sse2_lowp+0x59>
+ DB 119,26 ; ja bca5 <_sk_store_a8_sse2_lowp+0x59>
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,139,223,0,0,0 ; mov 0xdf(%ebx,%ecx,4),%ecx
DB 1,217 ; add %ebx,%ecx
DB 255,225 ; jmp *%ecx
DB 102,15,126,217 ; movd %xmm3,%ecx
DB 136,12,55 ; mov %cl,(%edi,%esi,1)
- DB 233,136,0,0,0 ; jmp bd51 <_sk_store_a8_sse2_lowp+0xe1>
- DB 102,15,111,163,23,23,0,0 ; movdqa 0x1717(%ebx),%xmm4
+ DB 233,136,0,0,0 ; jmp bd2d <_sk_store_a8_sse2_lowp+0xe1>
+ DB 102,15,111,163,27,23,0,0 ; movdqa 0x171b(%ebx),%xmm4
DB 102,15,219,227 ; pand %xmm3,%xmm4
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
DB 102,15,214,36,55 ; movq %xmm4,(%edi,%esi,1)
DB 15,40,101,24 ; movaps 0x18(%ebp),%xmm4
- DB 235,109 ; jmp bd51 <_sk_store_a8_sse2_lowp+0xe1>
+ DB 235,109 ; jmp bd2d <_sk_store_a8_sse2_lowp+0xe1>
DB 102,15,197,203,2 ; pextrw $0x2,%xmm3,%ecx
DB 136,76,55,2 ; mov %cl,0x2(%edi,%esi,1)
- DB 102,15,111,163,23,23,0,0 ; movdqa 0x1717(%ebx),%xmm4
+ DB 102,15,111,163,27,23,0,0 ; movdqa 0x171b(%ebx),%xmm4
DB 102,15,219,227 ; pand %xmm3,%xmm4
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
DB 102,15,126,225 ; movd %xmm4,%ecx
DB 15,40,101,24 ; movaps 0x18(%ebp),%xmm4
DB 102,137,12,55 ; mov %cx,(%edi,%esi,1)
- DB 235,70 ; jmp bd51 <_sk_store_a8_sse2_lowp+0xe1>
+ DB 235,70 ; jmp bd2d <_sk_store_a8_sse2_lowp+0xe1>
DB 102,15,197,203,6 ; pextrw $0x6,%xmm3,%ecx
DB 136,76,55,6 ; mov %cl,0x6(%edi,%esi,1)
DB 102,15,197,203,5 ; pextrw $0x5,%xmm3,%ecx
@@ -57654,7 +57642,7 @@ _sk_store_a8_sse2_lowp LABEL PROC
DB 15,40,254 ; movaps %xmm6,%xmm7
DB 15,40,245 ; movaps %xmm5,%xmm6
DB 15,40,236 ; movaps %xmm4,%xmm5
- DB 102,15,111,163,23,23,0,0 ; movdqa 0x1717(%ebx),%xmm4
+ DB 102,15,111,163,27,23,0,0 ; movdqa 0x171b(%ebx),%xmm4
DB 102,15,219,227 ; pand %xmm3,%xmm4
DB 102,15,103,228 ; packuswb %xmm4,%xmm4
DB 102,15,126,36,55 ; movd %xmm4,(%edi,%esi,1)
@@ -57688,7 +57676,7 @@ _sk_store_a8_sse2_lowp LABEL PROC
DB 0,0 ; add %al,(%eax)
DB 0,125,0 ; add %bh,0x0(%ebp)
DB 0,0 ; add %al,(%eax)
- DB 116,0 ; je bd9a <_sk_store_a8_sse2_lowp+0x12a>
+ DB 116,0 ; je bd76 <_sk_store_a8_sse2_lowp+0x12a>
DB 0,0 ; add %al,(%eax)
DB 107,0,0 ; imul $0x0,(%eax),%eax
DB 0,98,0 ; add %ah,0x0(%edx)
@@ -57716,10 +57704,10 @@ _sk_load_g8_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call bddd <_sk_load_g8_sse2_lowp+0x39>
+ DB 232,0,0,0,0 ; call bdb9 <_sk_load_g8_sse2_lowp+0x39>
DB 94 ; pop %esi
DB 139,125,16 ; mov 0x10(%ebp),%edi
- DB 119,28 ; ja bdff <_sk_load_g8_sse2_lowp+0x5b>
+ DB 119,28 ; ja bddb <_sk_load_g8_sse2_lowp+0x5b>
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,142,199,0,0,0 ; mov 0xc7(%esi,%ecx,4),%ecx
@@ -57727,10 +57715,10 @@ _sk_load_g8_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,182,12,59 ; movzbl (%ebx,%edi,1),%ecx
DB 102,15,110,193 ; movd %ecx,%xmm0
- DB 235,90 ; jmp be59 <_sk_load_g8_sse2_lowp+0xb5>
+ DB 235,90 ; jmp be35 <_sk_load_g8_sse2_lowp+0xb5>
DB 243,15,126,4,59 ; movq (%ebx,%edi,1),%xmm0
DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0
- DB 235,79 ; jmp be59 <_sk_load_g8_sse2_lowp+0xb5>
+ DB 235,79 ; jmp be35 <_sk_load_g8_sse2_lowp+0xb5>
DB 15,182,76,59,2 ; movzbl 0x2(%ebx,%edi,1),%ecx
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,193,2 ; pinsrw $0x2,%ecx,%xmm0
@@ -57738,7 +57726,7 @@ _sk_load_g8_sse2_lowp LABEL PROC
DB 102,15,110,233 ; movd %ecx,%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 243,15,16,197 ; movss %xmm5,%xmm0
- DB 235,47 ; jmp be59 <_sk_load_g8_sse2_lowp+0xb5>
+ DB 235,47 ; jmp be35 <_sk_load_g8_sse2_lowp+0xb5>
DB 15,182,76,59,6 ; movzbl 0x6(%ebx,%edi,1),%ecx
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,196,193,6 ; pinsrw $0x6,%ecx,%xmm0
@@ -57749,7 +57737,7 @@ _sk_load_g8_sse2_lowp LABEL PROC
DB 102,15,110,44,59 ; movd (%ebx,%edi,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 242,15,16,197 ; movsd %xmm5,%xmm0
- DB 102,15,219,134,227,21,0,0 ; pand 0x15e3(%esi),%xmm0
+ DB 102,15,219,134,231,21,0,0 ; pand 0x15e7(%esi),%xmm0
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 15,41,100,36,64 ; movaps %xmm4,0x40(%esp)
DB 15,41,92,36,48 ; movaps %xmm3,0x30(%esp)
@@ -57760,7 +57748,7 @@ _sk_load_g8_sse2_lowp LABEL PROC
DB 137,124,36,8 ; mov %edi,0x8(%esp)
DB 137,76,36,4 ; mov %ecx,0x4(%esp)
DB 137,20,36 ; mov %edx,(%esp)
- DB 15,40,158,227,21,0,0 ; movaps 0x15e3(%esi),%xmm3
+ DB 15,40,158,231,21,0,0 ; movaps 0x15e7(%esi),%xmm3
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,111,208 ; movdqa %xmm0,%xmm2
DB 255,80,4 ; call *0x4(%eax)
@@ -57801,10 +57789,10 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call bee9 <_sk_load_g8_dst_sse2_lowp+0x29>
+ DB 232,0,0,0,0 ; call bec5 <_sk_load_g8_dst_sse2_lowp+0x29>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja bf0b <_sk_load_g8_dst_sse2_lowp+0x4b>
+ DB 119,28 ; ja bee7 <_sk_load_g8_dst_sse2_lowp+0x4b>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,195,0,0,0 ; mov 0xc3(%edi,%ecx,4),%ecx
@@ -57812,10 +57800,10 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx
DB 102,15,110,225 ; movd %ecx,%xmm4
- DB 235,90 ; jmp bf65 <_sk_load_g8_dst_sse2_lowp+0xa5>
+ DB 235,90 ; jmp bf41 <_sk_load_g8_dst_sse2_lowp+0xa5>
DB 243,15,126,36,51 ; movq (%ebx,%esi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
- DB 235,79 ; jmp bf65 <_sk_load_g8_dst_sse2_lowp+0xa5>
+ DB 235,79 ; jmp bf41 <_sk_load_g8_dst_sse2_lowp+0xa5>
DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,225,2 ; pinsrw $0x2,%ecx,%xmm4
@@ -57823,7 +57811,7 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC
DB 102,15,110,233 ; movd %ecx,%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 243,15,16,229 ; movss %xmm5,%xmm4
- DB 235,47 ; jmp bf65 <_sk_load_g8_dst_sse2_lowp+0xa5>
+ DB 235,47 ; jmp bf41 <_sk_load_g8_dst_sse2_lowp+0xa5>
DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,225,6 ; pinsrw $0x6,%ecx,%xmm4
@@ -57834,9 +57822,9 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC
DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 242,15,16,229 ; movsd %xmm5,%xmm4
- DB 102,15,219,167,215,20,0,0 ; pand 0x14d7(%edi),%xmm4
+ DB 102,15,219,167,219,20,0,0 ; pand 0x14db(%edi),%xmm4
DB 141,72,8 ; lea 0x8(%eax),%ecx
- DB 15,40,175,215,20,0,0 ; movaps 0x14d7(%edi),%xmm5
+ DB 15,40,175,219,20,0,0 ; movaps 0x14db(%edi),%xmm5
DB 15,41,108,36,64 ; movaps %xmm5,0x40(%esp)
DB 102,15,127,100,36,48 ; movdqa %xmm4,0x30(%esp)
DB 102,15,127,100,36,32 ; movdqa %xmm4,0x20(%esp)
@@ -57875,7 +57863,7 @@ _sk_luminance_to_alpha_sse2_lowp LABEL PROC
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
DB 102,15,111,218 ; movdqa %xmm2,%xmm3
- DB 232,0,0,0,0 ; call bfd9 <_sk_luminance_to_alpha_sse2_lowp+0x11>
+ DB 232,0,0,0,0 ; call bfb5 <_sk_luminance_to_alpha_sse2_lowp+0x11>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,16 ; mov 0x10(%ebp),%edx
@@ -57885,10 +57873,10 @@ _sk_luminance_to_alpha_sse2_lowp LABEL PROC
DB 15,40,109,56 ; movaps 0x38(%ebp),%xmm5
DB 15,40,117,72 ; movaps 0x48(%ebp),%xmm6
DB 139,125,12 ; mov 0xc(%ebp),%edi
- DB 102,15,213,128,119,20,0,0 ; pmullw 0x1477(%eax),%xmm0
- DB 102,15,213,136,135,20,0,0 ; pmullw 0x1487(%eax),%xmm1
+ DB 102,15,213,128,123,20,0,0 ; pmullw 0x147b(%eax),%xmm0
+ DB 102,15,213,136,139,20,0,0 ; pmullw 0x148b(%eax),%xmm1
DB 102,15,253,200 ; paddw %xmm0,%xmm1
- DB 102,15,213,152,151,20,0,0 ; pmullw 0x1497(%eax),%xmm3
+ DB 102,15,213,152,155,20,0,0 ; pmullw 0x149b(%eax),%xmm3
DB 102,15,253,217 ; paddw %xmm1,%xmm3
DB 102,15,113,211,8 ; psrlw $0x8,%xmm3
DB 141,71,4 ; lea 0x4(%edi),%eax
@@ -57917,15 +57905,15 @@ _sk_scale_1_float_sse2_lowp LABEL PROC
DB 87 ; push %edi
DB 86 ; push %esi
DB 131,236,80 ; sub $0x50,%esp
- DB 232,0,0,0,0 ; call c062 <_sk_scale_1_float_sse2_lowp+0xd>
+ DB 232,0,0,0,0 ; call c03e <_sk_scale_1_float_sse2_lowp+0xd>
DB 94 ; pop %esi
DB 139,69,8 ; mov 0x8(%ebp),%eax
DB 139,85,16 ; mov 0x10(%ebp),%edx
DB 139,77,12 ; mov 0xc(%ebp),%ecx
DB 139,57 ; mov (%ecx),%edi
DB 243,15,16,39 ; movss (%edi),%xmm4
- DB 243,15,89,166,34,20,0,0 ; mulss 0x1422(%esi),%xmm4
- DB 243,15,88,166,30,20,0,0 ; addss 0x141e(%esi),%xmm4
+ DB 243,15,89,166,38,20,0,0 ; mulss 0x1426(%esi),%xmm4
+ DB 243,15,88,166,34,20,0,0 ; addss 0x1422(%esi),%xmm4
DB 243,15,44,252 ; cvttss2si %xmm4,%edi
DB 102,15,110,239 ; movd %edi,%xmm5
DB 139,125,20 ; mov 0x14(%ebp),%edi
@@ -57938,7 +57926,7 @@ _sk_scale_1_float_sse2_lowp LABEL PROC
DB 102,15,213,205 ; pmullw %xmm5,%xmm1
DB 102,15,213,213 ; pmullw %xmm5,%xmm2
DB 102,15,213,221 ; pmullw %xmm5,%xmm3
- DB 102,15,111,174,94,19,0,0 ; movdqa 0x135e(%esi),%xmm5
+ DB 102,15,111,174,98,19,0,0 ; movdqa 0x1362(%esi),%xmm5
DB 102,15,253,197 ; paddw %xmm5,%xmm0
DB 102,15,253,205 ; paddw %xmm5,%xmm1
DB 102,15,253,213 ; paddw %xmm5,%xmm2
@@ -57975,19 +57963,19 @@ _sk_lerp_1_float_sse2_lowp LABEL PROC
DB 102,15,111,218 ; movdqa %xmm2,%xmm3
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 232,0,0,0,0 ; call c130 <_sk_lerp_1_float_sse2_lowp+0x1d>
+ DB 232,0,0,0,0 ; call c10c <_sk_lerp_1_float_sse2_lowp+0x1d>
DB 89 ; pop %ecx
DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,16 ; mov (%eax),%edx
DB 243,15,16,50 ; movss (%edx),%xmm6
- DB 243,15,89,177,84,19,0,0 ; mulss 0x1354(%ecx),%xmm6
- DB 243,15,88,177,80,19,0,0 ; addss 0x1350(%ecx),%xmm6
+ DB 243,15,89,177,88,19,0,0 ; mulss 0x1358(%ecx),%xmm6
+ DB 243,15,88,177,84,19,0,0 ; addss 0x1354(%ecx),%xmm6
DB 243,15,44,214 ; cvttss2si %xmm6,%edx
DB 102,15,110,242 ; movd %edx,%xmm6
DB 242,15,112,246,0 ; pshuflw $0x0,%xmm6,%xmm6
DB 102,15,112,246,80 ; pshufd $0x50,%xmm6,%xmm6
- DB 102,15,111,129,144,18,0,0 ; movdqa 0x1290(%ecx),%xmm0
+ DB 102,15,111,129,148,18,0,0 ; movdqa 0x1294(%ecx),%xmm0
DB 102,15,213,206 ; pmullw %xmm6,%xmm1
DB 102,15,253,200 ; paddw %xmm0,%xmm1
DB 102,15,213,214 ; pmullw %xmm6,%xmm2
@@ -58058,10 +58046,10 @@ _sk_scale_u8_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call c259 <_sk_scale_u8_sse2_lowp+0x31>
+ DB 232,0,0,0,0 ; call c235 <_sk_scale_u8_sse2_lowp+0x31>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja c27b <_sk_scale_u8_sse2_lowp+0x53>
+ DB 119,28 ; ja c257 <_sk_scale_u8_sse2_lowp+0x53>
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,3,1,0,0 ; mov 0x103(%edi,%ecx,4),%ecx
@@ -58069,10 +58057,10 @@ _sk_scale_u8_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx
DB 102,15,110,225 ; movd %ecx,%xmm4
- DB 235,90 ; jmp c2d5 <_sk_scale_u8_sse2_lowp+0xad>
+ DB 235,90 ; jmp c2b1 <_sk_scale_u8_sse2_lowp+0xad>
DB 243,15,126,36,51 ; movq (%ebx,%esi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
- DB 235,79 ; jmp c2d5 <_sk_scale_u8_sse2_lowp+0xad>
+ DB 235,79 ; jmp c2b1 <_sk_scale_u8_sse2_lowp+0xad>
DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,225,2 ; pinsrw $0x2,%ecx,%xmm4
@@ -58080,7 +58068,7 @@ _sk_scale_u8_sse2_lowp LABEL PROC
DB 102,15,110,233 ; movd %ecx,%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 243,15,16,229 ; movss %xmm5,%xmm4
- DB 235,47 ; jmp c2d5 <_sk_scale_u8_sse2_lowp+0xad>
+ DB 235,47 ; jmp c2b1 <_sk_scale_u8_sse2_lowp+0xad>
DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx
DB 102,15,239,228 ; pxor %xmm4,%xmm4
DB 102,15,196,225,6 ; pinsrw $0x6,%ecx,%xmm4
@@ -58091,9 +58079,9 @@ _sk_scale_u8_sse2_lowp LABEL PROC
DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5
DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5
DB 242,15,16,229 ; movsd %xmm5,%xmm4
- DB 102,15,219,167,103,17,0,0 ; pand 0x1167(%edi),%xmm4
+ DB 102,15,219,167,107,17,0,0 ; pand 0x116b(%edi),%xmm4
DB 102,15,213,196 ; pmullw %xmm4,%xmm0
- DB 102,15,111,175,103,17,0,0 ; movdqa 0x1167(%edi),%xmm5
+ DB 102,15,111,175,107,17,0,0 ; movdqa 0x116b(%edi),%xmm5
DB 102,15,253,197 ; paddw %xmm5,%xmm0
DB 102,15,113,208,8 ; psrlw $0x8,%xmm0
DB 102,15,213,204 ; pmullw %xmm4,%xmm1
@@ -58158,10 +58146,10 @@ _sk_lerp_u8_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call c3a6 <_sk_lerp_u8_sse2_lowp+0x2e>
+ DB 232,0,0,0,0 ; call c382 <_sk_lerp_u8_sse2_lowp+0x2e>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja c3c8 <_sk_lerp_u8_sse2_lowp+0x50>
+ DB 119,28 ; ja c3a4 <_sk_lerp_u8_sse2_lowp+0x50>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,74,1,0,0 ; mov 0x14a(%edi,%ecx,4),%ecx
@@ -58169,10 +58157,10 @@ _sk_lerp_u8_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx
DB 102,15,110,217 ; movd %ecx,%xmm3
- DB 235,90 ; jmp c422 <_sk_lerp_u8_sse2_lowp+0xaa>
+ DB 235,90 ; jmp c3fe <_sk_lerp_u8_sse2_lowp+0xaa>
DB 243,15,126,28,51 ; movq (%ebx,%esi,1),%xmm3
DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3
- DB 235,79 ; jmp c422 <_sk_lerp_u8_sse2_lowp+0xaa>
+ DB 235,79 ; jmp c3fe <_sk_lerp_u8_sse2_lowp+0xaa>
DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,217,2 ; pinsrw $0x2,%ecx,%xmm3
@@ -58180,7 +58168,7 @@ _sk_lerp_u8_sse2_lowp LABEL PROC
DB 102,15,110,225 ; movd %ecx,%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 243,15,16,220 ; movss %xmm4,%xmm3
- DB 235,47 ; jmp c422 <_sk_lerp_u8_sse2_lowp+0xaa>
+ DB 235,47 ; jmp c3fe <_sk_lerp_u8_sse2_lowp+0xaa>
DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,217,6 ; pinsrw $0x6,%ecx,%xmm3
@@ -58191,8 +58179,8 @@ _sk_lerp_u8_sse2_lowp LABEL PROC
DB 102,15,110,36,51 ; movd (%ebx,%esi,1),%xmm4
DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4
DB 242,15,16,220 ; movsd %xmm4,%xmm3
- DB 102,15,219,159,26,16,0,0 ; pand 0x101a(%edi),%xmm3
- DB 102,15,111,183,26,16,0,0 ; movdqa 0x101a(%edi),%xmm6
+ DB 102,15,219,159,30,16,0,0 ; pand 0x101e(%edi),%xmm3
+ DB 102,15,111,183,30,16,0,0 ; movdqa 0x101e(%edi),%xmm6
DB 102,15,111,227 ; movdqa %xmm3,%xmm4
DB 102,15,239,230 ; pxor %xmm6,%xmm4
DB 102,15,111,252 ; movdqa %xmm4,%xmm7
@@ -58279,10 +58267,10 @@ _sk_scale_565_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call c54f <_sk_scale_565_sse2_lowp+0x43>
+ DB 232,0,0,0,0 ; call c52b <_sk_scale_565_sse2_lowp+0x43>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja c571 <_sk_scale_565_sse2_lowp+0x65>
+ DB 119,28 ; ja c54d <_sk_scale_565_sse2_lowp+0x65>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,249,1,0,0 ; mov 0x1f9(%edi,%ecx,4),%ecx
@@ -58290,14 +58278,14 @@ _sk_scale_565_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,183,12,115 ; movzwl (%ebx,%esi,2),%ecx
DB 102,15,110,217 ; movd %ecx,%xmm3
- DB 235,59 ; jmp c5ac <_sk_scale_565_sse2_lowp+0xa0>
+ DB 235,59 ; jmp c588 <_sk_scale_565_sse2_lowp+0xa0>
DB 243,15,111,28,115 ; movdqu (%ebx,%esi,2),%xmm3
- DB 235,52 ; jmp c5ac <_sk_scale_565_sse2_lowp+0xa0>
+ DB 235,52 ; jmp c588 <_sk_scale_565_sse2_lowp+0xa0>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,92,115,4,2 ; pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3
DB 243,15,16,12,115 ; movss (%ebx,%esi,2),%xmm1
DB 243,15,16,217 ; movss %xmm1,%xmm3
- DB 235,30 ; jmp c5ac <_sk_scale_565_sse2_lowp+0xa0>
+ DB 235,30 ; jmp c588 <_sk_scale_565_sse2_lowp+0xa0>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,92,115,12,6 ; pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3
DB 102,15,196,92,115,10,5 ; pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3
@@ -58305,11 +58293,11 @@ _sk_scale_565_sse2_lowp LABEL PROC
DB 102,15,18,28,115 ; movlpd (%ebx,%esi,2),%xmm3
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
- DB 102,15,219,143,177,14,0,0 ; pand 0xeb1(%edi),%xmm1
+ DB 102,15,219,143,181,14,0,0 ; pand 0xeb5(%edi),%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
DB 102,15,113,210,5 ; psrlw $0x5,%xmm2
- DB 102,15,219,151,193,14,0,0 ; pand 0xec1(%edi),%xmm2
- DB 102,15,111,135,209,14,0,0 ; movdqa 0xed1(%edi),%xmm0
+ DB 102,15,219,151,197,14,0,0 ; pand 0xec5(%edi),%xmm2
+ DB 102,15,111,135,213,14,0,0 ; movdqa 0xed5(%edi),%xmm0
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 102,15,113,211,13 ; psrlw $0xd,%xmm3
DB 102,15,235,217 ; por %xmm1,%xmm3
@@ -58322,7 +58310,7 @@ _sk_scale_565_sse2_lowp LABEL PROC
DB 102,15,113,208,2 ; psrlw $0x2,%xmm0
DB 102,15,235,193 ; por %xmm1,%xmm0
DB 102,15,127,69,200 ; movdqa %xmm0,-0x38(%ebp)
- DB 102,15,111,167,145,14,0,0 ; movdqa 0xe91(%edi),%xmm4
+ DB 102,15,111,167,149,14,0,0 ; movdqa 0xe95(%edi),%xmm4
DB 15,41,117,184 ; movaps %xmm6,-0x48(%ebp)
DB 102,15,239,244 ; pxor %xmm4,%xmm6
DB 102,15,239,252 ; pxor %xmm4,%xmm7
@@ -58365,7 +58353,7 @@ _sk_scale_565_sse2_lowp LABEL PROC
DB 102,15,111,229 ; movdqa %xmm5,%xmm4
DB 102,15,213,101,136 ; pmullw -0x78(%ebp),%xmm4
DB 102,15,213,125,184 ; pmullw -0x48(%ebp),%xmm7
- DB 102,15,111,135,113,14,0,0 ; movdqa 0xe71(%edi),%xmm0
+ DB 102,15,111,135,117,14,0,0 ; movdqa 0xe75(%edi),%xmm0
DB 102,15,253,216 ; paddw %xmm0,%xmm3
DB 102,15,253,208 ; paddw %xmm0,%xmm2
DB 102,15,253,224 ; paddw %xmm0,%xmm4
@@ -58440,10 +58428,10 @@ _sk_lerp_565_sse2_lowp LABEL PROC
DB 128,225,7 ; and $0x7,%cl
DB 254,201 ; dec %cl
DB 128,249,6 ; cmp $0x6,%cl
- DB 232,0,0,0,0 ; call c7a7 <_sk_lerp_565_sse2_lowp+0x43>
+ DB 232,0,0,0,0 ; call c783 <_sk_lerp_565_sse2_lowp+0x43>
DB 95 ; pop %edi
DB 139,117,16 ; mov 0x10(%ebp),%esi
- DB 119,28 ; ja c7c9 <_sk_lerp_565_sse2_lowp+0x65>
+ DB 119,28 ; ja c7a5 <_sk_lerp_565_sse2_lowp+0x65>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 15,182,201 ; movzbl %cl,%ecx
DB 139,140,143,73,2,0,0 ; mov 0x249(%edi,%ecx,4),%ecx
@@ -58451,14 +58439,14 @@ _sk_lerp_565_sse2_lowp LABEL PROC
DB 255,225 ; jmp *%ecx
DB 15,183,12,115 ; movzwl (%ebx,%esi,2),%ecx
DB 102,15,110,217 ; movd %ecx,%xmm3
- DB 235,59 ; jmp c804 <_sk_lerp_565_sse2_lowp+0xa0>
+ DB 235,59 ; jmp c7e0 <_sk_lerp_565_sse2_lowp+0xa0>
DB 243,15,111,28,115 ; movdqu (%ebx,%esi,2),%xmm3
- DB 235,52 ; jmp c804 <_sk_lerp_565_sse2_lowp+0xa0>
+ DB 235,52 ; jmp c7e0 <_sk_lerp_565_sse2_lowp+0xa0>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,92,115,4,2 ; pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3
DB 243,15,16,12,115 ; movss (%ebx,%esi,2),%xmm1
DB 243,15,16,217 ; movss %xmm1,%xmm3
- DB 235,30 ; jmp c804 <_sk_lerp_565_sse2_lowp+0xa0>
+ DB 235,30 ; jmp c7e0 <_sk_lerp_565_sse2_lowp+0xa0>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,15,196,92,115,12,6 ; pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3
DB 102,15,196,92,115,10,5 ; pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3
@@ -58466,11 +58454,11 @@ _sk_lerp_565_sse2_lowp LABEL PROC
DB 102,15,18,28,115 ; movlpd (%ebx,%esi,2),%xmm3
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,209,8 ; psrlw $0x8,%xmm1
- DB 102,15,219,143,89,12,0,0 ; pand 0xc59(%edi),%xmm1
+ DB 102,15,219,143,93,12,0,0 ; pand 0xc5d(%edi),%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
DB 102,15,113,210,5 ; psrlw $0x5,%xmm2
- DB 102,15,219,151,105,12,0,0 ; pand 0xc69(%edi),%xmm2
- DB 102,15,111,175,121,12,0,0 ; movdqa 0xc79(%edi),%xmm5
+ DB 102,15,219,151,109,12,0,0 ; pand 0xc6d(%edi),%xmm2
+ DB 102,15,111,175,125,12,0,0 ; movdqa 0xc7d(%edi),%xmm5
DB 102,15,219,235 ; pand %xmm3,%xmm5
DB 102,15,113,211,13 ; psrlw $0xd,%xmm3
DB 102,15,235,217 ; por %xmm1,%xmm3
@@ -58483,7 +58471,7 @@ _sk_lerp_565_sse2_lowp LABEL PROC
DB 102,15,113,213,2 ; psrlw $0x2,%xmm5
DB 102,15,235,233 ; por %xmm1,%xmm5
DB 102,15,127,109,216 ; movdqa %xmm5,-0x28(%ebp)
- DB 102,15,111,167,57,12,0,0 ; movdqa 0xc39(%edi),%xmm4
+ DB 102,15,111,167,61,12,0,0 ; movdqa 0xc3d(%edi),%xmm4
DB 102,15,111,198 ; movdqa %xmm6,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,239,204 ; pxor %xmm4,%xmm1
@@ -58524,7 +58512,7 @@ _sk_lerp_565_sse2_lowp LABEL PROC
DB 102,15,235,249 ; por %xmm1,%xmm7
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,213,93,168 ; pmullw -0x58(%ebp),%xmm3
- DB 102,15,111,143,25,12,0,0 ; movdqa 0xc19(%edi),%xmm1
+ DB 102,15,111,143,29,12,0,0 ; movdqa 0xc1d(%edi),%xmm1
DB 102,15,239,193 ; pxor %xmm1,%xmm0
DB 102,15,111,101,24 ; movdqa 0x18(%ebp),%xmm4
DB 102,15,213,196 ; pmullw %xmm4,%xmm0
@@ -58618,11 +58606,11 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC
DB 128,227,7 ; and $0x7,%bl
DB 254,203 ; dec %bl
DB 128,251,6 ; cmp $0x6,%bl
- DB 232,0,0,0,0 ; call ca4b <_sk_srcover_rgba_8888_sse2_lowp+0x3f>
+ DB 232,0,0,0,0 ; call ca27 <_sk_srcover_rgba_8888_sse2_lowp+0x3f>
DB 89 ; pop %ecx
DB 139,117,16 ; mov 0x10(%ebp),%esi
DB 15,182,211 ; movzbl %bl,%edx
- DB 119,29 ; ja ca71 <_sk_srcover_rgba_8888_sse2_lowp+0x65>
+ DB 119,29 ; ja ca4d <_sk_srcover_rgba_8888_sse2_lowp+0x65>
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 139,132,145,77,2,0,0 ; mov 0x24d(%ecx,%edx,4),%eax
DB 1,200 ; add %ecx,%eax
@@ -58630,14 +58618,14 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC
DB 255,224 ; jmp *%eax
DB 243,15,16,52,183 ; movss (%edi,%esi,4),%xmm6
DB 15,87,219 ; xorps %xmm3,%xmm3
- DB 235,73 ; jmp caba <_sk_srcover_rgba_8888_sse2_lowp+0xae>
+ DB 235,73 ; jmp ca96 <_sk_srcover_rgba_8888_sse2_lowp+0xae>
DB 102,15,16,52,183 ; movupd (%edi,%esi,4),%xmm6
DB 15,16,92,183,16 ; movups 0x10(%edi,%esi,4),%xmm3
- DB 235,61 ; jmp caba <_sk_srcover_rgba_8888_sse2_lowp+0xae>
+ DB 235,61 ; jmp ca96 <_sk_srcover_rgba_8888_sse2_lowp+0xae>
DB 102,15,110,68,183,8 ; movd 0x8(%edi,%esi,4),%xmm0
DB 102,15,112,240,69 ; pshufd $0x45,%xmm0,%xmm6
DB 102,15,18,52,183 ; movlpd (%edi,%esi,4),%xmm6
- DB 235,43 ; jmp caba <_sk_srcover_rgba_8888_sse2_lowp+0xae>
+ DB 235,43 ; jmp ca96 <_sk_srcover_rgba_8888_sse2_lowp+0xae>
DB 102,15,110,68,183,24 ; movd 0x18(%edi,%esi,4),%xmm0
DB 102,15,112,216,69 ; pshufd $0x45,%xmm0,%xmm3
DB 243,15,16,68,183,20 ; movss 0x14(%edi,%esi,4),%xmm0
@@ -58663,7 +58651,7 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC
DB 102,15,114,243,16 ; pslld $0x10,%xmm3
DB 102,15,114,227,16 ; psrad $0x10,%xmm3
DB 102,15,107,243 ; packssdw %xmm3,%xmm6
- DB 102,15,111,153,117,9,0,0 ; movdqa 0x975(%ecx),%xmm3
+ DB 102,15,111,153,121,9,0,0 ; movdqa 0x979(%ecx),%xmm3
DB 102,15,114,208,16 ; psrld $0x10,%xmm0
DB 102,15,114,210,16 ; psrld $0x10,%xmm2
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
@@ -58715,18 +58703,18 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC
DB 102,15,105,220 ; punpckhwd %xmm4,%xmm3
DB 102,15,235,222 ; por %xmm6,%xmm3
DB 128,251,6 ; cmp $0x6,%bl
- DB 119,16 ; ja cbfb <_sk_srcover_rgba_8888_sse2_lowp+0x1ef>
+ DB 119,16 ; ja cbd7 <_sk_srcover_rgba_8888_sse2_lowp+0x1ef>
DB 3,140,145,105,2,0,0 ; add 0x269(%ecx,%edx,4),%ecx
DB 255,225 ; jmp *%ecx
DB 102,15,126,4,183 ; movd %xmm0,(%edi,%esi,4)
- DB 235,64 ; jmp cc3b <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
+ DB 235,64 ; jmp cc17 <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
DB 243,15,127,4,183 ; movdqu %xmm0,(%edi,%esi,4)
DB 243,15,127,92,183,16 ; movdqu %xmm3,0x10(%edi,%esi,4)
- DB 235,51 ; jmp cc3b <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
+ DB 235,51 ; jmp cc17 <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
DB 102,15,112,208,78 ; pshufd $0x4e,%xmm0,%xmm2
DB 102,15,126,84,183,8 ; movd %xmm2,0x8(%edi,%esi,4)
DB 102,15,214,4,183 ; movq %xmm0,(%edi,%esi,4)
- DB 235,33 ; jmp cc3b <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
+ DB 235,33 ; jmp cc17 <_sk_srcover_rgba_8888_sse2_lowp+0x22f>
DB 102,15,112,211,78 ; pshufd $0x4e,%xmm3,%xmm2
DB 102,15,126,84,183,24 ; movd %xmm2,0x18(%edi,%esi,4)
DB 102,15,112,211,229 ; pshufd $0xe5,%xmm3,%xmm2
@@ -58855,11 +58843,11 @@ ALIGN 16
DB 0,128,191,0,0,128 ; add %al,-0x7fffff41(%eax)
DB 191,0,0,224,64 ; mov $0x40e00000,%edi
DB 0,0 ; add %al,(%eax)
- DB 224,64 ; loopne cdb8 <.literal16+0xe8>
+ DB 224,64 ; loopne cd98 <.literal16+0xe8>
DB 0,0 ; add %al,(%eax)
- DB 224,64 ; loopne cdbc <.literal16+0xec>
+ DB 224,64 ; loopne cd9c <.literal16+0xec>
DB 0,0 ; add %al,(%eax)
- DB 224,64 ; loopne cdc0 <.literal16+0xf0>
+ DB 224,64 ; loopne cda0 <.literal16+0xf0>
DB 154,153,153,62,154,153,153 ; lcall $0x9999,$0x9a3e9999
DB 62,154,153,153,62,154,153,153 ; ds lcall $0x9999,$0x9a3e9999
DB 62,61,10,23,63,61 ; ds cmp $0x3d3f170a,%eax
@@ -58870,16 +58858,16 @@ ALIGN 16
DB 63 ; aas
DB 174 ; scas %es:(%edi),%al
DB 71 ; inc %edi
- DB 225,61 ; loope cde1 <.literal16+0x111>
+ DB 225,61 ; loope cdc1 <.literal16+0x111>
DB 174 ; scas %es:(%edi),%al
DB 71 ; inc %edi
- DB 225,61 ; loope cde5 <.literal16+0x115>
+ DB 225,61 ; loope cdc5 <.literal16+0x115>
DB 174 ; scas %es:(%edi),%al
DB 71 ; inc %edi
- DB 225,61 ; loope cde9 <.literal16+0x119>
+ DB 225,61 ; loope cdc9 <.literal16+0x119>
DB 174 ; scas %es:(%edi),%al
DB 71 ; inc %edi
- DB 225,61 ; loope cded <.literal16+0x11d>
+ DB 225,61 ; loope cdcd <.literal16+0x11d>
DB 255,0 ; incl (%eax)
DB 0,0 ; add %al,(%eax)
DB 255,0 ; incl (%eax)
@@ -58889,13 +58877,13 @@ ALIGN 16
DB 255,0 ; incl (%eax)
DB 0,0 ; add %al,(%eax)
DB 0,0 ; add %al,(%eax)
- DB 127,67 ; jg ce07 <.literal16+0x137>
+ DB 127,67 ; jg cde7 <.literal16+0x137>
DB 0,0 ; add %al,(%eax)
- DB 127,67 ; jg ce0b <.literal16+0x13b>
+ DB 127,67 ; jg cdeb <.literal16+0x13b>
DB 0,0 ; add %al,(%eax)
- DB 127,67 ; jg ce0f <.literal16+0x13f>
+ DB 127,67 ; jg cdef <.literal16+0x13f>
DB 0,0 ; add %al,(%eax)
- DB 127,67 ; jg ce13 <.literal16+0x143>
+ DB 127,67 ; jg cdf3 <.literal16+0x143>
DB 145 ; xchg %eax,%ecx
DB 131,158,61,145,131,158,61 ; sbbl $0x3d,-0x617c6ec3(%esi)
DB 145 ; xchg %eax,%ecx
@@ -59046,13 +59034,13 @@ ALIGN 16
DB 132,55 ; test %dh,(%edi)
DB 8,33 ; or %ah,(%ecx)
DB 132,55 ; test %dh,(%edi)
- DB 224,7 ; loopne cf19 <.literal16+0x249>
+ DB 224,7 ; loopne cef9 <.literal16+0x249>
DB 0,0 ; add %al,(%eax)
- DB 224,7 ; loopne cf1d <.literal16+0x24d>
+ DB 224,7 ; loopne cefd <.literal16+0x24d>
DB 0,0 ; add %al,(%eax)
- DB 224,7 ; loopne cf21 <.literal16+0x251>
+ DB 224,7 ; loopne cf01 <.literal16+0x251>
DB 0,0 ; add %al,(%eax)
- DB 224,7 ; loopne cf25 <.literal16+0x255>
+ DB 224,7 ; loopne cf05 <.literal16+0x255>
DB 0,0 ; add %al,(%eax)
DB 33,8 ; and %ecx,(%eax)
DB 2,58 ; add (%edx),%bh
@@ -59101,17 +59089,17 @@ ALIGN 16
DB 0,0 ; add %al,(%eax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg cf84 <.literal16+0x2b4>
+ DB 127,0 ; jg cf64 <.literal16+0x2b4>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg cf88 <.literal16+0x2b8>
+ DB 127,0 ; jg cf68 <.literal16+0x2b8>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg cf8c <.literal16+0x2bc>
+ DB 127,0 ; jg cf6c <.literal16+0x2bc>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg cf90 <.literal16+0x2c0>
- DB 119,115 ; ja d005 <.literal16+0x335>
+ DB 127,0 ; jg cf70 <.literal16+0x2c0>
+ DB 119,115 ; ja cfe5 <.literal16+0x335>
DB 248 ; clc
DB 194,119,115 ; ret $0x7377
DB 248 ; clc
@@ -59122,7 +59110,7 @@ ALIGN 16
DB 194,117,191 ; ret $0xbf75
DB 191,63,117,191,191 ; mov $0xbfbf753f,%edi
DB 63 ; aas
- DB 117,191 ; jne cf69 <.literal16+0x299>
+ DB 117,191 ; jne cf49 <.literal16+0x299>
DB 191,63,117,191,191 ; mov $0xbfbf753f,%edi
DB 63 ; aas
DB 249 ; stc
@@ -59138,7 +59126,7 @@ ALIGN 16
DB 68 ; inc %esp
DB 180,62 ; mov $0x3e,%ah
DB 163,233,220,63,163 ; mov %eax,0xa33fdce9
- DB 233,220,63,163,233 ; jmp e9a40fa6 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a3459a>
+ DB 233,220,63,163,233 ; jmp e9a40f86 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a3459e>
DB 220,63 ; fdivrl (%edi)
DB 163,233,220,63,81 ; mov %eax,0x513fdce9
DB 140,242 ; mov %?,%edx
@@ -59234,16 +59222,16 @@ ALIGN 16
DB 128,3,62 ; addb $0x3e,(%ebx)
DB 31 ; pop %ds
DB 215 ; xlat %ds:(%ebx)
- DB 118,63 ; jbe d0f3 <.literal16+0x423>
+ DB 118,63 ; jbe d0d3 <.literal16+0x423>
DB 31 ; pop %ds
DB 215 ; xlat %ds:(%ebx)
- DB 118,63 ; jbe d0f7 <.literal16+0x427>
+ DB 118,63 ; jbe d0d7 <.literal16+0x427>
DB 31 ; pop %ds
DB 215 ; xlat %ds:(%ebx)
- DB 118,63 ; jbe d0fb <.literal16+0x42b>
+ DB 118,63 ; jbe d0db <.literal16+0x42b>
DB 31 ; pop %ds
DB 215 ; xlat %ds:(%ebx)
- DB 118,63 ; jbe d0ff <.literal16+0x42f>
+ DB 118,63 ; jbe d0df <.literal16+0x42f>
DB 246,64,83,63 ; testb $0x3f,0x53(%eax)
DB 246,64,83,63 ; testb $0x3f,0x53(%eax)
DB 246,64,83,63 ; testb $0x3f,0x53(%eax)
@@ -59269,13 +59257,13 @@ ALIGN 16
DB 248 ; clc
DB 65 ; inc %ecx
DB 0,0 ; add %al,(%eax)
- DB 124,66 ; jl d136 <.literal16+0x466>
+ DB 124,66 ; jl d116 <.literal16+0x466>
DB 0,0 ; add %al,(%eax)
- DB 124,66 ; jl d13a <.literal16+0x46a>
+ DB 124,66 ; jl d11a <.literal16+0x46a>
DB 0,0 ; add %al,(%eax)
- DB 124,66 ; jl d13e <.literal16+0x46e>
+ DB 124,66 ; jl d11e <.literal16+0x46e>
DB 0,0 ; add %al,(%eax)
- DB 124,66 ; jl d142 <.literal16+0x472>
+ DB 124,66 ; jl d122 <.literal16+0x472>
DB 0,240 ; add %dh,%al
DB 0,0 ; add %al,(%eax)
DB 0,240 ; add %dh,%al
@@ -59321,25 +59309,25 @@ ALIGN 16
DB 136,136,61,137,136,136 ; mov %cl,-0x777776c3(%eax)
DB 61,137,136,136,61 ; cmp $0x3d888889,%eax
DB 0,0 ; add %al,(%eax)
- DB 112,65 ; jo d1c5 <.literal16+0x4f5>
+ DB 112,65 ; jo d1a5 <.literal16+0x4f5>
DB 0,0 ; add %al,(%eax)
- DB 112,65 ; jo d1c9 <.literal16+0x4f9>
+ DB 112,65 ; jo d1a9 <.literal16+0x4f9>
DB 0,0 ; add %al,(%eax)
- DB 112,65 ; jo d1cd <.literal16+0x4fd>
+ DB 112,65 ; jo d1ad <.literal16+0x4fd>
DB 0,0 ; add %al,(%eax)
- DB 112,65 ; jo d1d1 <.literal16+0x501>
+ DB 112,65 ; jo d1b1 <.literal16+0x501>
DB 0,128,0,0,0,128 ; add %al,-0x80000000(%eax)
DB 0,0 ; add %al,(%eax)
DB 0,128,0,0,0,128 ; add %al,-0x80000000(%eax)
DB 0,0 ; add %al,(%eax)
DB 255 ; (bad)
- DB 127,0 ; jg d1a3 <.literal16+0x4d3>
+ DB 127,0 ; jg d183 <.literal16+0x4d3>
DB 0,255 ; add %bh,%bh
- DB 127,0 ; jg d1a7 <.literal16+0x4d7>
+ DB 127,0 ; jg d187 <.literal16+0x4d7>
DB 0,255 ; add %bh,%bh
- DB 127,0 ; jg d1ab <.literal16+0x4db>
+ DB 127,0 ; jg d18b <.literal16+0x4db>
DB 0,255 ; add %bh,%bh
- DB 127,0 ; jg d1af <.literal16+0x4df>
+ DB 127,0 ; jg d18f <.literal16+0x4df>
DB 0,0 ; add %al,(%eax)
DB 4,0 ; add $0x0,%al
DB 0,0 ; add %al,(%eax)
@@ -59365,13 +59353,13 @@ ALIGN 16
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,255 ; jg d1e8 <.literal16+0x518>
+ DB 127,255 ; jg d1c8 <.literal16+0x518>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,255 ; jg d1ec <.literal16+0x51c>
+ DB 127,255 ; jg d1cc <.literal16+0x51c>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 127,0 ; jg d1f1 <.literal16+0x521>
+ DB 127,0 ; jg d1d1 <.literal16+0x521>
DB 0,128,56,0,0,128 ; add %al,-0x7fffffc8(%eax)
DB 56,0 ; cmp %al,(%eax)
DB 0,128,56,0,0,128 ; add %al,-0x7fffffc8(%eax)
@@ -59385,13 +59373,13 @@ ALIGN 16
DB 0,255 ; add %bh,%bh
DB 255,0 ; incl (%eax)
DB 255 ; (bad)
- DB 127,71 ; jg d25b <.literal16+0x58b>
+ DB 127,71 ; jg d23b <.literal16+0x58b>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg d25f <.literal16+0x58f>
+ DB 127,71 ; jg d23f <.literal16+0x58f>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg d263 <.literal16+0x593>
+ DB 127,71 ; jg d243 <.literal16+0x593>
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg d267 <.literal16+0x597>
+ DB 127,71 ; jg d247 <.literal16+0x597>
DB 208 ; (bad)
DB 179,89 ; mov $0x59,%bl
DB 62,208 ; ds (bad)
@@ -59444,7 +59432,7 @@ ALIGN 16
DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110
DB 17,192 ; adc %eax,%eax
DB 45,16,17,192,18 ; sub $0x12c01110,%eax
- DB 120,57 ; js d2cc <.literal16+0x5fc>
+ DB 120,57 ; js d2ac <.literal16+0x5fc>
DB 64 ; inc %eax
DB 18,120,57 ; adc 0x39(%eax),%bh
DB 64 ; inc %eax
@@ -59515,13 +59503,13 @@ ALIGN 16
DB 192,191,0,0,192,191,0 ; sarb $0x0,-0x40400000(%edi)
DB 0,192 ; add %al,%al
DB 191,0,0,192,191 ; mov $0xbfc00000,%edi
- DB 114,28 ; jb d37e <.literal16+0x6ae>
+ DB 114,28 ; jb d35e <.literal16+0x6ae>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt d382 <.literal16+0x6b2>
+ DB 62,114,28 ; jb,pt d362 <.literal16+0x6b2>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt d386 <.literal16+0x6b6>
+ DB 62,114,28 ; jb,pt d366 <.literal16+0x6b6>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt d38a <.literal16+0x6ba>
+ DB 62,114,28 ; jb,pt d36a <.literal16+0x6ba>
DB 199 ; (bad)
DB 62,85 ; ds push %ebp
DB 85 ; push %ebp
@@ -59542,13 +59530,13 @@ ALIGN 16
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%esi)
DB 99,61,57,142,99,61 ; arpl %di,0x3d638e39
DB 57,142,99,61,114,249 ; cmp %ecx,-0x68dc29d(%esi)
- DB 127,63 ; jg d3e3 <.literal16+0x713>
- DB 114,249 ; jb d39f <.literal16+0x6cf>
- DB 127,63 ; jg d3e7 <.literal16+0x717>
- DB 114,249 ; jb d3a3 <.literal16+0x6d3>
- DB 127,63 ; jg d3eb <.literal16+0x71b>
- DB 114,249 ; jb d3a7 <.literal16+0x6d7>
- DB 127,63 ; jg d3ef <.literal16+0x71f>
+ DB 127,63 ; jg d3c3 <.literal16+0x713>
+ DB 114,249 ; jb d37f <.literal16+0x6cf>
+ DB 127,63 ; jg d3c7 <.literal16+0x717>
+ DB 114,249 ; jb d383 <.literal16+0x6d3>
+ DB 127,63 ; jg d3cb <.literal16+0x71b>
+ DB 114,249 ; jb d387 <.literal16+0x6d7>
+ DB 127,63 ; jg d3cf <.literal16+0x71f>
DB 3,0 ; add (%eax),%eax
DB 0,0 ; add %al,(%eax)
DB 3,0 ; add (%eax),%eax
@@ -59616,14 +59604,14 @@ ALIGN 16
DB 0,248 ; add %bh,%al
DB 0,248 ; add %bh,%al
DB 0,248 ; add %bh,%al
- DB 224,255 ; loopne d441 <.literal16+0x771>
- DB 224,255 ; loopne d443 <.literal16+0x773>
- DB 224,255 ; loopne d445 <.literal16+0x775>
- DB 224,255 ; loopne d447 <.literal16+0x777>
- DB 224,255 ; loopne d449 <.literal16+0x779>
- DB 224,255 ; loopne d44b <.literal16+0x77b>
- DB 224,255 ; loopne d44d <.literal16+0x77d>
- DB 224,255 ; loopne d44f <.literal16+0x77f>
+ DB 224,255 ; loopne d421 <.literal16+0x771>
+ DB 224,255 ; loopne d423 <.literal16+0x773>
+ DB 224,255 ; loopne d425 <.literal16+0x775>
+ DB 224,255 ; loopne d427 <.literal16+0x777>
+ DB 224,255 ; loopne d429 <.literal16+0x779>
+ DB 224,255 ; loopne d42b <.literal16+0x77b>
+ DB 224,255 ; loopne d42d <.literal16+0x77d>
+ DB 224,255 ; loopne d42f <.literal16+0x77f>
DB 54,0,54 ; add %dh,%ss:(%esi)
DB 0,54 ; add %dh,(%esi)
DB 0,54 ; add %dh,(%esi)
@@ -59647,6 +59635,6 @@ ALIGN 4
DB 0,0 ; add %al,(%eax)
DB 0,63 ; add %bh,(%edi)
DB 0,0 ; add %al,(%eax)
- DB 127,67 ; jg d4cb <_sk_srcover_rgba_8888_sse2_lowp+0xabf>
+ DB 127,67 ; jg d4ab <_sk_srcover_rgba_8888_sse2_lowp+0xac3>
ENDIF
END
diff --git a/src/jumper/SkJumper_misc.h b/src/jumper/SkJumper_misc.h
index 8f7ebb56ac..5db2709f05 100644
--- a/src/jumper/SkJumper_misc.h
+++ b/src/jumper/SkJumper_misc.h
@@ -65,7 +65,7 @@ SI void* load_and_inc(void**& program) {
// Lazily resolved on first cast. Does nothing if cast to Ctx::None.
struct Ctx {
- using None = decltype(nullptr);
+ struct None {};
void* ptr;
void**& program;
@@ -77,7 +77,7 @@ struct Ctx {
if (!ptr) { ptr = load_and_inc(program); }
return (T*)ptr;
}
- operator None() { return nullptr; }
+ operator None() { return None{}; }
};
#endif//SkJumper_misc_DEFINED
diff --git a/src/jumper/SkJumper_stages.cpp b/src/jumper/SkJumper_stages.cpp
index 4ba4a76a6b..262b9262de 100644
--- a/src/jumper/SkJumper_stages.cpp
+++ b/src/jumper/SkJumper_stages.cpp
@@ -85,31 +85,29 @@ extern "C" void WRAP(start_pipeline)(size_t x, size_t y, size_t xlimit, size_t y
}
#if defined(__i386__) || defined(_M_IX86) || defined(__arm__)
- #define STAGE(name) \
- SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \
+ #define STAGE(name, ...) \
+ SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \
F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da); \
extern "C" void WRAP(name)(Params* params, void** program, \
F r, F g, F b, F a) { \
- Ctx ctx(program); \
- name##_k(ctx,params->x,params->y,params->tail, r,g,b,a, \
+ name##_k(Ctx{program},params->x,params->y,params->tail, r,g,b,a, \
params->dr, params->dg, params->db, params->da); \
auto next = (Stage*)load_and_inc(program); \
next(params,program, r,g,b,a); \
} \
- SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \
+ SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \
F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da)
#else
- #define STAGE(name) \
- SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \
+ #define STAGE(name, ...) \
+ SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \
F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da); \
extern "C" void WRAP(name)(size_t tail, void** program, size_t x, size_t y, \
F r, F g, F b, F a, F dr, F dg, F db, F da) { \
- Ctx ctx(program); \
- name##_k(ctx,x,y,tail, r,g,b,a, dr,dg,db,da); \
+ name##_k(Ctx{program},x,y,tail, r,g,b,a, dr,dg,db,da); \
auto next = (Stage*)load_and_inc(program); \
next(tail,program,x,y, r,g,b,a, dr,dg,db,da); \
} \
- SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \
+ SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \
F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da)
#endif
@@ -214,7 +212,7 @@ SI U32 ix_and_ptr(T** ptr, const SkJumper_GatherCtx* ctx, F x, F y) {
// Now finally, normal Stages!
-STAGE(seed_shader) {
+STAGE(seed_shader, Ctx::None) {
// It's important for speed to explicitly cast(x) and cast(y),
// which has the effect of splatting them to vectors before converting to floats.
// On Intel this breaks a data dependency on previous loop iterations' registers.
@@ -226,9 +224,7 @@ STAGE(seed_shader) {
dr = dg = db = da = 0;
}
-STAGE(dither) {
- auto rate = *(const float*)ctx;
-
+STAGE(dither, const float* rate) {
// Get [(x,y), (x+1,y), (x+2,y), ...] loaded up in integer vectors.
uint32_t iota[] = {0,1,2,3,4,5,6,7};
U32 X = x + unaligned_load<U32>(iota),
@@ -251,9 +247,9 @@ STAGE(dither) {
// like 0 and 1 unchanged after rounding.
F dither = cast(M) * (2/128.0f) - (63/128.0f);
- r += rate*dither;
- g += rate*dither;
- b += rate*dither;
+ r += *rate*dither;
+ g += *rate*dither;
+ b += *rate*dither;
r = max(0, min(r, a));
g = max(0, min(g, a));
@@ -261,8 +257,7 @@ STAGE(dither) {
}
// load 4 floats from memory, and splat them into r,g,b,a
-STAGE(uniform_color) {
- auto c = (const SkJumper_UniformColorCtx*)ctx;
+STAGE(uniform_color, const SkJumper_UniformColorCtx* c) {
r = c->r;
g = c->g;
b = c->b;
@@ -270,18 +265,17 @@ STAGE(uniform_color) {
}
// splats opaque-black into r,g,b,a
-STAGE(black_color) {
+STAGE(black_color, Ctx::None) {
r = g = b = 0.0f;
a = 1.0f;
}
-STAGE(white_color) {
+STAGE(white_color, Ctx::None) {
r = g = b = a = 1.0f;
}
// load registers r,g,b,a from context (mirrors store_rgba)
-STAGE(load_rgba) {
- auto ptr = (const float*)ctx;
+STAGE(load_rgba, const float* ptr) {
r = unaligned_load<F>(ptr + 0*N);
g = unaligned_load<F>(ptr + 1*N);
b = unaligned_load<F>(ptr + 2*N);
@@ -289,8 +283,7 @@ STAGE(load_rgba) {
}
// store registers r,g,b,a into context (mirrors load_rgba)
-STAGE(store_rgba) {
- auto ptr = (float*)ctx;
+STAGE(store_rgba, float* ptr) {
unaligned_store(ptr + 0*N, r);
unaligned_store(ptr + 1*N, g);
unaligned_store(ptr + 2*N, b);
@@ -300,7 +293,7 @@ STAGE(store_rgba) {
// Most blend modes apply the same logic to each channel.
#define BLEND_MODE(name) \
SI F name##_channel(F s, F d, F sa, F da); \
- STAGE(name) { \
+ STAGE(name, Ctx::None) { \
r = name##_channel(r,dr,a,da); \
g = name##_channel(g,dg,a,da); \
b = name##_channel(b,db,a,da); \
@@ -331,7 +324,7 @@ BLEND_MODE(xor_) { return s*inv(da) + d*inv(sa); }
// Most other blend modes apply the same logic to colors, and srcover to alpha.
#define BLEND_MODE(name) \
SI F name##_channel(F s, F d, F sa, F da); \
- STAGE(name) { \
+ STAGE(name, Ctx::None) { \
r = name##_channel(r,dr,a,da); \
g = name##_channel(g,dg,a,da); \
b = name##_channel(b,db,a,da); \
@@ -429,7 +422,7 @@ SI void clip_color(F* r, F* g, F* b, F a) {
*b = clip(*b);
}
-STAGE(hue) {
+STAGE(hue, Ctx::None) {
F R = r*a,
G = g*a,
B = b*a;
@@ -443,7 +436,7 @@ STAGE(hue) {
b = b*inv(da) + db*inv(a) + B;
a = a + da - a*da;
}
-STAGE(saturation) {
+STAGE(saturation, Ctx::None) {
F R = dr*a,
G = dg*a,
B = db*a;
@@ -457,7 +450,7 @@ STAGE(saturation) {
b = b*inv(da) + db*inv(a) + B;
a = a + da - a*da;
}
-STAGE(color) {
+STAGE(color, Ctx::None) {
F R = r*da,
G = g*da,
B = b*da;
@@ -470,7 +463,7 @@ STAGE(color) {
b = b*inv(da) + db*inv(a) + B;
a = a + da - a*da;
}
-STAGE(luminosity) {
+STAGE(luminosity, Ctx::None) {
F R = dr*a,
G = dg*a,
B = db*a;
@@ -484,7 +477,7 @@ STAGE(luminosity) {
a = a + da - a*da;
}
-STAGE(srcover_rgba_8888) {
+STAGE(srcover_rgba_8888, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint32_t>(ctx, x,y);
U32 dst = load<U32>(ptr, tail);
@@ -508,76 +501,75 @@ STAGE(srcover_rgba_8888) {
store(ptr, dst, tail);
}
-STAGE(clamp_0) {
+STAGE(clamp_0, Ctx::None) {
r = max(r, 0);
g = max(g, 0);
b = max(b, 0);
a = max(a, 0);
}
-STAGE(clamp_1) {
+STAGE(clamp_1, Ctx::None) {
r = min(r, 1.0f);
g = min(g, 1.0f);
b = min(b, 1.0f);
a = min(a, 1.0f);
}
-STAGE(clamp_a) {
+STAGE(clamp_a, Ctx::None) {
a = min(a, 1.0f);
r = min(r, a);
g = min(g, a);
b = min(b, a);
}
-STAGE(clamp_a_dst) {
+STAGE(clamp_a_dst, Ctx::None) {
da = min(da, 1.0f);
dr = min(dr, da);
dg = min(dg, da);
db = min(db, da);
}
-STAGE(set_rgb) {
- auto rgb = (const float*)ctx;
+STAGE(set_rgb, const float* rgb) {
r = rgb[0];
g = rgb[1];
b = rgb[2];
}
-STAGE(swap_rb) {
+STAGE(swap_rb, Ctx::None) {
auto tmp = r;
r = b;
b = tmp;
}
-STAGE(invert) {
+STAGE(invert, Ctx::None) {
r = inv(r);
g = inv(g);
b = inv(b);
a = inv(a);
}
-STAGE(move_src_dst) {
+STAGE(move_src_dst, Ctx::None) {
dr = r;
dg = g;
db = b;
da = a;
}
-STAGE(move_dst_src) {
+STAGE(move_dst_src, Ctx::None) {
r = dr;
g = dg;
b = db;
a = da;
}
-STAGE(premul) {
+STAGE(premul, Ctx::None) {
r = r * a;
g = g * a;
b = b * a;
}
-STAGE(premul_dst) {
+STAGE(premul_dst, Ctx::None) {
dr = dr * da;
dg = dg * da;
db = db * da;
}
-STAGE(unpremul) {
+STAGE(unpremul, Ctx::None) {
auto scale = if_then_else(a == 0, 0, 1.0f / a);
r *= scale;
g *= scale;
@@ -590,17 +582,17 @@ SI F from_srgb(F s) {
return if_then_else(s < 0.055f, lo, hi);
}
-STAGE(from_srgb) {
+STAGE(from_srgb, Ctx::None) {
r = from_srgb(r);
g = from_srgb(g);
b = from_srgb(b);
}
-STAGE(from_srgb_dst) {
+STAGE(from_srgb_dst, Ctx::None) {
dr = from_srgb(dr);
dg = from_srgb(dg);
db = from_srgb(db);
}
-STAGE(to_srgb) {
+STAGE(to_srgb, Ctx::None) {
auto fn = [&](F l) {
// We tweak c and d for each instruction set to make sure fn(1) is exactly 1.
#if defined(JUMPER_IS_SSE2) || defined(JUMPER_IS_SSE41) || \
@@ -625,7 +617,7 @@ STAGE(to_srgb) {
b = fn(b);
}
-STAGE(rgb_to_hsl) {
+STAGE(rgb_to_hsl, Ctx::None) {
F mx = max(r,g,b),
mn = min(r,g,b),
d = mx - mn,
@@ -645,7 +637,7 @@ STAGE(rgb_to_hsl) {
g = s;
b = l;
}
-STAGE(hsl_to_rgb) {
+STAGE(hsl_to_rgb, Ctx::None) {
F h = r,
s = g,
l = b;
@@ -674,15 +666,13 @@ SI F alpha_coverage_from_rgb_coverage(F a, F da, F cr, F cg, F cb) {
, max(cr,cg,cb));
}
-STAGE(scale_1_float) {
- auto c = *(const float*)ctx;
-
- r = r * c;
- g = g * c;
- b = b * c;
- a = a * c;
+STAGE(scale_1_float, const float* c) {
+ r = r * *c;
+ g = g * *c;
+ b = b * *c;
+ a = a * *c;
}
-STAGE(scale_u8) {
+STAGE(scale_u8, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y);
auto scales = load<U8>(ptr, tail);
@@ -693,7 +683,7 @@ STAGE(scale_u8) {
b = b * c;
a = a * c;
}
-STAGE(scale_565) {
+STAGE(scale_565, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y);
F cr,cg,cb;
@@ -711,15 +701,13 @@ SI F lerp(F from, F to, F t) {
return mad(to-from, t, from);
}
-STAGE(lerp_1_float) {
- auto c = *(const float*)ctx;
-
- r = lerp(dr, r, c);
- g = lerp(dg, g, c);
- b = lerp(db, b, c);
- a = lerp(da, a, c);
+STAGE(lerp_1_float, const float* c) {
+ r = lerp(dr, r, *c);
+ g = lerp(dg, g, *c);
+ b = lerp(db, b, *c);
+ a = lerp(da, a, *c);
}
-STAGE(lerp_u8) {
+STAGE(lerp_u8, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y);
auto scales = load<U8>(ptr, tail);
@@ -730,7 +718,7 @@ STAGE(lerp_u8) {
b = lerp(db, b, c);
a = lerp(da, a, c);
}
-STAGE(lerp_565) {
+STAGE(lerp_565, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y);
F cr,cg,cb;
@@ -744,17 +732,14 @@ STAGE(lerp_565) {
a = lerp(da, a, ca);
}
-STAGE(load_tables) {
- auto c = (const SkJumper_LoadTablesCtx*)ctx;
-
+STAGE(load_tables, const SkJumper_LoadTablesCtx* c) {
auto px = load<U32>((const uint32_t*)c->src + x, tail);
r = gather(c->r, (px ) & 0xff);
g = gather(c->g, (px >> 8) & 0xff);
b = gather(c->b, (px >> 16) & 0xff);
a = cast( (px >> 24)) * (1/255.0f);
}
-STAGE(load_tables_u16_be) {
- auto c = (const SkJumper_LoadTablesCtx*)ctx;
+STAGE(load_tables_u16_be, const SkJumper_LoadTablesCtx* c) {
auto ptr = (const uint16_t*)c->src + 4*x;
U16 R,G,B,A;
@@ -766,8 +751,7 @@ STAGE(load_tables_u16_be) {
b = gather(c->b, expand(B) & 0xff);
a = (1/65535.0f) * cast(expand(bswap(A)));
}
-STAGE(load_tables_rgb_u16_be) {
- auto c = (const SkJumper_LoadTablesCtx*)ctx;
+STAGE(load_tables_rgb_u16_be, const SkJumper_LoadTablesCtx* c) {
auto ptr = (const uint16_t*)c->src + 3*x;
U16 R,G,B;
@@ -780,7 +764,7 @@ STAGE(load_tables_rgb_u16_be) {
a = 1.0f;
}
-STAGE(byte_tables) {
+STAGE(byte_tables, const void* ctx) { // TODO: rename Tables SkJumper_ByteTablesCtx
struct Tables { const uint8_t *r, *g, *b, *a; };
auto tables = (const Tables*)ctx;
@@ -790,7 +774,7 @@ STAGE(byte_tables) {
a = from_byte(gather(tables->a, round(a, 255.0f)));
}
-STAGE(byte_tables_rgb) {
+STAGE(byte_tables_rgb, const void* ctx) { // TODO: rename Tables SkJumper_ByteTablesRGBCtx
struct Tables { const uint8_t *r, *g, *b; int n; };
auto tables = (const Tables*)ctx;
@@ -803,29 +787,28 @@ STAGE(byte_tables_rgb) {
SI F table(F v, const SkJumper_TableCtx* ctx) {
return gather(ctx->table, round(v, ctx->size - 1));
}
-STAGE(table_r) { r = table(r, ctx); }
-STAGE(table_g) { g = table(g, ctx); }
-STAGE(table_b) { b = table(b, ctx); }
-STAGE(table_a) { a = table(a, ctx); }
+STAGE(table_r, const SkJumper_TableCtx* ctx) { r = table(r, ctx); }
+STAGE(table_g, const SkJumper_TableCtx* ctx) { g = table(g, ctx); }
+STAGE(table_b, const SkJumper_TableCtx* ctx) { b = table(b, ctx); }
+STAGE(table_a, const SkJumper_TableCtx* ctx) { a = table(a, ctx); }
SI F parametric(F v, const SkJumper_ParametricTransferFunction* ctx) {
F r = if_then_else(v <= ctx->D, mad(ctx->C, v, ctx->F)
, approx_powf(mad(ctx->A, v, ctx->B), ctx->G) + ctx->E);
return min(max(r, 0), 1.0f); // Clamp to [0,1], with argument order mattering to handle NaN.
}
-STAGE(parametric_r) { r = parametric(r, ctx); }
-STAGE(parametric_g) { g = parametric(g, ctx); }
-STAGE(parametric_b) { b = parametric(b, ctx); }
-STAGE(parametric_a) { a = parametric(a, ctx); }
+STAGE(parametric_r, const SkJumper_ParametricTransferFunction* ctx) { r = parametric(r, ctx); }
+STAGE(parametric_g, const SkJumper_ParametricTransferFunction* ctx) { g = parametric(g, ctx); }
+STAGE(parametric_b, const SkJumper_ParametricTransferFunction* ctx) { b = parametric(b, ctx); }
+STAGE(parametric_a, const SkJumper_ParametricTransferFunction* ctx) { a = parametric(a, ctx); }
-STAGE(gamma) {
- float G = *(const float*)ctx;
- r = approx_powf(r,G);
- g = approx_powf(g,G);
- b = approx_powf(b,G);
+STAGE(gamma, const float* G) {
+ r = approx_powf(r, *G);
+ g = approx_powf(g, *G);
+ b = approx_powf(b, *G);
}
-STAGE(lab_to_xyz) {
+STAGE(lab_to_xyz, Ctx::None) {
F L = r * 100.0f,
A = g * 255.0f - 128.0f,
B = b * 255.0f - 128.0f;
@@ -844,69 +827,69 @@ STAGE(lab_to_xyz) {
b = Z * 0.82521f;
}
-STAGE(load_a8) {
+STAGE(load_a8, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y);
r = g = b = 0.0f;
a = from_byte(load<U8>(ptr, tail));
}
-STAGE(load_a8_dst) {
+STAGE(load_a8_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y);
dr = dg = db = 0.0f;
da = from_byte(load<U8>(ptr, tail));
}
-STAGE(gather_a8) {
+STAGE(gather_a8, const SkJumper_GatherCtx* ctx) {
const uint8_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
r = g = b = 0.0f;
a = from_byte(gather(ptr, ix));
}
-STAGE(store_a8) {
+STAGE(store_a8, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint8_t>(ctx, x,y);
U8 packed = pack(pack(round(a, 255.0f)));
store(ptr, packed, tail);
}
-STAGE(load_g8) {
+STAGE(load_g8, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y);
r = g = b = from_byte(load<U8>(ptr, tail));
a = 1.0f;
}
-STAGE(load_g8_dst) {
+STAGE(load_g8_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y);
dr = dg = db = from_byte(load<U8>(ptr, tail));
da = 1.0f;
}
-STAGE(gather_g8) {
+STAGE(gather_g8, const SkJumper_GatherCtx* ctx) {
const uint8_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
r = g = b = from_byte(gather(ptr, ix));
a = 1.0f;
}
-STAGE(load_565) {
+STAGE(load_565, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y);
from_565(load<U16>(ptr, tail), &r,&g,&b);
a = 1.0f;
}
-STAGE(load_565_dst) {
+STAGE(load_565_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y);
from_565(load<U16>(ptr, tail), &dr,&dg,&db);
da = 1.0f;
}
-STAGE(gather_565) {
+STAGE(gather_565, const SkJumper_GatherCtx* ctx) {
const uint16_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
from_565(gather(ptr, ix), &r,&g,&b);
a = 1.0f;
}
-STAGE(store_565) {
+STAGE(store_565, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint16_t>(ctx, x,y);
U16 px = pack( round(r, 31.0f) << 11
@@ -915,20 +898,20 @@ STAGE(store_565) {
store(ptr, px, tail);
}
-STAGE(load_4444) {
+STAGE(load_4444, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y);
from_4444(load<U16>(ptr, tail), &r,&g,&b,&a);
}
-STAGE(load_4444_dst) {
+STAGE(load_4444_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y);
from_4444(load<U16>(ptr, tail), &dr,&dg,&db,&da);
}
-STAGE(gather_4444) {
+STAGE(gather_4444, const SkJumper_GatherCtx* ctx) {
const uint16_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
from_4444(gather(ptr, ix), &r,&g,&b,&a);
}
-STAGE(store_4444) {
+STAGE(store_4444, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint16_t>(ctx, x,y);
U16 px = pack( round(r, 15.0f) << 12
| round(g, 15.0f) << 8
@@ -937,20 +920,20 @@ STAGE(store_4444) {
store(ptr, px, tail);
}
-STAGE(load_8888) {
+STAGE(load_8888, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y);
from_8888(load<U32>(ptr, tail), &r,&g,&b,&a);
}
-STAGE(load_8888_dst) {
+STAGE(load_8888_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y);
from_8888(load<U32>(ptr, tail), &dr,&dg,&db,&da);
}
-STAGE(gather_8888) {
+STAGE(gather_8888, const SkJumper_GatherCtx* ctx) {
const uint32_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
from_8888(gather(ptr, ix), &r,&g,&b,&a);
}
-STAGE(store_8888) {
+STAGE(store_8888, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint32_t>(ctx, x,y);
U32 px = round(r, 255.0f)
@@ -960,20 +943,20 @@ STAGE(store_8888) {
store(ptr, px, tail);
}
-STAGE(load_bgra) {
+STAGE(load_bgra, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y);
from_8888(load<U32>(ptr, tail), &b,&g,&r,&a);
}
-STAGE(load_bgra_dst) {
+STAGE(load_bgra_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y);
from_8888(load<U32>(ptr, tail), &db,&dg,&dr,&da);
}
-STAGE(gather_bgra) {
+STAGE(gather_bgra, const SkJumper_GatherCtx* ctx) {
const uint32_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
from_8888(gather(ptr, ix), &b,&g,&r,&a);
}
-STAGE(store_bgra) {
+STAGE(store_bgra, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint32_t>(ctx, x,y);
U32 px = round(b, 255.0f)
@@ -983,7 +966,7 @@ STAGE(store_bgra) {
store(ptr, px, tail);
}
-STAGE(load_f16) {
+STAGE(load_f16, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint64_t>(ctx, x,y);
U16 R,G,B,A;
@@ -993,7 +976,7 @@ STAGE(load_f16) {
b = from_half(B);
a = from_half(A);
}
-STAGE(load_f16_dst) {
+STAGE(load_f16_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint64_t>(ctx, x,y);
U16 R,G,B,A;
@@ -1003,7 +986,7 @@ STAGE(load_f16_dst) {
db = from_half(B);
da = from_half(A);
}
-STAGE(gather_f16) {
+STAGE(gather_f16, const SkJumper_GatherCtx* ctx) {
const uint64_t* ptr;
U32 ix = ix_and_ptr(&ptr, ctx, r,g);
auto px = gather(ptr, ix);
@@ -1015,7 +998,7 @@ STAGE(gather_f16) {
b = from_half(B);
a = from_half(A);
}
-STAGE(store_f16) {
+STAGE(store_f16, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint64_t>(ctx, x,y);
store4((uint16_t*)ptr,tail, to_half(r)
, to_half(g)
@@ -1023,7 +1006,7 @@ STAGE(store_f16) {
, to_half(a));
}
-STAGE(load_u16_be) {
+STAGE(load_u16_be, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, 4*x,y);
U16 R,G,B,A;
@@ -1034,7 +1017,7 @@ STAGE(load_u16_be) {
b = (1/65535.0f) * cast(expand(bswap(B)));
a = (1/65535.0f) * cast(expand(bswap(A)));
}
-STAGE(load_rgb_u16_be) {
+STAGE(load_rgb_u16_be, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const uint16_t>(ctx, 3*x,y);
U16 R,G,B;
@@ -1045,7 +1028,7 @@ STAGE(load_rgb_u16_be) {
b = (1/65535.0f) * cast(expand(bswap(B)));
a = 1.0f;
}
-STAGE(store_u16_be) {
+STAGE(store_u16_be, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<uint16_t>(ctx, 4*x,y);
U16 R = bswap(pack(round(r, 65535.0f))),
@@ -1056,15 +1039,15 @@ STAGE(store_u16_be) {
store4(ptr,tail, R,G,B,A);
}
-STAGE(load_f32) {
+STAGE(load_f32, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const float>(ctx, 4*x,y);
load4(ptr,tail, &r,&g,&b,&a);
}
-STAGE(load_f32_dst) {
+STAGE(load_f32_dst, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<const float>(ctx, 4*x,y);
load4(ptr,tail, &dr,&dg,&db,&da);
}
-STAGE(store_f32) {
+STAGE(store_f32, const SkJumper_MemoryCtx* ctx) {
auto ptr = ptr_at_xy<float>(ctx, 4*x,y);
store4(ptr,tail, r,g,b,a);
}
@@ -1080,44 +1063,36 @@ SI F exclusive_mirror(F v, const SkJumper_TileCtx* ctx) {
// Tile x or y to [0,limit) == [0,limit - 1 ulp] (think, sampling from images).
// The gather stages will hard clamp the output of these stages to [0,limit)...
// we just need to do the basic repeat or mirroring.
-STAGE(repeat_x) { r = exclusive_repeat(r, (const SkJumper_TileCtx*)ctx); }
-STAGE(repeat_y) { g = exclusive_repeat(g, (const SkJumper_TileCtx*)ctx); }
-STAGE(mirror_x) { r = exclusive_mirror(r, (const SkJumper_TileCtx*)ctx); }
-STAGE(mirror_y) { g = exclusive_mirror(g, (const SkJumper_TileCtx*)ctx); }
+STAGE(repeat_x, const SkJumper_TileCtx* ctx) { r = exclusive_repeat(r, ctx); }
+STAGE(repeat_y, const SkJumper_TileCtx* ctx) { g = exclusive_repeat(g, ctx); }
+STAGE(mirror_x, const SkJumper_TileCtx* ctx) { r = exclusive_mirror(r, ctx); }
+STAGE(mirror_y, const SkJumper_TileCtx* ctx) { g = exclusive_mirror(g, ctx); }
// Clamp x to [0,1], both sides exclusive (think, gradients).
-STAGE( clamp_x_1) { r = min(max(0, r), 1.0f); }
-STAGE(repeat_x_1) { r = r - floor_(r); }
-STAGE(mirror_x_1) { r = abs_( (r-1.0f) - two(floor_((r-1.0f)*0.5f)) - 1.0f ); }
+STAGE( clamp_x_1, Ctx::None) { r = min(max(0, r), 1.0f); }
+STAGE(repeat_x_1, Ctx::None) { r = r - floor_(r); }
+STAGE(mirror_x_1, Ctx::None) { r = abs_( (r-1.0f) - two(floor_((r-1.0f)*0.5f)) - 1.0f ); }
-STAGE(luminance_to_alpha) {
+STAGE(luminance_to_alpha, Ctx::None) {
a = r*0.2126f + g*0.7152f + b*0.0722f;
r = g = b = 0;
}
-STAGE(matrix_translate) {
- auto m = (const float*)ctx;
-
+STAGE(matrix_translate, const float* m) {
r += m[0];
g += m[1];
}
-STAGE(matrix_scale_translate) {
- auto m = (const float*)ctx;
-
+STAGE(matrix_scale_translate, const float* m) {
r = mad(r,m[2], m[0]);
g = mad(g,m[3], m[1]);
}
-STAGE(matrix_2x3) {
- auto m = (const float*)ctx;
-
+STAGE(matrix_2x3, const float* m) {
auto R = mad(r,m[0], mad(g,m[2], m[4])),
G = mad(r,m[1], mad(g,m[3], m[5]));
r = R;
g = G;
}
-STAGE(matrix_3x4) {
- auto m = (const float*)ctx;
-
+STAGE(matrix_3x4, const float* m) {
auto R = mad(r,m[0], mad(g,m[3], mad(b,m[6], m[ 9]))),
G = mad(r,m[1], mad(g,m[4], mad(b,m[7], m[10]))),
B = mad(r,m[2], mad(g,m[5], mad(b,m[8], m[11])));
@@ -1125,9 +1100,7 @@ STAGE(matrix_3x4) {
g = G;
b = B;
}
-STAGE(matrix_4x5) {
- auto m = (const float*)ctx;
-
+STAGE(matrix_4x5, const float* m) {
auto R = mad(r,m[0], mad(g,m[4], mad(b,m[ 8], mad(a,m[12], m[16])))),
G = mad(r,m[1], mad(g,m[5], mad(b,m[ 9], mad(a,m[13], m[17])))),
B = mad(r,m[2], mad(g,m[6], mad(b,m[10], mad(a,m[14], m[18])))),
@@ -1137,8 +1110,7 @@ STAGE(matrix_4x5) {
b = B;
a = A;
}
-STAGE(matrix_4x3) {
- auto m = (const float*)ctx;
+STAGE(matrix_4x3, const float* m) {
auto X = r,
Y = g;
@@ -1147,10 +1119,8 @@ STAGE(matrix_4x3) {
b = mad(X, m[2], mad(Y, m[6], m[10]));
a = mad(X, m[3], mad(Y, m[7], m[11]));
}
-STAGE(matrix_perspective) {
+STAGE(matrix_perspective, const float* m) {
// N.B. Unlike the other matrix_ stages, this matrix is row-major.
- auto m = (const float*)ctx;
-
auto R = mad(r,m[0], mad(g,m[1], m[2])),
G = mad(r,m[3], mad(g,m[4], m[5])),
Z = mad(r,m[6], mad(g,m[7], m[8]));
@@ -1190,14 +1160,14 @@ SI void gradient_lookup(const SkJumper_GradientCtx* c, U32 idx, F t,
*a = mad(t, fa, ba);
}
-STAGE(evenly_spaced_gradient) {
- auto c = (const SkJumper_GradientCtx*)ctx;
+STAGE(evenly_spaced_gradient, const SkJumper_GradientCtx* c) {
auto t = r;
auto idx = trunc_(t * (c->stopCount-1));
gradient_lookup(c, idx, t, &r, &g, &b, &a);
}
-STAGE(gauss_a_to_rgba) {
+// TODO: move this somewhere not in the middle of the gradients...
+STAGE(gauss_a_to_rgba, Ctx::None) {
// x = 1 - x;
// exp(-x * x * 4) - 0.018f;
// ... now approximate with quartic
@@ -1213,8 +1183,7 @@ STAGE(gauss_a_to_rgba) {
b = a;
}
-STAGE(gradient) {
- auto c = (const SkJumper_GradientCtx*)ctx;
+STAGE(gradient, const SkJumper_GradientCtx* c) {
auto t = r;
U32 idx = 0;
@@ -1226,7 +1195,8 @@ STAGE(gradient) {
gradient_lookup(c, idx, t, &r, &g, &b, &a);
}
-STAGE(evenly_spaced_2_stop_gradient) {
+STAGE(evenly_spaced_2_stop_gradient, const void* ctx) {
+ // TODO: Rename Ctx SkJumper_EvenlySpacedGradientCtx.
struct Ctx { float f[4], b[4]; };
auto c = (const Ctx*)ctx;
@@ -1237,7 +1207,7 @@ STAGE(evenly_spaced_2_stop_gradient) {
a = mad(t, c->f[3], c->b[3]);
}
-STAGE(xy_to_unit_angle) {
+STAGE(xy_to_unit_angle, Ctx::None) {
F X = r,
Y = g;
F xabs = abs_(X),
@@ -1263,7 +1233,7 @@ STAGE(xy_to_unit_angle) {
r = phi;
}
-STAGE(xy_to_radius) {
+STAGE(xy_to_radius, Ctx::None) {
F X2 = r * r,
Y2 = g * g;
r = sqrt_(X2 + Y2);
@@ -1302,26 +1272,22 @@ SI F solve_2pt_conical_quadratic(const SkJumper_2PtConicalCtx* c, F x, F y, F (*
(-coeffB - sqrt_disc) * (invCoeffA * 0.5f));
}
-STAGE(xy_to_2pt_conical_quadratic_max) {
+STAGE(xy_to_2pt_conical_quadratic_max, const SkJumper_2PtConicalCtx* ctx) {
r = solve_2pt_conical_quadratic(ctx, r, g, max);
}
-STAGE(xy_to_2pt_conical_quadratic_min) {
+STAGE(xy_to_2pt_conical_quadratic_min, const SkJumper_2PtConicalCtx* ctx) {
r = solve_2pt_conical_quadratic(ctx, r, g, min);
}
-STAGE(xy_to_2pt_conical_linear) {
- auto* c = (const SkJumper_2PtConicalCtx*)ctx;
-
+STAGE(xy_to_2pt_conical_linear, const SkJumper_2PtConicalCtx* c) {
const F coeffB = -2 * (r + c->fDR*c->fR0),
coeffC = r*r + g*g - c->fR0*c->fR0;
r = -coeffC / coeffB;
}
-STAGE(mask_2pt_conical_degenerates) {
- auto* c = (SkJumper_2PtConicalCtx*)ctx;
-
+STAGE(mask_2pt_conical_degenerates, SkJumper_2PtConicalCtx* c) {
// The gradient t coordinate is in the r register right now.
F& t = r;
@@ -1329,22 +1295,19 @@ STAGE(mask_2pt_conical_degenerates) {
// and save a mask to ignore those colors in apply_vector_mask.
auto is_degenerate = (mad(t, c->fDR, c->fR0) < 0) // Radius(t) < 0
| (t != t); // t == NaN
-
t = if_then_else(is_degenerate, F(0), t);
unaligned_store(&c->fMask, if_then_else(is_degenerate, U32(0), U32(0xffffffff)));
}
-STAGE(apply_vector_mask) {
- const U32 mask = unaligned_load<U32>((const uint32_t*)ctx);
+STAGE(apply_vector_mask, const uint32_t* ctx) {
+ const U32 mask = unaligned_load<U32>(ctx);
r = bit_cast<F>(bit_cast<U32>(r) & mask);
g = bit_cast<F>(bit_cast<U32>(g) & mask);
b = bit_cast<F>(bit_cast<U32>(b) & mask);
a = bit_cast<F>(bit_cast<U32>(a) & mask);
}
-STAGE(save_xy) {
- auto c = (SkJumper_SamplerCtx*)ctx;
-
+STAGE(save_xy, SkJumper_SamplerCtx* c) {
// Whether bilinear or bicubic, all sample points are at the same fractional offset (fx,fy).
// They're either the 4 corners of a logical 1x1 pixel or the 16 corners of a 3x3 grid
// surrounding (x,y) at (0.5,0.5) off-center.
@@ -1358,9 +1321,7 @@ STAGE(save_xy) {
unaligned_store(c->fy, fy);
}
-STAGE(accumulate) {
- auto c = (const SkJumper_SamplerCtx*)ctx;
-
+STAGE(accumulate, const SkJumper_SamplerCtx* c) {
// Bilinear and bicubic filters are both separable, so we produce independent contributions
// from x and y, multiplying them together here to get each pixel's total scale factor.
auto scale = unaligned_load<F>(c->scalex)
@@ -1397,10 +1358,10 @@ SI void bilinear_y(SkJumper_SamplerCtx* ctx, F* y) {
unaligned_store(ctx->scaley, scaley);
}
-STAGE(bilinear_nx) { bilinear_x<-1>(ctx, &r); }
-STAGE(bilinear_px) { bilinear_x<+1>(ctx, &r); }
-STAGE(bilinear_ny) { bilinear_y<-1>(ctx, &g); }
-STAGE(bilinear_py) { bilinear_y<+1>(ctx, &g); }
+STAGE(bilinear_nx, SkJumper_SamplerCtx* ctx) { bilinear_x<-1>(ctx, &r); }
+STAGE(bilinear_px, SkJumper_SamplerCtx* ctx) { bilinear_x<+1>(ctx, &r); }
+STAGE(bilinear_ny, SkJumper_SamplerCtx* ctx) { bilinear_y<-1>(ctx, &g); }
+STAGE(bilinear_py, SkJumper_SamplerCtx* ctx) { bilinear_y<+1>(ctx, &g); }
// In bicubic interpolation, the 16 pixels and +/- 0.5 and +/- 1.5 offsets from the sample
@@ -1443,18 +1404,17 @@ SI void bicubic_y(SkJumper_SamplerCtx* ctx, F* y) {
unaligned_store(ctx->scaley, scaley);
}
-STAGE(bicubic_n3x) { bicubic_x<-3>(ctx, &r); }
-STAGE(bicubic_n1x) { bicubic_x<-1>(ctx, &r); }
-STAGE(bicubic_p1x) { bicubic_x<+1>(ctx, &r); }
-STAGE(bicubic_p3x) { bicubic_x<+3>(ctx, &r); }
+STAGE(bicubic_n3x, SkJumper_SamplerCtx* ctx) { bicubic_x<-3>(ctx, &r); }
+STAGE(bicubic_n1x, SkJumper_SamplerCtx* ctx) { bicubic_x<-1>(ctx, &r); }
+STAGE(bicubic_p1x, SkJumper_SamplerCtx* ctx) { bicubic_x<+1>(ctx, &r); }
+STAGE(bicubic_p3x, SkJumper_SamplerCtx* ctx) { bicubic_x<+3>(ctx, &r); }
-STAGE(bicubic_n3y) { bicubic_y<-3>(ctx, &g); }
-STAGE(bicubic_n1y) { bicubic_y<-1>(ctx, &g); }
-STAGE(bicubic_p1y) { bicubic_y<+1>(ctx, &g); }
-STAGE(bicubic_p3y) { bicubic_y<+3>(ctx, &g); }
+STAGE(bicubic_n3y, SkJumper_SamplerCtx* ctx) { bicubic_y<-3>(ctx, &g); }
+STAGE(bicubic_n1y, SkJumper_SamplerCtx* ctx) { bicubic_y<-1>(ctx, &g); }
+STAGE(bicubic_p1y, SkJumper_SamplerCtx* ctx) { bicubic_y<+1>(ctx, &g); }
+STAGE(bicubic_p3y, SkJumper_SamplerCtx* ctx) { bicubic_y<+3>(ctx, &g); }
-STAGE(callback) {
- auto c = (SkJumper_CallbackCtx*)ctx;
+STAGE(callback, SkJumper_CallbackCtx* c) {
store4(c->rgba,0, r,g,b,a);
c->fn(c, tail ? tail : N);
load4(c->read_from,0, &r,&g,&b,&a);
@@ -1502,11 +1462,11 @@ inline void color_lookup_table<0>(const SkJumper_ColorLookupTableCtx* ctx,
b = gather(ctx->table, 3*index+2);
}
-STAGE(clut_3D) {
+STAGE(clut_3D, const SkJumper_ColorLookupTableCtx* ctx) {
color_lookup_table<3>(ctx, r,g,b,a, 0,1);
// This 3D color lookup table leaves alpha alone.
}
-STAGE(clut_4D) {
+STAGE(clut_4D, const SkJumper_ColorLookupTableCtx* ctx) {
color_lookup_table<4>(ctx, r,g,b,a, 0,1);
// "a" was really CMYK's K, so we just set alpha opaque.
a = 1.0f;