diff options
author | Mike Klein <mtklein@chromium.org> | 2017-09-27 11:42:30 -0400 |
---|---|---|
committer | Skia Commit-Bot <skia-commit-bot@chromium.org> | 2017-09-28 18:08:28 +0000 |
commit | f7729c262076b88b2635e7f8d09e7f3340eea79b (patch) | |
tree | 20ecc274046d229721ae9383359e4e5ff370a2a1 /src/jumper | |
parent | 6c08b7bbe47201a21d9e53a907b4baa906bb20b4 (diff) |
Move context types into STAGE() macros.
This is something I came up with while writing _lowp.cpp.
This should all be a logical no-op, but there are some code generation
changes. I'm not exactly sure why.
Change-Id: Iaad36b5298b37fe26ebd375a147a48852f98e1e4
Reviewed-on: https://skia-review.googlesource.com/52003
Commit-Queue: Mike Klein <mtklein@chromium.org>
Reviewed-by: Herb Derby <herb@google.com>
Diffstat (limited to 'src/jumper')
-rw-r--r-- | src/jumper/SkJumper_generated.S | 2008 | ||||
-rw-r--r-- | src/jumper/SkJumper_generated_win.S | 1736 | ||||
-rw-r--r-- | src/jumper/SkJumper_misc.h | 4 | ||||
-rw-r--r-- | src/jumper/SkJumper_stages.cpp | 346 |
4 files changed, 2007 insertions, 2087 deletions
diff --git a/src/jumper/SkJumper_generated.S b/src/jumper/SkJumper_generated.S index ac9aef2434..337703b096 100644 --- a/src/jumper/SkJumper_generated.S +++ b/src/jumper/SkJumper_generated.S @@ -6808,11 +6808,11 @@ _sk_evenly_spaced_gradient_vfp4: .long 0xed2d8b10 // vpush {d8-d15} .long 0xe24dd010 // sub sp, sp, #16 .long 0xe58d0008 // str r0, [sp, #8] - .long 0xe2810004 // add r0, r1, #4 - .long 0xe58d000c // str r0, [sp, #12] - .long 0xe1a0c001 // mov ip, r1 - .long 0xe49c7008 // ldr r7, [ip], #8 .long 0xf2600150 // vorr q8, q0, q0 + .long 0xe5917000 // ldr r7, [r1] + .long 0xe5910004 // ldr r0, [r1, #4] + .long 0xe2811008 // add r1, r1, #8 + .long 0xe58d000c // str r0, [sp, #12] .long 0xe8974204 // ldm r7, {r2, r9, lr} .long 0xe2422001 // sub r2, r2, #1 .long 0xe5970010 // ldr r0, [r7, #16] @@ -6848,34 +6848,31 @@ _sk_evenly_spaced_gradient_vfp4: .long 0xed90ca00 // vldr s24, [r0] .long 0xe597001c // ldr r0, [r7, #28] .long 0xe0806103 // add r6, r0, r3, lsl #2 + .long 0xe0808102 // add r8, r0, r2, lsl #2 .long 0xe080a104 // add sl, r0, r4, lsl #2 .long 0xedd65a00 // vldr s11, [r6] .long 0xe0806105 // add r6, r0, r5, lsl #2 .long 0xe58d6004 // str r6, [sp, #4] - .long 0xe0806102 // add r6, r0, r2, lsl #2 - .long 0xe58d6000 // str r6, [sp] .long 0xe5970018 // ldr r0, [r7, #24] - .long 0xed9a5a00 // vldr s10, [sl] - .long 0xe0808103 // add r8, r0, r3, lsl #2 + .long 0xe5977014 // ldr r7, [r7, #20] + .long 0xe080c103 // add ip, r0, r3, lsl #2 .long 0xe0806104 // add r6, r0, r4, lsl #2 - .long 0xedd83a00 // vldr s7, [r8] + .long 0xed9a5a00 // vldr s10, [sl] + .long 0xeddc3a00 // vldr s7, [ip] + .long 0xedd84a00 // vldr s9, [r8] .long 0xed963a00 // vldr s6, [r6] .long 0xe0806102 // add r6, r0, r2, lsl #2 .long 0xe0800105 // add r0, r0, r5, lsl #2 .long 0xedd62a00 // vldr s5, [r6] - .long 0xe5976014 // ldr r6, [r7, #20] + .long 0xe0876103 // add r6, r7, r3, lsl #2 + .long 0xedd69a00 // vldr s19, [r6] + .long 0xe0876104 // add r6, r7, r4, lsl #2 .long 0xed902a00 // vldr s4, [r0] - .long 0xe0867103 // add r7, r6, r3, lsl #2 - .long 0xe59d0000 // ldr r0, [sp] - .long 0xedd79a00 // vldr s19, [r7] - .long 0xe0867104 // add r7, r6, r4, lsl #2 - .long 0xedd04a00 // vldr s9, [r0] - .long 0xed979a00 // vldr s18, [r7] - .long 0xe08e7103 // add r7, lr, r3, lsl #2 + .long 0xed969a00 // vldr s18, [r6] + .long 0xe08e6103 // add r6, lr, r3, lsl #2 .long 0xe0893103 // add r3, r9, r3, lsl #2 .long 0xe59d0004 // ldr r0, [sp, #4] - .long 0xedd71a00 // vldr s3, [r7] - .long 0xe08e7105 // add r7, lr, r5, lsl #2 + .long 0xedd61a00 // vldr s3, [r6] .long 0xedd3fa00 // vldr s31, [r3] .long 0xe0893104 // add r3, r9, r4, lsl #2 .long 0xed904a00 // vldr s8, [r0] @@ -6888,16 +6885,16 @@ _sk_evenly_spaced_gradient_vfp4: .long 0xe0893105 // add r3, r9, r5, lsl #2 .long 0xe59d0008 // ldr r0, [sp, #8] .long 0xed93ea00 // vldr s28, [r3] - .long 0xe0863102 // add r3, r6, r2, lsl #2 + .long 0xe0873102 // add r3, r7, r2, lsl #2 .long 0xedd38a00 // vldr s17, [r3] - .long 0xe0863105 // add r3, r6, r5, lsl #2 + .long 0xe0873105 // add r3, r7, r5, lsl #2 + .long 0xe08e7105 // add r7, lr, r5, lsl #2 .long 0xed938a00 // vldr s16, [r3] .long 0xe08e3104 // add r3, lr, r4, lsl #2 .long 0xf2008cde // vfma.f32 q4, q8, q7 .long 0xed931a00 // vldr s2, [r3] .long 0xe08e3102 // add r3, lr, r2, lsl #2 - .long 0xe5912004 // ldr r2, [r1, #4] - .long 0xe1a0100c // mov r1, ip + .long 0xe59d200c // ldr r2, [sp, #12] .long 0xedd30a00 // vldr s1, [r3] .long 0xe08b3105 // add r3, fp, r5, lsl #2 .long 0xed936a00 // vldr s12, [r3] @@ -6910,7 +6907,6 @@ _sk_evenly_spaced_gradient_vfp4: .long 0xe28dd004 // add sp, sp, #4 .long 0xe8bd4ff0 // pop {r4, r5, r6, r7, r8, r9, sl, fp, lr} .long 0xe12fff12 // bx r2 - .long 0xe320f000 // nop {0} HIDDEN _sk_gauss_a_to_rgba_vfp4 .globl _sk_gauss_a_to_rgba_vfp4 @@ -6964,110 +6960,107 @@ _sk_gradient_vfp4: .long 0xe92d4ff0 // push {r4, r5, r6, r7, r8, r9, sl, fp, lr} .long 0xe24dd004 // sub sp, sp, #4 .long 0xed2d8b10 // vpush {d8-d15} - .long 0xe24dd008 // sub sp, sp, #8 - .long 0xe2812004 // add r2, r1, #4 - .long 0xe58d2004 // str r2, [sp, #4] - .long 0xe5913000 // ldr r3, [r1] + .long 0xe5912000 // ldr r2, [r1] .long 0xf2606150 // vorr q11, q0, q0 .long 0xf2c02050 // vmov.i32 q9, #0 .long 0xf2c00050 // vmov.i32 q8, #0 - .long 0xe5931000 // ldr r1, [r3] - .long 0xe3510002 // cmp r1, #2 - .long 0x3a00000a // bcc 62e8 <sk_gradient_vfp4+0x60> - .long 0xe5932024 // ldr r2, [r3, #36] + .long 0xe5923000 // ldr r3, [r2] + .long 0xe3530002 // cmp r3, #2 + .long 0x3a00000a // bcc 62cc <sk_gradient_vfp4+0x54> + .long 0xe5927024 // ldr r7, [r2, #36] .long 0xf2c04051 // vmov.i32 q10, #1 .long 0xf2c00050 // vmov.i32 q8, #0 - .long 0xe2411001 // sub r1, r1, #1 - .long 0xe2822004 // add r2, r2, #4 - .long 0xf4e28cbd // vld1.32 {d24[]-d25[]}, [r2 :32]! - .long 0xe2511001 // subs r1, r1, #1 + .long 0xe2433001 // sub r3, r3, #1 + .long 0xe2877004 // add r7, r7, #4 + .long 0xf4e78cbd // vld1.32 {d24[]-d25[]}, [r7 :32]! + .long 0xe2533001 // subs r3, r3, #1 .long 0xf3468ee8 // vcge.f32 q12, q11, q12 .long 0xf35481f2 // vbsl q12, q10, q9 .long 0xf26008e8 // vadd.i32 q8, q8, q12 - .long 0x1afffff9 // bne 62d0 <sk_gradient_vfp4+0x48> - .long 0xee317b90 // vmov.32 r7, d17[1] - .long 0xe9934400 // ldmib r3, {sl, lr} - .long 0xee111b90 // vmov.32 r1, d17[0] - .long 0xe5935010 // ldr r5, [r3, #16] - .long 0xe593c020 // ldr ip, [r3, #32] - .long 0xe593600c // ldr r6, [r3, #12] - .long 0xe593b01c // ldr fp, [r3, #28] - .long 0xe0852107 // add r2, r5, r7, lsl #2 - .long 0xedd2ba00 // vldr s23, [r2] - .long 0xe0852101 // add r2, r5, r1, lsl #2 - .long 0xed92ba00 // vldr s22, [r2] - .long 0xee302b90 // vmov.32 r2, d16[1] - .long 0xe0854102 // add r4, r5, r2, lsl #2 - .long 0xedd4aa00 // vldr s21, [r4] - .long 0xee104b90 // vmov.32 r4, d16[0] - .long 0xe0855104 // add r5, r5, r4, lsl #2 - .long 0xed95aa00 // vldr s20, [r5] - .long 0xe08c5107 // add r5, ip, r7, lsl #2 - .long 0xedd57a00 // vldr s15, [r5] - .long 0xe08c5101 // add r5, ip, r1, lsl #2 - .long 0xed957a00 // vldr s14, [r5] - .long 0xe0865107 // add r5, r6, r7, lsl #2 - .long 0xedd5da00 // vldr s27, [r5] - .long 0xe0865101 // add r5, r6, r1, lsl #2 - .long 0xed95da00 // vldr s26, [r5] - .long 0xe0865102 // add r5, r6, r2, lsl #2 - .long 0xedd5ca00 // vldr s25, [r5] - .long 0xe0865104 // add r5, r6, r4, lsl #2 - .long 0xed95ca00 // vldr s24, [r5] - .long 0xe08b5107 // add r5, fp, r7, lsl #2 - .long 0xedd55a00 // vldr s11, [r5] - .long 0xe5935018 // ldr r5, [r3, #24] - .long 0xe5933014 // ldr r3, [r3, #20] - .long 0xe0856107 // add r6, r5, r7, lsl #2 - .long 0xe0858104 // add r8, r5, r4, lsl #2 - .long 0xe0859102 // add r9, r5, r2, lsl #2 - .long 0xedd63a00 // vldr s7, [r6] - .long 0xe0856101 // add r6, r5, r1, lsl #2 - .long 0xe08e5107 // add r5, lr, r7, lsl #2 - .long 0xed963a00 // vldr s6, [r6] - .long 0xe08a6101 // add r6, sl, r1, lsl #2 - .long 0xedd5fa00 // vldr s31, [r5] - .long 0xe08e5101 // add r5, lr, r1, lsl #2 - .long 0xedd92a00 // vldr s5, [r9] - .long 0xed95fa00 // vldr s30, [r5] - .long 0xe0835107 // add r5, r3, r7, lsl #2 - .long 0xed982a00 // vldr s4, [r8] - .long 0xedd59a00 // vldr s19, [r5] - .long 0xe0835101 // add r5, r3, r1, lsl #2 - .long 0xe08b1101 // add r1, fp, r1, lsl #2 - .long 0xed959a00 // vldr s18, [r5] - .long 0xe0835102 // add r5, r3, r2, lsl #2 - .long 0xe0833104 // add r3, r3, r4, lsl #2 - .long 0xed915a00 // vldr s10, [r1] - .long 0xedd58a00 // vldr s17, [r5] - .long 0xe08a5107 // add r5, sl, r7, lsl #2 - .long 0xe08e7104 // add r7, lr, r4, lsl #2 - .long 0xe08c1102 // add r1, ip, r2, lsl #2 - .long 0xedd51a00 // vldr s3, [r5] - .long 0xe08e5102 // add r5, lr, r2, lsl #2 - .long 0xed938a00 // vldr s16, [r3] - .long 0xe08c3104 // add r3, ip, r4, lsl #2 + .long 0x1afffff9 // bne 62b4 <sk_gradient_vfp4+0x3c> + .long 0xee314b90 // vmov.32 r4, d17[1] + .long 0xe5926010 // ldr r6, [r2, #16] + .long 0xee11cb90 // vmov.32 ip, d17[0] + .long 0xe592e020 // ldr lr, [r2, #32] + .long 0xe592700c // ldr r7, [r2, #12] + .long 0xe592901c // ldr r9, [r2, #28] + .long 0xe5928008 // ldr r8, [r2, #8] + .long 0xe592b004 // ldr fp, [r2, #4] + .long 0xe0863104 // add r3, r6, r4, lsl #2 + .long 0xedd3ba00 // vldr s23, [r3] + .long 0xe086310c // add r3, r6, ip, lsl #2 + .long 0xed93ba00 // vldr s22, [r3] + .long 0xee303b90 // vmov.32 r3, d16[1] + .long 0xe0865103 // add r5, r6, r3, lsl #2 + .long 0xedd5aa00 // vldr s21, [r5] + .long 0xee105b90 // vmov.32 r5, d16[0] + .long 0xe0866105 // add r6, r6, r5, lsl #2 + .long 0xed96aa00 // vldr s20, [r6] + .long 0xe08e6104 // add r6, lr, r4, lsl #2 + .long 0xedd67a00 // vldr s15, [r6] + .long 0xe08e610c // add r6, lr, ip, lsl #2 + .long 0xed967a00 // vldr s14, [r6] + .long 0xe0876104 // add r6, r7, r4, lsl #2 + .long 0xedd6da00 // vldr s27, [r6] + .long 0xe087610c // add r6, r7, ip, lsl #2 + .long 0xed96da00 // vldr s26, [r6] + .long 0xe0876103 // add r6, r7, r3, lsl #2 + .long 0xedd6ca00 // vldr s25, [r6] + .long 0xe0876105 // add r6, r7, r5, lsl #2 + .long 0xed96ca00 // vldr s24, [r6] + .long 0xe0896104 // add r6, r9, r4, lsl #2 + .long 0xedd65a00 // vldr s11, [r6] + .long 0xe5926018 // ldr r6, [r2, #24] + .long 0xe5922014 // ldr r2, [r2, #20] + .long 0xe0867104 // add r7, r6, r4, lsl #2 + .long 0xe086a103 // add sl, r6, r3, lsl #2 + .long 0xedd73a00 // vldr s7, [r7] + .long 0xe086710c // add r7, r6, ip, lsl #2 + .long 0xed973a00 // vldr s6, [r7] + .long 0xe0867105 // add r7, r6, r5, lsl #2 + .long 0xe0886104 // add r6, r8, r4, lsl #2 + .long 0xedda2a00 // vldr s5, [sl] + .long 0xedd6fa00 // vldr s31, [r6] + .long 0xe088610c // add r6, r8, ip, lsl #2 + .long 0xed972a00 // vldr s4, [r7] + .long 0xe089710c // add r7, r9, ip, lsl #2 + .long 0xed96fa00 // vldr s30, [r6] + .long 0xe0826104 // add r6, r2, r4, lsl #2 + .long 0xe08b4104 // add r4, fp, r4, lsl #2 + .long 0xed975a00 // vldr s10, [r7] + .long 0xedd69a00 // vldr s19, [r6] + .long 0xe082610c // add r6, r2, ip, lsl #2 + .long 0xedd41a00 // vldr s3, [r4] + .long 0xe0884103 // add r4, r8, r3, lsl #2 + .long 0xed969a00 // vldr s18, [r6] + .long 0xe0826103 // add r6, r2, r3, lsl #2 + .long 0xe0822105 // add r2, r2, r5, lsl #2 + .long 0xedd4ea00 // vldr s29, [r4] + .long 0xedd68a00 // vldr s17, [r6] + .long 0xe08b610c // add r6, fp, ip, lsl #2 + .long 0xe0894105 // add r4, r9, r5, lsl #2 .long 0xed961a00 // vldr s2, [r6] - .long 0xe08a6102 // add r6, sl, r2, lsl #2 - .long 0xedd5ea00 // vldr s29, [r5] - .long 0xe08b5104 // add r5, fp, r4, lsl #2 + .long 0xe08b6103 // add r6, fp, r3, lsl #2 + .long 0xed928a00 // vldr s16, [r2] + .long 0xe08e2105 // add r2, lr, r5, lsl #2 .long 0xedd60a00 // vldr s1, [r6] - .long 0xe08a6104 // add r6, sl, r4, lsl #2 - .long 0xed97ea00 // vldr s28, [r7] - .long 0xe08b7102 // add r7, fp, r2, lsl #2 + .long 0xe08b6105 // add r6, fp, r5, lsl #2 + .long 0xe0885105 // add r5, r8, r5, lsl #2 .long 0xed960a00 // vldr s0, [r6] - .long 0xedd16a00 // vldr s13, [r1] - .long 0xf2062cde // vfma.f32 q1, q11, q7 - .long 0xedd74a00 // vldr s9, [r7] + .long 0xed95ea00 // vldr s28, [r5] + .long 0xe0895103 // add r5, r9, r3, lsl #2 .long 0xf2068cd0 // vfma.f32 q4, q11, q0 - .long 0xe59d1004 // ldr r1, [sp, #4] - .long 0xed954a00 // vldr s8, [r5] - .long 0xed936a00 // vldr s12, [r3] + .long 0xe08e3103 // add r3, lr, r3, lsl #2 + .long 0xedd54a00 // vldr s9, [r5] + .long 0xedd36a00 // vldr s13, [r3] + .long 0xf2062cde // vfma.f32 q1, q11, q7 + .long 0xed944a00 // vldr s8, [r4] + .long 0xed926a00 // vldr s12, [r2] + .long 0xe5912004 // ldr r2, [r1, #4] .long 0xf2064cdc // vfma.f32 q2, q11, q6 - .long 0xe4912004 // ldr r2, [r1], #4 + .long 0xe2811008 // add r1, r1, #8 .long 0xf2066cda // vfma.f32 q3, q11, q5 .long 0xf2280158 // vorr q0, q4, q4 - .long 0xe28dd008 // add sp, sp, #8 .long 0xecbd8b10 // vpop {d8-d15} .long 0xe28dd004 // add sp, sp, #4 .long 0xe8bd4ff0 // pop {r4, r5, r6, r7, r8, r9, sl, fp, lr} @@ -7079,31 +7072,30 @@ FUNCTION(_sk_evenly_spaced_2_stop_gradient_vfp4) _sk_evenly_spaced_2_stop_gradient_vfp4: .long 0xe92d4010 // push {r4, lr} .long 0xe8911008 // ldm r1, {r3, ip} - .long 0xe3a0e014 // mov lr, #20 + .long 0xe3a0e01c // mov lr, #28 .long 0xe2811008 // add r1, r1, #8 - .long 0xe2832004 // add r2, r3, #4 + .long 0xe283200c // add r2, r3, #12 .long 0xe1a04003 // mov r4, r3 .long 0xf4e24cbf // vld1.32 {d20[]-d21[]}, [r2 :32] - .long 0xe283200c // add r2, r3, #12 - .long 0xf4e26cbf // vld1.32 {d22[]-d23[]}, [r2 :32] .long 0xe2832008 // add r2, r3, #8 + .long 0xf4e26cbf // vld1.32 {d22[]-d23[]}, [r2 :32] + .long 0xe2832004 // add r2, r3, #4 .long 0xf4e28cbf // vld1.32 {d24[]-d25[]}, [r2 :32] .long 0xe2832010 // add r2, r3, #16 .long 0xf4e42cbe // vld1.32 {d18[]-d19[]}, [r4 :32], lr .long 0xf4e20cbf // vld1.32 {d16[]-d17[]}, [r2 :32] - .long 0xe2832018 // add r2, r3, #24 + .long 0xe2832014 // add r2, r3, #20 .long 0xf2400c72 // vfma.f32 q8, q0, q9 + .long 0xf4a22cbf // vld1.32 {d2[]-d3[]}, [r2 :32] + .long 0xe2832018 // add r2, r3, #24 + .long 0xf2002c78 // vfma.f32 q1, q0, q12 .long 0xf4a24cbf // vld1.32 {d4[]-d5[]}, [r2 :32] - .long 0xe283201c // add r2, r3, #28 - .long 0xf2004c78 // vfma.f32 q2, q0, q12 - .long 0xf4a26cbf // vld1.32 {d6[]-d7[]}, [r2 :32] - .long 0xf2006c76 // vfma.f32 q3, q0, q11 - .long 0xf4a42cbf // vld1.32 {d2[]-d3[]}, [r4 :32] - .long 0xf2002c74 // vfma.f32 q1, q0, q10 + .long 0xf2004c76 // vfma.f32 q2, q0, q11 + .long 0xf4a46cbf // vld1.32 {d6[]-d7[]}, [r4 :32] + .long 0xf2006c74 // vfma.f32 q3, q0, q10 .long 0xf22001f0 // vorr q0, q8, q8 .long 0xe8bd4010 // pop {r4, lr} .long 0xe12fff1c // bx ip - .long 0xe320f000 // nop {0} HIDDEN _sk_xy_to_unit_angle_vfp4 .globl _sk_xy_to_unit_angle_vfp4 @@ -7815,13 +7807,11 @@ FUNCTION(_sk_clut_3D_vfp4) _sk_clut_3D_vfp4: .long 0xe92d4830 // push {r4, r5, fp, lr} .long 0xed2d8b10 // vpush {d8-d15} - .long 0xe24dd0b0 // sub sp, sp, #176 + .long 0xe24dd0a0 // sub sp, sp, #160 .long 0xe28de070 // add lr, sp, #112 - .long 0xe2812004 // add r2, r1, #4 - .long 0xe1a0c001 // mov ip, r1 .long 0xec8e6b04 // vstmia lr, {d6-d7} - .long 0xe58d20ac // str r2, [sp, #172] - .long 0xe49c2008 // ldr r2, [ip], #8 + .long 0xe8911004 // ldm r1, {r2, ip} + .long 0xe2811008 // add r1, r1, #8 .long 0xe8924008 // ldm r2, {r3, lr} .long 0xe5924008 // ldr r4, [r2, #8] .long 0xe592200c // ldr r2, [r2, #12] @@ -8131,7 +8121,7 @@ _sk_clut_3D_vfp4: .long 0xe0835105 // add r5, r3, r5, lsl #2 .long 0xedd55a00 // vldr s11, [r5] .long 0xee325b90 // vmov.32 r5, d18[1] - .long 0xea000004 // b 7308 <sk_clut_3D_vfp4+0x510> + .long 0xea000004 // b 72e0 <sk_clut_3D_vfp4+0x508> .long 0xe320f000 // nop {0} .long 0x3f7ff972 // .word 0x3f7ff972 .long 0x3f7ff972 // .word 0x3f7ff972 @@ -8299,8 +8289,6 @@ _sk_clut_3D_vfp4: .long 0xe28de090 // add lr, sp, #144 .long 0xed92ea00 // vldr s28, [r2] .long 0xf3fb2662 // vcvt.f32.s32 q9, q9 - .long 0xe5912004 // ldr r2, [r1, #4] - .long 0xe1a0100c // mov r1, ip .long 0xf26e0d44 // vsub.f32 q8, q7, q2 .long 0xf2004cf4 // vfma.f32 q2, q8, q10 .long 0xf2684d42 // vsub.f32 q10, q4, q1 @@ -8316,10 +8304,10 @@ _sk_clut_3D_vfp4: .long 0xf2020cf0 // vfma.f32 q0, q9, q8 .long 0xf206ccf0 // vfma.f32 q6, q11, q8 .long 0xf22c415c // vorr q2, q6, q6 - .long 0xe28dd0b0 // add sp, sp, #176 + .long 0xe28dd0a0 // add sp, sp, #160 .long 0xecbd8b10 // vpop {d8-d15} .long 0xe8bd4830 // pop {r4, r5, fp, lr} - .long 0xe12fff12 // bx r2 + .long 0xe12fff1c // bx ip .long 0xe320f000 // nop {0} HIDDEN _sk_clut_4D_vfp4 @@ -8329,11 +8317,9 @@ _sk_clut_4D_vfp4: .long 0xe92d41f0 // push {r4, r5, r6, r7, r8, lr} .long 0xed2d8b10 // vpush {d8-d15} .long 0xe24ddf6a // sub sp, sp, #424 - .long 0xe2812004 // add r2, r1, #4 - .long 0xe58d21a4 // str r2, [sp, #420] - .long 0xe1a0c001 // mov ip, r1 + .long 0xe8911004 // ldm r1, {r2, ip} .long 0xf2c0c052 // vmov.i32 q14, #2 - .long 0xe49c2008 // ldr r2, [ip], #8 + .long 0xe2811008 // add r1, r1, #8 .long 0xe8924008 // ldm r2, {r3, lr} .long 0xe592500c // ldr r5, [r2, #12] .long 0xe5924008 // ldr r4, [r2, #8] @@ -8652,7 +8638,7 @@ _sk_clut_4D_vfp4: .long 0xf2802051 // vmov.i32 q1, #1 .long 0xf22e29e0 // vmla.i32 q1, q15, q8 .long 0xedd20a00 // vldr s1, [r2] - .long 0xea000004 // b 7b18 <sk_clut_4D_vfp4+0x530> + .long 0xea000004 // b 7ae0 <sk_clut_4D_vfp4+0x528> .long 0xe320f000 // nop {0} .long 0x3f7ff972 // .word 0x3f7ff972 .long 0x3f7ff972 // .word 0x3f7ff972 @@ -9357,12 +9343,10 @@ _sk_clut_4D_vfp4: .long 0xe28de0e0 // add lr, sp, #224 .long 0xf2600de2 // vsub.f32 q8, q8, q9 .long 0xecde8b04 // vldmia lr, {d24-d25} - .long 0xe28f203c // add r2, pc, #60 + .long 0xe28f2034 // add r2, pc, #52 .long 0xf26c4d6a // vsub.f32 q10, q6, q13 .long 0xf4226acf // vld1.64 {d6-d7}, [r2] .long 0xf2642d40 // vsub.f32 q9, q2, q0 - .long 0xe5912004 // ldr r2, [r1, #4] - .long 0xe1a0100c // mov r1, ip .long 0xf26a6d68 // vsub.f32 q11, q5, q12 .long 0xf244acf0 // vfma.f32 q13, q10, q8 .long 0xf2020cf0 // vfma.f32 q0, q9, q8 @@ -9372,7 +9356,7 @@ _sk_clut_4D_vfp4: .long 0xe28ddf6a // add sp, sp, #424 .long 0xecbd8b10 // vpop {d8-d15} .long 0xe8bd41f0 // pop {r4, r5, r6, r7, r8, lr} - .long 0xe12fff12 // bx r2 + .long 0xe12fff1c // bx ip .long 0xe320f000 // nop {0} .long 0x3f800000 // .word 0x3f800000 .long 0x3f800000 // .word 0x3f800000 @@ -54257,11 +54241,11 @@ _sk_seed_shader_sse2: .byte 102,15,110,2 // movd (%edx),%xmm0 .byte 102,15,112,192,0 // pshufd $0x0,%xmm0,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,88,128,247,203,0,0 // addps 0xcbf7(%eax),%xmm0 + .byte 15,88,128,215,203,0,0 // addps 0xcbd7(%eax),%xmm0 .byte 102,15,110,74,4 // movd 0x4(%edx),%xmm1 .byte 102,15,112,201,0 // pshufd $0x0,%xmm1,%xmm1 .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 - .byte 15,88,136,7,204,0,0 // addps 0xcc07(%eax),%xmm1 + .byte 15,88,136,231,203,0,0 // addps 0xcbe7(%eax),%xmm1 .byte 141,113,4 // lea 0x4(%ecx),%esi .byte 15,87,210 // xorps %xmm2,%xmm2 .byte 15,41,82,64 // movaps %xmm2,0x40(%edx) @@ -54269,7 +54253,7 @@ _sk_seed_shader_sse2: .byte 15,41,82,32 // movaps %xmm2,0x20(%edx) .byte 15,41,82,16 // movaps %xmm2,0x10(%edx) .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,144,23,204,0,0 // movaps 0xcc17(%eax),%xmm2 + .byte 15,40,144,247,203,0,0 // movaps 0xcbf7(%eax),%xmm2 .byte 15,87,219 // xorps %xmm3,%xmm3 .byte 86 // push %esi .byte 82 // push %edx @@ -54296,15 +54280,15 @@ _sk_dither_sse2: .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 102,15,110,32 // movd (%eax),%xmm4 .byte 102,15,112,228,0 // pshufd $0x0,%xmm4,%xmm4 - .byte 102,15,254,161,178,203,0,0 // paddd 0xcbb2(%ecx),%xmm4 + .byte 102,15,254,161,146,203,0,0 // paddd 0xcb92(%ecx),%xmm4 .byte 102,15,110,104,4 // movd 0x4(%eax),%xmm5 .byte 102,15,112,253,0 // pshufd $0x0,%xmm5,%xmm7 .byte 102,15,239,252 // pxor %xmm4,%xmm7 - .byte 102,15,111,177,194,203,0,0 // movdqa 0xcbc2(%ecx),%xmm6 + .byte 102,15,111,177,162,203,0,0 // movdqa 0xcba2(%ecx),%xmm6 .byte 102,15,111,207 // movdqa %xmm7,%xmm1 .byte 102,15,219,206 // pand %xmm6,%xmm1 .byte 102,15,114,241,5 // pslld $0x5,%xmm1 - .byte 102,15,111,129,226,203,0,0 // movdqa 0xcbe2(%ecx),%xmm0 + .byte 102,15,111,129,194,203,0,0 // movdqa 0xcbc2(%ecx),%xmm0 .byte 102,15,111,239 // movdqa %xmm7,%xmm5 .byte 102,15,219,232 // pand %xmm0,%xmm5 .byte 102,15,114,245,2 // pslld $0x2,%xmm5 @@ -54314,7 +54298,7 @@ _sk_dither_sse2: .byte 102,15,219,196 // pand %xmm4,%xmm0 .byte 102,15,254,192 // paddd %xmm0,%xmm0 .byte 102,15,235,198 // por %xmm6,%xmm0 - .byte 102,15,111,137,210,203,0,0 // movdqa 0xcbd2(%ecx),%xmm1 + .byte 102,15,111,137,178,203,0,0 // movdqa 0xcbb2(%ecx),%xmm1 .byte 102,15,219,249 // pand %xmm1,%xmm7 .byte 102,15,219,225 // pand %xmm1,%xmm4 .byte 102,15,114,212,2 // psrld $0x2,%xmm4 @@ -54325,8 +54309,8 @@ _sk_dither_sse2: .byte 102,15,114,215,1 // psrld $0x1,%xmm7 .byte 102,15,235,231 // por %xmm7,%xmm4 .byte 15,91,196 // cvtdq2ps %xmm4,%xmm0 - .byte 15,89,129,242,203,0,0 // mulps 0xcbf2(%ecx),%xmm0 - .byte 15,88,129,2,204,0,0 // addps 0xcc02(%ecx),%xmm0 + .byte 15,89,129,210,203,0,0 // mulps 0xcbd2(%ecx),%xmm0 + .byte 15,88,129,226,203,0,0 // addps 0xcbe2(%ecx),%xmm0 .byte 243,15,16,14 // movss (%esi),%xmm1 .byte 15,198,201,0 // shufps $0x0,%xmm1,%xmm1 .byte 15,89,200 // mulps %xmm0,%xmm1 @@ -54394,7 +54378,7 @@ _sk_black_color_sse2: .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 141,81,4 // lea 0x4(%ecx),%edx .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,152,102,202,0,0 // movaps 0xca66(%eax),%xmm3 + .byte 15,40,152,70,202,0,0 // movaps 0xca46(%eax),%xmm3 .byte 15,87,192 // xorps %xmm0,%xmm0 .byte 15,87,201 // xorps %xmm1,%xmm1 .byte 15,87,210 // xorps %xmm2,%xmm2 @@ -54417,7 +54401,7 @@ _sk_white_color_sse2: .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 141,81,4 // lea 0x4(%ecx),%edx .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,128,54,202,0,0 // movaps 0xca36(%eax),%xmm0 + .byte 15,40,128,22,202,0,0 // movaps 0xca16(%eax),%xmm0 .byte 15,40,200 // movaps %xmm0,%xmm1 .byte 15,40,208 // movaps %xmm0,%xmm2 .byte 15,40,216 // movaps %xmm0,%xmm3 @@ -54507,7 +54491,7 @@ _sk_srcatop_sse2: .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 15,40,97,64 // movaps 0x40(%ecx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 - .byte 15,40,170,135,201,0,0 // movaps 0xc987(%edx),%xmm5 + .byte 15,40,170,103,201,0,0 // movaps 0xc967(%edx),%xmm5 .byte 15,92,235 // subps %xmm3,%xmm5 .byte 15,40,113,16 // movaps 0x10(%ecx),%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 @@ -54546,7 +54530,7 @@ _sk_dstatop_sse2: .byte 15,40,105,64 // movaps 0x40(%ecx),%xmm5 .byte 15,40,113,16 // movaps 0x10(%ecx),%xmm6 .byte 15,89,243 // mulps %xmm3,%xmm6 - .byte 15,40,162,40,201,0,0 // movaps 0xc928(%edx),%xmm4 + .byte 15,40,162,8,201,0,0 // movaps 0xc908(%edx),%xmm4 .byte 15,92,229 // subps %xmm5,%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 15,88,198 // addps %xmm6,%xmm0 @@ -54630,7 +54614,7 @@ _sk_srcout_sse2: .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,85,8 // mov 0x8(%ebp),%edx - .byte 15,40,160,103,200,0,0 // movaps 0xc867(%eax),%xmm4 + .byte 15,40,160,71,200,0,0 // movaps 0xc847(%eax),%xmm4 .byte 15,92,98,64 // subps 0x40(%edx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 15,89,204 // mulps %xmm4,%xmm1 @@ -54656,7 +54640,7 @@ _sk_dstout_sse2: .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,85,8 // mov 0x8(%ebp),%edx - .byte 15,40,160,47,200,0,0 // movaps 0xc82f(%eax),%xmm4 + .byte 15,40,160,15,200,0,0 // movaps 0xc80f(%eax),%xmm4 .byte 15,92,227 // subps %xmm3,%xmm4 .byte 15,40,66,16 // movaps 0x10(%edx),%xmm0 .byte 15,89,196 // mulps %xmm4,%xmm0 @@ -54686,7 +54670,7 @@ _sk_srcover_sse2: .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,85,8 // mov 0x8(%ebp),%edx - .byte 15,40,160,232,199,0,0 // movaps 0xc7e8(%eax),%xmm4 + .byte 15,40,160,200,199,0,0 // movaps 0xc7c8(%eax),%xmm4 .byte 15,92,227 // subps %xmm3,%xmm4 .byte 15,40,106,16 // movaps 0x10(%edx),%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 @@ -54720,7 +54704,7 @@ _sk_dstover_sse2: .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,85,8 // mov 0x8(%ebp),%edx .byte 15,40,106,64 // movaps 0x40(%edx),%xmm5 - .byte 15,40,160,152,199,0,0 // movaps 0xc798(%eax),%xmm4 + .byte 15,40,160,120,199,0,0 // movaps 0xc778(%eax),%xmm4 .byte 15,92,229 // subps %xmm5,%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 15,88,66,16 // addps 0x10(%edx),%xmm0 @@ -54776,7 +54760,7 @@ _sk_multiply_sse2: .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 15,40,80,64 // movaps 0x40(%eax),%xmm2 .byte 15,41,85,200 // movaps %xmm2,-0x38(%ebp) - .byte 15,40,129,25,199,0,0 // movaps 0xc719(%ecx),%xmm0 + .byte 15,40,129,249,198,0,0 // movaps 0xc6f9(%ecx),%xmm0 .byte 15,40,240 // movaps %xmm0,%xmm6 .byte 15,92,242 // subps %xmm2,%xmm6 .byte 15,40,254 // movaps %xmm6,%xmm7 @@ -54836,7 +54820,7 @@ _sk_plus__sse2: .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,85,8 // mov 0x8(%ebp),%edx .byte 15,88,66,16 // addps 0x10(%edx),%xmm0 - .byte 15,40,160,115,198,0,0 // movaps 0xc673(%eax),%xmm4 + .byte 15,40,160,83,198,0,0 // movaps 0xc653(%eax),%xmm4 .byte 15,93,196 // minps %xmm4,%xmm0 .byte 15,88,74,32 // addps 0x20(%edx),%xmm1 .byte 15,93,204 // minps %xmm4,%xmm1 @@ -54908,7 +54892,7 @@ _sk_xor__sse2: .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 15,40,105,64 // movaps 0x40(%ecx),%xmm5 - .byte 15,40,154,197,197,0,0 // movaps 0xc5c5(%edx),%xmm3 + .byte 15,40,154,165,197,0,0 // movaps 0xc5a5(%edx),%xmm3 .byte 15,40,243 // movaps %xmm3,%xmm6 .byte 15,92,245 // subps %xmm5,%xmm6 .byte 15,89,198 // mulps %xmm6,%xmm0 @@ -54970,7 +54954,7 @@ _sk_darken_sse2: .byte 15,89,203 // mulps %xmm3,%xmm1 .byte 15,95,209 // maxps %xmm1,%xmm2 .byte 15,92,234 // subps %xmm2,%xmm5 - .byte 15,40,138,93,197,0,0 // movaps 0xc55d(%edx),%xmm1 + .byte 15,40,138,61,197,0,0 // movaps 0xc53d(%edx),%xmm1 .byte 15,92,203 // subps %xmm3,%xmm1 .byte 15,89,206 // mulps %xmm6,%xmm1 .byte 15,88,217 // addps %xmm1,%xmm3 @@ -55019,7 +55003,7 @@ _sk_lighten_sse2: .byte 15,89,203 // mulps %xmm3,%xmm1 .byte 15,93,209 // minps %xmm1,%xmm2 .byte 15,92,234 // subps %xmm2,%xmm5 - .byte 15,40,138,221,196,0,0 // movaps 0xc4dd(%edx),%xmm1 + .byte 15,40,138,189,196,0,0 // movaps 0xc4bd(%edx),%xmm1 .byte 15,92,203 // subps %xmm3,%xmm1 .byte 15,89,206 // mulps %xmm6,%xmm1 .byte 15,88,217 // addps %xmm1,%xmm3 @@ -55072,7 +55056,7 @@ _sk_difference_sse2: .byte 15,93,214 // minps %xmm6,%xmm2 .byte 15,88,210 // addps %xmm2,%xmm2 .byte 15,92,226 // subps %xmm2,%xmm4 - .byte 15,40,146,90,196,0,0 // movaps 0xc45a(%edx),%xmm2 + .byte 15,40,146,58,196,0,0 // movaps 0xc43a(%edx),%xmm2 .byte 15,92,211 // subps %xmm3,%xmm2 .byte 15,89,213 // mulps %xmm5,%xmm2 .byte 15,88,218 // addps %xmm2,%xmm3 @@ -55116,7 +55100,7 @@ _sk_exclusion_sse2: .byte 15,89,202 // mulps %xmm2,%xmm1 .byte 15,88,201 // addps %xmm1,%xmm1 .byte 15,92,233 // subps %xmm1,%xmm5 - .byte 15,40,138,212,195,0,0 // movaps 0xc3d4(%edx),%xmm1 + .byte 15,40,138,180,195,0,0 // movaps 0xc3b4(%edx),%xmm1 .byte 15,92,203 // subps %xmm3,%xmm1 .byte 15,89,73,64 // mulps 0x40(%ecx),%xmm1 .byte 15,88,217 // addps %xmm1,%xmm3 @@ -55157,7 +55141,7 @@ _sk_colorburn_sse2: .byte 15,93,198 // minps %xmm6,%xmm0 .byte 15,40,233 // movaps %xmm1,%xmm5 .byte 15,92,232 // subps %xmm0,%xmm5 - .byte 15,40,177,85,195,0,0 // movaps 0xc355(%ecx),%xmm6 + .byte 15,40,177,53,195,0,0 // movaps 0xc335(%ecx),%xmm6 .byte 15,40,198 // movaps %xmm6,%xmm0 .byte 15,92,193 // subps %xmm1,%xmm0 .byte 15,41,69,200 // movaps %xmm0,-0x38(%ebp) @@ -55274,7 +55258,7 @@ _sk_colordodge_sse2: .byte 89 // pop %ecx .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 15,40,72,16 // movaps 0x10(%eax),%xmm1 - .byte 15,40,145,204,193,0,0 // movaps 0xc1cc(%ecx),%xmm2 + .byte 15,40,145,172,193,0,0 // movaps 0xc1ac(%ecx),%xmm2 .byte 15,40,226 // movaps %xmm2,%xmm4 .byte 15,92,214 // subps %xmm6,%xmm2 .byte 15,40,250 // movaps %xmm2,%xmm7 @@ -55391,7 +55375,7 @@ _sk_hardlight_sse2: .byte 89 // pop %ecx .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 15,40,72,64 // movaps 0x40(%eax),%xmm1 - .byte 15,40,145,107,192,0,0 // movaps 0xc06b(%ecx),%xmm2 + .byte 15,40,145,75,192,0,0 // movaps 0xc04b(%ecx),%xmm2 .byte 15,40,234 // movaps %xmm2,%xmm5 .byte 15,92,233 // subps %xmm1,%xmm5 .byte 15,40,225 // movaps %xmm1,%xmm4 @@ -55501,7 +55485,7 @@ _sk_overlay_sse2: .byte 89 // pop %ecx .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 15,40,80,64 // movaps 0x40(%eax),%xmm2 - .byte 15,40,161,32,191,0,0 // movaps 0xbf20(%ecx),%xmm4 + .byte 15,40,161,0,191,0,0 // movaps 0xbf00(%ecx),%xmm4 .byte 15,40,244 // movaps %xmm4,%xmm6 .byte 15,92,242 // subps %xmm2,%xmm6 .byte 15,40,206 // movaps %xmm6,%xmm1 @@ -55629,17 +55613,17 @@ _sk_softlight_sse2: .byte 232,0,0,0,0 // call f50 <_sk_softlight_sse2+0x52> .byte 89 // pop %ecx .byte 15,40,194 // movaps %xmm2,%xmm0 - .byte 15,40,137,0,190,0,0 // movaps 0xbe00(%ecx),%xmm1 + .byte 15,40,137,224,189,0,0 // movaps 0xbde0(%ecx),%xmm1 .byte 15,41,141,104,255,255,255 // movaps %xmm1,-0x98(%ebp) .byte 15,88,193 // addps %xmm1,%xmm0 .byte 15,89,198 // mulps %xmm6,%xmm0 - .byte 15,40,185,144,189,0,0 // movaps 0xbd90(%ecx),%xmm7 + .byte 15,40,185,112,189,0,0 // movaps 0xbd70(%ecx),%xmm7 .byte 15,41,125,232 // movaps %xmm7,-0x18(%ebp) .byte 15,92,250 // subps %xmm2,%xmm7 .byte 15,82,242 // rsqrtps %xmm2,%xmm6 .byte 15,83,206 // rcpps %xmm6,%xmm1 .byte 15,92,202 // subps %xmm2,%xmm1 - .byte 15,40,161,16,190,0,0 // movaps 0xbe10(%ecx),%xmm4 + .byte 15,40,161,240,189,0,0 // movaps 0xbdf0(%ecx),%xmm4 .byte 15,41,101,152 // movaps %xmm4,-0x68(%ebp) .byte 15,89,212 // mulps %xmm4,%xmm2 .byte 15,88,208 // addps %xmm0,%xmm2 @@ -55845,7 +55829,7 @@ _sk_hue_sse2: .byte 15,40,226 // movaps %xmm2,%xmm4 .byte 15,40,72,64 // movaps 0x40(%eax),%xmm1 .byte 15,41,77,216 // movaps %xmm1,-0x28(%ebp) - .byte 15,40,169,207,186,0,0 // movaps 0xbacf(%ecx),%xmm5 + .byte 15,40,169,175,186,0,0 // movaps 0xbaaf(%ecx),%xmm5 .byte 15,92,233 // subps %xmm1,%xmm5 .byte 15,89,197 // mulps %xmm5,%xmm0 .byte 15,41,133,72,255,255,255 // movaps %xmm0,-0xb8(%ebp) @@ -55878,17 +55862,17 @@ _sk_hue_sse2: .byte 15,89,233 // mulps %xmm1,%xmm5 .byte 15,41,173,120,255,255,255 // movaps %xmm5,-0x88(%ebp) .byte 15,89,193 // mulps %xmm1,%xmm0 - .byte 15,40,153,95,187,0,0 // movaps 0xbb5f(%ecx),%xmm3 + .byte 15,40,153,63,187,0,0 // movaps 0xbb3f(%ecx),%xmm3 .byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp) .byte 15,40,117,152 // movaps -0x68(%ebp),%xmm6 .byte 15,40,206 // movaps %xmm6,%xmm1 .byte 15,89,203 // mulps %xmm3,%xmm1 - .byte 15,40,153,111,187,0,0 // movaps 0xbb6f(%ecx),%xmm3 + .byte 15,40,153,79,187,0,0 // movaps 0xbb4f(%ecx),%xmm3 .byte 15,40,109,136 // movaps -0x78(%ebp),%xmm5 .byte 15,40,253 // movaps %xmm5,%xmm7 .byte 15,89,251 // mulps %xmm3,%xmm7 .byte 15,88,249 // addps %xmm1,%xmm7 - .byte 15,40,137,207,186,0,0 // movaps 0xbacf(%ecx),%xmm1 + .byte 15,40,137,175,186,0,0 // movaps 0xbaaf(%ecx),%xmm1 .byte 15,92,77,184 // subps -0x48(%ebp),%xmm1 .byte 15,89,241 // mulps %xmm1,%xmm6 .byte 15,41,117,152 // movaps %xmm6,-0x68(%ebp) @@ -55898,7 +55882,7 @@ _sk_hue_sse2: .byte 15,40,77,200 // movaps -0x38(%ebp),%xmm1 .byte 15,89,241 // mulps %xmm1,%xmm6 .byte 15,41,117,168 // movaps %xmm6,-0x58(%ebp) - .byte 15,40,169,127,187,0,0 // movaps 0xbb7f(%ecx),%xmm5 + .byte 15,40,169,95,187,0,0 // movaps 0xbb5f(%ecx),%xmm5 .byte 15,89,205 // mulps %xmm5,%xmm1 .byte 15,88,207 // addps %xmm7,%xmm1 .byte 15,94,212 // divps %xmm4,%xmm2 @@ -56091,17 +56075,17 @@ _sk_saturation_sse2: .byte 15,89,253 // mulps %xmm5,%xmm7 .byte 232,0,0,0,0 // call 1565 <_sk_saturation_sse2+0xb0> .byte 89 // pop %ecx - .byte 15,40,153,11,184,0,0 // movaps 0xb80b(%ecx),%xmm3 + .byte 15,40,153,235,183,0,0 // movaps 0xb7eb(%ecx),%xmm3 .byte 15,41,157,88,255,255,255 // movaps %xmm3,-0xa8(%ebp) .byte 15,40,77,184 // movaps -0x48(%ebp),%xmm1 .byte 15,40,193 // movaps %xmm1,%xmm0 .byte 15,89,195 // mulps %xmm3,%xmm0 - .byte 15,40,153,27,184,0,0 // movaps 0xb81b(%ecx),%xmm3 + .byte 15,40,153,251,183,0,0 // movaps 0xb7fb(%ecx),%xmm3 .byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp) .byte 15,40,238 // movaps %xmm6,%xmm5 .byte 15,89,235 // mulps %xmm3,%xmm5 .byte 15,88,232 // addps %xmm0,%xmm5 - .byte 15,40,129,123,183,0,0 // movaps 0xb77b(%ecx),%xmm0 + .byte 15,40,129,91,183,0,0 // movaps 0xb75b(%ecx),%xmm0 .byte 15,41,133,104,255,255,255 // movaps %xmm0,-0x98(%ebp) .byte 15,92,69,216 // subps -0x28(%ebp),%xmm0 .byte 15,89,200 // mulps %xmm0,%xmm1 @@ -56113,7 +56097,7 @@ _sk_saturation_sse2: .byte 15,89,200 // mulps %xmm0,%xmm1 .byte 15,41,141,120,255,255,255 // movaps %xmm1,-0x88(%ebp) .byte 15,40,200 // movaps %xmm0,%xmm1 - .byte 15,40,129,43,184,0,0 // movaps 0xb82b(%ecx),%xmm0 + .byte 15,40,129,11,184,0,0 // movaps 0xb80b(%ecx),%xmm0 .byte 15,89,200 // mulps %xmm0,%xmm1 .byte 15,88,205 // addps %xmm5,%xmm1 .byte 15,40,109,168 // movaps -0x58(%ebp),%xmm5 @@ -56272,16 +56256,16 @@ _sk_color_sse2: .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 15,40,80,16 // movaps 0x10(%eax),%xmm2 .byte 15,40,72,32 // movaps 0x20(%eax),%xmm1 - .byte 15,40,177,176,181,0,0 // movaps 0xb5b0(%ecx),%xmm6 + .byte 15,40,177,144,181,0,0 // movaps 0xb590(%ecx),%xmm6 .byte 15,41,117,216 // movaps %xmm6,-0x28(%ebp) .byte 15,40,194 // movaps %xmm2,%xmm0 .byte 15,89,198 // mulps %xmm6,%xmm0 - .byte 15,40,153,192,181,0,0 // movaps 0xb5c0(%ecx),%xmm3 + .byte 15,40,153,160,181,0,0 // movaps 0xb5a0(%ecx),%xmm3 .byte 15,41,93,184 // movaps %xmm3,-0x48(%ebp) .byte 15,40,241 // movaps %xmm1,%xmm6 .byte 15,89,243 // mulps %xmm3,%xmm6 .byte 15,88,240 // addps %xmm0,%xmm6 - .byte 15,40,129,32,181,0,0 // movaps 0xb520(%ecx),%xmm0 + .byte 15,40,129,0,181,0,0 // movaps 0xb500(%ecx),%xmm0 .byte 15,41,69,168 // movaps %xmm0,-0x58(%ebp) .byte 15,92,69,200 // subps -0x38(%ebp),%xmm0 .byte 15,89,208 // mulps %xmm0,%xmm2 @@ -56291,7 +56275,7 @@ _sk_color_sse2: .byte 15,40,80,48 // movaps 0x30(%eax),%xmm2 .byte 15,89,194 // mulps %xmm2,%xmm0 .byte 15,41,133,72,255,255,255 // movaps %xmm0,-0xb8(%ebp) - .byte 15,40,137,208,181,0,0 // movaps 0xb5d0(%ecx),%xmm1 + .byte 15,40,137,176,181,0,0 // movaps 0xb5b0(%ecx),%xmm1 .byte 15,89,209 // mulps %xmm1,%xmm2 .byte 15,88,214 // addps %xmm6,%xmm2 .byte 15,40,88,64 // movaps 0x40(%eax),%xmm3 @@ -56450,18 +56434,18 @@ _sk_luminosity_sse2: .byte 232,0,0,0,0 // call 1a23 <_sk_luminosity_sse2+0x11> .byte 89 // pop %ecx .byte 139,69,8 // mov 0x8(%ebp),%eax - .byte 15,40,161,77,179,0,0 // movaps 0xb34d(%ecx),%xmm4 + .byte 15,40,161,45,179,0,0 // movaps 0xb32d(%ecx),%xmm4 .byte 15,41,101,232 // movaps %xmm4,-0x18(%ebp) .byte 15,40,208 // movaps %xmm0,%xmm2 .byte 15,89,212 // mulps %xmm4,%xmm2 - .byte 15,40,161,93,179,0,0 // movaps 0xb35d(%ecx),%xmm4 + .byte 15,40,161,61,179,0,0 // movaps 0xb33d(%ecx),%xmm4 .byte 15,41,101,216 // movaps %xmm4,-0x28(%ebp) .byte 15,40,233 // movaps %xmm1,%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 .byte 15,88,234 // addps %xmm2,%xmm5 .byte 15,40,80,64 // movaps 0x40(%eax),%xmm2 .byte 15,41,85,184 // movaps %xmm2,-0x48(%ebp) - .byte 15,40,161,189,178,0,0 // movaps 0xb2bd(%ecx),%xmm4 + .byte 15,40,161,157,178,0,0 // movaps 0xb29d(%ecx),%xmm4 .byte 15,40,252 // movaps %xmm4,%xmm7 .byte 15,92,250 // subps %xmm2,%xmm7 .byte 15,89,199 // mulps %xmm7,%xmm0 @@ -56471,7 +56455,7 @@ _sk_luminosity_sse2: .byte 15,89,254 // mulps %xmm6,%xmm7 .byte 15,41,189,104,255,255,255 // movaps %xmm7,-0x98(%ebp) .byte 15,40,214 // movaps %xmm6,%xmm2 - .byte 15,40,137,109,179,0,0 // movaps 0xb36d(%ecx),%xmm1 + .byte 15,40,137,77,179,0,0 // movaps 0xb34d(%ecx),%xmm1 .byte 15,89,209 // mulps %xmm1,%xmm2 .byte 15,88,213 // addps %xmm5,%xmm2 .byte 15,40,104,16 // movaps 0x10(%eax),%xmm5 @@ -56647,7 +56631,7 @@ _sk_srcover_rgba_8888_sse2: .byte 139,49 // mov (%ecx),%esi .byte 15,133,224,0,0,0 // jne 1d90 <_sk_srcover_rgba_8888_sse2+0x119> .byte 243,15,111,20,178 // movdqu (%edx,%esi,4),%xmm2 - .byte 102,15,111,167,18,177,0,0 // movdqa 0xb112(%edi),%xmm4 + .byte 102,15,111,167,242,176,0,0 // movdqa 0xb0f2(%edi),%xmm4 .byte 102,15,111,234 // movdqa %xmm2,%xmm5 .byte 102,15,219,236 // pand %xmm4,%xmm5 .byte 102,15,111,242 // movdqa %xmm2,%xmm6 @@ -56658,9 +56642,9 @@ _sk_srcover_rgba_8888_sse2: .byte 102,15,219,252 // pand %xmm4,%xmm7 .byte 15,91,229 // cvtdq2ps %xmm5,%xmm4 .byte 15,41,97,16 // movaps %xmm4,0x10(%ecx) - .byte 15,40,175,82,176,0,0 // movaps 0xb052(%edi),%xmm5 + .byte 15,40,175,50,176,0,0 // movaps 0xb032(%edi),%xmm5 .byte 15,92,235 // subps %xmm3,%xmm5 - .byte 15,40,143,34,177,0,0 // movaps 0xb122(%edi),%xmm1 + .byte 15,40,143,2,177,0,0 // movaps 0xb102(%edi),%xmm1 .byte 15,89,193 // mulps %xmm1,%xmm0 .byte 15,89,229 // mulps %xmm5,%xmm4 .byte 15,88,224 // addps %xmm0,%xmm4 @@ -56774,7 +56758,7 @@ _sk_clamp_1_sse2: .byte 232,0,0,0,0 // call 1e3a <_sk_clamp_1_sse2+0xb> .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 15,40,160,166,174,0,0 // movaps 0xaea6(%eax),%xmm4 + .byte 15,40,160,134,174,0,0 // movaps 0xae86(%eax),%xmm4 .byte 15,93,196 // minps %xmm4,%xmm0 .byte 15,93,204 // minps %xmm4,%xmm1 .byte 15,93,212 // minps %xmm4,%xmm2 @@ -56798,7 +56782,7 @@ _sk_clamp_a_sse2: .byte 232,0,0,0,0 // call 1e6d <_sk_clamp_a_sse2+0xb> .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 15,93,152,115,174,0,0 // minps 0xae73(%eax),%xmm3 + .byte 15,93,152,83,174,0,0 // minps 0xae53(%eax),%xmm3 .byte 15,93,195 // minps %xmm3,%xmm0 .byte 15,93,203 // minps %xmm3,%xmm1 .byte 15,93,211 // minps %xmm3,%xmm2 @@ -56823,7 +56807,7 @@ _sk_clamp_a_dst_sse2: .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,85,8 // mov 0x8(%ebp),%edx .byte 15,40,98,64 // movaps 0x40(%edx),%xmm4 - .byte 15,93,160,67,174,0,0 // minps 0xae43(%eax),%xmm4 + .byte 15,93,160,35,174,0,0 // minps 0xae23(%eax),%xmm4 .byte 15,41,98,64 // movaps %xmm4,0x40(%edx) .byte 15,40,106,16 // movaps 0x10(%edx),%xmm5 .byte 15,40,114,32 // movaps 0x20(%edx),%xmm6 @@ -56897,7 +56881,7 @@ _sk_invert_sse2: .byte 232,0,0,0,0 // call 1f48 <_sk_invert_sse2+0xb> .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 15,40,160,152,173,0,0 // movaps 0xad98(%eax),%xmm4 + .byte 15,40,160,120,173,0,0 // movaps 0xad78(%eax),%xmm4 .byte 15,40,236 // movaps %xmm4,%xmm5 .byte 15,92,232 // subps %xmm0,%xmm5 .byte 15,40,244 // movaps %xmm4,%xmm6 @@ -57020,7 +57004,7 @@ _sk_unpremul_sse2: .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 15,87,228 // xorps %xmm4,%xmm4 - .byte 15,40,168,154,172,0,0 // movaps 0xac9a(%eax),%xmm5 + .byte 15,40,168,122,172,0,0 // movaps 0xac7a(%eax),%xmm5 .byte 15,94,235 // divps %xmm3,%xmm5 .byte 15,194,227,4 // cmpneqps %xmm3,%xmm4 .byte 15,84,229 // andps %xmm5,%xmm4 @@ -57051,19 +57035,19 @@ _sk_from_srgb_sse2: .byte 88 // pop %eax .byte 15,40,202 // movaps %xmm2,%xmm1 .byte 15,89,201 // mulps %xmm1,%xmm1 - .byte 15,40,160,224,172,0,0 // movaps 0xace0(%eax),%xmm4 + .byte 15,40,160,192,172,0,0 // movaps 0xacc0(%eax),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 - .byte 15,40,176,64,173,0,0 // movaps 0xad40(%eax),%xmm6 + .byte 15,40,176,32,173,0,0 // movaps 0xad20(%eax),%xmm6 .byte 15,41,117,216 // movaps %xmm6,-0x28(%ebp) .byte 15,88,198 // addps %xmm6,%xmm0 .byte 15,89,193 // mulps %xmm1,%xmm0 - .byte 15,40,176,48,173,0,0 // movaps 0xad30(%eax),%xmm6 + .byte 15,40,176,16,173,0,0 // movaps 0xad10(%eax),%xmm6 .byte 15,40,202 // movaps %xmm2,%xmm1 .byte 15,89,206 // mulps %xmm6,%xmm1 - .byte 15,40,184,80,173,0,0 // movaps 0xad50(%eax),%xmm7 + .byte 15,40,184,48,173,0,0 // movaps 0xad30(%eax),%xmm7 .byte 15,41,125,232 // movaps %xmm7,-0x18(%ebp) .byte 15,88,199 // addps %xmm7,%xmm0 - .byte 15,40,184,96,173,0,0 // movaps 0xad60(%eax),%xmm7 + .byte 15,40,184,64,173,0,0 // movaps 0xad40(%eax),%xmm7 .byte 15,194,215,1 // cmpltps %xmm7,%xmm2 .byte 15,84,202 // andps %xmm2,%xmm1 .byte 15,85,208 // andnps %xmm0,%xmm2 @@ -57123,18 +57107,18 @@ _sk_from_srgb_dst_sse2: .byte 15,40,72,16 // movaps 0x10(%eax),%xmm1 .byte 15,40,233 // movaps %xmm1,%xmm5 .byte 15,89,237 // mulps %xmm5,%xmm5 - .byte 15,40,161,5,172,0,0 // movaps 0xac05(%ecx),%xmm4 + .byte 15,40,161,229,171,0,0 // movaps 0xabe5(%ecx),%xmm4 .byte 15,40,193 // movaps %xmm1,%xmm0 .byte 15,89,196 // mulps %xmm4,%xmm0 - .byte 15,40,177,101,172,0,0 // movaps 0xac65(%ecx),%xmm6 + .byte 15,40,177,69,172,0,0 // movaps 0xac45(%ecx),%xmm6 .byte 15,88,198 // addps %xmm6,%xmm0 .byte 15,89,197 // mulps %xmm5,%xmm0 - .byte 15,40,169,85,172,0,0 // movaps 0xac55(%ecx),%xmm5 + .byte 15,40,169,53,172,0,0 // movaps 0xac35(%ecx),%xmm5 .byte 15,40,209 // movaps %xmm1,%xmm2 .byte 15,89,213 // mulps %xmm5,%xmm2 - .byte 15,40,185,117,172,0,0 // movaps 0xac75(%ecx),%xmm7 + .byte 15,40,185,85,172,0,0 // movaps 0xac55(%ecx),%xmm7 .byte 15,88,199 // addps %xmm7,%xmm0 - .byte 15,40,153,133,172,0,0 // movaps 0xac85(%ecx),%xmm3 + .byte 15,40,153,101,172,0,0 // movaps 0xac65(%ecx),%xmm3 .byte 15,194,203,1 // cmpltps %xmm3,%xmm1 .byte 15,84,209 // andps %xmm1,%xmm2 .byte 15,85,200 // andnps %xmm0,%xmm1 @@ -57196,25 +57180,25 @@ _sk_to_srgb_sse2: .byte 232,0,0,0,0 // call 2256 <_sk_to_srgb_sse2+0x18> .byte 88 // pop %eax .byte 15,82,218 // rsqrtps %xmm2,%xmm3 - .byte 15,40,160,186,171,0,0 // movaps 0xabba(%eax),%xmm4 + .byte 15,40,160,154,171,0,0 // movaps 0xab9a(%eax),%xmm4 .byte 15,40,235 // movaps %xmm3,%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 - .byte 15,40,128,202,171,0,0 // movaps 0xabca(%eax),%xmm0 + .byte 15,40,128,170,171,0,0 // movaps 0xabaa(%eax),%xmm0 .byte 15,41,69,232 // movaps %xmm0,-0x18(%ebp) .byte 15,88,232 // addps %xmm0,%xmm5 .byte 15,89,235 // mulps %xmm3,%xmm5 - .byte 15,40,128,218,171,0,0 // movaps 0xabda(%eax),%xmm0 + .byte 15,40,128,186,171,0,0 // movaps 0xabba(%eax),%xmm0 .byte 15,41,69,200 // movaps %xmm0,-0x38(%ebp) .byte 15,88,232 // addps %xmm0,%xmm5 - .byte 15,40,128,234,171,0,0 // movaps 0xabea(%eax),%xmm0 + .byte 15,40,128,202,171,0,0 // movaps 0xabca(%eax),%xmm0 .byte 15,41,69,216 // movaps %xmm0,-0x28(%ebp) .byte 15,88,216 // addps %xmm0,%xmm3 .byte 15,83,195 // rcpps %xmm3,%xmm0 .byte 15,89,197 // mulps %xmm5,%xmm0 - .byte 15,40,168,170,171,0,0 // movaps 0xabaa(%eax),%xmm5 + .byte 15,40,168,138,171,0,0 // movaps 0xab8a(%eax),%xmm5 .byte 15,40,202 // movaps %xmm2,%xmm1 .byte 15,89,205 // mulps %xmm5,%xmm1 - .byte 15,40,152,250,171,0,0 // movaps 0xabfa(%eax),%xmm3 + .byte 15,40,152,218,171,0,0 // movaps 0xabda(%eax),%xmm3 .byte 15,194,211,1 // cmpltps %xmm3,%xmm2 .byte 15,84,202 // andps %xmm2,%xmm1 .byte 15,85,208 // andnps %xmm0,%xmm2 @@ -57285,14 +57269,14 @@ _sk_rgb_to_hsl_sse2: .byte 15,40,195 // movaps %xmm3,%xmm0 .byte 15,92,193 // subps %xmm1,%xmm0 .byte 15,41,69,216 // movaps %xmm0,-0x28(%ebp) - .byte 15,40,136,147,169,0,0 // movaps 0xa993(%eax),%xmm1 + .byte 15,40,136,115,169,0,0 // movaps 0xa973(%eax),%xmm1 .byte 15,94,200 // divps %xmm0,%xmm1 .byte 15,40,199 // movaps %xmm7,%xmm0 .byte 15,92,194 // subps %xmm2,%xmm0 .byte 15,89,193 // mulps %xmm1,%xmm0 .byte 15,40,239 // movaps %xmm7,%xmm5 .byte 15,194,234,1 // cmpltps %xmm2,%xmm5 - .byte 15,84,168,19,171,0,0 // andps 0xab13(%eax),%xmm5 + .byte 15,84,168,243,170,0,0 // andps 0xaaf3(%eax),%xmm5 .byte 15,88,232 // addps %xmm0,%xmm5 .byte 15,40,195 // movaps %xmm3,%xmm0 .byte 15,194,196,0 // cmpeqps %xmm4,%xmm0 @@ -57302,9 +57286,9 @@ _sk_rgb_to_hsl_sse2: .byte 15,92,231 // subps %xmm7,%xmm4 .byte 15,89,209 // mulps %xmm1,%xmm2 .byte 15,89,225 // mulps %xmm1,%xmm4 - .byte 15,40,136,35,171,0,0 // movaps 0xab23(%eax),%xmm1 + .byte 15,40,136,3,171,0,0 // movaps 0xab03(%eax),%xmm1 .byte 15,88,209 // addps %xmm1,%xmm2 - .byte 15,88,160,51,171,0,0 // addps 0xab33(%eax),%xmm4 + .byte 15,88,160,19,171,0,0 // addps 0xab13(%eax),%xmm4 .byte 15,84,214 // andps %xmm6,%xmm2 .byte 15,85,244 // andnps %xmm4,%xmm6 .byte 15,86,242 // orps %xmm2,%xmm6 @@ -57316,7 +57300,7 @@ _sk_rgb_to_hsl_sse2: .byte 15,194,226,4 // cmpneqps %xmm2,%xmm4 .byte 15,92,203 // subps %xmm3,%xmm1 .byte 15,88,218 // addps %xmm2,%xmm3 - .byte 15,40,168,131,169,0,0 // movaps 0xa983(%eax),%xmm5 + .byte 15,40,168,99,169,0,0 // movaps 0xa963(%eax),%xmm5 .byte 15,92,202 // subps %xmm2,%xmm1 .byte 15,40,211 // movaps %xmm3,%xmm2 .byte 15,89,213 // mulps %xmm5,%xmm2 @@ -57326,7 +57310,7 @@ _sk_rgb_to_hsl_sse2: .byte 15,86,233 // orps %xmm1,%xmm5 .byte 15,40,77,216 // movaps -0x28(%ebp),%xmm1 .byte 15,94,205 // divps %xmm5,%xmm1 - .byte 15,89,128,67,171,0,0 // mulps 0xab43(%eax),%xmm0 + .byte 15,89,128,35,171,0,0 // mulps 0xab23(%eax),%xmm0 .byte 15,84,196 // andps %xmm4,%xmm0 .byte 15,84,204 // andps %xmm4,%xmm1 .byte 139,69,12 // mov 0xc(%ebp),%eax @@ -57351,7 +57335,7 @@ _sk_hsl_to_rgb_sse2: .byte 15,41,69,184 // movaps %xmm0,-0x48(%ebp) .byte 232,0,0,0,0 // call 2448 <_sk_hsl_to_rgb_sse2+0x19> .byte 88 // pop %eax - .byte 15,40,160,136,168,0,0 // movaps 0xa888(%eax),%xmm4 + .byte 15,40,160,104,168,0,0 // movaps 0xa868(%eax),%xmm4 .byte 15,40,220 // movaps %xmm4,%xmm3 .byte 15,41,165,104,255,255,255 // movaps %xmm4,-0x98(%ebp) .byte 15,194,218,2 // cmpleps %xmm2,%xmm3 @@ -57364,13 +57348,13 @@ _sk_hsl_to_rgb_sse2: .byte 15,84,243 // andps %xmm3,%xmm6 .byte 15,85,217 // andnps %xmm1,%xmm3 .byte 15,86,222 // orps %xmm6,%xmm3 - .byte 15,40,168,88,170,0,0 // movaps 0xaa58(%eax),%xmm5 + .byte 15,40,168,56,170,0,0 // movaps 0xaa38(%eax),%xmm5 .byte 15,88,232 // addps %xmm0,%xmm5 .byte 243,15,91,205 // cvttps2dq %xmm5,%xmm1 .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,194,193,1 // cmpltps %xmm1,%xmm0 - .byte 15,40,176,152,168,0,0 // movaps 0xa898(%eax),%xmm6 + .byte 15,40,176,120,168,0,0 // movaps 0xa878(%eax),%xmm6 .byte 15,41,117,136 // movaps %xmm6,-0x78(%ebp) .byte 15,84,198 // andps %xmm6,%xmm0 .byte 15,92,200 // subps %xmm0,%xmm1 @@ -57380,19 +57364,19 @@ _sk_hsl_to_rgb_sse2: .byte 15,41,93,216 // movaps %xmm3,-0x28(%ebp) .byte 15,88,210 // addps %xmm2,%xmm2 .byte 15,92,211 // subps %xmm3,%xmm2 - .byte 15,40,184,104,170,0,0 // movaps 0xaa68(%eax),%xmm7 + .byte 15,40,184,72,170,0,0 // movaps 0xaa48(%eax),%xmm7 .byte 15,41,189,88,255,255,255 // movaps %xmm7,-0xa8(%ebp) .byte 15,194,253,2 // cmpleps %xmm5,%xmm7 .byte 15,92,218 // subps %xmm2,%xmm3 .byte 15,41,93,200 // movaps %xmm3,-0x38(%ebp) .byte 15,40,204 // movaps %xmm4,%xmm1 .byte 15,194,205,2 // cmpleps %xmm5,%xmm1 - .byte 15,40,160,72,170,0,0 // movaps 0xaa48(%eax),%xmm4 + .byte 15,40,160,40,170,0,0 // movaps 0xaa28(%eax),%xmm4 .byte 15,41,165,120,255,255,255 // movaps %xmm4,-0x88(%ebp) .byte 15,194,229,2 // cmpleps %xmm5,%xmm4 - .byte 15,40,176,24,170,0,0 // movaps 0xaa18(%eax),%xmm6 + .byte 15,40,176,248,169,0,0 // movaps 0xa9f8(%eax),%xmm6 .byte 15,89,238 // mulps %xmm6,%xmm5 - .byte 15,40,128,56,170,0,0 // movaps 0xaa38(%eax),%xmm0 + .byte 15,40,128,24,170,0,0 // movaps 0xaa18(%eax),%xmm0 .byte 15,41,69,168 // movaps %xmm0,-0x58(%ebp) .byte 15,92,197 // subps %xmm5,%xmm0 .byte 15,89,195 // mulps %xmm3,%xmm0 @@ -57418,18 +57402,18 @@ _sk_hsl_to_rgb_sse2: .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 .byte 15,40,203 // movaps %xmm3,%xmm1 .byte 15,194,200,1 // cmpltps %xmm0,%xmm1 - .byte 15,84,136,152,168,0,0 // andps 0xa898(%eax),%xmm1 + .byte 15,84,136,120,168,0,0 // andps 0xa878(%eax),%xmm1 .byte 15,92,193 // subps %xmm1,%xmm0 .byte 15,40,203 // movaps %xmm3,%xmm1 .byte 15,92,200 // subps %xmm0,%xmm1 - .byte 15,40,128,104,170,0,0 // movaps 0xaa68(%eax),%xmm0 + .byte 15,40,128,72,170,0,0 // movaps 0xaa48(%eax),%xmm0 .byte 15,194,193,2 // cmpleps %xmm1,%xmm0 - .byte 15,40,152,136,168,0,0 // movaps 0xa888(%eax),%xmm3 + .byte 15,40,152,104,168,0,0 // movaps 0xa868(%eax),%xmm3 .byte 15,194,217,2 // cmpleps %xmm1,%xmm3 - .byte 15,40,160,72,170,0,0 // movaps 0xaa48(%eax),%xmm4 + .byte 15,40,160,40,170,0,0 // movaps 0xaa28(%eax),%xmm4 .byte 15,194,225,2 // cmpleps %xmm1,%xmm4 .byte 15,89,206 // mulps %xmm6,%xmm1 - .byte 15,40,168,56,170,0,0 // movaps 0xaa38(%eax),%xmm5 + .byte 15,40,168,24,170,0,0 // movaps 0xaa18(%eax),%xmm5 .byte 15,92,233 // subps %xmm1,%xmm5 .byte 15,89,239 // mulps %xmm7,%xmm5 .byte 15,88,234 // addps %xmm2,%xmm5 @@ -57449,7 +57433,7 @@ _sk_hsl_to_rgb_sse2: .byte 15,40,125,232 // movaps -0x18(%ebp),%xmm7 .byte 15,85,252 // andnps %xmm4,%xmm7 .byte 15,40,93,184 // movaps -0x48(%ebp),%xmm3 - .byte 15,88,152,120,170,0,0 // addps 0xaa78(%eax),%xmm3 + .byte 15,88,152,88,170,0,0 // addps 0xaa58(%eax),%xmm3 .byte 243,15,91,195 // cvttps2dq %xmm3,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 .byte 15,40,203 // movaps %xmm3,%xmm1 @@ -57551,9 +57535,9 @@ _sk_scale_u8_sse2: .byte 102,15,110,36,62 // movd (%esi,%edi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 .byte 102,15,97,224 // punpcklwd %xmm0,%xmm4 - .byte 102,15,219,162,222,166,0,0 // pand 0xa6de(%edx),%xmm4 + .byte 102,15,219,162,190,166,0,0 // pand 0xa6be(%edx),%xmm4 .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 - .byte 15,89,162,14,168,0,0 // mulps 0xa80e(%edx),%xmm4 + .byte 15,89,162,238,167,0,0 // mulps 0xa7ee(%edx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 15,89,204 // mulps %xmm4,%xmm1 .byte 15,89,212 // mulps %xmm4,%xmm2 @@ -57619,17 +57603,17 @@ _sk_scale_565_sse2: .byte 15,133,157,0,0,0 // jne 283a <_sk_scale_565_sse2+0xd8> .byte 243,15,126,52,126 // movq (%esi,%edi,2),%xmm6 .byte 102,15,97,240 // punpcklwd %xmm0,%xmm6 - .byte 102,15,111,162,100,167,0,0 // movdqa 0xa764(%edx),%xmm4 + .byte 102,15,111,162,68,167,0,0 // movdqa 0xa744(%edx),%xmm4 .byte 102,15,219,230 // pand %xmm6,%xmm4 .byte 15,91,212 // cvtdq2ps %xmm4,%xmm2 - .byte 15,89,146,116,167,0,0 // mulps 0xa774(%edx),%xmm2 - .byte 102,15,111,170,132,167,0,0 // movdqa 0xa784(%edx),%xmm5 + .byte 15,89,146,84,167,0,0 // mulps 0xa754(%edx),%xmm2 + .byte 102,15,111,170,100,167,0,0 // movdqa 0xa764(%edx),%xmm5 .byte 102,15,219,238 // pand %xmm6,%xmm5 .byte 15,91,237 // cvtdq2ps %xmm5,%xmm5 - .byte 15,89,170,148,167,0,0 // mulps 0xa794(%edx),%xmm5 - .byte 102,15,219,178,164,167,0,0 // pand 0xa7a4(%edx),%xmm6 + .byte 15,89,170,116,167,0,0 // mulps 0xa774(%edx),%xmm5 + .byte 102,15,219,178,132,167,0,0 // pand 0xa784(%edx),%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 - .byte 15,89,178,180,167,0,0 // mulps 0xa7b4(%edx),%xmm6 + .byte 15,89,178,148,167,0,0 // mulps 0xa794(%edx),%xmm6 .byte 15,40,253 // movaps %xmm5,%xmm7 .byte 15,93,254 // minps %xmm6,%xmm7 .byte 15,40,226 // movaps %xmm2,%xmm4 @@ -57743,9 +57727,9 @@ _sk_lerp_u8_sse2: .byte 102,15,110,36,62 // movd (%esi,%edi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 .byte 102,15,97,224 // punpcklwd %xmm0,%xmm4 - .byte 102,15,219,162,182,164,0,0 // pand 0xa4b6(%edx),%xmm4 + .byte 102,15,219,162,150,164,0,0 // pand 0xa496(%edx),%xmm4 .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 - .byte 15,89,162,230,165,0,0 // mulps 0xa5e6(%edx),%xmm4 + .byte 15,89,162,198,165,0,0 // mulps 0xa5c6(%edx),%xmm4 .byte 15,40,105,16 // movaps 0x10(%ecx),%xmm5 .byte 15,40,113,32 // movaps 0x20(%ecx),%xmm6 .byte 15,92,197 // subps %xmm5,%xmm0 @@ -57823,17 +57807,17 @@ _sk_lerp_565_sse2: .byte 15,133,211,0,0,0 // jne 2ac8 <_sk_lerp_565_sse2+0x113> .byte 243,15,126,44,126 // movq (%esi,%edi,2),%xmm5 .byte 102,15,97,232 // punpcklwd %xmm0,%xmm5 - .byte 102,15,111,162,12,165,0,0 // movdqa 0xa50c(%edx),%xmm4 + .byte 102,15,111,162,236,164,0,0 // movdqa 0xa4ec(%edx),%xmm4 .byte 102,15,219,229 // pand %xmm5,%xmm4 .byte 15,91,204 // cvtdq2ps %xmm4,%xmm1 - .byte 15,89,138,28,165,0,0 // mulps 0xa51c(%edx),%xmm1 - .byte 102,15,111,178,44,165,0,0 // movdqa 0xa52c(%edx),%xmm6 + .byte 15,89,138,252,164,0,0 // mulps 0xa4fc(%edx),%xmm1 + .byte 102,15,111,178,12,165,0,0 // movdqa 0xa50c(%edx),%xmm6 .byte 102,15,219,245 // pand %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 - .byte 15,89,178,60,165,0,0 // mulps 0xa53c(%edx),%xmm6 - .byte 102,15,219,170,76,165,0,0 // pand 0xa54c(%edx),%xmm5 + .byte 15,89,178,28,165,0,0 // mulps 0xa51c(%edx),%xmm6 + .byte 102,15,219,170,44,165,0,0 // pand 0xa52c(%edx),%xmm5 .byte 15,91,213 // cvtdq2ps %xmm5,%xmm2 - .byte 15,89,146,92,165,0,0 // mulps 0xa55c(%edx),%xmm2 + .byte 15,89,146,60,165,0,0 // mulps 0xa53c(%edx),%xmm2 .byte 15,40,218 // movaps %xmm2,%xmm3 .byte 15,41,93,200 // movaps %xmm3,-0x38(%ebp) .byte 15,40,254 // movaps %xmm6,%xmm7 @@ -57912,16 +57896,16 @@ _sk_load_tables_sse2: .byte 131,236,12 // sub $0xc,%esp .byte 232,0,0,0,0 // call 2b1e <_sk_load_tables_sse2+0xe> .byte 90 // pop %edx - .byte 139,117,12 // mov 0xc(%ebp),%esi + .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,57 // mov (%ecx),%edi + .byte 139,48 // mov (%eax),%esi .byte 139,65,8 // mov 0x8(%ecx),%eax .byte 133,192 // test %eax,%eax - .byte 139,54 // mov (%esi),%esi + .byte 139,57 // mov (%ecx),%edi .byte 139,30 // mov (%esi),%ebx .byte 15,133,22,1,0,0 // jne 2c4c <_sk_load_tables_sse2+0x13c> .byte 243,15,111,28,187 // movdqu (%ebx,%edi,4),%xmm3 - .byte 102,15,111,146,130,162,0,0 // movdqa 0xa282(%edx),%xmm2 + .byte 102,15,111,146,98,162,0,0 // movdqa 0xa262(%edx),%xmm2 .byte 102,15,111,195 // movdqa %xmm3,%xmm0 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1 @@ -57977,7 +57961,7 @@ _sk_load_tables_sse2: .byte 102,15,20,215 // unpcklpd %xmm7,%xmm2 .byte 102,15,114,211,24 // psrld $0x18,%xmm3 .byte 15,91,219 // cvtdq2ps %xmm3,%xmm3 - .byte 15,89,154,178,163,0,0 // mulps 0xa3b2(%edx),%xmm3 + .byte 15,89,154,146,163,0,0 // mulps 0xa392(%edx),%xmm3 .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 137,194 // mov %eax,%edx .byte 141,66,8 // lea 0x8(%edx),%eax @@ -58018,17 +58002,17 @@ _sk_load_tables_u16_be_sse2: .byte 131,236,44 // sub $0x2c,%esp .byte 232,0,0,0,0 // call 2c8f <_sk_load_tables_u16_be_sse2+0xe> .byte 90 // pop %edx - .byte 139,69,12 // mov 0xc(%ebp),%eax + .byte 139,117,12 // mov 0xc(%ebp),%esi .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,57 // mov (%ecx),%edi - .byte 139,89,8 // mov 0x8(%ecx),%ebx + .byte 139,65,8 // mov 0x8(%ecx),%eax .byte 193,231,2 // shl $0x2,%edi - .byte 133,219 // test %ebx,%ebx - .byte 139,48 // mov (%eax),%esi - .byte 139,6 // mov (%esi),%eax + .byte 133,192 // test %eax,%eax + .byte 139,54 // mov (%esi),%esi + .byte 139,30 // mov (%esi),%ebx .byte 15,133,210,1,0,0 // jne 2e7c <_sk_load_tables_u16_be_sse2+0x1fb> - .byte 102,15,16,4,120 // movupd (%eax,%edi,2),%xmm0 - .byte 243,15,111,76,120,16 // movdqu 0x10(%eax,%edi,2),%xmm1 + .byte 102,15,16,4,123 // movupd (%ebx,%edi,2),%xmm0 + .byte 243,15,111,76,123,16 // movdqu 0x10(%ebx,%edi,2),%xmm1 .byte 102,15,40,216 // movapd %xmm0,%xmm3 .byte 102,15,97,217 // punpcklwd %xmm1,%xmm3 .byte 102,15,105,193 // punpckhwd %xmm1,%xmm0 @@ -58052,7 +58036,7 @@ _sk_load_tables_u16_be_sse2: .byte 242,15,112,192,232 // pshuflw $0xe8,%xmm0,%xmm0 .byte 243,15,112,192,232 // pshufhw $0xe8,%xmm0,%xmm0 .byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0 - .byte 102,15,111,146,177,162,0,0 // movdqa 0xa2b1(%edx),%xmm2 + .byte 102,15,111,146,145,162,0,0 // movdqa 0xa291(%edx),%xmm2 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,97,196 // punpcklwd %xmm4,%xmm0 @@ -58124,7 +58108,7 @@ _sk_load_tables_u16_be_sse2: .byte 243,15,126,93,232 // movq -0x18(%ebp),%xmm3 .byte 102,15,97,220 // punpcklwd %xmm4,%xmm3 .byte 15,91,219 // cvtdq2ps %xmm3,%xmm3 - .byte 15,89,154,193,162,0,0 // mulps 0xa2c1(%edx),%xmm3 + .byte 15,89,154,161,162,0,0 // mulps 0xa2a1(%edx),%xmm3 .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 137,194 // mov %eax,%edx .byte 141,66,8 // lea 0x8(%edx),%eax @@ -58138,14 +58122,14 @@ _sk_load_tables_u16_be_sse2: .byte 91 // pop %ebx .byte 93 // pop %ebp .byte 195 // ret - .byte 242,15,16,4,120 // movsd (%eax,%edi,2),%xmm0 + .byte 242,15,16,4,123 // movsd (%ebx,%edi,2),%xmm0 .byte 102,15,239,201 // pxor %xmm1,%xmm1 - .byte 131,251,1 // cmp $0x1,%ebx + .byte 131,248,1 // cmp $0x1,%eax .byte 15,132,39,254,255,255 // je 2cb5 <_sk_load_tables_u16_be_sse2+0x34> - .byte 102,15,22,68,120,8 // movhpd 0x8(%eax,%edi,2),%xmm0 - .byte 131,251,3 // cmp $0x3,%ebx + .byte 102,15,22,68,123,8 // movhpd 0x8(%ebx,%edi,2),%xmm0 + .byte 131,248,3 // cmp $0x3,%eax .byte 15,130,24,254,255,255 // jb 2cb5 <_sk_load_tables_u16_be_sse2+0x34> - .byte 243,15,126,76,120,16 // movq 0x10(%eax,%edi,2),%xmm1 + .byte 243,15,126,76,123,16 // movq 0x10(%ebx,%edi,2),%xmm1 .byte 233,13,254,255,255 // jmp 2cb5 <_sk_load_tables_u16_be_sse2+0x34> HIDDEN _sk_load_tables_rgb_u16_be_sse2 @@ -58197,7 +58181,7 @@ _sk_load_tables_rgb_u16_be_sse2: .byte 242,15,112,194,232 // pshuflw $0xe8,%xmm2,%xmm0 .byte 243,15,112,192,232 // pshufhw $0xe8,%xmm0,%xmm0 .byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0 - .byte 102,15,111,146,138,160,0,0 // movdqa 0xa08a(%edx),%xmm2 + .byte 102,15,111,146,106,160,0,0 // movdqa 0xa06a(%edx),%xmm2 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,97,195 // punpcklwd %xmm3,%xmm0 @@ -58262,7 +58246,7 @@ _sk_load_tables_rgb_u16_be_sse2: .byte 137,198 // mov %eax,%esi .byte 141,70,8 // lea 0x8(%esi),%eax .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,154,42,158,0,0 // movaps 0x9e2a(%edx),%xmm3 + .byte 15,40,154,10,158,0,0 // movaps 0x9e0a(%edx),%xmm3 .byte 80 // push %eax .byte 81 // push %ecx .byte 255,86,4 // call *0x4(%esi) @@ -58305,7 +58289,7 @@ _sk_byte_tables_sse2: .byte 90 // pop %edx .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,8 // mov (%eax),%ecx - .byte 15,40,162,205,156,0,0 // movaps 0x9ccd(%edx),%xmm4 + .byte 15,40,162,173,156,0,0 // movaps 0x9cad(%edx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0 .byte 102,15,112,232,78 // pshufd $0x4e,%xmm0,%xmm5 @@ -58327,7 +58311,7 @@ _sk_byte_tables_sse2: .byte 102,15,110,192 // movd %eax,%xmm0 .byte 139,65,4 // mov 0x4(%ecx),%eax .byte 102,15,196,195,1 // pinsrw $0x1,%ebx,%xmm0 - .byte 15,40,170,237,157,0,0 // movaps 0x9ded(%edx),%xmm5 + .byte 15,40,170,205,157,0,0 // movaps 0x9dcd(%edx),%xmm5 .byte 15,89,204 // mulps %xmm4,%xmm1 .byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1 .byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6 @@ -58457,7 +58441,7 @@ _sk_byte_tables_rgb_sse2: .byte 102,15,110,199 // movd %edi,%xmm0 .byte 139,121,4 // mov 0x4(%ecx),%edi .byte 102,15,196,198,1 // pinsrw $0x1,%esi,%xmm0 - .byte 15,40,170,241,155,0,0 // movaps 0x9bf1(%edx),%xmm5 + .byte 15,40,170,209,155,0,0 // movaps 0x9bd1(%edx),%xmm5 .byte 15,89,204 // mulps %xmm4,%xmm1 .byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1 .byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6 @@ -58713,15 +58697,15 @@ _sk_parametric_r_sse2: .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,88,245 // addps %xmm5,%xmm6 .byte 15,91,238 // cvtdq2ps %xmm6,%xmm5 - .byte 15,89,170,177,153,0,0 // mulps 0x99b1(%edx),%xmm5 - .byte 15,84,178,193,153,0,0 // andps 0x99c1(%edx),%xmm6 - .byte 15,86,178,33,151,0,0 // orps 0x9721(%edx),%xmm6 - .byte 15,88,170,209,153,0,0 // addps 0x99d1(%edx),%xmm5 - .byte 15,40,186,225,153,0,0 // movaps 0x99e1(%edx),%xmm7 + .byte 15,89,170,145,153,0,0 // mulps 0x9991(%edx),%xmm5 + .byte 15,84,178,161,153,0,0 // andps 0x99a1(%edx),%xmm6 + .byte 15,86,178,1,151,0,0 // orps 0x9701(%edx),%xmm6 + .byte 15,88,170,177,153,0,0 // addps 0x99b1(%edx),%xmm5 + .byte 15,40,186,193,153,0,0 // movaps 0x99c1(%edx),%xmm7 .byte 15,89,254 // mulps %xmm6,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,88,178,241,153,0,0 // addps 0x99f1(%edx),%xmm6 - .byte 15,40,186,1,154,0,0 // movaps 0x9a01(%edx),%xmm7 + .byte 15,88,178,209,153,0,0 // addps 0x99d1(%edx),%xmm6 + .byte 15,40,186,225,153,0,0 // movaps 0x99e1(%edx),%xmm7 .byte 15,94,254 // divps %xmm6,%xmm7 .byte 243,15,16,49 // movss (%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -58731,21 +58715,21 @@ _sk_parametric_r_sse2: .byte 15,91,254 // cvtdq2ps %xmm6,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,194,199,1 // cmpltps %xmm7,%xmm0 - .byte 15,40,178,49,151,0,0 // movaps 0x9731(%edx),%xmm6 + .byte 15,40,178,17,151,0,0 // movaps 0x9711(%edx),%xmm6 .byte 15,84,198 // andps %xmm6,%xmm0 .byte 15,92,248 // subps %xmm0,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,92,199 // subps %xmm7,%xmm0 - .byte 15,88,170,17,154,0,0 // addps 0x9a11(%edx),%xmm5 - .byte 15,40,186,33,154,0,0 // movaps 0x9a21(%edx),%xmm7 + .byte 15,88,170,241,153,0,0 // addps 0x99f1(%edx),%xmm5 + .byte 15,40,186,1,154,0,0 // movaps 0x9a01(%edx),%xmm7 .byte 15,89,248 // mulps %xmm0,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,40,186,49,154,0,0 // movaps 0x9a31(%edx),%xmm7 + .byte 15,40,186,17,154,0,0 // movaps 0x9a11(%edx),%xmm7 .byte 15,92,248 // subps %xmm0,%xmm7 - .byte 15,40,130,65,154,0,0 // movaps 0x9a41(%edx),%xmm0 + .byte 15,40,130,33,154,0,0 // movaps 0x9a21(%edx),%xmm0 .byte 15,94,199 // divps %xmm7,%xmm0 .byte 15,88,197 // addps %xmm5,%xmm0 - .byte 15,89,130,81,154,0,0 // mulps 0x9a51(%edx),%xmm0 + .byte 15,89,130,49,154,0,0 // mulps 0x9a31(%edx),%xmm0 .byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0 .byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 @@ -58799,15 +58783,15 @@ _sk_parametric_g_sse2: .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,88,245 // addps %xmm5,%xmm6 .byte 15,91,238 // cvtdq2ps %xmm6,%xmm5 - .byte 15,89,170,122,152,0,0 // mulps 0x987a(%edx),%xmm5 - .byte 15,84,178,138,152,0,0 // andps 0x988a(%edx),%xmm6 - .byte 15,86,178,234,149,0,0 // orps 0x95ea(%edx),%xmm6 - .byte 15,88,170,154,152,0,0 // addps 0x989a(%edx),%xmm5 - .byte 15,40,186,170,152,0,0 // movaps 0x98aa(%edx),%xmm7 + .byte 15,89,170,90,152,0,0 // mulps 0x985a(%edx),%xmm5 + .byte 15,84,178,106,152,0,0 // andps 0x986a(%edx),%xmm6 + .byte 15,86,178,202,149,0,0 // orps 0x95ca(%edx),%xmm6 + .byte 15,88,170,122,152,0,0 // addps 0x987a(%edx),%xmm5 + .byte 15,40,186,138,152,0,0 // movaps 0x988a(%edx),%xmm7 .byte 15,89,254 // mulps %xmm6,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,88,178,186,152,0,0 // addps 0x98ba(%edx),%xmm6 - .byte 15,40,186,202,152,0,0 // movaps 0x98ca(%edx),%xmm7 + .byte 15,88,178,154,152,0,0 // addps 0x989a(%edx),%xmm6 + .byte 15,40,186,170,152,0,0 // movaps 0x98aa(%edx),%xmm7 .byte 15,94,254 // divps %xmm6,%xmm7 .byte 243,15,16,49 // movss (%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -58817,21 +58801,21 @@ _sk_parametric_g_sse2: .byte 15,91,254 // cvtdq2ps %xmm6,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,194,199,1 // cmpltps %xmm7,%xmm0 - .byte 15,40,178,250,149,0,0 // movaps 0x95fa(%edx),%xmm6 + .byte 15,40,178,218,149,0,0 // movaps 0x95da(%edx),%xmm6 .byte 15,84,198 // andps %xmm6,%xmm0 .byte 15,92,248 // subps %xmm0,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,92,199 // subps %xmm7,%xmm0 - .byte 15,88,170,218,152,0,0 // addps 0x98da(%edx),%xmm5 - .byte 15,40,186,234,152,0,0 // movaps 0x98ea(%edx),%xmm7 + .byte 15,88,170,186,152,0,0 // addps 0x98ba(%edx),%xmm5 + .byte 15,40,186,202,152,0,0 // movaps 0x98ca(%edx),%xmm7 .byte 15,89,248 // mulps %xmm0,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,40,186,250,152,0,0 // movaps 0x98fa(%edx),%xmm7 + .byte 15,40,186,218,152,0,0 // movaps 0x98da(%edx),%xmm7 .byte 15,92,248 // subps %xmm0,%xmm7 - .byte 15,40,130,10,153,0,0 // movaps 0x990a(%edx),%xmm0 + .byte 15,40,130,234,152,0,0 // movaps 0x98ea(%edx),%xmm0 .byte 15,94,199 // divps %xmm7,%xmm0 .byte 15,88,197 // addps %xmm5,%xmm0 - .byte 15,89,130,26,153,0,0 // mulps 0x991a(%edx),%xmm0 + .byte 15,89,130,250,152,0,0 // mulps 0x98fa(%edx),%xmm0 .byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0 .byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 @@ -58884,15 +58868,15 @@ _sk_parametric_b_sse2: .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,88,245 // addps %xmm5,%xmm6 .byte 15,91,238 // cvtdq2ps %xmm6,%xmm5 - .byte 15,89,170,70,151,0,0 // mulps 0x9746(%edx),%xmm5 - .byte 15,84,178,86,151,0,0 // andps 0x9756(%edx),%xmm6 - .byte 15,86,178,182,148,0,0 // orps 0x94b6(%edx),%xmm6 - .byte 15,88,170,102,151,0,0 // addps 0x9766(%edx),%xmm5 - .byte 15,40,186,118,151,0,0 // movaps 0x9776(%edx),%xmm7 + .byte 15,89,170,38,151,0,0 // mulps 0x9726(%edx),%xmm5 + .byte 15,84,178,54,151,0,0 // andps 0x9736(%edx),%xmm6 + .byte 15,86,178,150,148,0,0 // orps 0x9496(%edx),%xmm6 + .byte 15,88,170,70,151,0,0 // addps 0x9746(%edx),%xmm5 + .byte 15,40,186,86,151,0,0 // movaps 0x9756(%edx),%xmm7 .byte 15,89,254 // mulps %xmm6,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,88,178,134,151,0,0 // addps 0x9786(%edx),%xmm6 - .byte 15,40,186,150,151,0,0 // movaps 0x9796(%edx),%xmm7 + .byte 15,88,178,102,151,0,0 // addps 0x9766(%edx),%xmm6 + .byte 15,40,186,118,151,0,0 // movaps 0x9776(%edx),%xmm7 .byte 15,94,254 // divps %xmm6,%xmm7 .byte 243,15,16,49 // movss (%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -58902,21 +58886,21 @@ _sk_parametric_b_sse2: .byte 15,91,254 // cvtdq2ps %xmm6,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,194,199,1 // cmpltps %xmm7,%xmm0 - .byte 15,40,178,198,148,0,0 // movaps 0x94c6(%edx),%xmm6 + .byte 15,40,178,166,148,0,0 // movaps 0x94a6(%edx),%xmm6 .byte 15,84,198 // andps %xmm6,%xmm0 .byte 15,92,248 // subps %xmm0,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,92,199 // subps %xmm7,%xmm0 - .byte 15,88,170,166,151,0,0 // addps 0x97a6(%edx),%xmm5 - .byte 15,40,186,182,151,0,0 // movaps 0x97b6(%edx),%xmm7 + .byte 15,88,170,134,151,0,0 // addps 0x9786(%edx),%xmm5 + .byte 15,40,186,150,151,0,0 // movaps 0x9796(%edx),%xmm7 .byte 15,89,248 // mulps %xmm0,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,40,186,198,151,0,0 // movaps 0x97c6(%edx),%xmm7 + .byte 15,40,186,166,151,0,0 // movaps 0x97a6(%edx),%xmm7 .byte 15,92,248 // subps %xmm0,%xmm7 - .byte 15,40,130,214,151,0,0 // movaps 0x97d6(%edx),%xmm0 + .byte 15,40,130,182,151,0,0 // movaps 0x97b6(%edx),%xmm0 .byte 15,94,199 // divps %xmm7,%xmm0 .byte 15,88,197 // addps %xmm5,%xmm0 - .byte 15,89,130,230,151,0,0 // mulps 0x97e6(%edx),%xmm0 + .byte 15,89,130,198,151,0,0 // mulps 0x97c6(%edx),%xmm0 .byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0 .byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 @@ -58969,15 +58953,15 @@ _sk_parametric_a_sse2: .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,88,245 // addps %xmm5,%xmm6 .byte 15,91,238 // cvtdq2ps %xmm6,%xmm5 - .byte 15,89,170,18,150,0,0 // mulps 0x9612(%edx),%xmm5 - .byte 15,84,178,34,150,0,0 // andps 0x9622(%edx),%xmm6 - .byte 15,86,178,130,147,0,0 // orps 0x9382(%edx),%xmm6 - .byte 15,88,170,50,150,0,0 // addps 0x9632(%edx),%xmm5 - .byte 15,40,186,66,150,0,0 // movaps 0x9642(%edx),%xmm7 + .byte 15,89,170,242,149,0,0 // mulps 0x95f2(%edx),%xmm5 + .byte 15,84,178,2,150,0,0 // andps 0x9602(%edx),%xmm6 + .byte 15,86,178,98,147,0,0 // orps 0x9362(%edx),%xmm6 + .byte 15,88,170,18,150,0,0 // addps 0x9612(%edx),%xmm5 + .byte 15,40,186,34,150,0,0 // movaps 0x9622(%edx),%xmm7 .byte 15,89,254 // mulps %xmm6,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,88,178,82,150,0,0 // addps 0x9652(%edx),%xmm6 - .byte 15,40,186,98,150,0,0 // movaps 0x9662(%edx),%xmm7 + .byte 15,88,178,50,150,0,0 // addps 0x9632(%edx),%xmm6 + .byte 15,40,186,66,150,0,0 // movaps 0x9642(%edx),%xmm7 .byte 15,94,254 // divps %xmm6,%xmm7 .byte 243,15,16,49 // movss (%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -58987,21 +58971,21 @@ _sk_parametric_a_sse2: .byte 15,91,254 // cvtdq2ps %xmm6,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,194,199,1 // cmpltps %xmm7,%xmm0 - .byte 15,40,178,146,147,0,0 // movaps 0x9392(%edx),%xmm6 + .byte 15,40,178,114,147,0,0 // movaps 0x9372(%edx),%xmm6 .byte 15,84,198 // andps %xmm6,%xmm0 .byte 15,92,248 // subps %xmm0,%xmm7 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,92,199 // subps %xmm7,%xmm0 - .byte 15,88,170,114,150,0,0 // addps 0x9672(%edx),%xmm5 - .byte 15,40,186,130,150,0,0 // movaps 0x9682(%edx),%xmm7 + .byte 15,88,170,82,150,0,0 // addps 0x9652(%edx),%xmm5 + .byte 15,40,186,98,150,0,0 // movaps 0x9662(%edx),%xmm7 .byte 15,89,248 // mulps %xmm0,%xmm7 .byte 15,92,239 // subps %xmm7,%xmm5 - .byte 15,40,186,146,150,0,0 // movaps 0x9692(%edx),%xmm7 + .byte 15,40,186,114,150,0,0 // movaps 0x9672(%edx),%xmm7 .byte 15,92,248 // subps %xmm0,%xmm7 - .byte 15,40,130,162,150,0,0 // movaps 0x96a2(%edx),%xmm0 + .byte 15,40,130,130,150,0,0 // movaps 0x9682(%edx),%xmm0 .byte 15,94,199 // divps %xmm7,%xmm0 .byte 15,88,197 // addps %xmm5,%xmm0 - .byte 15,89,130,178,150,0,0 // mulps 0x96b2(%edx),%xmm0 + .byte 15,89,130,146,150,0,0 // mulps 0x9692(%edx),%xmm0 .byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0 .byte 243,15,16,105,20 // movss 0x14(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 @@ -59036,15 +59020,15 @@ _sk_gamma_sse2: .byte 232,0,0,0,0 // call 3a7f <_sk_gamma_sse2+0x12> .byte 88 // pop %eax .byte 15,91,195 // cvtdq2ps %xmm3,%xmm0 - .byte 15,89,128,225,148,0,0 // mulps 0x94e1(%eax),%xmm0 - .byte 15,84,152,241,148,0,0 // andps 0x94f1(%eax),%xmm3 - .byte 15,86,152,81,146,0,0 // orps 0x9251(%eax),%xmm3 - .byte 15,88,128,1,149,0,0 // addps 0x9501(%eax),%xmm0 + .byte 15,89,128,193,148,0,0 // mulps 0x94c1(%eax),%xmm0 + .byte 15,84,152,209,148,0,0 // andps 0x94d1(%eax),%xmm3 + .byte 15,86,152,49,146,0,0 // orps 0x9231(%eax),%xmm3 + .byte 15,88,128,225,148,0,0 // addps 0x94e1(%eax),%xmm0 .byte 15,40,227 // movaps %xmm3,%xmm4 - .byte 15,89,160,17,149,0,0 // mulps 0x9511(%eax),%xmm4 + .byte 15,89,160,241,148,0,0 // mulps 0x94f1(%eax),%xmm4 .byte 15,92,196 // subps %xmm4,%xmm0 - .byte 15,88,152,33,149,0,0 // addps 0x9521(%eax),%xmm3 - .byte 15,40,160,49,149,0,0 // movaps 0x9531(%eax),%xmm4 + .byte 15,88,152,1,149,0,0 // addps 0x9501(%eax),%xmm3 + .byte 15,40,160,17,149,0,0 // movaps 0x9511(%eax),%xmm4 .byte 15,94,227 // divps %xmm3,%xmm4 .byte 15,92,196 // subps %xmm4,%xmm0 .byte 139,77,12 // mov 0xc(%ebp),%ecx @@ -59057,30 +59041,30 @@ _sk_gamma_sse2: .byte 15,91,219 // cvtdq2ps %xmm3,%xmm3 .byte 15,40,224 // movaps %xmm0,%xmm4 .byte 15,194,227,1 // cmpltps %xmm3,%xmm4 - .byte 15,84,160,97,146,0,0 // andps 0x9261(%eax),%xmm4 + .byte 15,84,160,65,146,0,0 // andps 0x9241(%eax),%xmm4 .byte 15,92,220 // subps %xmm4,%xmm3 .byte 15,40,224 // movaps %xmm0,%xmm4 .byte 15,92,227 // subps %xmm3,%xmm4 - .byte 15,88,128,65,149,0,0 // addps 0x9541(%eax),%xmm0 - .byte 15,40,176,97,149,0,0 // movaps 0x9561(%eax),%xmm6 + .byte 15,88,128,33,149,0,0 // addps 0x9521(%eax),%xmm0 + .byte 15,40,176,65,149,0,0 // movaps 0x9541(%eax),%xmm6 .byte 15,92,244 // subps %xmm4,%xmm6 - .byte 15,40,168,81,149,0,0 // movaps 0x9551(%eax),%xmm5 + .byte 15,40,168,49,149,0,0 // movaps 0x9531(%eax),%xmm5 .byte 15,89,229 // mulps %xmm5,%xmm4 .byte 15,92,196 // subps %xmm4,%xmm0 - .byte 15,40,152,113,149,0,0 // movaps 0x9571(%eax),%xmm3 + .byte 15,40,152,81,149,0,0 // movaps 0x9551(%eax),%xmm3 .byte 15,40,227 // movaps %xmm3,%xmm4 .byte 15,94,230 // divps %xmm6,%xmm4 .byte 15,88,224 // addps %xmm0,%xmm4 .byte 15,91,193 // cvtdq2ps %xmm1,%xmm0 - .byte 15,89,128,225,148,0,0 // mulps 0x94e1(%eax),%xmm0 - .byte 15,84,136,241,148,0,0 // andps 0x94f1(%eax),%xmm1 - .byte 15,86,136,81,146,0,0 // orps 0x9251(%eax),%xmm1 - .byte 15,88,128,1,149,0,0 // addps 0x9501(%eax),%xmm0 + .byte 15,89,128,193,148,0,0 // mulps 0x94c1(%eax),%xmm0 + .byte 15,84,136,209,148,0,0 // andps 0x94d1(%eax),%xmm1 + .byte 15,86,136,49,146,0,0 // orps 0x9231(%eax),%xmm1 + .byte 15,88,128,225,148,0,0 // addps 0x94e1(%eax),%xmm0 .byte 15,40,241 // movaps %xmm1,%xmm6 - .byte 15,89,176,17,149,0,0 // mulps 0x9511(%eax),%xmm6 + .byte 15,89,176,241,148,0,0 // mulps 0x94f1(%eax),%xmm6 .byte 15,92,198 // subps %xmm6,%xmm0 - .byte 15,88,136,33,149,0,0 // addps 0x9521(%eax),%xmm1 - .byte 15,40,176,49,149,0,0 // movaps 0x9531(%eax),%xmm6 + .byte 15,88,136,1,149,0,0 // addps 0x9501(%eax),%xmm1 + .byte 15,40,176,17,149,0,0 // movaps 0x9511(%eax),%xmm6 .byte 15,94,241 // divps %xmm1,%xmm6 .byte 15,92,198 // subps %xmm6,%xmm0 .byte 15,89,199 // mulps %xmm7,%xmm0 @@ -59088,12 +59072,12 @@ _sk_gamma_sse2: .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 .byte 15,40,240 // movaps %xmm0,%xmm6 .byte 15,194,241,1 // cmpltps %xmm1,%xmm6 - .byte 15,84,176,97,146,0,0 // andps 0x9261(%eax),%xmm6 + .byte 15,84,176,65,146,0,0 // andps 0x9241(%eax),%xmm6 .byte 15,92,206 // subps %xmm6,%xmm1 .byte 15,40,240 // movaps %xmm0,%xmm6 .byte 15,92,241 // subps %xmm1,%xmm6 - .byte 15,88,128,65,149,0,0 // addps 0x9541(%eax),%xmm0 - .byte 15,40,184,97,149,0,0 // movaps 0x9561(%eax),%xmm7 + .byte 15,88,128,33,149,0,0 // addps 0x9521(%eax),%xmm0 + .byte 15,40,184,65,149,0,0 // movaps 0x9541(%eax),%xmm7 .byte 15,92,254 // subps %xmm6,%xmm7 .byte 15,89,245 // mulps %xmm5,%xmm6 .byte 15,92,198 // subps %xmm6,%xmm0 @@ -59101,15 +59085,15 @@ _sk_gamma_sse2: .byte 15,94,207 // divps %xmm7,%xmm1 .byte 15,88,200 // addps %xmm0,%xmm1 .byte 15,91,194 // cvtdq2ps %xmm2,%xmm0 - .byte 15,89,128,225,148,0,0 // mulps 0x94e1(%eax),%xmm0 - .byte 15,84,144,241,148,0,0 // andps 0x94f1(%eax),%xmm2 - .byte 15,86,144,81,146,0,0 // orps 0x9251(%eax),%xmm2 - .byte 15,88,128,1,149,0,0 // addps 0x9501(%eax),%xmm0 - .byte 15,40,176,17,149,0,0 // movaps 0x9511(%eax),%xmm6 + .byte 15,89,128,193,148,0,0 // mulps 0x94c1(%eax),%xmm0 + .byte 15,84,144,209,148,0,0 // andps 0x94d1(%eax),%xmm2 + .byte 15,86,144,49,146,0,0 // orps 0x9231(%eax),%xmm2 + .byte 15,88,128,225,148,0,0 // addps 0x94e1(%eax),%xmm0 + .byte 15,40,176,241,148,0,0 // movaps 0x94f1(%eax),%xmm6 .byte 15,89,242 // mulps %xmm2,%xmm6 .byte 15,92,198 // subps %xmm6,%xmm0 - .byte 15,88,144,33,149,0,0 // addps 0x9521(%eax),%xmm2 - .byte 15,40,176,49,149,0,0 // movaps 0x9531(%eax),%xmm6 + .byte 15,88,144,1,149,0,0 // addps 0x9501(%eax),%xmm2 + .byte 15,40,176,17,149,0,0 // movaps 0x9511(%eax),%xmm6 .byte 15,94,242 // divps %xmm2,%xmm6 .byte 15,92,198 // subps %xmm6,%xmm0 .byte 15,89,69,232 // mulps -0x18(%ebp),%xmm0 @@ -59117,18 +59101,18 @@ _sk_gamma_sse2: .byte 15,91,210 // cvtdq2ps %xmm2,%xmm2 .byte 15,40,240 // movaps %xmm0,%xmm6 .byte 15,194,242,1 // cmpltps %xmm2,%xmm6 - .byte 15,84,176,97,146,0,0 // andps 0x9261(%eax),%xmm6 + .byte 15,84,176,65,146,0,0 // andps 0x9241(%eax),%xmm6 .byte 15,92,214 // subps %xmm6,%xmm2 .byte 15,40,240 // movaps %xmm0,%xmm6 .byte 15,92,242 // subps %xmm2,%xmm6 - .byte 15,88,128,65,149,0,0 // addps 0x9541(%eax),%xmm0 + .byte 15,88,128,33,149,0,0 // addps 0x9521(%eax),%xmm0 .byte 15,89,238 // mulps %xmm6,%xmm5 .byte 15,92,197 // subps %xmm5,%xmm0 - .byte 15,40,144,97,149,0,0 // movaps 0x9561(%eax),%xmm2 + .byte 15,40,144,65,149,0,0 // movaps 0x9541(%eax),%xmm2 .byte 15,92,214 // subps %xmm6,%xmm2 .byte 15,94,218 // divps %xmm2,%xmm3 .byte 15,88,216 // addps %xmm0,%xmm3 - .byte 15,40,128,129,149,0,0 // movaps 0x9581(%eax),%xmm0 + .byte 15,40,128,97,149,0,0 // movaps 0x9561(%eax),%xmm0 .byte 15,89,224 // mulps %xmm0,%xmm4 .byte 15,89,200 // mulps %xmm0,%xmm1 .byte 15,89,216 // mulps %xmm0,%xmm3 @@ -59157,29 +59141,29 @@ _sk_lab_to_xyz_sse2: .byte 15,40,208 // movaps %xmm0,%xmm2 .byte 232,0,0,0,0 // call 3c67 <_sk_lab_to_xyz_sse2+0x15> .byte 88 // pop %eax - .byte 15,89,144,169,147,0,0 // mulps 0x93a9(%eax),%xmm2 - .byte 15,40,160,73,145,0,0 // movaps 0x9149(%eax),%xmm4 + .byte 15,89,144,137,147,0,0 // mulps 0x9389(%eax),%xmm2 + .byte 15,40,160,41,145,0,0 // movaps 0x9129(%eax),%xmm4 .byte 15,89,204 // mulps %xmm4,%xmm1 - .byte 15,40,168,185,147,0,0 // movaps 0x93b9(%eax),%xmm5 + .byte 15,40,168,153,147,0,0 // movaps 0x9399(%eax),%xmm5 .byte 15,88,205 // addps %xmm5,%xmm1 .byte 15,89,220 // mulps %xmm4,%xmm3 .byte 15,88,221 // addps %xmm5,%xmm3 - .byte 15,88,144,201,147,0,0 // addps 0x93c9(%eax),%xmm2 - .byte 15,89,144,217,147,0,0 // mulps 0x93d9(%eax),%xmm2 - .byte 15,89,136,233,147,0,0 // mulps 0x93e9(%eax),%xmm1 + .byte 15,88,144,169,147,0,0 // addps 0x93a9(%eax),%xmm2 + .byte 15,89,144,185,147,0,0 // mulps 0x93b9(%eax),%xmm2 + .byte 15,89,136,201,147,0,0 // mulps 0x93c9(%eax),%xmm1 .byte 15,88,202 // addps %xmm2,%xmm1 - .byte 15,89,152,249,147,0,0 // mulps 0x93f9(%eax),%xmm3 + .byte 15,89,152,217,147,0,0 // mulps 0x93d9(%eax),%xmm3 .byte 15,40,234 // movaps %xmm2,%xmm5 .byte 15,92,235 // subps %xmm3,%xmm5 .byte 15,40,193 // movaps %xmm1,%xmm0 .byte 15,89,192 // mulps %xmm0,%xmm0 .byte 15,89,193 // mulps %xmm1,%xmm0 - .byte 15,40,152,9,148,0,0 // movaps 0x9409(%eax),%xmm3 + .byte 15,40,152,233,147,0,0 // movaps 0x93e9(%eax),%xmm3 .byte 15,40,227 // movaps %xmm3,%xmm4 .byte 15,194,224,1 // cmpltps %xmm0,%xmm4 - .byte 15,40,176,25,148,0,0 // movaps 0x9419(%eax),%xmm6 + .byte 15,40,176,249,147,0,0 // movaps 0x93f9(%eax),%xmm6 .byte 15,88,206 // addps %xmm6,%xmm1 - .byte 15,40,184,41,148,0,0 // movaps 0x9429(%eax),%xmm7 + .byte 15,40,184,9,148,0,0 // movaps 0x9409(%eax),%xmm7 .byte 15,89,207 // mulps %xmm7,%xmm1 .byte 15,84,196 // andps %xmm4,%xmm0 .byte 15,85,225 // andnps %xmm1,%xmm4 @@ -59204,8 +59188,8 @@ _sk_lab_to_xyz_sse2: .byte 15,85,221 // andnps %xmm5,%xmm3 .byte 15,86,216 // orps %xmm0,%xmm3 .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 15,89,160,57,148,0,0 // mulps 0x9439(%eax),%xmm4 - .byte 15,89,152,73,148,0,0 // mulps 0x9449(%eax),%xmm3 + .byte 15,89,160,25,148,0,0 // mulps 0x9419(%eax),%xmm4 + .byte 15,89,152,41,148,0,0 // mulps 0x9429(%eax),%xmm3 .byte 141,65,4 // lea 0x4(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp .byte 15,40,196 // movaps %xmm4,%xmm0 @@ -59243,9 +59227,9 @@ _sk_load_a8_sse2: .byte 102,15,110,4,62 // movd (%esi,%edi,1),%xmm0 .byte 102,15,96,192 // punpcklbw %xmm0,%xmm0 .byte 102,15,97,192 // punpcklwd %xmm0,%xmm0 - .byte 102,15,219,130,73,144,0,0 // pand 0x9049(%edx),%xmm0 + .byte 102,15,219,130,41,144,0,0 // pand 0x9029(%edx),%xmm0 .byte 15,91,216 // cvtdq2ps %xmm0,%xmm3 - .byte 15,89,154,121,145,0,0 // mulps 0x9179(%edx),%xmm3 + .byte 15,89,154,89,145,0,0 // mulps 0x9159(%edx),%xmm3 .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp .byte 15,87,192 // xorps %xmm0,%xmm0 @@ -59293,8 +59277,8 @@ _sk_load_a8_dst_sse2: .byte 131,236,12 // sub $0xc,%esp .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,49 // mov (%ecx),%esi .byte 139,16 // mov (%eax),%edx + .byte 139,49 // mov (%ecx),%esi .byte 139,122,4 // mov 0x4(%edx),%edi .byte 15,175,121,4 // imul 0x4(%ecx),%edi .byte 3,58 // add (%edx),%edi @@ -59310,9 +59294,9 @@ _sk_load_a8_dst_sse2: .byte 102,15,110,36,55 // movd (%edi,%esi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 .byte 102,15,97,224 // punpcklwd %xmm0,%xmm4 - .byte 102,15,219,162,117,143,0,0 // pand 0x8f75(%edx),%xmm4 + .byte 102,15,219,162,85,143,0,0 // pand 0x8f55(%edx),%xmm4 .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 - .byte 15,89,162,165,144,0,0 // mulps 0x90a5(%edx),%xmm4 + .byte 15,89,162,133,144,0,0 // mulps 0x9085(%edx),%xmm4 .byte 15,41,97,64 // movaps %xmm4,0x40(%ecx) .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp @@ -59403,7 +59387,7 @@ _sk_gather_a8_sse2: .byte 102,15,96,193 // punpcklbw %xmm1,%xmm0 .byte 102,15,97,193 // punpcklwd %xmm1,%xmm0 .byte 15,91,216 // cvtdq2ps %xmm0,%xmm3 - .byte 15,89,153,120,143,0,0 // mulps 0x8f78(%ecx),%xmm3 + .byte 15,89,153,88,143,0,0 // mulps 0x8f58(%ecx),%xmm3 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 131,236,8 // sub $0x8,%esp .byte 15,87,192 // xorps %xmm0,%xmm0 @@ -59437,7 +59421,7 @@ _sk_store_a8_sse2: .byte 15,175,81,4 // imul 0x4(%ecx),%edx .byte 3,23 // add (%edi),%edx .byte 139,89,8 // mov 0x8(%ecx),%ebx - .byte 15,40,166,20,142,0,0 // movaps 0x8e14(%esi),%xmm4 + .byte 15,40,166,244,141,0,0 // movaps 0x8df4(%esi),%xmm4 .byte 15,89,227 // mulps %xmm3,%xmm4 .byte 102,15,91,228 // cvtps2dq %xmm4,%xmm4 .byte 102,15,114,244,16 // pslld $0x10,%xmm4 @@ -59472,7 +59456,7 @@ _sk_store_a8_sse2: .byte 102,15,197,220,4 // pextrw $0x4,%xmm4,%ebx .byte 136,92,58,2 // mov %bl,0x2(%edx,%edi,1) .byte 102,15,112,228,212 // pshufd $0xd4,%xmm4,%xmm4 - .byte 102,15,219,166,36,145,0,0 // pand 0x9124(%esi),%xmm4 + .byte 102,15,219,166,4,145,0,0 // pand 0x9104(%esi),%xmm4 .byte 102,15,103,228 // packuswb %xmm4,%xmm4 .byte 102,15,103,228 // packuswb %xmm4,%xmm4 .byte 102,15,103,228 // packuswb %xmm4,%xmm4 @@ -59508,12 +59492,12 @@ _sk_load_g8_sse2: .byte 102,15,110,4,62 // movd (%esi,%edi,1),%xmm0 .byte 102,15,96,192 // punpcklbw %xmm0,%xmm0 .byte 102,15,97,192 // punpcklwd %xmm0,%xmm0 - .byte 102,15,219,130,82,141,0,0 // pand 0x8d52(%edx),%xmm0 + .byte 102,15,219,130,50,141,0,0 // pand 0x8d32(%edx),%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,89,130,130,142,0,0 // mulps 0x8e82(%edx),%xmm0 + .byte 15,89,130,98,142,0,0 // mulps 0x8e62(%edx),%xmm0 .byte 141,112,8 // lea 0x8(%eax),%esi .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,154,146,140,0,0 // movaps 0x8c92(%edx),%xmm3 + .byte 15,40,154,114,140,0,0 // movaps 0x8c72(%edx),%xmm3 .byte 15,40,200 // movaps %xmm0,%xmm1 .byte 15,40,208 // movaps %xmm0,%xmm2 .byte 86 // push %esi @@ -59571,13 +59555,13 @@ _sk_load_g8_dst_sse2: .byte 102,15,110,36,62 // movd (%esi,%edi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 .byte 102,15,97,224 // punpcklwd %xmm0,%xmm4 - .byte 102,15,219,162,166,140,0,0 // pand 0x8ca6(%edx),%xmm4 + .byte 102,15,219,162,134,140,0,0 // pand 0x8c86(%edx),%xmm4 .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 - .byte 15,89,162,214,141,0,0 // mulps 0x8dd6(%edx),%xmm4 + .byte 15,89,162,182,141,0,0 // mulps 0x8db6(%edx),%xmm4 .byte 15,41,97,48 // movaps %xmm4,0x30(%ecx) .byte 15,41,97,32 // movaps %xmm4,0x20(%ecx) .byte 15,41,97,16 // movaps %xmm4,0x10(%ecx) - .byte 15,40,162,230,139,0,0 // movaps 0x8be6(%edx),%xmm4 + .byte 15,40,162,198,139,0,0 // movaps 0x8bc6(%edx),%xmm4 .byte 15,41,97,64 // movaps %xmm4,0x40(%ecx) .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp @@ -59669,10 +59653,10 @@ _sk_gather_g8_sse2: .byte 102,15,96,193 // punpcklbw %xmm1,%xmm0 .byte 102,15,97,193 // punpcklwd %xmm1,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,89,129,127,140,0,0 // mulps 0x8c7f(%ecx),%xmm0 + .byte 15,89,129,95,140,0,0 // mulps 0x8c5f(%ecx),%xmm0 .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,153,143,138,0,0 // movaps 0x8a8f(%ecx),%xmm3 + .byte 15,40,153,111,138,0,0 // movaps 0x8a6f(%ecx),%xmm3 .byte 15,40,200 // movaps %xmm0,%xmm1 .byte 15,40,208 // movaps %xmm0,%xmm2 .byte 82 // push %edx @@ -59709,20 +59693,20 @@ _sk_load_565_sse2: .byte 117,97 // jne 431a <_sk_load_565_sse2+0x8c> .byte 243,15,126,20,126 // movq (%esi,%edi,2),%xmm2 .byte 102,15,97,208 // punpcklwd %xmm0,%xmm2 - .byte 102,15,111,130,68,140,0,0 // movdqa 0x8c44(%edx),%xmm0 + .byte 102,15,111,130,36,140,0,0 // movdqa 0x8c24(%edx),%xmm0 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,89,130,84,140,0,0 // mulps 0x8c54(%edx),%xmm0 - .byte 102,15,111,138,100,140,0,0 // movdqa 0x8c64(%edx),%xmm1 + .byte 15,89,130,52,140,0,0 // mulps 0x8c34(%edx),%xmm0 + .byte 102,15,111,138,68,140,0,0 // movdqa 0x8c44(%edx),%xmm1 .byte 102,15,219,202 // pand %xmm2,%xmm1 .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 - .byte 15,89,138,116,140,0,0 // mulps 0x8c74(%edx),%xmm1 - .byte 102,15,219,146,132,140,0,0 // pand 0x8c84(%edx),%xmm2 + .byte 15,89,138,84,140,0,0 // mulps 0x8c54(%edx),%xmm1 + .byte 102,15,219,146,100,140,0,0 // pand 0x8c64(%edx),%xmm2 .byte 15,91,210 // cvtdq2ps %xmm2,%xmm2 - .byte 15,89,146,148,140,0,0 // mulps 0x8c94(%edx),%xmm2 + .byte 15,89,146,116,140,0,0 // mulps 0x8c74(%edx),%xmm2 .byte 141,112,8 // lea 0x8(%eax),%esi .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,154,68,138,0,0 // movaps 0x8a44(%edx),%xmm3 + .byte 15,40,154,36,138,0,0 // movaps 0x8a24(%edx),%xmm3 .byte 86 // push %esi .byte 81 // push %ecx .byte 255,80,4 // call *0x4(%eax) @@ -59776,21 +59760,21 @@ _sk_load_565_dst_sse2: .byte 117,113 // jne 43fa <_sk_load_565_dst_sse2+0x9c> .byte 243,15,126,36,126 // movq (%esi,%edi,2),%xmm4 .byte 102,15,97,224 // punpcklwd %xmm0,%xmm4 - .byte 102,15,111,170,116,139,0,0 // movdqa 0x8b74(%edx),%xmm5 + .byte 102,15,111,170,84,139,0,0 // movdqa 0x8b54(%edx),%xmm5 .byte 102,15,219,236 // pand %xmm4,%xmm5 .byte 15,91,237 // cvtdq2ps %xmm5,%xmm5 - .byte 15,89,170,132,139,0,0 // mulps 0x8b84(%edx),%xmm5 + .byte 15,89,170,100,139,0,0 // mulps 0x8b64(%edx),%xmm5 .byte 15,41,105,16 // movaps %xmm5,0x10(%ecx) - .byte 102,15,111,170,148,139,0,0 // movdqa 0x8b94(%edx),%xmm5 + .byte 102,15,111,170,116,139,0,0 // movdqa 0x8b74(%edx),%xmm5 .byte 102,15,219,236 // pand %xmm4,%xmm5 .byte 15,91,237 // cvtdq2ps %xmm5,%xmm5 - .byte 15,89,170,164,139,0,0 // mulps 0x8ba4(%edx),%xmm5 + .byte 15,89,170,132,139,0,0 // mulps 0x8b84(%edx),%xmm5 .byte 15,41,105,32 // movaps %xmm5,0x20(%ecx) - .byte 102,15,219,162,180,139,0,0 // pand 0x8bb4(%edx),%xmm4 + .byte 102,15,219,162,148,139,0,0 // pand 0x8b94(%edx),%xmm4 .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 - .byte 15,89,162,196,139,0,0 // mulps 0x8bc4(%edx),%xmm4 + .byte 15,89,162,164,139,0,0 // mulps 0x8ba4(%edx),%xmm4 .byte 15,41,97,48 // movaps %xmm4,0x30(%ecx) - .byte 15,40,162,116,137,0,0 // movaps 0x8974(%edx),%xmm4 + .byte 15,40,162,84,137,0,0 // movaps 0x8954(%edx),%xmm4 .byte 15,41,97,64 // movaps %xmm4,0x40(%ecx) .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp @@ -59875,20 +59859,20 @@ _sk_gather_565_sse2: .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,196,209,3 // pinsrw $0x3,%ecx,%xmm2 .byte 102,15,97,208 // punpcklwd %xmm0,%xmm2 - .byte 102,15,111,130,242,137,0,0 // movdqa 0x89f2(%edx),%xmm0 + .byte 102,15,111,130,210,137,0,0 // movdqa 0x89d2(%edx),%xmm0 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,89,130,2,138,0,0 // mulps 0x8a02(%edx),%xmm0 - .byte 102,15,111,138,18,138,0,0 // movdqa 0x8a12(%edx),%xmm1 + .byte 15,89,130,226,137,0,0 // mulps 0x89e2(%edx),%xmm0 + .byte 102,15,111,138,242,137,0,0 // movdqa 0x89f2(%edx),%xmm1 .byte 102,15,219,202 // pand %xmm2,%xmm1 .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 - .byte 15,89,138,34,138,0,0 // mulps 0x8a22(%edx),%xmm1 - .byte 102,15,219,146,50,138,0,0 // pand 0x8a32(%edx),%xmm2 + .byte 15,89,138,2,138,0,0 // mulps 0x8a02(%edx),%xmm1 + .byte 102,15,219,146,18,138,0,0 // pand 0x8a12(%edx),%xmm2 .byte 15,91,210 // cvtdq2ps %xmm2,%xmm2 - .byte 15,89,146,66,138,0,0 // mulps 0x8a42(%edx),%xmm2 + .byte 15,89,146,34,138,0,0 // mulps 0x8a22(%edx),%xmm2 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,154,242,135,0,0 // movaps 0x87f2(%edx),%xmm3 + .byte 15,40,154,210,135,0,0 // movaps 0x87d2(%edx),%xmm3 .byte 81 // push %ecx .byte 255,117,8 // pushl 0x8(%ebp) .byte 255,80,4 // call *0x4(%eax) @@ -59916,8 +59900,8 @@ _sk_store_565_sse2: .byte 1,210 // add %edx,%edx .byte 3,22 // add (%esi),%edx .byte 139,49 // mov (%ecx),%esi - .byte 15,40,167,111,139,0,0 // movaps 0x8b6f(%edi),%xmm4 - .byte 15,40,175,127,139,0,0 // movaps 0x8b7f(%edi),%xmm5 + .byte 15,40,167,79,139,0,0 // movaps 0x8b4f(%edi),%xmm4 + .byte 15,40,175,95,139,0,0 // movaps 0x8b5f(%edi),%xmm5 .byte 139,89,8 // mov 0x8(%ecx),%ebx .byte 15,40,240 // movaps %xmm0,%xmm6 .byte 15,89,244 // mulps %xmm4,%xmm6 @@ -59997,21 +59981,21 @@ _sk_load_4444_sse2: .byte 117,112 // jne 46d0 <_sk_load_4444_sse2+0x9b> .byte 243,15,126,28,126 // movq (%esi,%edi,2),%xmm3 .byte 102,15,97,216 // punpcklwd %xmm0,%xmm3 - .byte 102,15,111,130,173,138,0,0 // movdqa 0x8aad(%edx),%xmm0 + .byte 102,15,111,130,141,138,0,0 // movdqa 0x8a8d(%edx),%xmm0 .byte 102,15,219,195 // pand %xmm3,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,89,130,189,138,0,0 // mulps 0x8abd(%edx),%xmm0 - .byte 102,15,111,138,205,138,0,0 // movdqa 0x8acd(%edx),%xmm1 + .byte 15,89,130,157,138,0,0 // mulps 0x8a9d(%edx),%xmm0 + .byte 102,15,111,138,173,138,0,0 // movdqa 0x8aad(%edx),%xmm1 .byte 102,15,219,203 // pand %xmm3,%xmm1 .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 - .byte 15,89,138,221,138,0,0 // mulps 0x8add(%edx),%xmm1 - .byte 102,15,111,146,237,138,0,0 // movdqa 0x8aed(%edx),%xmm2 + .byte 15,89,138,189,138,0,0 // mulps 0x8abd(%edx),%xmm1 + .byte 102,15,111,146,205,138,0,0 // movdqa 0x8acd(%edx),%xmm2 .byte 102,15,219,211 // pand %xmm3,%xmm2 .byte 15,91,210 // cvtdq2ps %xmm2,%xmm2 - .byte 15,89,146,253,138,0,0 // mulps 0x8afd(%edx),%xmm2 - .byte 102,15,219,154,13,139,0,0 // pand 0x8b0d(%edx),%xmm3 + .byte 15,89,146,221,138,0,0 // mulps 0x8add(%edx),%xmm2 + .byte 102,15,219,154,237,138,0,0 // pand 0x8aed(%edx),%xmm3 .byte 15,91,219 // cvtdq2ps %xmm3,%xmm3 - .byte 15,89,154,29,139,0,0 // mulps 0x8b1d(%edx),%xmm3 + .byte 15,89,154,253,138,0,0 // mulps 0x8afd(%edx),%xmm3 .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp .byte 82 // push %edx @@ -60067,24 +60051,24 @@ _sk_load_4444_dst_sse2: .byte 15,133,128,0,0,0 // jne 47c3 <_sk_load_4444_dst_sse2+0xaf> .byte 243,15,126,36,126 // movq (%esi,%edi,2),%xmm4 .byte 102,15,97,224 // punpcklwd %xmm0,%xmm4 - .byte 102,15,111,170,206,137,0,0 // movdqa 0x89ce(%edx),%xmm5 + .byte 102,15,111,170,174,137,0,0 // movdqa 0x89ae(%edx),%xmm5 .byte 102,15,219,236 // pand %xmm4,%xmm5 .byte 15,91,237 // cvtdq2ps %xmm5,%xmm5 - .byte 15,89,170,222,137,0,0 // mulps 0x89de(%edx),%xmm5 + .byte 15,89,170,190,137,0,0 // mulps 0x89be(%edx),%xmm5 .byte 15,41,105,16 // movaps %xmm5,0x10(%ecx) - .byte 102,15,111,170,238,137,0,0 // movdqa 0x89ee(%edx),%xmm5 + .byte 102,15,111,170,206,137,0,0 // movdqa 0x89ce(%edx),%xmm5 .byte 102,15,219,236 // pand %xmm4,%xmm5 .byte 15,91,237 // cvtdq2ps %xmm5,%xmm5 - .byte 15,89,170,254,137,0,0 // mulps 0x89fe(%edx),%xmm5 + .byte 15,89,170,222,137,0,0 // mulps 0x89de(%edx),%xmm5 .byte 15,41,105,32 // movaps %xmm5,0x20(%ecx) - .byte 102,15,111,170,14,138,0,0 // movdqa 0x8a0e(%edx),%xmm5 + .byte 102,15,111,170,238,137,0,0 // movdqa 0x89ee(%edx),%xmm5 .byte 102,15,219,236 // pand %xmm4,%xmm5 .byte 15,91,237 // cvtdq2ps %xmm5,%xmm5 - .byte 15,89,170,30,138,0,0 // mulps 0x8a1e(%edx),%xmm5 + .byte 15,89,170,254,137,0,0 // mulps 0x89fe(%edx),%xmm5 .byte 15,41,105,48 // movaps %xmm5,0x30(%ecx) - .byte 102,15,219,162,46,138,0,0 // pand 0x8a2e(%edx),%xmm4 + .byte 102,15,219,162,14,138,0,0 // pand 0x8a0e(%edx),%xmm4 .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 - .byte 15,89,162,62,138,0,0 // mulps 0x8a3e(%edx),%xmm4 + .byte 15,89,162,30,138,0,0 // mulps 0x8a1e(%edx),%xmm4 .byte 15,41,97,64 // movaps %xmm4,0x40(%ecx) .byte 141,80,8 // lea 0x8(%eax),%edx .byte 131,236,8 // sub $0x8,%esp @@ -60169,21 +60153,21 @@ _sk_gather_4444_sse2: .byte 89 // pop %ecx .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,97,216 // punpcklwd %xmm0,%xmm3 - .byte 102,15,111,129,48,136,0,0 // movdqa 0x8830(%ecx),%xmm0 + .byte 102,15,111,129,16,136,0,0 // movdqa 0x8810(%ecx),%xmm0 .byte 102,15,219,195 // pand %xmm3,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,89,129,64,136,0,0 // mulps 0x8840(%ecx),%xmm0 - .byte 102,15,111,137,80,136,0,0 // movdqa 0x8850(%ecx),%xmm1 + .byte 15,89,129,32,136,0,0 // mulps 0x8820(%ecx),%xmm0 + .byte 102,15,111,137,48,136,0,0 // movdqa 0x8830(%ecx),%xmm1 .byte 102,15,219,203 // pand %xmm3,%xmm1 .byte 15,91,201 // cvtdq2ps %xmm1,%xmm1 - .byte 15,89,137,96,136,0,0 // mulps 0x8860(%ecx),%xmm1 - .byte 102,15,111,145,112,136,0,0 // movdqa 0x8870(%ecx),%xmm2 + .byte 15,89,137,64,136,0,0 // mulps 0x8840(%ecx),%xmm1 + .byte 102,15,111,145,80,136,0,0 // movdqa 0x8850(%ecx),%xmm2 .byte 102,15,219,211 // pand %xmm3,%xmm2 .byte 15,91,210 // cvtdq2ps %xmm2,%xmm2 - .byte 15,89,145,128,136,0,0 // mulps 0x8880(%ecx),%xmm2 - .byte 102,15,219,153,144,136,0,0 // pand 0x8890(%ecx),%xmm3 + .byte 15,89,145,96,136,0,0 // mulps 0x8860(%ecx),%xmm2 + .byte 102,15,219,153,112,136,0,0 // pand 0x8870(%ecx),%xmm3 .byte 15,91,219 // cvtdq2ps %xmm3,%xmm3 - .byte 15,89,153,160,136,0,0 // mulps 0x88a0(%ecx),%xmm3 + .byte 15,89,153,128,136,0,0 // mulps 0x8880(%ecx),%xmm3 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 131,236,8 // sub $0x8,%esp .byte 81 // push %ecx @@ -60213,7 +60197,7 @@ _sk_store_4444_sse2: .byte 1,210 // add %edx,%edx .byte 3,22 // add (%esi),%edx .byte 139,49 // mov (%ecx),%esi - .byte 15,40,167,51,136,0,0 // movaps 0x8833(%edi),%xmm4 + .byte 15,40,167,19,136,0,0 // movaps 0x8813(%edi),%xmm4 .byte 139,89,8 // mov 0x8(%ecx),%ebx .byte 15,40,232 // movaps %xmm0,%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 @@ -60298,11 +60282,11 @@ _sk_load_8888_sse2: .byte 139,57 // mov (%ecx),%edi .byte 117,102 // jne 4ab2 <_sk_load_8888_sse2+0x92> .byte 243,15,111,28,190 // movdqu (%esi,%edi,4),%xmm3 - .byte 102,15,111,146,114,131,0,0 // movdqa 0x8372(%edx),%xmm2 + .byte 102,15,111,146,82,131,0,0 // movdqa 0x8352(%edx),%xmm2 .byte 102,15,111,195 // movdqa %xmm3,%xmm0 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,40,162,162,132,0,0 // movaps 0x84a2(%edx),%xmm4 + .byte 15,40,162,130,132,0,0 // movaps 0x8482(%edx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,114,209,8 // psrld $0x8,%xmm1 @@ -60367,11 +60351,11 @@ _sk_load_8888_dst_sse2: .byte 139,57 // mov (%ecx),%edi .byte 117,118 // jne 4b89 <_sk_load_8888_dst_sse2+0xa2> .byte 243,15,111,36,190 // movdqu (%esi,%edi,4),%xmm4 - .byte 102,15,111,170,171,130,0,0 // movdqa 0x82ab(%edx),%xmm5 + .byte 102,15,111,170,139,130,0,0 // movdqa 0x828b(%edx),%xmm5 .byte 102,15,111,244 // movdqa %xmm4,%xmm6 .byte 102,15,219,245 // pand %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 - .byte 15,40,186,219,131,0,0 // movaps 0x83db(%edx),%xmm7 + .byte 15,40,186,187,131,0,0 // movaps 0x83bb(%edx),%xmm7 .byte 15,89,247 // mulps %xmm7,%xmm6 .byte 15,41,113,16 // movaps %xmm6,0x10(%ecx) .byte 102,15,111,244 // movdqa %xmm4,%xmm6 @@ -60466,11 +60450,11 @@ _sk_gather_8888_sse2: .byte 102,15,98,194 // punpckldq %xmm2,%xmm0 .byte 102,15,98,217 // punpckldq %xmm1,%xmm3 .byte 102,15,108,216 // punpcklqdq %xmm0,%xmm3 - .byte 102,15,111,145,56,129,0,0 // movdqa 0x8138(%ecx),%xmm2 + .byte 102,15,111,145,24,129,0,0 // movdqa 0x8118(%ecx),%xmm2 .byte 102,15,111,195 // movdqa %xmm3,%xmm0 .byte 102,15,219,194 // pand %xmm2,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,40,161,104,130,0,0 // movaps 0x8268(%ecx),%xmm4 + .byte 15,40,161,72,130,0,0 // movaps 0x8248(%ecx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,114,209,8 // psrld $0x8,%xmm1 @@ -60514,7 +60498,7 @@ _sk_store_8888_sse2: .byte 193,226,2 // shl $0x2,%edx .byte 3,22 // add (%esi),%edx .byte 139,49 // mov (%ecx),%esi - .byte 15,40,167,205,128,0,0 // movaps 0x80cd(%edi),%xmm4 + .byte 15,40,167,173,128,0,0 // movaps 0x80ad(%edi),%xmm4 .byte 139,89,8 // mov 0x8(%ecx),%ebx .byte 15,40,232 // movaps %xmm0,%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 @@ -60585,11 +60569,11 @@ _sk_load_bgra_sse2: .byte 139,57 // mov (%ecx),%edi .byte 117,102 // jne 4e1d <_sk_load_bgra_sse2+0x92> .byte 243,15,111,28,190 // movdqu (%esi,%edi,4),%xmm3 - .byte 102,15,111,130,7,128,0,0 // movdqa 0x8007(%edx),%xmm0 + .byte 102,15,111,130,231,127,0,0 // movdqa 0x7fe7(%edx),%xmm0 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,219,200 // pand %xmm0,%xmm1 .byte 15,91,209 // cvtdq2ps %xmm1,%xmm2 - .byte 15,40,162,55,129,0,0 // movaps 0x8137(%edx),%xmm4 + .byte 15,40,162,23,129,0,0 // movaps 0x8117(%edx),%xmm4 .byte 15,89,212 // mulps %xmm4,%xmm2 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,114,209,8 // psrld $0x8,%xmm1 @@ -60654,11 +60638,11 @@ _sk_load_bgra_dst_sse2: .byte 139,57 // mov (%ecx),%edi .byte 117,118 // jne 4ef4 <_sk_load_bgra_dst_sse2+0xa2> .byte 243,15,111,36,190 // movdqu (%esi,%edi,4),%xmm4 - .byte 102,15,111,170,64,127,0,0 // movdqa 0x7f40(%edx),%xmm5 + .byte 102,15,111,170,32,127,0,0 // movdqa 0x7f20(%edx),%xmm5 .byte 102,15,111,244 // movdqa %xmm4,%xmm6 .byte 102,15,219,245 // pand %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 - .byte 15,40,186,112,128,0,0 // movaps 0x8070(%edx),%xmm7 + .byte 15,40,186,80,128,0,0 // movaps 0x8050(%edx),%xmm7 .byte 15,89,247 // mulps %xmm7,%xmm6 .byte 15,41,113,48 // movaps %xmm6,0x30(%ecx) .byte 102,15,111,244 // movdqa %xmm4,%xmm6 @@ -60753,11 +60737,11 @@ _sk_gather_bgra_sse2: .byte 102,15,98,194 // punpckldq %xmm2,%xmm0 .byte 102,15,98,217 // punpckldq %xmm1,%xmm3 .byte 102,15,108,216 // punpcklqdq %xmm0,%xmm3 - .byte 102,15,111,129,205,125,0,0 // movdqa 0x7dcd(%ecx),%xmm0 + .byte 102,15,111,129,173,125,0,0 // movdqa 0x7dad(%ecx),%xmm0 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,219,200 // pand %xmm0,%xmm1 .byte 15,91,209 // cvtdq2ps %xmm1,%xmm2 - .byte 15,40,161,253,126,0,0 // movaps 0x7efd(%ecx),%xmm4 + .byte 15,40,161,221,126,0,0 // movaps 0x7edd(%ecx),%xmm4 .byte 15,89,212 // mulps %xmm4,%xmm2 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,114,209,8 // psrld $0x8,%xmm1 @@ -60801,7 +60785,7 @@ _sk_store_bgra_sse2: .byte 193,226,2 // shl $0x2,%edx .byte 3,22 // add (%esi),%edx .byte 139,49 // mov (%ecx),%esi - .byte 15,40,167,98,125,0,0 // movaps 0x7d62(%edi),%xmm4 + .byte 15,40,167,66,125,0,0 // movaps 0x7d42(%edi),%xmm4 .byte 139,89,8 // mov 0x8(%ecx),%ebx .byte 15,40,234 // movaps %xmm2,%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 @@ -60900,11 +60884,11 @@ _sk_load_f16_sse2: .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,97,200 // punpcklwd %xmm0,%xmm1 .byte 102,15,239,210 // pxor %xmm2,%xmm2 - .byte 102,15,111,170,124,128,0,0 // movdqa 0x807c(%edx),%xmm5 + .byte 102,15,111,170,92,128,0,0 // movdqa 0x805c(%edx),%xmm5 .byte 102,15,111,241 // movdqa %xmm1,%xmm6 .byte 102,15,219,245 // pand %xmm5,%xmm6 - .byte 102,15,219,138,140,128,0,0 // pand 0x808c(%edx),%xmm1 - .byte 102,15,111,130,156,128,0,0 // movdqa 0x809c(%edx),%xmm0 + .byte 102,15,219,138,108,128,0,0 // pand 0x806c(%edx),%xmm1 + .byte 102,15,111,130,124,128,0,0 // movdqa 0x807c(%edx),%xmm0 .byte 102,15,127,69,184 // movdqa %xmm0,-0x48(%ebp) .byte 102,15,114,246,16 // pslld $0x10,%xmm6 .byte 102,15,111,216 // movdqa %xmm0,%xmm3 @@ -60916,7 +60900,7 @@ _sk_load_f16_sse2: .byte 102,15,239,255 // pxor %xmm7,%xmm7 .byte 102,15,111,212 // movdqa %xmm4,%xmm2 .byte 102,15,219,213 // pand %xmm5,%xmm2 - .byte 102,15,111,154,140,128,0,0 // movdqa 0x808c(%edx),%xmm3 + .byte 102,15,111,154,108,128,0,0 // movdqa 0x806c(%edx),%xmm3 .byte 102,15,219,227 // pand %xmm3,%xmm4 .byte 102,15,114,242,16 // pslld $0x10,%xmm2 .byte 102,15,102,196 // pcmpgtd %xmm4,%xmm0 @@ -60929,7 +60913,7 @@ _sk_load_f16_sse2: .byte 102,15,219,253 // pand %xmm5,%xmm7 .byte 102,15,219,195 // pand %xmm3,%xmm0 .byte 102,15,114,247,16 // pslld $0x10,%xmm7 - .byte 102,15,111,146,156,128,0,0 // movdqa 0x809c(%edx),%xmm2 + .byte 102,15,111,146,124,128,0,0 // movdqa 0x807c(%edx),%xmm2 .byte 102,15,102,208 // pcmpgtd %xmm0,%xmm2 .byte 102,15,114,240,13 // pslld $0xd,%xmm0 .byte 102,15,235,199 // por %xmm7,%xmm0 @@ -60944,7 +60928,7 @@ _sk_load_f16_sse2: .byte 102,15,127,93,184 // movdqa %xmm3,-0x48(%ebp) .byte 102,15,114,247,13 // pslld $0xd,%xmm7 .byte 102,15,235,253 // por %xmm5,%xmm7 - .byte 102,15,111,154,172,128,0,0 // movdqa 0x80ac(%edx),%xmm3 + .byte 102,15,111,154,140,128,0,0 // movdqa 0x808c(%edx),%xmm3 .byte 102,15,254,203 // paddd %xmm3,%xmm1 .byte 102,15,254,227 // paddd %xmm3,%xmm4 .byte 102,15,254,195 // paddd %xmm3,%xmm0 @@ -61033,18 +61017,18 @@ _sk_load_f16_dst_sse2: .byte 102,15,126,85,232 // movd %xmm2,-0x18(%ebp) .byte 102,15,239,210 // pxor %xmm2,%xmm2 .byte 102,15,97,202 // punpcklwd %xmm2,%xmm1 - .byte 102,15,111,186,95,126,0,0 // movdqa 0x7e5f(%edx),%xmm7 + .byte 102,15,111,186,63,126,0,0 // movdqa 0x7e3f(%edx),%xmm7 .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 102,15,219,215 // pand %xmm7,%xmm2 - .byte 102,15,111,154,111,126,0,0 // movdqa 0x7e6f(%edx),%xmm3 + .byte 102,15,111,154,79,126,0,0 // movdqa 0x7e4f(%edx),%xmm3 .byte 102,15,219,203 // pand %xmm3,%xmm1 - .byte 102,15,111,162,127,126,0,0 // movdqa 0x7e7f(%edx),%xmm4 + .byte 102,15,111,162,95,126,0,0 // movdqa 0x7e5f(%edx),%xmm4 .byte 102,15,114,242,16 // pslld $0x10,%xmm2 .byte 102,15,111,236 // movdqa %xmm4,%xmm5 .byte 102,15,102,233 // pcmpgtd %xmm1,%xmm5 .byte 102,15,114,241,13 // pslld $0xd,%xmm1 .byte 102,15,235,202 // por %xmm2,%xmm1 - .byte 102,15,111,146,143,126,0,0 // movdqa 0x7e8f(%edx),%xmm2 + .byte 102,15,111,146,111,126,0,0 // movdqa 0x7e6f(%edx),%xmm2 .byte 102,15,127,85,184 // movdqa %xmm2,-0x48(%ebp) .byte 102,15,254,202 // paddd %xmm2,%xmm1 .byte 102,15,223,233 // pandn %xmm1,%xmm5 @@ -61190,11 +61174,11 @@ _sk_gather_f16_sse2: .byte 102,15,126,69,248 // movd %xmm0,-0x8(%ebp) .byte 102,15,97,206 // punpcklwd %xmm6,%xmm1 .byte 102,15,239,210 // pxor %xmm2,%xmm2 - .byte 102,15,111,177,195,123,0,0 // movdqa 0x7bc3(%ecx),%xmm6 + .byte 102,15,111,177,163,123,0,0 // movdqa 0x7ba3(%ecx),%xmm6 .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,219,230 // pand %xmm6,%xmm4 - .byte 102,15,219,137,211,123,0,0 // pand 0x7bd3(%ecx),%xmm1 - .byte 102,15,111,129,227,123,0,0 // movdqa 0x7be3(%ecx),%xmm0 + .byte 102,15,219,137,179,123,0,0 // pand 0x7bb3(%ecx),%xmm1 + .byte 102,15,111,129,195,123,0,0 // movdqa 0x7bc3(%ecx),%xmm0 .byte 102,15,114,244,16 // pslld $0x10,%xmm4 .byte 102,15,111,216 // movdqa %xmm0,%xmm3 .byte 102,15,102,217 // pcmpgtd %xmm1,%xmm3 @@ -61205,7 +61189,7 @@ _sk_gather_f16_sse2: .byte 102,15,239,255 // pxor %xmm7,%xmm7 .byte 102,15,111,213 // movdqa %xmm5,%xmm2 .byte 102,15,219,214 // pand %xmm6,%xmm2 - .byte 102,15,111,153,211,123,0,0 // movdqa 0x7bd3(%ecx),%xmm3 + .byte 102,15,111,153,179,123,0,0 // movdqa 0x7bb3(%ecx),%xmm3 .byte 102,15,219,235 // pand %xmm3,%xmm5 .byte 102,15,114,242,16 // pslld $0x10,%xmm2 .byte 102,15,111,224 // movdqa %xmm0,%xmm4 @@ -61219,7 +61203,7 @@ _sk_gather_f16_sse2: .byte 102,15,219,254 // pand %xmm6,%xmm7 .byte 102,15,219,195 // pand %xmm3,%xmm0 .byte 102,15,114,247,16 // pslld $0x10,%xmm7 - .byte 102,15,111,145,227,123,0,0 // movdqa 0x7be3(%ecx),%xmm2 + .byte 102,15,111,145,195,123,0,0 // movdqa 0x7bc3(%ecx),%xmm2 .byte 102,15,111,218 // movdqa %xmm2,%xmm3 .byte 102,15,102,216 // pcmpgtd %xmm0,%xmm3 .byte 102,15,114,240,13 // pslld $0xd,%xmm0 @@ -61228,12 +61212,12 @@ _sk_gather_f16_sse2: .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,97,252 // punpcklwd %xmm4,%xmm7 .byte 102,15,219,247 // pand %xmm7,%xmm6 - .byte 102,15,219,185,211,123,0,0 // pand 0x7bd3(%ecx),%xmm7 + .byte 102,15,219,185,179,123,0,0 // pand 0x7bb3(%ecx),%xmm7 .byte 102,15,114,246,16 // pslld $0x10,%xmm6 .byte 102,15,102,215 // pcmpgtd %xmm7,%xmm2 .byte 102,15,114,247,13 // pslld $0xd,%xmm7 .byte 102,15,235,254 // por %xmm6,%xmm7 - .byte 102,15,111,161,243,123,0,0 // movdqa 0x7bf3(%ecx),%xmm4 + .byte 102,15,111,161,211,123,0,0 // movdqa 0x7bd3(%ecx),%xmm4 .byte 102,15,254,204 // paddd %xmm4,%xmm1 .byte 102,15,254,236 // paddd %xmm4,%xmm5 .byte 102,15,254,196 // paddd %xmm4,%xmm0 @@ -61272,22 +61256,22 @@ _sk_store_f16_sse2: .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 232,0,0,0,0 // call 5781 <_sk_store_f16_sse2+0x19> .byte 88 // pop %eax - .byte 102,15,111,152,63,122,0,0 // movdqa 0x7a3f(%eax),%xmm3 + .byte 102,15,111,152,31,122,0,0 // movdqa 0x7a1f(%eax),%xmm3 .byte 102,15,111,224 // movdqa %xmm0,%xmm4 .byte 102,15,219,227 // pand %xmm3,%xmm4 - .byte 102,15,111,136,111,122,0,0 // movdqa 0x7a6f(%eax),%xmm1 + .byte 102,15,111,136,79,122,0,0 // movdqa 0x7a4f(%eax),%xmm1 .byte 102,15,127,77,232 // movdqa %xmm1,-0x18(%ebp) .byte 102,15,111,240 // movdqa %xmm0,%xmm6 .byte 102,15,114,246,3 // pslld $0x3,%xmm6 .byte 102,15,219,241 // pand %xmm1,%xmm6 .byte 102,15,254,244 // paddd %xmm4,%xmm6 - .byte 102,15,111,184,79,122,0,0 // movdqa 0x7a4f(%eax),%xmm7 + .byte 102,15,111,184,47,122,0,0 // movdqa 0x7a2f(%eax),%xmm7 .byte 102,15,127,69,168 // movdqa %xmm0,-0x58(%ebp) .byte 102,15,219,199 // pand %xmm7,%xmm0 - .byte 102,15,111,168,95,122,0,0 // movdqa 0x7a5f(%eax),%xmm5 + .byte 102,15,111,168,63,122,0,0 // movdqa 0x7a3f(%eax),%xmm5 .byte 102,15,111,205 // movdqa %xmm5,%xmm1 .byte 102,15,102,200 // pcmpgtd %xmm0,%xmm1 - .byte 102,15,111,128,239,118,0,0 // movdqa 0x76ef(%eax),%xmm0 + .byte 102,15,111,128,207,118,0,0 // movdqa 0x76cf(%eax),%xmm0 .byte 102,15,127,69,216 // movdqa %xmm0,-0x28(%ebp) .byte 102,15,254,240 // paddd %xmm0,%xmm6 .byte 102,15,114,230,16 // psrad $0x10,%xmm6 @@ -61339,8 +61323,8 @@ _sk_store_f16_sse2: .byte 102,15,97,245 // punpcklwd %xmm5,%xmm6 .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,17 // mov (%ecx),%edx .byte 139,56 // mov (%eax),%edi + .byte 139,17 // mov (%ecx),%edx .byte 139,119,4 // mov 0x4(%edi),%esi .byte 15,175,113,4 // imul 0x4(%ecx),%esi .byte 193,230,3 // shl $0x3,%esi @@ -61389,8 +61373,8 @@ _sk_load_u16_be_sse2: .byte 131,236,44 // sub $0x2c,%esp .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,49 // mov (%ecx),%esi .byte 139,16 // mov (%eax),%edx + .byte 139,49 // mov (%ecx),%esi .byte 139,122,4 // mov 0x4(%edx),%edi .byte 15,175,121,4 // imul 0x4(%ecx),%edi .byte 1,255 // add %edi,%edi @@ -61421,7 +61405,7 @@ _sk_load_u16_be_sse2: .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,97,195 // punpcklwd %xmm3,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,40,162,2,118,0,0 // movaps 0x7602(%edx),%xmm4 + .byte 15,40,162,226,117,0,0 // movaps 0x75e2(%edx),%xmm4 .byte 15,89,196 // mulps %xmm4,%xmm0 .byte 102,15,111,205 // movdqa %xmm5,%xmm1 .byte 102,15,113,241,8 // psllw $0x8,%xmm1 @@ -61490,8 +61474,8 @@ _sk_load_rgb_u16_be_sse2: .byte 131,236,28 // sub $0x1c,%esp .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,121,8 // mov 0x8(%ecx),%edi .byte 139,16 // mov (%eax),%edx + .byte 139,121,8 // mov 0x8(%ecx),%edi .byte 139,114,4 // mov 0x4(%edx),%esi .byte 15,175,113,4 // imul 0x4(%ecx),%esi .byte 1,246 // add %esi,%esi @@ -61525,7 +61509,7 @@ _sk_load_rgb_u16_be_sse2: .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,97,195 // punpcklwd %xmm3,%xmm0 .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 - .byte 15,40,170,155,116,0,0 // movaps 0x749b(%edx),%xmm5 + .byte 15,40,170,123,116,0,0 // movaps 0x747b(%edx),%xmm5 .byte 15,89,197 // mulps %xmm5,%xmm0 .byte 102,15,111,204 // movdqa %xmm4,%xmm1 .byte 102,15,113,241,8 // psllw $0x8,%xmm1 @@ -61551,7 +61535,7 @@ _sk_load_rgb_u16_be_sse2: .byte 15,89,213 // mulps %xmm5,%xmm2 .byte 141,112,8 // lea 0x8(%eax),%esi .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,154,43,114,0,0 // movaps 0x722b(%edx),%xmm3 + .byte 15,40,154,11,114,0,0 // movaps 0x720b(%edx),%xmm3 .byte 86 // push %esi .byte 81 // push %ecx .byte 255,80,4 // call *0x4(%eax) @@ -61598,7 +61582,7 @@ _sk_store_u16_be_sse2: .byte 1,210 // add %edx,%edx .byte 3,22 // add (%esi),%edx .byte 139,49 // mov (%ecx),%esi - .byte 15,40,183,247,117,0,0 // movaps 0x75f7(%edi),%xmm6 + .byte 15,40,183,215,117,0,0 // movaps 0x75d7(%edi),%xmm6 .byte 139,121,8 // mov 0x8(%ecx),%edi .byte 193,230,2 // shl $0x2,%esi .byte 15,40,224 // movaps %xmm0,%xmm4 @@ -61679,8 +61663,8 @@ _sk_load_f32_sse2: .byte 86 // push %esi .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,57 // mov (%ecx),%edi .byte 139,48 // mov (%eax),%esi + .byte 139,57 // mov (%ecx),%edi .byte 139,86,4 // mov 0x4(%esi),%edx .byte 15,175,81,4 // imul 0x4(%ecx),%edx .byte 193,226,2 // shl $0x2,%edx @@ -61743,8 +61727,8 @@ _sk_load_f32_dst_sse2: .byte 15,41,85,232 // movaps %xmm2,-0x18(%ebp) .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,57 // mov (%ecx),%edi .byte 139,48 // mov (%eax),%esi + .byte 139,57 // mov (%ecx),%edi .byte 139,86,4 // mov 0x4(%esi),%edx .byte 15,175,81,4 // imul 0x4(%ecx),%edx .byte 193,226,2 // shl $0x2,%edx @@ -61812,8 +61796,8 @@ _sk_store_f32_sse2: .byte 131,236,12 // sub $0xc,%esp .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 139,25 // mov (%ecx),%ebx .byte 139,48 // mov (%eax),%esi + .byte 139,25 // mov (%ecx),%ebx .byte 139,86,4 // mov 0x4(%esi),%edx .byte 15,175,81,4 // imul 0x4(%ecx),%edx .byte 193,226,2 // shl $0x2,%edx @@ -61878,7 +61862,7 @@ _sk_repeat_x_sse2: .byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 .byte 15,194,238,1 // cmpltps %xmm6,%xmm5 - .byte 15,84,168,179,109,0,0 // andps 0x6db3(%eax),%xmm5 + .byte 15,84,168,147,109,0,0 // andps 0x6d93(%eax),%xmm5 .byte 15,92,245 // subps %xmm5,%xmm6 .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4 .byte 15,89,230 // mulps %xmm6,%xmm4 @@ -61910,7 +61894,7 @@ _sk_repeat_y_sse2: .byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 .byte 15,194,238,1 // cmpltps %xmm6,%xmm5 - .byte 15,84,168,97,109,0,0 // andps 0x6d61(%eax),%xmm5 + .byte 15,84,168,65,109,0,0 // andps 0x6d41(%eax),%xmm5 .byte 15,92,245 // subps %xmm5,%xmm6 .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4 .byte 15,89,230 // mulps %xmm6,%xmm4 @@ -61940,13 +61924,13 @@ _sk_mirror_x_sse2: .byte 15,40,244 // movaps %xmm4,%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 .byte 15,92,198 // subps %xmm6,%xmm0 - .byte 243,15,89,169,159,116,0,0 // mulss 0x749f(%ecx),%xmm5 + .byte 243,15,89,169,127,116,0,0 // mulss 0x747f(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,89,232 // mulps %xmm0,%xmm5 .byte 243,15,91,253 // cvttps2dq %xmm5,%xmm7 .byte 15,91,255 // cvtdq2ps %xmm7,%xmm7 .byte 15,194,239,1 // cmpltps %xmm7,%xmm5 - .byte 15,84,169,15,109,0,0 // andps 0x6d0f(%ecx),%xmm5 + .byte 15,84,169,239,108,0,0 // andps 0x6cef(%ecx),%xmm5 .byte 15,92,253 // subps %xmm5,%xmm7 .byte 243,15,88,228 // addss %xmm4,%xmm4 .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4 @@ -61981,13 +61965,13 @@ _sk_mirror_y_sse2: .byte 15,40,244 // movaps %xmm4,%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 .byte 15,92,206 // subps %xmm6,%xmm1 - .byte 243,15,89,169,43,116,0,0 // mulss 0x742b(%ecx),%xmm5 + .byte 243,15,89,169,11,116,0,0 // mulss 0x740b(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,89,233 // mulps %xmm1,%xmm5 .byte 243,15,91,253 // cvttps2dq %xmm5,%xmm7 .byte 15,91,255 // cvtdq2ps %xmm7,%xmm7 .byte 15,194,239,1 // cmpltps %xmm7,%xmm5 - .byte 15,84,169,155,108,0,0 // andps 0x6c9b(%ecx),%xmm5 + .byte 15,84,169,123,108,0,0 // andps 0x6c7b(%ecx),%xmm5 .byte 15,92,253 // subps %xmm5,%xmm7 .byte 243,15,88,228 // addss %xmm4,%xmm4 .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4 @@ -62018,7 +62002,7 @@ _sk_clamp_x_1_sse2: .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 15,87,228 // xorps %xmm4,%xmm4 .byte 15,95,224 // maxps %xmm0,%xmm4 - .byte 15,93,160,39,108,0,0 // minps 0x6c27(%eax),%xmm4 + .byte 15,93,160,7,108,0,0 // minps 0x6c07(%eax),%xmm4 .byte 141,65,4 // lea 0x4(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp .byte 15,40,196 // movaps %xmm4,%xmm0 @@ -62043,7 +62027,7 @@ _sk_repeat_x_1_sse2: .byte 15,91,228 // cvtdq2ps %xmm4,%xmm4 .byte 15,40,232 // movaps %xmm0,%xmm5 .byte 15,194,236,1 // cmpltps %xmm4,%xmm5 - .byte 15,84,168,247,107,0,0 // andps 0x6bf7(%eax),%xmm5 + .byte 15,84,168,215,107,0,0 // andps 0x6bd7(%eax),%xmm5 .byte 15,92,229 // subps %xmm5,%xmm4 .byte 15,92,196 // subps %xmm4,%xmm0 .byte 141,65,4 // lea 0x4(%ecx),%eax @@ -62065,14 +62049,14 @@ _sk_mirror_x_1_sse2: .byte 232,0,0,0,0 // call 6124 <_sk_mirror_x_1_sse2+0xb> .byte 89 // pop %ecx .byte 139,69,12 // mov 0xc(%ebp),%eax - .byte 15,40,161,44,108,0,0 // movaps 0x6c2c(%ecx),%xmm4 + .byte 15,40,161,12,108,0,0 // movaps 0x6c0c(%ecx),%xmm4 .byte 15,88,196 // addps %xmm4,%xmm0 - .byte 15,40,169,172,107,0,0 // movaps 0x6bac(%ecx),%xmm5 + .byte 15,40,169,140,107,0,0 // movaps 0x6b8c(%ecx),%xmm5 .byte 15,89,232 // mulps %xmm0,%xmm5 .byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 .byte 15,194,238,1 // cmpltps %xmm6,%xmm5 - .byte 15,84,169,188,107,0,0 // andps 0x6bbc(%ecx),%xmm5 + .byte 15,84,169,156,107,0,0 // andps 0x6b9c(%ecx),%xmm5 .byte 15,87,255 // xorps %xmm7,%xmm7 .byte 15,92,245 // subps %xmm5,%xmm6 .byte 15,88,246 // addps %xmm6,%xmm6 @@ -62100,10 +62084,10 @@ _sk_luminance_to_alpha_sse2: .byte 232,0,0,0,0 // call 6182 <_sk_luminance_to_alpha_sse2+0xe> .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 15,89,128,142,112,0,0 // mulps 0x708e(%eax),%xmm0 - .byte 15,89,136,158,112,0,0 // mulps 0x709e(%eax),%xmm1 + .byte 15,89,128,110,112,0,0 // mulps 0x706e(%eax),%xmm0 + .byte 15,89,136,126,112,0,0 // mulps 0x707e(%eax),%xmm1 .byte 15,88,200 // addps %xmm0,%xmm1 - .byte 15,89,152,174,112,0,0 // mulps 0x70ae(%eax),%xmm3 + .byte 15,89,152,142,112,0,0 // mulps 0x708e(%eax),%xmm3 .byte 15,88,217 // addps %xmm1,%xmm3 .byte 141,65,4 // lea 0x4(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -62281,13 +62265,12 @@ _sk_matrix_4x5_sse2: .byte 137,229 // mov %esp,%ebp .byte 131,236,8 // sub $0x8,%esp .byte 15,40,233 // movaps %xmm1,%xmm5 + .byte 15,40,224 // movaps %xmm0,%xmm4 .byte 139,69,12 // mov 0xc(%ebp),%eax - .byte 141,72,4 // lea 0x4(%eax),%ecx - .byte 137,77,252 // mov %ecx,-0x4(%ebp) .byte 139,8 // mov (%eax),%ecx - .byte 243,15,16,33 // movss (%ecx),%xmm4 + .byte 243,15,16,1 // movss (%ecx),%xmm0 .byte 243,15,16,73,4 // movss 0x4(%ecx),%xmm1 - .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4 + .byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0 .byte 243,15,16,113,48 // movss 0x30(%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 .byte 243,15,16,121,64 // movss 0x40(%ecx),%xmm7 @@ -62302,8 +62285,8 @@ _sk_matrix_4x5_sse2: .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 .byte 15,88,247 // addps %xmm7,%xmm6 - .byte 15,89,224 // mulps %xmm0,%xmm4 - .byte 15,88,230 // addps %xmm6,%xmm4 + .byte 15,89,196 // mulps %xmm4,%xmm0 + .byte 15,88,198 // addps %xmm6,%xmm0 .byte 15,198,201,0 // shufps $0x0,%xmm1,%xmm1 .byte 243,15,16,113,52 // movss 0x34(%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -62319,7 +62302,7 @@ _sk_matrix_4x5_sse2: .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 .byte 15,88,247 // addps %xmm7,%xmm6 - .byte 15,89,200 // mulps %xmm0,%xmm1 + .byte 15,89,204 // mulps %xmm4,%xmm1 .byte 15,88,206 // addps %xmm6,%xmm1 .byte 243,15,16,113,56 // movss 0x38(%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -62337,7 +62320,7 @@ _sk_matrix_4x5_sse2: .byte 15,88,247 // addps %xmm7,%xmm6 .byte 243,15,16,121,8 // movss 0x8(%ecx),%xmm7 .byte 15,198,255,0 // shufps $0x0,%xmm7,%xmm7 - .byte 15,89,248 // mulps %xmm0,%xmm7 + .byte 15,89,252 // mulps %xmm4,%xmm7 .byte 15,88,254 // addps %xmm6,%xmm7 .byte 243,15,16,113,60 // movss 0x3c(%ecx),%xmm6 .byte 15,198,246,0 // shufps $0x0,%xmm6,%xmm6 @@ -62355,15 +62338,13 @@ _sk_matrix_4x5_sse2: .byte 15,88,211 // addps %xmm3,%xmm2 .byte 243,15,16,89,12 // movss 0xc(%ecx),%xmm3 .byte 15,198,219,0 // shufps $0x0,%xmm3,%xmm3 - .byte 15,89,216 // mulps %xmm0,%xmm3 + .byte 15,89,220 // mulps %xmm4,%xmm3 .byte 15,88,218 // addps %xmm2,%xmm3 - .byte 139,77,8 // mov 0x8(%ebp),%ecx - .byte 141,80,8 // lea 0x8(%eax),%edx + .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,196 // movaps %xmm4,%xmm0 .byte 15,40,215 // movaps %xmm7,%xmm2 - .byte 82 // push %edx .byte 81 // push %ecx + .byte 255,117,8 // pushl 0x8(%ebp) .byte 255,80,4 // call *0x4(%eax) .byte 131,196,24 // add $0x18,%esp .byte 93 // pop %ebp @@ -62493,23 +62474,21 @@ _sk_evenly_spaced_gradient_sse2: .byte 86 // push %esi .byte 131,236,60 // sub $0x3c,%esp .byte 15,41,69,184 // movaps %xmm0,-0x48(%ebp) - .byte 232,0,0,0,0 // call 661f <_sk_evenly_spaced_gradient_sse2+0x12> + .byte 232,0,0,0,0 // call 6618 <_sk_evenly_spaced_gradient_sse2+0x12> .byte 90 // pop %edx - .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 141,65,4 // lea 0x4(%ecx),%eax - .byte 137,69,240 // mov %eax,-0x10(%ebp) - .byte 139,9 // mov (%ecx),%ecx + .byte 139,69,12 // mov 0xc(%ebp),%eax + .byte 139,8 // mov (%eax),%ecx .byte 139,49 // mov (%ecx),%esi .byte 139,65,4 // mov 0x4(%ecx),%eax .byte 78 // dec %esi .byte 102,15,110,206 // movd %esi,%xmm1 .byte 102,15,112,201,0 // pshufd $0x0,%xmm1,%xmm1 - .byte 102,15,111,146,33,108,0,0 // movdqa 0x6c21(%edx),%xmm2 + .byte 102,15,111,146,8,108,0,0 // movdqa 0x6c08(%edx),%xmm2 .byte 102,15,219,209 // pand %xmm1,%xmm2 - .byte 102,15,235,146,225,105,0,0 // por 0x69e1(%edx),%xmm2 + .byte 102,15,235,146,200,105,0,0 // por 0x69c8(%edx),%xmm2 .byte 102,15,114,209,16 // psrld $0x10,%xmm1 - .byte 102,15,235,138,49,108,0,0 // por 0x6c31(%edx),%xmm1 - .byte 15,88,138,65,108,0,0 // addps 0x6c41(%edx),%xmm1 + .byte 102,15,235,138,24,108,0,0 // por 0x6c18(%edx),%xmm1 + .byte 15,88,138,40,108,0,0 // addps 0x6c28(%edx),%xmm1 .byte 15,88,202 // addps %xmm2,%xmm1 .byte 15,89,200 // mulps %xmm0,%xmm1 .byte 243,15,91,201 // cvttps2dq %xmm1,%xmm1 @@ -62594,14 +62573,13 @@ _sk_evenly_spaced_gradient_sse2: .byte 15,88,215 // addps %xmm7,%xmm2 .byte 15,89,221 // mulps %xmm5,%xmm3 .byte 15,88,216 // addps %xmm0,%xmm3 - .byte 139,69,8 // mov 0x8(%ebp),%eax - .byte 139,85,12 // mov 0xc(%ebp),%edx - .byte 141,74,8 // lea 0x8(%edx),%ecx + .byte 139,77,12 // mov 0xc(%ebp),%ecx + .byte 141,65,8 // lea 0x8(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp .byte 15,40,196 // movaps %xmm4,%xmm0 - .byte 81 // push %ecx .byte 80 // push %eax - .byte 255,82,4 // call *0x4(%edx) + .byte 255,117,8 // pushl 0x8(%ebp) + .byte 255,81,4 // call *0x4(%ecx) .byte 131,196,76 // add $0x4c,%esp .byte 94 // pop %esi .byte 95 // pop %edi @@ -62616,18 +62594,18 @@ _sk_gauss_a_to_rgba_sse2: .byte 85 // push %ebp .byte 137,229 // mov %esp,%ebp .byte 131,236,8 // sub $0x8,%esp - .byte 232,0,0,0,0 // call 67df <_sk_gauss_a_to_rgba_sse2+0xb> + .byte 232,0,0,0,0 // call 67d1 <_sk_gauss_a_to_rgba_sse2+0xb> .byte 88 // pop %eax .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 15,40,128,145,106,0,0 // movaps 0x6a91(%eax),%xmm0 + .byte 15,40,128,127,106,0,0 // movaps 0x6a7f(%eax),%xmm0 .byte 15,89,195 // mulps %xmm3,%xmm0 - .byte 15,88,128,161,106,0,0 // addps 0x6aa1(%eax),%xmm0 + .byte 15,88,128,143,106,0,0 // addps 0x6a8f(%eax),%xmm0 .byte 15,89,195 // mulps %xmm3,%xmm0 - .byte 15,88,128,177,106,0,0 // addps 0x6ab1(%eax),%xmm0 + .byte 15,88,128,159,106,0,0 // addps 0x6a9f(%eax),%xmm0 .byte 15,89,195 // mulps %xmm3,%xmm0 - .byte 15,88,128,193,106,0,0 // addps 0x6ac1(%eax),%xmm0 + .byte 15,88,128,175,106,0,0 // addps 0x6aaf(%eax),%xmm0 .byte 15,89,195 // mulps %xmm3,%xmm0 - .byte 15,88,128,209,106,0,0 // addps 0x6ad1(%eax),%xmm0 + .byte 15,88,128,191,106,0,0 // addps 0x6abf(%eax),%xmm0 .byte 141,65,4 // lea 0x4(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp .byte 15,40,200 // movaps %xmm0,%xmm1 @@ -62650,16 +62628,14 @@ _sk_gradient_sse2: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,60 // sub $0x3c,%esp - .byte 139,77,12 // mov 0xc(%ebp),%ecx - .byte 141,81,4 // lea 0x4(%ecx),%edx - .byte 137,85,240 // mov %edx,-0x10(%ebp) - .byte 139,9 // mov (%ecx),%ecx - .byte 139,17 // mov (%ecx),%edx + .byte 139,69,12 // mov 0xc(%ebp),%eax + .byte 139,16 // mov (%eax),%edx + .byte 139,10 // mov (%edx),%ecx .byte 102,15,239,201 // pxor %xmm1,%xmm1 - .byte 131,250,2 // cmp $0x2,%edx - .byte 114,33 // jb 686c <_sk_gradient_sse2+0x40> - .byte 139,113,36 // mov 0x24(%ecx),%esi - .byte 74 // dec %edx + .byte 131,249,2 // cmp $0x2,%ecx + .byte 114,33 // jb 6858 <_sk_gradient_sse2+0x3a> + .byte 139,114,36 // mov 0x24(%edx),%esi + .byte 73 // dec %ecx .byte 131,198,4 // add $0x4,%esi .byte 102,15,239,201 // pxor %xmm1,%xmm1 .byte 243,15,16,22 // movss (%esi),%xmm2 @@ -62667,80 +62643,80 @@ _sk_gradient_sse2: .byte 15,194,208,2 // cmpleps %xmm0,%xmm2 .byte 102,15,250,202 // psubd %xmm2,%xmm1 .byte 131,198,4 // add $0x4,%esi - .byte 74 // dec %edx - .byte 117,234 // jne 6856 <_sk_gradient_sse2+0x2a> - .byte 102,15,126,202 // movd %xmm1,%edx + .byte 73 // dec %ecx + .byte 117,234 // jne 6842 <_sk_gradient_sse2+0x24> + .byte 102,15,126,206 // movd %xmm1,%esi .byte 102,15,112,209,229 // pshufd $0xe5,%xmm1,%xmm2 .byte 102,15,112,217,78 // pshufd $0x4e,%xmm1,%xmm3 - .byte 102,15,126,222 // movd %xmm3,%esi + .byte 102,15,126,223 // movd %xmm3,%edi .byte 102,15,112,201,231 // pshufd $0xe7,%xmm1,%xmm1 - .byte 102,15,126,207 // movd %xmm1,%edi - .byte 139,65,4 // mov 0x4(%ecx),%eax - .byte 243,15,16,12,184 // movss (%eax,%edi,4),%xmm1 - .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3 - .byte 243,15,16,36,144 // movss (%eax,%edx,4),%xmm4 - .byte 102,15,126,211 // movd %xmm2,%ebx - .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2 + .byte 102,15,126,203 // movd %xmm1,%ebx + .byte 139,66,4 // mov 0x4(%edx),%eax + .byte 243,15,16,12,152 // movss (%eax,%ebx,4),%xmm1 + .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3 + .byte 243,15,16,36,176 // movss (%eax,%esi,4),%xmm4 + .byte 102,15,126,209 // movd %xmm2,%ecx + .byte 243,15,16,20,136 // movss (%eax,%ecx,4),%xmm2 .byte 15,20,217 // unpcklps %xmm1,%xmm3 - .byte 139,65,20 // mov 0x14(%ecx),%eax - .byte 243,15,16,12,184 // movss (%eax,%edi,4),%xmm1 - .byte 243,15,16,52,176 // movss (%eax,%esi,4),%xmm6 - .byte 243,15,16,44,144 // movss (%eax,%edx,4),%xmm5 - .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7 + .byte 139,66,20 // mov 0x14(%edx),%eax + .byte 243,15,16,12,152 // movss (%eax,%ebx,4),%xmm1 + .byte 243,15,16,52,184 // movss (%eax,%edi,4),%xmm6 + .byte 243,15,16,44,176 // movss (%eax,%esi,4),%xmm5 + .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7 .byte 15,20,226 // unpcklps %xmm2,%xmm4 .byte 102,15,20,227 // unpcklpd %xmm3,%xmm4 .byte 102,15,41,101,184 // movapd %xmm4,-0x48(%ebp) .byte 15,20,241 // unpcklps %xmm1,%xmm6 .byte 15,20,239 // unpcklps %xmm7,%xmm5 - .byte 139,65,8 // mov 0x8(%ecx),%eax - .byte 243,15,16,20,184 // movss (%eax,%edi,4),%xmm2 - .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3 - .byte 243,15,16,12,144 // movss (%eax,%edx,4),%xmm1 - .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7 + .byte 139,66,8 // mov 0x8(%edx),%eax + .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2 + .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3 + .byte 243,15,16,12,176 // movss (%eax,%esi,4),%xmm1 + .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7 .byte 102,15,20,238 // unpcklpd %xmm6,%xmm5 .byte 102,15,41,109,200 // movapd %xmm5,-0x38(%ebp) .byte 15,20,218 // unpcklps %xmm2,%xmm3 .byte 15,20,207 // unpcklps %xmm7,%xmm1 .byte 102,15,20,203 // unpcklpd %xmm3,%xmm1 - .byte 139,65,24 // mov 0x18(%ecx),%eax - .byte 243,15,16,20,184 // movss (%eax,%edi,4),%xmm2 - .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3 - .byte 243,15,16,36,144 // movss (%eax,%edx,4),%xmm4 - .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7 + .byte 139,66,24 // mov 0x18(%edx),%eax + .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2 + .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3 + .byte 243,15,16,36,176 // movss (%eax,%esi,4),%xmm4 + .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7 .byte 15,20,218 // unpcklps %xmm2,%xmm3 .byte 15,20,231 // unpcklps %xmm7,%xmm4 .byte 102,15,20,227 // unpcklpd %xmm3,%xmm4 .byte 102,15,41,101,216 // movapd %xmm4,-0x28(%ebp) - .byte 139,65,12 // mov 0xc(%ecx),%eax - .byte 243,15,16,20,184 // movss (%eax,%edi,4),%xmm2 - .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3 + .byte 139,66,12 // mov 0xc(%edx),%eax + .byte 243,15,16,20,152 // movss (%eax,%ebx,4),%xmm2 + .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3 .byte 15,20,218 // unpcklps %xmm2,%xmm3 - .byte 243,15,16,20,144 // movss (%eax,%edx,4),%xmm2 - .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7 + .byte 243,15,16,20,176 // movss (%eax,%esi,4),%xmm2 + .byte 243,15,16,60,136 // movss (%eax,%ecx,4),%xmm7 .byte 15,20,215 // unpcklps %xmm7,%xmm2 .byte 102,15,20,211 // unpcklpd %xmm3,%xmm2 - .byte 139,65,28 // mov 0x1c(%ecx),%eax - .byte 243,15,16,60,184 // movss (%eax,%edi,4),%xmm7 - .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3 + .byte 139,66,28 // mov 0x1c(%edx),%eax + .byte 243,15,16,60,152 // movss (%eax,%ebx,4),%xmm7 + .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3 .byte 15,20,223 // unpcklps %xmm7,%xmm3 - .byte 243,15,16,60,144 // movss (%eax,%edx,4),%xmm7 - .byte 243,15,16,44,152 // movss (%eax,%ebx,4),%xmm5 + .byte 243,15,16,60,176 // movss (%eax,%esi,4),%xmm7 + .byte 243,15,16,44,136 // movss (%eax,%ecx,4),%xmm5 .byte 15,20,253 // unpcklps %xmm5,%xmm7 .byte 102,15,20,251 // unpcklpd %xmm3,%xmm7 - .byte 139,65,16 // mov 0x10(%ecx),%eax - .byte 243,15,16,28,184 // movss (%eax,%edi,4),%xmm3 - .byte 243,15,16,44,176 // movss (%eax,%esi,4),%xmm5 + .byte 139,66,16 // mov 0x10(%edx),%eax + .byte 243,15,16,28,152 // movss (%eax,%ebx,4),%xmm3 + .byte 243,15,16,44,184 // movss (%eax,%edi,4),%xmm5 .byte 15,20,235 // unpcklps %xmm3,%xmm5 - .byte 243,15,16,28,144 // movss (%eax,%edx,4),%xmm3 - .byte 243,15,16,52,152 // movss (%eax,%ebx,4),%xmm6 + .byte 243,15,16,28,176 // movss (%eax,%esi,4),%xmm3 + .byte 243,15,16,52,136 // movss (%eax,%ecx,4),%xmm6 .byte 15,20,222 // unpcklps %xmm6,%xmm3 .byte 102,15,20,221 // unpcklpd %xmm5,%xmm3 - .byte 139,65,32 // mov 0x20(%ecx),%eax - .byte 243,15,16,44,184 // movss (%eax,%edi,4),%xmm5 - .byte 243,15,16,52,176 // movss (%eax,%esi,4),%xmm6 + .byte 139,66,32 // mov 0x20(%edx),%eax + .byte 243,15,16,44,152 // movss (%eax,%ebx,4),%xmm5 + .byte 243,15,16,52,184 // movss (%eax,%edi,4),%xmm6 .byte 15,20,245 // unpcklps %xmm5,%xmm6 - .byte 243,15,16,44,144 // movss (%eax,%edx,4),%xmm5 - .byte 243,15,16,36,152 // movss (%eax,%ebx,4),%xmm4 + .byte 243,15,16,44,176 // movss (%eax,%esi,4),%xmm5 + .byte 243,15,16,36,136 // movss (%eax,%ecx,4),%xmm4 .byte 15,20,236 // unpcklps %xmm4,%xmm5 .byte 102,15,20,238 // unpcklpd %xmm6,%xmm5 .byte 15,40,101,184 // movaps -0x48(%ebp),%xmm4 @@ -62752,13 +62728,14 @@ _sk_gradient_sse2: .byte 15,88,215 // addps %xmm7,%xmm2 .byte 15,89,216 // mulps %xmm0,%xmm3 .byte 15,88,221 // addps %xmm5,%xmm3 - .byte 139,69,240 // mov -0x10(%ebp),%eax - .byte 141,72,4 // lea 0x4(%eax),%ecx + .byte 139,69,12 // mov 0xc(%ebp),%eax + .byte 137,193 // mov %eax,%ecx + .byte 141,65,8 // lea 0x8(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp .byte 15,40,196 // movaps %xmm4,%xmm0 - .byte 81 // push %ecx + .byte 80 // push %eax .byte 255,117,8 // pushl 0x8(%ebp) - .byte 255,16 // call *(%eax) + .byte 255,81,4 // call *0x4(%ecx) .byte 131,196,76 // add $0x4c,%esp .byte 94 // pop %esi .byte 95 // pop %edi @@ -62820,7 +62797,7 @@ _sk_xy_to_unit_angle_sse2: .byte 15,40,218 // movaps %xmm2,%xmm3 .byte 15,40,209 // movaps %xmm1,%xmm2 .byte 15,40,200 // movaps %xmm0,%xmm1 - .byte 232,0,0,0,0 // call 6a71 <_sk_xy_to_unit_angle_sse2+0x18> + .byte 232,0,0,0,0 // call 6a60 <_sk_xy_to_unit_angle_sse2+0x18> .byte 88 // pop %eax .byte 15,87,237 // xorps %xmm5,%xmm5 .byte 15,92,233 // subps %xmm1,%xmm5 @@ -62835,30 +62812,30 @@ _sk_xy_to_unit_angle_sse2: .byte 15,94,247 // divps %xmm7,%xmm6 .byte 15,40,254 // movaps %xmm6,%xmm7 .byte 15,89,255 // mulps %xmm7,%xmm7 - .byte 15,40,128,79,104,0,0 // movaps 0x684f(%eax),%xmm0 + .byte 15,40,128,64,104,0,0 // movaps 0x6840(%eax),%xmm0 .byte 15,89,199 // mulps %xmm7,%xmm0 - .byte 15,88,128,95,104,0,0 // addps 0x685f(%eax),%xmm0 + .byte 15,88,128,80,104,0,0 // addps 0x6850(%eax),%xmm0 .byte 15,89,199 // mulps %xmm7,%xmm0 - .byte 15,88,128,111,104,0,0 // addps 0x686f(%eax),%xmm0 + .byte 15,88,128,96,104,0,0 // addps 0x6860(%eax),%xmm0 .byte 15,89,199 // mulps %xmm7,%xmm0 - .byte 15,88,128,127,104,0,0 // addps 0x687f(%eax),%xmm0 + .byte 15,88,128,112,104,0,0 // addps 0x6870(%eax),%xmm0 .byte 15,89,198 // mulps %xmm6,%xmm0 .byte 15,194,236,1 // cmpltps %xmm4,%xmm5 - .byte 15,40,176,143,104,0,0 // movaps 0x688f(%eax),%xmm6 + .byte 15,40,176,128,104,0,0 // movaps 0x6880(%eax),%xmm6 .byte 15,92,240 // subps %xmm0,%xmm6 .byte 15,84,245 // andps %xmm5,%xmm6 .byte 15,85,232 // andnps %xmm0,%xmm5 .byte 15,87,228 // xorps %xmm4,%xmm4 .byte 15,86,238 // orps %xmm6,%xmm5 .byte 15,194,204,1 // cmpltps %xmm4,%xmm1 - .byte 15,40,128,95,98,0,0 // movaps 0x625f(%eax),%xmm0 + .byte 15,40,128,80,98,0,0 // movaps 0x6250(%eax),%xmm0 .byte 15,92,197 // subps %xmm5,%xmm0 .byte 15,84,193 // andps %xmm1,%xmm0 .byte 15,85,205 // andnps %xmm5,%xmm1 .byte 15,86,200 // orps %xmm0,%xmm1 .byte 15,40,194 // movaps %xmm2,%xmm0 .byte 15,194,196,1 // cmpltps %xmm4,%xmm0 - .byte 15,40,168,111,98,0,0 // movaps 0x626f(%eax),%xmm5 + .byte 15,40,168,96,98,0,0 // movaps 0x6260(%eax),%xmm5 .byte 15,92,233 // subps %xmm1,%xmm5 .byte 15,84,232 // andps %xmm0,%xmm5 .byte 15,85,193 // andnps %xmm1,%xmm0 @@ -62919,15 +62896,15 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2: .byte 15,40,241 // movaps %xmm1,%xmm6 .byte 15,89,246 // mulps %xmm6,%xmm6 .byte 15,88,240 // addps %xmm0,%xmm6 - .byte 232,0,0,0,0 // call 6b8e <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31> + .byte 232,0,0,0,0 // call 6b7d <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31> .byte 90 // pop %edx .byte 243,15,89,237 // mulss %xmm5,%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,92,245 // subps %xmm5,%xmm6 .byte 243,15,16,65,32 // movss 0x20(%ecx),%xmm0 .byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0 - .byte 15,89,162,130,103,0,0 // mulps 0x6782(%edx),%xmm4 - .byte 15,89,130,146,103,0,0 // mulps 0x6792(%edx),%xmm0 + .byte 15,89,162,115,103,0,0 // mulps 0x6773(%edx),%xmm4 + .byte 15,89,130,131,103,0,0 // mulps 0x6783(%edx),%xmm0 .byte 15,89,198 // mulps %xmm6,%xmm0 .byte 15,40,236 // movaps %xmm4,%xmm5 .byte 15,89,237 // mulps %xmm5,%xmm5 @@ -62935,11 +62912,11 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2: .byte 15,81,237 // sqrtps %xmm5,%xmm5 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,92,196 // subps %xmm4,%xmm0 - .byte 15,87,162,50,102,0,0 // xorps 0x6632(%edx),%xmm4 + .byte 15,87,162,35,102,0,0 // xorps 0x6623(%edx),%xmm4 .byte 15,92,229 // subps %xmm5,%xmm4 .byte 243,15,16,105,36 // movss 0x24(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 - .byte 15,89,170,66,97,0,0 // mulps 0x6142(%edx),%xmm5 + .byte 15,89,170,51,97,0,0 // mulps 0x6133(%edx),%xmm5 .byte 15,89,197 // mulps %xmm5,%xmm0 .byte 15,89,229 // mulps %xmm5,%xmm4 .byte 15,95,196 // maxps %xmm4,%xmm0 @@ -62970,15 +62947,15 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2: .byte 15,40,241 // movaps %xmm1,%xmm6 .byte 15,89,246 // mulps %xmm6,%xmm6 .byte 15,88,240 // addps %xmm0,%xmm6 - .byte 232,0,0,0,0 // call 6c2c <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31> + .byte 232,0,0,0,0 // call 6c1b <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31> .byte 90 // pop %edx .byte 243,15,89,237 // mulss %xmm5,%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,92,245 // subps %xmm5,%xmm6 .byte 243,15,16,65,32 // movss 0x20(%ecx),%xmm0 .byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0 - .byte 15,89,162,228,102,0,0 // mulps 0x66e4(%edx),%xmm4 - .byte 15,89,130,244,102,0,0 // mulps 0x66f4(%edx),%xmm0 + .byte 15,89,162,213,102,0,0 // mulps 0x66d5(%edx),%xmm4 + .byte 15,89,130,229,102,0,0 // mulps 0x66e5(%edx),%xmm0 .byte 15,89,198 // mulps %xmm6,%xmm0 .byte 15,40,236 // movaps %xmm4,%xmm5 .byte 15,89,237 // mulps %xmm5,%xmm5 @@ -62986,11 +62963,11 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2: .byte 15,81,237 // sqrtps %xmm5,%xmm5 .byte 15,40,197 // movaps %xmm5,%xmm0 .byte 15,92,196 // subps %xmm4,%xmm0 - .byte 15,87,162,148,101,0,0 // xorps 0x6594(%edx),%xmm4 + .byte 15,87,162,133,101,0,0 // xorps 0x6585(%edx),%xmm4 .byte 15,92,229 // subps %xmm5,%xmm4 .byte 243,15,16,105,36 // movss 0x24(%ecx),%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 - .byte 15,89,170,164,96,0,0 // mulps 0x60a4(%edx),%xmm5 + .byte 15,89,170,149,96,0,0 // mulps 0x6095(%edx),%xmm5 .byte 15,89,197 // mulps %xmm5,%xmm0 .byte 15,89,229 // mulps %xmm5,%xmm4 .byte 15,93,196 // minps %xmm4,%xmm0 @@ -63010,7 +62987,7 @@ _sk_xy_to_2pt_conical_linear_sse2: .byte 85 // push %ebp .byte 137,229 // mov %esp,%ebp .byte 131,236,8 // sub $0x8,%esp - .byte 232,0,0,0,0 // call 6ca4 <_sk_xy_to_2pt_conical_linear_sse2+0xb> + .byte 232,0,0,0,0 // call 6c93 <_sk_xy_to_2pt_conical_linear_sse2+0xb> .byte 89 // pop %ecx .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,16 // mov (%eax),%edx @@ -63019,7 +62996,7 @@ _sk_xy_to_2pt_conical_linear_sse2: .byte 243,15,89,236 // mulss %xmm4,%xmm5 .byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5 .byte 15,88,232 // addps %xmm0,%xmm5 - .byte 15,89,169,108,102,0,0 // mulps 0x666c(%ecx),%xmm5 + .byte 15,89,169,93,102,0,0 // mulps 0x665d(%ecx),%xmm5 .byte 15,89,192 // mulps %xmm0,%xmm0 .byte 15,40,241 // movaps %xmm1,%xmm6 .byte 15,89,246 // mulps %xmm6,%xmm6 @@ -63027,7 +63004,7 @@ _sk_xy_to_2pt_conical_linear_sse2: .byte 243,15,89,228 // mulss %xmm4,%xmm4 .byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4 .byte 15,92,196 // subps %xmm4,%xmm0 - .byte 15,87,129,28,101,0,0 // xorps 0x651c(%ecx),%xmm0 + .byte 15,87,129,13,101,0,0 // xorps 0x650d(%ecx),%xmm0 .byte 15,94,197 // divps %xmm5,%xmm0 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 131,236,8 // sub $0x8,%esp @@ -63104,16 +63081,16 @@ _sk_save_xy_sse2: .byte 131,236,24 // sub $0x18,%esp .byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp) .byte 15,40,218 // movaps %xmm2,%xmm3 - .byte 232,0,0,0,0 // call 6d8d <_sk_save_xy_sse2+0x12> + .byte 232,0,0,0,0 // call 6d7c <_sk_save_xy_sse2+0x12> .byte 88 // pop %eax - .byte 15,40,160,67,95,0,0 // movaps 0x5f43(%eax),%xmm4 + .byte 15,40,160,52,95,0,0 // movaps 0x5f34(%eax),%xmm4 .byte 15,40,232 // movaps %xmm0,%xmm5 .byte 15,88,236 // addps %xmm4,%xmm5 .byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6 .byte 15,91,246 // cvtdq2ps %xmm6,%xmm6 .byte 15,40,253 // movaps %xmm5,%xmm7 .byte 15,194,254,1 // cmpltps %xmm6,%xmm7 - .byte 15,40,144,83,95,0,0 // movaps 0x5f53(%eax),%xmm2 + .byte 15,40,144,68,95,0,0 // movaps 0x5f44(%eax),%xmm2 .byte 15,84,250 // andps %xmm2,%xmm7 .byte 15,92,247 // subps %xmm7,%xmm6 .byte 15,92,238 // subps %xmm6,%xmm5 @@ -63188,15 +63165,15 @@ _sk_bilinear_nx_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 6e6f <_sk_bilinear_nx_sse2+0xa> + .byte 232,0,0,0,0 // call 6e5e <_sk_bilinear_nx_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,6 // movups (%esi),%xmm0 .byte 15,16,102,64 // movups 0x40(%esi),%xmm4 - .byte 15,88,128,193,100,0,0 // addps 0x64c1(%eax),%xmm0 - .byte 15,40,168,113,94,0,0 // movaps 0x5e71(%eax),%xmm5 + .byte 15,88,128,178,100,0,0 // addps 0x64b2(%eax),%xmm0 + .byte 15,40,168,98,94,0,0 // movaps 0x5e62(%eax),%xmm5 .byte 15,92,236 // subps %xmm4,%xmm5 .byte 15,17,174,128,0,0,0 // movups %xmm5,0x80(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax @@ -63217,14 +63194,14 @@ _sk_bilinear_px_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 6eb2 <_sk_bilinear_px_sse2+0xa> + .byte 232,0,0,0,0 // call 6ea1 <_sk_bilinear_px_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,6 // movups (%esi),%xmm0 .byte 15,16,102,64 // movups 0x40(%esi),%xmm4 - .byte 15,88,128,30,94,0,0 // addps 0x5e1e(%eax),%xmm0 + .byte 15,88,128,15,94,0,0 // addps 0x5e0f(%eax),%xmm0 .byte 15,17,166,128,0,0,0 // movups %xmm4,0x80(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -63244,15 +63221,15 @@ _sk_bilinear_ny_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 6eeb <_sk_bilinear_ny_sse2+0xa> + .byte 232,0,0,0,0 // call 6eda <_sk_bilinear_ny_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,78,32 // movups 0x20(%esi),%xmm1 .byte 15,16,102,96 // movups 0x60(%esi),%xmm4 - .byte 15,88,136,69,100,0,0 // addps 0x6445(%eax),%xmm1 - .byte 15,40,168,245,93,0,0 // movaps 0x5df5(%eax),%xmm5 + .byte 15,88,136,54,100,0,0 // addps 0x6436(%eax),%xmm1 + .byte 15,40,168,230,93,0,0 // movaps 0x5de6(%eax),%xmm5 .byte 15,92,236 // subps %xmm4,%xmm5 .byte 15,17,174,160,0,0,0 // movups %xmm5,0xa0(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax @@ -63273,14 +63250,14 @@ _sk_bilinear_py_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 6f2f <_sk_bilinear_py_sse2+0xa> + .byte 232,0,0,0,0 // call 6f1e <_sk_bilinear_py_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,78,32 // movups 0x20(%esi),%xmm1 .byte 15,16,102,96 // movups 0x60(%esi),%xmm4 - .byte 15,88,136,161,93,0,0 // addps 0x5da1(%eax),%xmm1 + .byte 15,88,136,146,93,0,0 // addps 0x5d92(%eax),%xmm1 .byte 15,17,166,160,0,0,0 // movups %xmm4,0xa0(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -63300,20 +63277,20 @@ _sk_bicubic_n3x_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 6f69 <_sk_bicubic_n3x_sse2+0xa> + .byte 232,0,0,0,0 // call 6f58 <_sk_bicubic_n3x_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,6 // movups (%esi),%xmm0 .byte 15,16,102,64 // movups 0x40(%esi),%xmm4 - .byte 15,88,128,215,99,0,0 // addps 0x63d7(%eax),%xmm0 - .byte 15,40,168,119,93,0,0 // movaps 0x5d77(%eax),%xmm5 + .byte 15,88,128,200,99,0,0 // addps 0x63c8(%eax),%xmm0 + .byte 15,40,168,104,93,0,0 // movaps 0x5d68(%eax),%xmm5 .byte 15,92,236 // subps %xmm4,%xmm5 .byte 15,40,229 // movaps %xmm5,%xmm4 .byte 15,89,228 // mulps %xmm4,%xmm4 - .byte 15,89,168,231,99,0,0 // mulps 0x63e7(%eax),%xmm5 - .byte 15,88,168,87,95,0,0 // addps 0x5f57(%eax),%xmm5 + .byte 15,89,168,216,99,0,0 // mulps 0x63d8(%eax),%xmm5 + .byte 15,88,168,72,95,0,0 // addps 0x5f48(%eax),%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 .byte 15,17,174,128,0,0,0 // movups %xmm5,0x80(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax @@ -63334,23 +63311,23 @@ _sk_bicubic_n1x_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 6fc3 <_sk_bicubic_n1x_sse2+0xa> + .byte 232,0,0,0,0 // call 6fb2 <_sk_bicubic_n1x_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,6 // movups (%esi),%xmm0 .byte 15,16,102,64 // movups 0x40(%esi),%xmm4 - .byte 15,88,128,109,99,0,0 // addps 0x636d(%eax),%xmm0 - .byte 15,40,168,29,93,0,0 // movaps 0x5d1d(%eax),%xmm5 + .byte 15,88,128,94,99,0,0 // addps 0x635e(%eax),%xmm0 + .byte 15,40,168,14,93,0,0 // movaps 0x5d0e(%eax),%xmm5 .byte 15,92,236 // subps %xmm4,%xmm5 - .byte 15,40,160,157,99,0,0 // movaps 0x639d(%eax),%xmm4 + .byte 15,40,160,142,99,0,0 // movaps 0x638e(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 - .byte 15,88,160,173,99,0,0 // addps 0x63ad(%eax),%xmm4 + .byte 15,88,160,158,99,0,0 // addps 0x639e(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 - .byte 15,88,160,13,93,0,0 // addps 0x5d0d(%eax),%xmm4 + .byte 15,88,160,254,92,0,0 // addps 0x5cfe(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 - .byte 15,88,160,189,99,0,0 // addps 0x63bd(%eax),%xmm4 + .byte 15,88,160,174,99,0,0 // addps 0x63ae(%eax),%xmm4 .byte 15,17,166,128,0,0,0 // movups %xmm4,0x80(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -63370,22 +63347,22 @@ _sk_bicubic_p1x_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 702b <_sk_bicubic_p1x_sse2+0xa> + .byte 232,0,0,0,0 // call 701a <_sk_bicubic_p1x_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi - .byte 15,40,160,165,92,0,0 // movaps 0x5ca5(%eax),%xmm4 + .byte 15,40,160,150,92,0,0 // movaps 0x5c96(%eax),%xmm4 .byte 15,16,6 // movups (%esi),%xmm0 .byte 15,16,110,64 // movups 0x40(%esi),%xmm5 .byte 15,88,196 // addps %xmm4,%xmm0 - .byte 15,40,176,53,99,0,0 // movaps 0x6335(%eax),%xmm6 + .byte 15,40,176,38,99,0,0 // movaps 0x6326(%eax),%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 - .byte 15,88,176,69,99,0,0 // addps 0x6345(%eax),%xmm6 + .byte 15,88,176,54,99,0,0 // addps 0x6336(%eax),%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 .byte 15,88,244 // addps %xmm4,%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 - .byte 15,88,176,85,99,0,0 // addps 0x6355(%eax),%xmm6 + .byte 15,88,176,70,99,0,0 // addps 0x6346(%eax),%xmm6 .byte 15,17,182,128,0,0,0 // movups %xmm6,0x80(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -63405,18 +63382,18 @@ _sk_bicubic_p3x_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 7088 <_sk_bicubic_p3x_sse2+0xa> + .byte 232,0,0,0,0 // call 7077 <_sk_bicubic_p3x_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,6 // movups (%esi),%xmm0 .byte 15,16,102,64 // movups 0x40(%esi),%xmm4 - .byte 15,88,128,232,98,0,0 // addps 0x62e8(%eax),%xmm0 + .byte 15,88,128,217,98,0,0 // addps 0x62d9(%eax),%xmm0 .byte 15,40,236 // movaps %xmm4,%xmm5 .byte 15,89,237 // mulps %xmm5,%xmm5 - .byte 15,89,160,200,98,0,0 // mulps 0x62c8(%eax),%xmm4 - .byte 15,88,160,56,94,0,0 // addps 0x5e38(%eax),%xmm4 + .byte 15,89,160,185,98,0,0 // mulps 0x62b9(%eax),%xmm4 + .byte 15,88,160,41,94,0,0 // addps 0x5e29(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 .byte 15,17,166,128,0,0,0 // movups %xmm4,0x80(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax @@ -63437,20 +63414,20 @@ _sk_bicubic_n3y_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 70d8 <_sk_bicubic_n3y_sse2+0xa> + .byte 232,0,0,0,0 // call 70c7 <_sk_bicubic_n3y_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,78,32 // movups 0x20(%esi),%xmm1 .byte 15,16,102,96 // movups 0x60(%esi),%xmm4 - .byte 15,88,136,104,98,0,0 // addps 0x6268(%eax),%xmm1 - .byte 15,40,168,8,92,0,0 // movaps 0x5c08(%eax),%xmm5 + .byte 15,88,136,89,98,0,0 // addps 0x6259(%eax),%xmm1 + .byte 15,40,168,249,91,0,0 // movaps 0x5bf9(%eax),%xmm5 .byte 15,92,236 // subps %xmm4,%xmm5 .byte 15,40,229 // movaps %xmm5,%xmm4 .byte 15,89,228 // mulps %xmm4,%xmm4 - .byte 15,89,168,120,98,0,0 // mulps 0x6278(%eax),%xmm5 - .byte 15,88,168,232,93,0,0 // addps 0x5de8(%eax),%xmm5 + .byte 15,89,168,105,98,0,0 // mulps 0x6269(%eax),%xmm5 + .byte 15,88,168,217,93,0,0 // addps 0x5dd9(%eax),%xmm5 .byte 15,89,236 // mulps %xmm4,%xmm5 .byte 15,17,174,160,0,0,0 // movups %xmm5,0xa0(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax @@ -63471,23 +63448,23 @@ _sk_bicubic_n1y_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 7133 <_sk_bicubic_n1y_sse2+0xa> + .byte 232,0,0,0,0 // call 7122 <_sk_bicubic_n1y_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,78,32 // movups 0x20(%esi),%xmm1 .byte 15,16,102,96 // movups 0x60(%esi),%xmm4 - .byte 15,88,136,253,97,0,0 // addps 0x61fd(%eax),%xmm1 - .byte 15,40,168,173,91,0,0 // movaps 0x5bad(%eax),%xmm5 + .byte 15,88,136,238,97,0,0 // addps 0x61ee(%eax),%xmm1 + .byte 15,40,168,158,91,0,0 // movaps 0x5b9e(%eax),%xmm5 .byte 15,92,236 // subps %xmm4,%xmm5 - .byte 15,40,160,45,98,0,0 // movaps 0x622d(%eax),%xmm4 + .byte 15,40,160,30,98,0,0 // movaps 0x621e(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 - .byte 15,88,160,61,98,0,0 // addps 0x623d(%eax),%xmm4 + .byte 15,88,160,46,98,0,0 // addps 0x622e(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 - .byte 15,88,160,157,91,0,0 // addps 0x5b9d(%eax),%xmm4 + .byte 15,88,160,142,91,0,0 // addps 0x5b8e(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 - .byte 15,88,160,77,98,0,0 // addps 0x624d(%eax),%xmm4 + .byte 15,88,160,62,98,0,0 // addps 0x623e(%eax),%xmm4 .byte 15,17,166,160,0,0,0 // movups %xmm4,0xa0(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -63507,22 +63484,22 @@ _sk_bicubic_p1y_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 719c <_sk_bicubic_p1y_sse2+0xa> + .byte 232,0,0,0,0 // call 718b <_sk_bicubic_p1y_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi - .byte 15,40,160,52,91,0,0 // movaps 0x5b34(%eax),%xmm4 + .byte 15,40,160,37,91,0,0 // movaps 0x5b25(%eax),%xmm4 .byte 15,16,78,32 // movups 0x20(%esi),%xmm1 .byte 15,16,110,96 // movups 0x60(%esi),%xmm5 .byte 15,88,204 // addps %xmm4,%xmm1 - .byte 15,40,176,196,97,0,0 // movaps 0x61c4(%eax),%xmm6 + .byte 15,40,176,181,97,0,0 // movaps 0x61b5(%eax),%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 - .byte 15,88,176,212,97,0,0 // addps 0x61d4(%eax),%xmm6 + .byte 15,88,176,197,97,0,0 // addps 0x61c5(%eax),%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 .byte 15,88,244 // addps %xmm4,%xmm6 .byte 15,89,245 // mulps %xmm5,%xmm6 - .byte 15,88,176,228,97,0,0 // addps 0x61e4(%eax),%xmm6 + .byte 15,88,176,213,97,0,0 // addps 0x61d5(%eax),%xmm6 .byte 15,17,182,160,0,0,0 // movups %xmm6,0xa0(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp @@ -63542,18 +63519,18 @@ _sk_bicubic_p3y_sse2: .byte 137,229 // mov %esp,%ebp .byte 86 // push %esi .byte 80 // push %eax - .byte 232,0,0,0,0 // call 71fa <_sk_bicubic_p3y_sse2+0xa> + .byte 232,0,0,0,0 // call 71e9 <_sk_bicubic_p3y_sse2+0xa> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,12 // mov 0xc(%ebp),%edx .byte 139,50 // mov (%edx),%esi .byte 15,16,78,32 // movups 0x20(%esi),%xmm1 .byte 15,16,102,96 // movups 0x60(%esi),%xmm4 - .byte 15,88,136,118,97,0,0 // addps 0x6176(%eax),%xmm1 + .byte 15,88,136,103,97,0,0 // addps 0x6167(%eax),%xmm1 .byte 15,40,236 // movaps %xmm4,%xmm5 .byte 15,89,237 // mulps %xmm5,%xmm5 - .byte 15,89,160,86,97,0,0 // mulps 0x6156(%eax),%xmm4 - .byte 15,88,160,198,92,0,0 // addps 0x5cc6(%eax),%xmm4 + .byte 15,89,160,71,97,0,0 // mulps 0x6147(%eax),%xmm4 + .byte 15,88,160,183,92,0,0 // addps 0x5cb7(%eax),%xmm4 .byte 15,89,229 // mulps %xmm5,%xmm4 .byte 15,17,166,160,0,0,0 // movups %xmm4,0xa0(%esi) .byte 141,66,8 // lea 0x8(%edx),%eax @@ -63576,10 +63553,10 @@ _sk_callback_sse2: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,12 // sub $0xc,%esp - .byte 139,117,12 // mov 0xc(%ebp),%esi - .byte 139,125,8 // mov 0x8(%ebp),%edi - .byte 139,71,8 // mov 0x8(%edi),%eax - .byte 139,30 // mov (%esi),%ebx + .byte 139,117,8 // mov 0x8(%ebp),%esi + .byte 139,125,12 // mov 0xc(%ebp),%edi + .byte 139,31 // mov (%edi),%ebx + .byte 139,70,8 // mov 0x8(%esi),%eax .byte 15,40,224 // movaps %xmm0,%xmm4 .byte 15,20,225 // unpcklps %xmm1,%xmm4 .byte 15,40,234 // movaps %xmm2,%xmm5 @@ -63621,11 +63598,11 @@ _sk_callback_sse2: .byte 15,40,212 // movaps %xmm4,%xmm2 .byte 102,15,20,211 // unpcklpd %xmm3,%xmm2 .byte 15,18,220 // movhlps %xmm4,%xmm3 - .byte 141,70,8 // lea 0x8(%esi),%eax + .byte 141,71,8 // lea 0x8(%edi),%eax .byte 131,236,8 // sub $0x8,%esp .byte 80 // push %eax - .byte 87 // push %edi - .byte 255,86,4 // call *0x4(%esi) + .byte 86 // push %esi + .byte 255,87,4 // call *0x4(%edi) .byte 131,196,28 // add $0x1c,%esp .byte 94 // pop %esi .byte 95 // pop %edi @@ -63642,12 +63619,10 @@ _sk_clut_3D_sse2: .byte 83 // push %ebx .byte 87 // push %edi .byte 86 // push %esi - .byte 129,236,44,1,0,0 // sub $0x12c,%esp - .byte 15,41,157,200,254,255,255 // movaps %xmm3,-0x138(%ebp) + .byte 129,236,28,1,0,0 // sub $0x11c,%esp + .byte 15,41,157,216,254,255,255 // movaps %xmm3,-0x128(%ebp) .byte 15,40,216 // movaps %xmm0,%xmm3 .byte 139,69,12 // mov 0xc(%ebp),%eax - .byte 141,72,4 // lea 0x4(%eax),%ecx - .byte 137,141,20,255,255,255 // mov %ecx,-0xec(%ebp) .byte 139,8 // mov (%eax),%ecx .byte 139,81,12 // mov 0xc(%ecx),%edx .byte 141,114,255 // lea -0x1(%edx),%esi @@ -63656,7 +63631,7 @@ _sk_clut_3D_sse2: .byte 15,91,192 // cvtdq2ps %xmm0,%xmm0 .byte 15,89,194 // mulps %xmm2,%xmm0 .byte 15,40,224 // movaps %xmm0,%xmm4 - .byte 15,41,165,232,254,255,255 // movaps %xmm4,-0x118(%ebp) + .byte 15,41,165,248,254,255,255 // movaps %xmm4,-0x108(%ebp) .byte 102,15,110,194 // movd %edx,%xmm0 .byte 102,15,112,240,0 // pshufd $0x0,%xmm0,%xmm6 .byte 102,15,127,117,152 // movdqa %xmm6,-0x68(%ebp) @@ -63698,15 +63673,15 @@ _sk_clut_3D_sse2: .byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0 .byte 102,15,98,200 // punpckldq %xmm0,%xmm1 .byte 102,15,127,77,136 // movdqa %xmm1,-0x78(%ebp) - .byte 232,0,0,0,0 // call 73e6 <_sk_clut_3D_sse2+0xf7> + .byte 232,0,0,0,0 // call 73cc <_sk_clut_3D_sse2+0xee> .byte 90 // pop %edx .byte 243,15,91,196 // cvttps2dq %xmm4,%xmm0 - .byte 102,15,127,133,248,254,255,255 // movdqa %xmm0,-0x108(%ebp) + .byte 102,15,127,133,8,255,255,255 // movdqa %xmm0,-0xf8(%ebp) .byte 102,15,111,221 // movdqa %xmm5,%xmm3 .byte 102,15,254,216 // paddd %xmm0,%xmm3 .byte 102,15,111,193 // movdqa %xmm1,%xmm0 .byte 102,15,254,195 // paddd %xmm3,%xmm0 - .byte 102,15,111,162,186,95,0,0 // movdqa 0x5fba(%edx),%xmm4 + .byte 102,15,111,162,180,95,0,0 // movdqa 0x5fb4(%edx),%xmm4 .byte 102,15,127,165,120,255,255,255 // movdqa %xmm4,-0x88(%ebp) .byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1 .byte 102,15,244,196 // pmuludq %xmm4,%xmm0 @@ -63746,7 +63721,7 @@ _sk_clut_3D_sse2: .byte 243,15,16,4,129 // movss (%ecx,%eax,4),%xmm0 .byte 15,20,248 // unpcklps %xmm0,%xmm7 .byte 102,15,20,252 // unpcklpd %xmm4,%xmm7 - .byte 102,15,111,130,58,89,0,0 // movdqa 0x593a(%edx),%xmm0 + .byte 102,15,111,130,52,89,0,0 // movdqa 0x5934(%edx),%xmm0 .byte 102,15,127,133,104,255,255,255 // movdqa %xmm0,-0x98(%ebp) .byte 102,15,254,200 // paddd %xmm0,%xmm1 .byte 102,15,112,193,229 // pshufd $0xe5,%xmm1,%xmm0 @@ -63763,8 +63738,8 @@ _sk_clut_3D_sse2: .byte 243,15,16,4,129 // movss (%ecx,%eax,4),%xmm0 .byte 15,20,240 // unpcklps %xmm0,%xmm6 .byte 102,15,20,241 // unpcklpd %xmm1,%xmm6 - .byte 15,40,130,170,95,0,0 // movaps 0x5faa(%edx),%xmm0 - .byte 15,40,141,232,254,255,255 // movaps -0x118(%ebp),%xmm1 + .byte 15,40,130,164,95,0,0 // movaps 0x5fa4(%edx),%xmm0 + .byte 15,40,141,248,254,255,255 // movaps -0x108(%ebp),%xmm1 .byte 15,88,200 // addps %xmm0,%xmm1 .byte 15,41,77,200 // movaps %xmm1,-0x38(%ebp) .byte 15,40,141,88,255,255,255 // movaps -0xa8(%ebp),%xmm1 @@ -63848,7 +63823,7 @@ _sk_clut_3D_sse2: .byte 15,92,206 // subps %xmm6,%xmm1 .byte 15,89,204 // mulps %xmm4,%xmm1 .byte 15,88,206 // addps %xmm6,%xmm1 - .byte 15,41,141,216,254,255,255 // movaps %xmm1,-0x128(%ebp) + .byte 15,41,141,232,254,255,255 // movaps %xmm1,-0x118(%ebp) .byte 243,15,91,133,72,255,255,255 // cvttps2dq -0xb8(%ebp),%xmm0 .byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4 .byte 102,15,111,77,152 // movdqa -0x68(%ebp),%xmm1 @@ -63859,7 +63834,7 @@ _sk_clut_3D_sse2: .byte 102,15,112,196,232 // pshufd $0xe8,%xmm4,%xmm0 .byte 102,15,98,248 // punpckldq %xmm0,%xmm7 .byte 102,15,127,125,152 // movdqa %xmm7,-0x68(%ebp) - .byte 102,15,254,189,248,254,255,255 // paddd -0x108(%ebp),%xmm7 + .byte 102,15,254,189,8,255,255,255 // paddd -0xf8(%ebp),%xmm7 .byte 102,15,111,199 // movdqa %xmm7,%xmm0 .byte 102,15,254,69,136 // paddd -0x78(%ebp),%xmm0 .byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4 @@ -63996,7 +63971,7 @@ _sk_clut_3D_sse2: .byte 15,89,212 // mulps %xmm4,%xmm2 .byte 15,88,208 // addps %xmm0,%xmm2 .byte 15,41,149,56,255,255,255 // movaps %xmm2,-0xc8(%ebp) - .byte 15,40,133,216,254,255,255 // movaps -0x128(%ebp),%xmm0 + .byte 15,40,133,232,254,255,255 // movaps -0x118(%ebp),%xmm0 .byte 15,92,216 // subps %xmm0,%xmm3 .byte 15,89,220 // mulps %xmm4,%xmm3 .byte 15,88,216 // addps %xmm0,%xmm3 @@ -64267,8 +64242,8 @@ _sk_clut_3D_sse2: .byte 15,92,214 // subps %xmm6,%xmm2 .byte 15,89,211 // mulps %xmm3,%xmm2 .byte 15,88,214 // addps %xmm6,%xmm2 - .byte 15,91,157,248,254,255,255 // cvtdq2ps -0x108(%ebp),%xmm3 - .byte 15,40,165,232,254,255,255 // movaps -0x118(%ebp),%xmm4 + .byte 15,91,157,8,255,255,255 // cvtdq2ps -0xf8(%ebp),%xmm3 + .byte 15,40,165,248,254,255,255 // movaps -0x108(%ebp),%xmm4 .byte 15,92,227 // subps %xmm3,%xmm4 .byte 15,40,93,184 // movaps -0x48(%ebp),%xmm3 .byte 15,92,195 // subps %xmm3,%xmm0 @@ -64282,15 +64257,14 @@ _sk_clut_3D_sse2: .byte 15,92,211 // subps %xmm3,%xmm2 .byte 15,89,212 // mulps %xmm4,%xmm2 .byte 15,88,211 // addps %xmm3,%xmm2 - .byte 139,69,8 // mov 0x8(%ebp),%eax - .byte 139,85,12 // mov 0xc(%ebp),%edx - .byte 141,74,8 // lea 0x8(%edx),%ecx + .byte 139,77,12 // mov 0xc(%ebp),%ecx + .byte 141,65,8 // lea 0x8(%ecx),%eax .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,157,200,254,255,255 // movaps -0x138(%ebp),%xmm3 - .byte 81 // push %ecx + .byte 15,40,157,216,254,255,255 // movaps -0x128(%ebp),%xmm3 .byte 80 // push %eax - .byte 255,82,4 // call *0x4(%edx) - .byte 129,196,60,1,0,0 // add $0x13c,%esp + .byte 255,117,8 // pushl 0x8(%ebp) + .byte 255,81,4 // call *0x4(%ecx) + .byte 129,196,44,1,0,0 // add $0x12c,%esp .byte 94 // pop %esi .byte 95 // pop %edi .byte 91 // pop %ebx @@ -64306,10 +64280,8 @@ _sk_clut_4D_sse2: .byte 83 // push %ebx .byte 87 // push %edi .byte 86 // push %esi - .byte 129,236,92,1,0,0 // sub $0x15c,%esp + .byte 129,236,76,1,0,0 // sub $0x14c,%esp .byte 139,69,12 // mov 0xc(%ebp),%eax - .byte 141,72,4 // lea 0x4(%eax),%ecx - .byte 137,141,212,254,255,255 // mov %ecx,-0x12c(%ebp) .byte 139,16 // mov (%eax),%edx .byte 139,74,16 // mov 0x10(%edx),%ecx .byte 141,113,255 // lea -0x1(%ecx),%esi @@ -64386,18 +64358,18 @@ _sk_clut_4D_sse2: .byte 102,15,112,201,232 // pshufd $0xe8,%xmm1,%xmm1 .byte 102,15,98,217 // punpckldq %xmm1,%xmm3 .byte 102,15,127,93,152 // movdqa %xmm3,-0x68(%ebp) - .byte 232,0,0,0,0 // call 7f7c <_sk_clut_4D_sse2+0x16e> + .byte 232,0,0,0,0 // call 7f58 <_sk_clut_4D_sse2+0x165> .byte 89 // pop %ecx .byte 15,40,197 // movaps %xmm5,%xmm0 - .byte 15,41,133,152,254,255,255 // movaps %xmm0,-0x168(%ebp) + .byte 15,41,133,168,254,255,255 // movaps %xmm0,-0x158(%ebp) .byte 243,15,91,200 // cvttps2dq %xmm0,%xmm1 - .byte 102,15,127,141,184,254,255,255 // movdqa %xmm1,-0x148(%ebp) + .byte 102,15,127,141,200,254,255,255 // movdqa %xmm1,-0x138(%ebp) .byte 102,15,254,241 // paddd %xmm1,%xmm6 .byte 102,15,127,117,200 // movdqa %xmm6,-0x38(%ebp) .byte 102,15,111,212 // movdqa %xmm4,%xmm2 .byte 102,15,254,214 // paddd %xmm6,%xmm2 .byte 102,15,254,218 // paddd %xmm2,%xmm3 - .byte 102,15,111,161,36,84,0,0 // movdqa 0x5424(%ecx),%xmm4 + .byte 102,15,111,161,40,84,0,0 // movdqa 0x5428(%ecx),%xmm4 .byte 102,15,112,203,245 // pshufd $0xf5,%xmm3,%xmm1 .byte 102,15,244,220 // pmuludq %xmm4,%xmm3 .byte 102,15,244,204 // pmuludq %xmm4,%xmm1 @@ -64439,7 +64411,7 @@ _sk_clut_4D_sse2: .byte 15,20,223 // unpcklps %xmm7,%xmm3 .byte 102,15,20,222 // unpcklpd %xmm6,%xmm3 .byte 102,15,41,157,232,254,255,255 // movapd %xmm3,-0x118(%ebp) - .byte 102,15,254,137,164,77,0,0 // paddd 0x4da4(%ecx),%xmm1 + .byte 102,15,254,137,168,77,0,0 // paddd 0x4da8(%ecx),%xmm1 .byte 102,15,112,241,229 // pshufd $0xe5,%xmm1,%xmm6 .byte 102,15,126,240 // movd %xmm6,%eax .byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6 @@ -64454,7 +64426,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,60,130 // movss (%edx,%eax,4),%xmm7 .byte 15,20,223 // unpcklps %xmm7,%xmm3 .byte 102,15,20,222 // unpcklpd %xmm6,%xmm3 - .byte 15,40,185,20,84,0,0 // movaps 0x5414(%ecx),%xmm7 + .byte 15,40,185,24,84,0,0 // movaps 0x5418(%ecx),%xmm7 .byte 15,88,199 // addps %xmm7,%xmm0 .byte 15,41,133,120,255,255,255 // movaps %xmm0,-0x88(%ebp) .byte 15,40,133,248,254,255,255 // movaps -0x108(%ebp),%xmm0 @@ -64462,7 +64434,7 @@ _sk_clut_4D_sse2: .byte 15,41,69,136 // movaps %xmm0,-0x78(%ebp) .byte 15,40,133,56,255,255,255 // movaps -0xc8(%ebp),%xmm0 .byte 15,88,199 // addps %xmm7,%xmm0 - .byte 15,41,133,168,254,255,255 // movaps %xmm0,-0x158(%ebp) + .byte 15,41,133,184,254,255,255 // movaps %xmm0,-0x148(%ebp) .byte 15,88,125,216 // addps -0x28(%ebp),%xmm7 .byte 243,15,91,255 // cvttps2dq %xmm7,%xmm7 .byte 102,15,112,199,245 // pshufd $0xf5,%xmm7,%xmm0 @@ -64475,7 +64447,7 @@ _sk_clut_4D_sse2: .byte 102,15,127,101,168 // movdqa %xmm4,-0x58(%ebp) .byte 102,15,254,212 // paddd %xmm4,%xmm2 .byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0 - .byte 102,15,111,161,36,84,0,0 // movdqa 0x5424(%ecx),%xmm4 + .byte 102,15,111,161,40,84,0,0 // movdqa 0x5428(%ecx),%xmm4 .byte 102,15,244,212 // pmuludq %xmm4,%xmm2 .byte 102,15,244,196 // pmuludq %xmm4,%xmm0 .byte 102,15,112,240,232 // pshufd $0xe8,%xmm0,%xmm6 @@ -64511,7 +64483,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5 .byte 15,20,213 // unpcklps %xmm5,%xmm2 .byte 102,15,20,214 // unpcklpd %xmm6,%xmm2 - .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0 + .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0 .byte 102,15,112,232,229 // pshufd $0xe5,%xmm0,%xmm5 .byte 102,15,126,232 // movd %xmm5,%eax .byte 102,15,112,232,78 // pshufd $0x4e,%xmm0,%xmm5 @@ -64543,7 +64515,7 @@ _sk_clut_4D_sse2: .byte 15,92,251 // subps %xmm3,%xmm7 .byte 15,89,248 // mulps %xmm0,%xmm7 .byte 15,88,251 // addps %xmm3,%xmm7 - .byte 243,15,91,141,168,254,255,255 // cvttps2dq -0x158(%ebp),%xmm1 + .byte 243,15,91,141,184,254,255,255 // cvttps2dq -0x148(%ebp),%xmm1 .byte 102,15,112,217,245 // pshufd $0xf5,%xmm1,%xmm3 .byte 102,15,111,133,88,255,255,255 // movdqa -0xa8(%ebp),%xmm0 .byte 102,15,244,216 // pmuludq %xmm0,%xmm3 @@ -64595,7 +64567,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5 .byte 15,20,245 // unpcklps %xmm5,%xmm6 .byte 102,15,20,240 // unpcklpd %xmm0,%xmm6 - .byte 102,15,254,137,164,77,0,0 // paddd 0x4da4(%ecx),%xmm1 + .byte 102,15,254,137,168,77,0,0 // paddd 0x4da8(%ecx),%xmm1 .byte 102,15,112,193,229 // pshufd $0xe5,%xmm1,%xmm0 .byte 102,15,126,192 // movd %xmm0,%eax .byte 102,15,112,193,78 // pshufd $0x4e,%xmm1,%xmm0 @@ -64613,7 +64585,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,202 // movdqa %xmm2,%xmm1 .byte 102,15,254,77,168 // paddd -0x58(%ebp),%xmm1 .byte 102,15,112,193,245 // pshufd $0xf5,%xmm1,%xmm0 - .byte 102,15,111,145,36,84,0,0 // movdqa 0x5424(%ecx),%xmm2 + .byte 102,15,111,145,40,84,0,0 // movdqa 0x5428(%ecx),%xmm2 .byte 102,15,244,202 // pmuludq %xmm2,%xmm1 .byte 102,15,244,194 // pmuludq %xmm2,%xmm0 .byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0 @@ -64649,7 +64621,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0 .byte 15,20,216 // unpcklps %xmm0,%xmm3 .byte 102,15,20,217 // unpcklpd %xmm1,%xmm3 - .byte 102,15,254,169,164,77,0,0 // paddd 0x4da4(%ecx),%xmm5 + .byte 102,15,254,169,168,77,0,0 // paddd 0x4da8(%ecx),%xmm5 .byte 102,15,112,197,229 // pshufd $0xe5,%xmm5,%xmm0 .byte 102,15,126,192 // movd %xmm0,%eax .byte 102,15,112,197,78 // pshufd $0x4e,%xmm5,%xmm0 @@ -64702,14 +64674,14 @@ _sk_clut_4D_sse2: .byte 102,15,112,193,232 // pshufd $0xe8,%xmm1,%xmm0 .byte 102,15,98,224 // punpckldq %xmm0,%xmm4 .byte 102,15,127,165,24,255,255,255 // movdqa %xmm4,-0xe8(%ebp) - .byte 102,15,254,165,184,254,255,255 // paddd -0x148(%ebp),%xmm4 + .byte 102,15,254,165,200,254,255,255 // paddd -0x138(%ebp),%xmm4 .byte 102,15,127,101,200 // movdqa %xmm4,-0x38(%ebp) .byte 102,15,111,204 // movdqa %xmm4,%xmm1 .byte 102,15,254,141,72,255,255,255 // paddd -0xb8(%ebp),%xmm1 .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 102,15,254,85,152 // paddd -0x68(%ebp),%xmm2 .byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0 - .byte 102,15,111,153,36,84,0,0 // movdqa 0x5424(%ecx),%xmm3 + .byte 102,15,111,153,40,84,0,0 // movdqa 0x5428(%ecx),%xmm3 .byte 102,15,244,211 // pmuludq %xmm3,%xmm2 .byte 102,15,244,195 // pmuludq %xmm3,%xmm0 .byte 102,15,111,251 // movdqa %xmm3,%xmm7 @@ -64748,7 +64720,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5 .byte 15,20,229 // unpcklps %xmm5,%xmm4 .byte 102,15,20,227 // unpcklpd %xmm3,%xmm4 - .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0 + .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0 .byte 102,15,112,216,229 // pshufd $0xe5,%xmm0,%xmm3 .byte 102,15,126,216 // movd %xmm3,%eax .byte 102,15,112,216,78 // pshufd $0x4e,%xmm0,%xmm3 @@ -64800,7 +64772,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,52,130 // movss (%edx,%eax,4),%xmm6 .byte 15,20,238 // unpcklps %xmm6,%xmm5 .byte 102,15,20,235 // unpcklpd %xmm3,%xmm5 - .byte 102,15,111,137,164,77,0,0 // movdqa 0x4da4(%ecx),%xmm1 + .byte 102,15,111,137,168,77,0,0 // movdqa 0x4da8(%ecx),%xmm1 .byte 102,15,254,249 // paddd %xmm1,%xmm7 .byte 102,15,112,223,229 // pshufd $0xe5,%xmm7,%xmm3 .byte 102,15,126,216 // movd %xmm3,%eax @@ -64834,7 +64806,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,226 // movdqa %xmm2,%xmm4 .byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0 .byte 102,15,112,208,245 // pshufd $0xf5,%xmm0,%xmm2 - .byte 102,15,111,153,36,84,0,0 // movdqa 0x5424(%ecx),%xmm3 + .byte 102,15,111,153,40,84,0,0 // movdqa 0x5428(%ecx),%xmm3 .byte 102,15,244,195 // pmuludq %xmm3,%xmm0 .byte 102,15,244,211 // pmuludq %xmm3,%xmm2 .byte 102,15,112,218,232 // pshufd $0xe8,%xmm2,%xmm3 @@ -64891,7 +64863,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,212 // movdqa %xmm4,%xmm2 .byte 102,15,254,85,168 // paddd -0x58(%ebp),%xmm2 .byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0 - .byte 102,15,111,137,36,84,0,0 // movdqa 0x5424(%ecx),%xmm1 + .byte 102,15,111,137,40,84,0,0 // movdqa 0x5428(%ecx),%xmm1 .byte 102,15,244,209 // pmuludq %xmm1,%xmm2 .byte 102,15,244,193 // pmuludq %xmm1,%xmm0 .byte 102,15,112,240,232 // pshufd $0xe8,%xmm0,%xmm6 @@ -64928,7 +64900,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4 .byte 15,20,212 // unpcklps %xmm4,%xmm2 .byte 102,15,20,214 // unpcklpd %xmm6,%xmm2 - .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0 + .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0 .byte 102,15,112,224,229 // pshufd $0xe5,%xmm0,%xmm4 .byte 102,15,126,224 // movd %xmm4,%eax .byte 102,15,112,224,78 // pshufd $0x4e,%xmm0,%xmm4 @@ -64996,7 +64968,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,93,152 // movdqa -0x68(%ebp),%xmm3 .byte 102,15,254,217 // paddd %xmm1,%xmm3 .byte 102,15,112,211,245 // pshufd $0xf5,%xmm3,%xmm2 - .byte 102,15,111,129,36,84,0,0 // movdqa 0x5424(%ecx),%xmm0 + .byte 102,15,111,129,40,84,0,0 // movdqa 0x5428(%ecx),%xmm0 .byte 102,15,244,216 // pmuludq %xmm0,%xmm3 .byte 102,15,244,208 // pmuludq %xmm0,%xmm2 .byte 102,15,111,248 // movdqa %xmm0,%xmm7 @@ -65035,7 +65007,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,28,130 // movss (%edx,%eax,4),%xmm3 .byte 15,20,235 // unpcklps %xmm3,%xmm5 .byte 102,15,20,238 // unpcklpd %xmm6,%xmm5 - .byte 102,15,254,145,164,77,0,0 // paddd 0x4da4(%ecx),%xmm2 + .byte 102,15,254,145,168,77,0,0 // paddd 0x4da8(%ecx),%xmm2 .byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3 .byte 102,15,126,216 // movd %xmm3,%eax .byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3 @@ -65087,7 +65059,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0 .byte 15,20,208 // unpcklps %xmm0,%xmm2 .byte 102,15,20,215 // unpcklpd %xmm7,%xmm2 - .byte 102,15,111,137,164,77,0,0 // movdqa 0x4da4(%ecx),%xmm1 + .byte 102,15,111,137,168,77,0,0 // movdqa 0x4da8(%ecx),%xmm1 .byte 102,15,254,217 // paddd %xmm1,%xmm3 .byte 102,15,112,195,229 // pshufd $0xe5,%xmm3,%xmm0 .byte 102,15,126,192 // movd %xmm0,%eax @@ -65122,7 +65094,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,194 // movdqa %xmm2,%xmm0 .byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0 .byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4 - .byte 102,15,111,169,36,84,0,0 // movdqa 0x5424(%ecx),%xmm5 + .byte 102,15,111,169,40,84,0,0 // movdqa 0x5428(%ecx),%xmm5 .byte 102,15,111,221 // movdqa %xmm5,%xmm3 .byte 102,15,244,195 // pmuludq %xmm3,%xmm0 .byte 102,15,244,227 // pmuludq %xmm3,%xmm4 @@ -65178,7 +65150,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,202 // movdqa %xmm2,%xmm1 .byte 102,15,254,77,168 // paddd -0x58(%ebp),%xmm1 .byte 102,15,112,193,245 // pshufd $0xf5,%xmm1,%xmm0 - .byte 102,15,111,145,36,84,0,0 // movdqa 0x5424(%ecx),%xmm2 + .byte 102,15,111,145,40,84,0,0 // movdqa 0x5428(%ecx),%xmm2 .byte 102,15,244,202 // pmuludq %xmm2,%xmm1 .byte 102,15,244,194 // pmuludq %xmm2,%xmm0 .byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0 @@ -65214,7 +65186,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0 .byte 15,20,216 // unpcklps %xmm0,%xmm3 .byte 102,15,20,217 // unpcklpd %xmm1,%xmm3 - .byte 102,15,254,185,164,77,0,0 // paddd 0x4da4(%ecx),%xmm7 + .byte 102,15,254,185,168,77,0,0 // paddd 0x4da8(%ecx),%xmm7 .byte 102,15,112,199,229 // pshufd $0xe5,%xmm7,%xmm0 .byte 102,15,126,192 // movd %xmm0,%eax .byte 102,15,112,199,78 // pshufd $0x4e,%xmm7,%xmm0 @@ -65264,7 +65236,7 @@ _sk_clut_4D_sse2: .byte 102,15,111,233 // movdqa %xmm1,%xmm5 .byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0 .byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1 - .byte 102,15,111,145,36,84,0,0 // movdqa 0x5424(%ecx),%xmm2 + .byte 102,15,111,145,40,84,0,0 // movdqa 0x5428(%ecx),%xmm2 .byte 102,15,244,194 // pmuludq %xmm2,%xmm0 .byte 102,15,244,202 // pmuludq %xmm2,%xmm1 .byte 102,15,111,250 // movdqa %xmm2,%xmm7 @@ -65303,7 +65275,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4 .byte 15,20,204 // unpcklps %xmm4,%xmm1 .byte 102,15,20,203 // unpcklpd %xmm3,%xmm1 - .byte 102,15,254,145,164,77,0,0 // paddd 0x4da4(%ecx),%xmm2 + .byte 102,15,254,145,168,77,0,0 // paddd 0x4da8(%ecx),%xmm2 .byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3 .byte 102,15,126,216 // movd %xmm3,%eax .byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3 @@ -65357,7 +65329,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4 .byte 15,20,252 // unpcklps %xmm4,%xmm7 .byte 102,15,20,254 // unpcklpd %xmm6,%xmm7 - .byte 102,15,254,153,164,77,0,0 // paddd 0x4da4(%ecx),%xmm3 + .byte 102,15,254,153,168,77,0,0 // paddd 0x4da8(%ecx),%xmm3 .byte 102,15,112,227,229 // pshufd $0xe5,%xmm3,%xmm4 .byte 102,15,126,224 // movd %xmm4,%eax .byte 102,15,112,227,78 // pshufd $0x4e,%xmm3,%xmm4 @@ -65390,7 +65362,7 @@ _sk_clut_4D_sse2: .byte 102,15,254,208 // paddd %xmm0,%xmm2 .byte 102,15,111,216 // movdqa %xmm0,%xmm3 .byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0 - .byte 102,15,111,137,36,84,0,0 // movdqa 0x5424(%ecx),%xmm1 + .byte 102,15,111,137,40,84,0,0 // movdqa 0x5428(%ecx),%xmm1 .byte 102,15,244,209 // pmuludq %xmm1,%xmm2 .byte 102,15,244,193 // pmuludq %xmm1,%xmm0 .byte 102,15,111,241 // movdqa %xmm1,%xmm6 @@ -65430,7 +65402,7 @@ _sk_clut_4D_sse2: .byte 15,20,225 // unpcklps %xmm1,%xmm4 .byte 102,15,20,226 // unpcklpd %xmm2,%xmm4 .byte 102,15,41,165,88,255,255,255 // movapd %xmm4,-0xa8(%ebp) - .byte 102,15,254,129,164,77,0,0 // paddd 0x4da4(%ecx),%xmm0 + .byte 102,15,254,129,168,77,0,0 // paddd 0x4da8(%ecx),%xmm0 .byte 102,15,112,200,229 // pshufd $0xe5,%xmm0,%xmm1 .byte 102,15,126,200 // movd %xmm1,%eax .byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1 @@ -65484,7 +65456,7 @@ _sk_clut_4D_sse2: .byte 243,15,16,52,130 // movss (%edx,%eax,4),%xmm6 .byte 15,20,206 // unpcklps %xmm6,%xmm1 .byte 102,15,20,203 // unpcklpd %xmm3,%xmm1 - .byte 102,15,254,145,164,77,0,0 // paddd 0x4da4(%ecx),%xmm2 + .byte 102,15,254,145,168,77,0,0 // paddd 0x4da8(%ecx),%xmm2 .byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3 .byte 102,15,126,216 // movd %xmm3,%eax .byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3 @@ -65535,8 +65507,8 @@ _sk_clut_4D_sse2: .byte 15,92,212 // subps %xmm4,%xmm2 .byte 15,89,211 // mulps %xmm3,%xmm2 .byte 15,88,212 // addps %xmm4,%xmm2 - .byte 15,91,157,184,254,255,255 // cvtdq2ps -0x148(%ebp),%xmm3 - .byte 15,40,165,152,254,255,255 // movaps -0x168(%ebp),%xmm4 + .byte 15,91,157,200,254,255,255 // cvtdq2ps -0x138(%ebp),%xmm3 + .byte 15,40,165,168,254,255,255 // movaps -0x158(%ebp),%xmm4 .byte 15,92,227 // subps %xmm3,%xmm4 .byte 15,40,157,40,255,255,255 // movaps -0xd8(%ebp),%xmm3 .byte 15,92,195 // subps %xmm3,%xmm0 @@ -65550,21 +65522,21 @@ _sk_clut_4D_sse2: .byte 15,92,211 // subps %xmm3,%xmm2 .byte 15,89,212 // mulps %xmm4,%xmm2 .byte 15,88,211 // addps %xmm3,%xmm2 - .byte 139,69,8 // mov 0x8(%ebp),%eax - .byte 139,117,12 // mov 0xc(%ebp),%esi - .byte 141,86,8 // lea 0x8(%esi),%edx + .byte 139,85,12 // mov 0xc(%ebp),%edx + .byte 141,66,8 // lea 0x8(%edx),%eax .byte 131,236,8 // sub $0x8,%esp - .byte 15,40,153,100,77,0,0 // movaps 0x4d64(%ecx),%xmm3 - .byte 82 // push %edx + .byte 15,40,153,104,77,0,0 // movaps 0x4d68(%ecx),%xmm3 .byte 80 // push %eax - .byte 255,86,4 // call *0x4(%esi) - .byte 129,196,108,1,0,0 // add $0x16c,%esp + .byte 255,117,8 // pushl 0x8(%ebp) + .byte 255,82,4 // call *0x4(%edx) + .byte 129,196,92,1,0,0 // add $0x15c,%esp .byte 94 // pop %esi .byte 95 // pop %edi .byte 91 // pop %ebx .byte 93 // pop %ebp .byte 195 // ret .byte 144 // nop + .byte 144 // nop HIDDEN _sk_start_pipeline_sse2_lowp .globl _sk_start_pipeline_sse2_lowp @@ -65578,7 +65550,7 @@ _sk_start_pipeline_sse2_lowp: .byte 131,236,92 // sub $0x5c,%esp .byte 139,125,12 // mov 0xc(%ebp),%edi .byte 59,125,20 // cmp 0x14(%ebp),%edi - .byte 15,131,193,0,0,0 // jae 949e <_sk_start_pipeline_sse2_lowp+0xd6> + .byte 15,131,193,0,0,0 // jae 947a <_sk_start_pipeline_sse2_lowp+0xd6> .byte 139,85,16 // mov 0x10(%ebp),%edx .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 139,117,24 // mov 0x18(%ebp),%esi @@ -65592,7 +65564,7 @@ _sk_start_pipeline_sse2_lowp: .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 137,223 // mov %ebx,%edi .byte 137,243 // mov %esi,%ebx - .byte 119,77 // ja 9450 <_sk_start_pipeline_sse2_lowp+0x88> + .byte 119,77 // ja 942c <_sk_start_pipeline_sse2_lowp+0x88> .byte 139,117,8 // mov 0x8(%ebp),%esi .byte 15,41,68,36,64 // movaps %xmm0,0x40(%esp) .byte 15,41,68,36,48 // movaps %xmm0,0x30(%esp) @@ -65614,13 +65586,13 @@ _sk_start_pipeline_sse2_lowp: .byte 131,198,16 // add $0x10,%esi .byte 57,214 // cmp %edx,%esi .byte 137,198 // mov %eax,%esi - .byte 118,182 // jbe 9406 <_sk_start_pipeline_sse2_lowp+0x3e> + .byte 118,182 // jbe 93e2 <_sk_start_pipeline_sse2_lowp+0x3e> .byte 137,209 // mov %edx,%ecx .byte 41,193 // sub %eax,%ecx .byte 137,222 // mov %ebx,%esi .byte 137,251 // mov %edi,%ebx .byte 139,125,240 // mov -0x10(%ebp),%edi - .byte 116,55 // je 9494 <_sk_start_pipeline_sse2_lowp+0xcc> + .byte 116,55 // je 9470 <_sk_start_pipeline_sse2_lowp+0xcc> .byte 15,41,68,36,64 // movaps %xmm0,0x40(%esp) .byte 15,41,68,36,48 // movaps %xmm0,0x30(%esp) .byte 15,41,68,36,32 // movaps %xmm0,0x20(%esp) @@ -65638,7 +65610,7 @@ _sk_start_pipeline_sse2_lowp: .byte 139,85,16 // mov 0x10(%ebp),%edx .byte 71 // inc %edi .byte 59,125,20 // cmp 0x14(%ebp),%edi - .byte 15,133,86,255,255,255 // jne 93f4 <_sk_start_pipeline_sse2_lowp+0x2c> + .byte 15,133,86,255,255,255 // jne 93d0 <_sk_start_pipeline_sse2_lowp+0x2c> .byte 131,196,92 // add $0x5c,%esp .byte 94 // pop %esi .byte 95 // pop %edi @@ -65710,7 +65682,7 @@ _sk_black_color_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,92 // sub $0x5c,%esp - .byte 232,0,0,0,0 // call 954d <_sk_black_color_sse2_lowp+0xe> + .byte 232,0,0,0,0 // call 9529 <_sk_black_color_sse2_lowp+0xe> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,16 // mov 0x10(%ebp),%edx @@ -65729,7 +65701,7 @@ _sk_black_color_sse2_lowp: .byte 137,84,36,8 // mov %edx,0x8(%esp) .byte 137,92,36,4 // mov %ebx,0x4(%esp) .byte 137,12,36 // mov %ecx,(%esp) - .byte 15,40,152,99,62,0,0 // movaps 0x3e63(%eax),%xmm3 + .byte 15,40,152,103,62,0,0 // movaps 0x3e67(%eax),%xmm3 .byte 15,87,192 // xorps %xmm0,%xmm0 .byte 15,87,201 // xorps %xmm1,%xmm1 .byte 15,87,210 // xorps %xmm2,%xmm2 @@ -65751,7 +65723,7 @@ _sk_white_color_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,92 // sub $0x5c,%esp - .byte 232,0,0,0,0 // call 95b8 <_sk_white_color_sse2_lowp+0xe> + .byte 232,0,0,0,0 // call 9594 <_sk_white_color_sse2_lowp+0xe> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,16 // mov 0x10(%ebp),%edx @@ -65770,7 +65742,7 @@ _sk_white_color_sse2_lowp: .byte 137,84,36,8 // mov %edx,0x8(%esp) .byte 137,92,36,4 // mov %ebx,0x4(%esp) .byte 137,12,36 // mov %ecx,(%esp) - .byte 15,40,128,248,61,0,0 // movaps 0x3df8(%eax),%xmm0 + .byte 15,40,128,252,61,0,0 // movaps 0x3dfc(%eax),%xmm0 .byte 15,40,200 // movaps %xmm0,%xmm1 .byte 15,40,208 // movaps %xmm0,%xmm2 .byte 15,40,216 // movaps %xmm0,%xmm3 @@ -65791,16 +65763,16 @@ _sk_set_rgb_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9622 <_sk_set_rgb_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 95fe <_sk_set_rgb_sse2_lowp+0xd> .byte 94 // pop %esi .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 139,85,16 // mov 0x10(%ebp),%edx .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,57 // mov (%ecx),%edi - .byte 243,15,16,150,82,62,0,0 // movss 0x3e52(%esi),%xmm2 + .byte 243,15,16,150,86,62,0,0 // movss 0x3e56(%esi),%xmm2 .byte 243,15,16,7 // movss (%edi),%xmm0 .byte 243,15,89,194 // mulss %xmm2,%xmm0 - .byte 243,15,16,142,78,62,0,0 // movss 0x3e4e(%esi),%xmm1 + .byte 243,15,16,142,82,62,0,0 // movss 0x3e52(%esi),%xmm1 .byte 243,15,88,193 // addss %xmm1,%xmm0 .byte 243,15,44,240 // cvttss2si %xmm0,%esi .byte 102,15,110,198 // movd %esi,%xmm0 @@ -65849,7 +65821,7 @@ _sk_premul_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 96e6 <_sk_premul_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 96c2 <_sk_premul_sse2_lowp+0xd> .byte 90 // pop %edx .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 139,77,16 // mov 0x10(%ebp),%ecx @@ -65858,7 +65830,7 @@ _sk_premul_sse2_lowp: .byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5 .byte 15,40,117,56 // movaps 0x38(%ebp),%xmm6 .byte 102,15,213,195 // pmullw %xmm3,%xmm0 - .byte 102,15,111,186,202,60,0,0 // movdqa 0x3cca(%edx),%xmm7 + .byte 102,15,111,186,206,60,0,0 // movdqa 0x3cce(%edx),%xmm7 .byte 102,15,253,199 // paddw %xmm7,%xmm0 .byte 102,15,213,203 // pmullw %xmm3,%xmm1 .byte 102,15,253,207 // paddw %xmm7,%xmm1 @@ -65992,12 +65964,12 @@ _sk_invert_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9860 <_sk_invert_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 983c <_sk_invert_sse2_lowp+0xd> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,16 // mov 0x10(%ebp),%edx .byte 139,117,20 // mov 0x14(%ebp),%esi - .byte 102,15,111,160,80,59,0,0 // movdqa 0x3b50(%eax),%xmm4 + .byte 102,15,111,160,84,59,0,0 // movdqa 0x3b54(%eax),%xmm4 .byte 102,15,111,236 // movdqa %xmm4,%xmm5 .byte 102,15,249,232 // psubw %xmm0,%xmm5 .byte 102,15,111,244 // movdqa %xmm4,%xmm6 @@ -66079,11 +66051,11 @@ _sk_srcatop_sse2_lowp: .byte 102,15,111,234 // movdqa %xmm2,%xmm5 .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call 9958 <_sk_srcatop_sse2_lowp+0x19> + .byte 232,0,0,0,0 // call 9934 <_sk_srcatop_sse2_lowp+0x19> .byte 88 // pop %eax .byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6 .byte 102,15,213,206 // pmullw %xmm6,%xmm1 - .byte 102,15,111,128,88,58,0,0 // movdqa 0x3a58(%eax),%xmm0 + .byte 102,15,111,128,92,58,0,0 // movdqa 0x3a5c(%eax),%xmm0 .byte 102,15,253,200 // paddw %xmm0,%xmm1 .byte 102,15,213,214 // pmullw %xmm6,%xmm2 .byte 102,15,253,208 // paddw %xmm0,%xmm2 @@ -66141,12 +66113,12 @@ _sk_dstatop_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9a2c <_sk_dstatop_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9a08 <_sk_dstatop_sse2_lowp+0xd> .byte 88 // pop %eax .byte 102,15,111,101,40 // movdqa 0x28(%ebp),%xmm4 .byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6 .byte 102,15,213,243 // pmullw %xmm3,%xmm6 - .byte 102,15,111,184,132,57,0,0 // movdqa 0x3984(%eax),%xmm7 + .byte 102,15,111,184,136,57,0,0 // movdqa 0x3988(%eax),%xmm7 .byte 102,15,253,247 // paddw %xmm7,%xmm6 .byte 102,15,213,227 // pmullw %xmm3,%xmm4 .byte 102,15,253,231 // paddw %xmm7,%xmm4 @@ -66199,7 +66171,7 @@ _sk_srcin_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9aed <_sk_srcin_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9ac9 <_sk_srcin_sse2_lowp+0xd> .byte 94 // pop %esi .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 139,77,16 // mov 0x10(%ebp),%ecx @@ -66208,7 +66180,7 @@ _sk_srcin_sse2_lowp: .byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5 .byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6 .byte 102,15,213,198 // pmullw %xmm6,%xmm0 - .byte 102,15,111,190,195,56,0,0 // movdqa 0x38c3(%esi),%xmm7 + .byte 102,15,111,190,199,56,0,0 // movdqa 0x38c7(%esi),%xmm7 .byte 102,15,253,199 // paddw %xmm7,%xmm0 .byte 102,15,213,206 // pmullw %xmm6,%xmm1 .byte 102,15,253,207 // paddw %xmm7,%xmm1 @@ -66247,14 +66219,14 @@ _sk_dstin_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9b84 <_sk_dstin_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9b60 <_sk_dstin_sse2_lowp+0xd> .byte 88 // pop %eax .byte 102,15,111,85,56 // movdqa 0x38(%ebp),%xmm2 .byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5 .byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6 .byte 102,15,111,198 // movdqa %xmm6,%xmm0 .byte 102,15,213,195 // pmullw %xmm3,%xmm0 - .byte 102,15,111,184,44,56,0,0 // movdqa 0x382c(%eax),%xmm7 + .byte 102,15,111,184,48,56,0,0 // movdqa 0x3830(%eax),%xmm7 .byte 102,15,253,199 // paddw %xmm7,%xmm0 .byte 102,15,111,205 // movdqa %xmm5,%xmm1 .byte 102,15,213,203 // pmullw %xmm3,%xmm1 @@ -66298,14 +66270,14 @@ _sk_srcout_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9c2c <_sk_srcout_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9c08 <_sk_srcout_sse2_lowp+0xd> .byte 94 // pop %esi .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 139,77,16 // mov 0x10(%ebp),%ecx .byte 139,85,20 // mov 0x14(%ebp),%edx .byte 15,40,101,24 // movaps 0x18(%ebp),%xmm4 .byte 102,15,111,109,72 // movdqa 0x48(%ebp),%xmm5 - .byte 102,15,111,182,132,55,0,0 // movdqa 0x3784(%esi),%xmm6 + .byte 102,15,111,182,136,55,0,0 // movdqa 0x3788(%esi),%xmm6 .byte 102,15,111,254 // movdqa %xmm6,%xmm7 .byte 102,15,249,253 // psubw %xmm5,%xmm7 .byte 102,15,213,199 // pmullw %xmm7,%xmm0 @@ -66349,11 +66321,11 @@ _sk_dstout_sse2_lowp: .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp .byte 102,15,111,195 // movdqa %xmm3,%xmm0 - .byte 232,0,0,0,0 // call 9ccf <_sk_dstout_sse2_lowp+0x11> + .byte 232,0,0,0,0 // call 9cab <_sk_dstout_sse2_lowp+0x11> .byte 88 // pop %eax .byte 102,15,111,109,56 // movdqa 0x38(%ebp),%xmm5 .byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6 - .byte 102,15,111,184,225,54,0,0 // movdqa 0x36e1(%eax),%xmm7 + .byte 102,15,111,184,229,54,0,0 // movdqa 0x36e5(%eax),%xmm7 .byte 102,15,111,223 // movdqa %xmm7,%xmm3 .byte 102,15,249,216 // psubw %xmm0,%xmm3 .byte 102,15,111,195 // movdqa %xmm3,%xmm0 @@ -66405,9 +66377,9 @@ _sk_srcover_sse2_lowp: .byte 15,41,85,232 // movaps %xmm2,-0x18(%ebp) .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 102,15,111,224 // movdqa %xmm0,%xmm4 - .byte 232,0,0,0,0 // call 9d8b <_sk_srcover_sse2_lowp+0x19> + .byte 232,0,0,0,0 // call 9d67 <_sk_srcover_sse2_lowp+0x19> .byte 88 // pop %eax - .byte 102,15,111,136,37,54,0,0 // movdqa 0x3625(%eax),%xmm1 + .byte 102,15,111,136,41,54,0,0 // movdqa 0x3629(%eax),%xmm1 .byte 102,15,111,193 // movdqa %xmm1,%xmm0 .byte 102,15,249,195 // psubw %xmm3,%xmm0 .byte 102,15,111,248 // movdqa %xmm0,%xmm7 @@ -66466,7 +66438,7 @@ _sk_dstover_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9e5b <_sk_dstover_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9e37 <_sk_dstover_sse2_lowp+0xd> .byte 95 // pop %edi .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,16 // mov 0x10(%ebp),%edx @@ -66474,7 +66446,7 @@ _sk_dstover_sse2_lowp: .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 102,15,111,101,56 // movdqa 0x38(%ebp),%xmm4 .byte 102,15,111,109,72 // movdqa 0x48(%ebp),%xmm5 - .byte 102,15,111,183,85,53,0,0 // movdqa 0x3555(%edi),%xmm6 + .byte 102,15,111,183,89,53,0,0 // movdqa 0x3559(%edi),%xmm6 .byte 102,15,111,254 // movdqa %xmm6,%xmm7 .byte 102,15,249,253 // psubw %xmm5,%xmm7 .byte 102,15,213,199 // pmullw %xmm7,%xmm0 @@ -66520,12 +66492,12 @@ _sk_modulate_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9f10 <_sk_modulate_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9eec <_sk_modulate_sse2_lowp+0xd> .byte 88 // pop %eax .byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5 .byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6 .byte 102,15,213,198 // pmullw %xmm6,%xmm0 - .byte 102,15,111,184,160,52,0,0 // movdqa 0x34a0(%eax),%xmm7 + .byte 102,15,111,184,164,52,0,0 // movdqa 0x34a4(%eax),%xmm7 .byte 102,15,253,199 // paddw %xmm7,%xmm0 .byte 102,15,213,205 // pmullw %xmm5,%xmm1 .byte 102,15,253,207 // paddw %xmm7,%xmm1 @@ -66568,10 +66540,10 @@ _sk_multiply_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call 9fac <_sk_multiply_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call 9f88 <_sk_multiply_sse2_lowp+0xd> .byte 88 // pop %eax .byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5 - .byte 102,15,111,160,4,52,0,0 // movdqa 0x3404(%eax),%xmm4 + .byte 102,15,111,160,8,52,0,0 // movdqa 0x3408(%eax),%xmm4 .byte 102,15,111,245 // movdqa %xmm5,%xmm6 .byte 102,15,253,244 // paddw %xmm4,%xmm6 .byte 102,15,249,117,72 // psubw 0x48(%ebp),%xmm6 @@ -66641,17 +66613,17 @@ _sk_plus__sse2_lowp: .byte 131,236,96 // sub $0x60,%esp .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call a0ad <_sk_plus__sse2_lowp+0x15> + .byte 232,0,0,0,0 // call a089 <_sk_plus__sse2_lowp+0x15> .byte 88 // pop %eax .byte 102,15,253,77,24 // paddw 0x18(%ebp),%xmm1 - .byte 102,15,111,168,19,51,0,0 // movdqa 0x3313(%eax),%xmm5 + .byte 102,15,111,168,23,51,0,0 // movdqa 0x3317(%eax),%xmm5 .byte 102,15,111,193 // movdqa %xmm1,%xmm0 .byte 102,15,217,197 // psubusw %xmm5,%xmm0 .byte 102,15,127,109,232 // movdqa %xmm5,-0x18(%ebp) .byte 102,15,239,255 // pxor %xmm7,%xmm7 .byte 102,15,117,199 // pcmpeqw %xmm7,%xmm0 .byte 102,15,219,200 // pand %xmm0,%xmm1 - .byte 102,15,111,176,3,51,0,0 // movdqa 0x3303(%eax),%xmm6 + .byte 102,15,111,176,7,51,0,0 // movdqa 0x3307(%eax),%xmm6 .byte 102,15,223,198 // pandn %xmm6,%xmm0 .byte 102,15,235,193 // por %xmm1,%xmm0 .byte 102,15,253,101,40 // paddw 0x28(%ebp),%xmm4 @@ -66712,14 +66684,14 @@ _sk_screen_sse2_lowp: .byte 131,236,80 // sub $0x50,%esp .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call a1a5 <_sk_screen_sse2_lowp+0x15> + .byte 232,0,0,0,0 // call a181 <_sk_screen_sse2_lowp+0x15> .byte 88 // pop %eax .byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5 .byte 102,15,111,117,24 // movdqa 0x18(%ebp),%xmm6 .byte 102,15,111,198 // movdqa %xmm6,%xmm0 .byte 102,15,253,193 // paddw %xmm1,%xmm0 .byte 102,15,213,206 // pmullw %xmm6,%xmm1 - .byte 102,15,111,176,11,50,0,0 // movdqa 0x320b(%eax),%xmm6 + .byte 102,15,111,176,15,50,0,0 // movdqa 0x320f(%eax),%xmm6 .byte 102,15,253,206 // paddw %xmm6,%xmm1 .byte 102,15,113,209,8 // psrlw $0x8,%xmm1 .byte 102,15,249,193 // psubw %xmm1,%xmm0 @@ -66777,9 +66749,9 @@ _sk_xor__sse2_lowp: .byte 86 // push %esi .byte 131,236,96 // sub $0x60,%esp .byte 102,15,127,93,232 // movdqa %xmm3,-0x18(%ebp) - .byte 232,0,0,0,0 // call a285 <_sk_xor__sse2_lowp+0x12> + .byte 232,0,0,0,0 // call a261 <_sk_xor__sse2_lowp+0x12> .byte 88 // pop %eax - .byte 102,15,111,176,43,49,0,0 // movdqa 0x312b(%eax),%xmm6 + .byte 102,15,111,176,47,49,0,0 // movdqa 0x312f(%eax),%xmm6 .byte 102,15,111,254 // movdqa %xmm6,%xmm7 .byte 102,15,249,125,72 // psubw 0x48(%ebp),%xmm7 .byte 102,15,213,199 // pmullw %xmm7,%xmm0 @@ -66846,7 +66818,7 @@ _sk_darken_sse2_lowp: .byte 15,41,85,200 // movaps %xmm2,-0x38(%ebp) .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call a37a <_sk_darken_sse2_lowp+0x25> + .byte 232,0,0,0,0 // call a356 <_sk_darken_sse2_lowp+0x25> .byte 88 // pop %eax .byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6 .byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5 @@ -66857,7 +66829,7 @@ _sk_darken_sse2_lowp: .byte 102,15,111,222 // movdqa %xmm6,%xmm3 .byte 102,15,111,197 // movdqa %xmm5,%xmm0 .byte 102,15,213,199 // pmullw %xmm7,%xmm0 - .byte 102,15,111,184,86,48,0,0 // movdqa 0x3056(%eax),%xmm7 + .byte 102,15,111,184,90,48,0,0 // movdqa 0x305a(%eax),%xmm7 .byte 102,15,111,241 // movdqa %xmm1,%xmm6 .byte 102,15,239,247 // pxor %xmm7,%xmm6 .byte 102,15,111,232 // movdqa %xmm0,%xmm5 @@ -66866,7 +66838,7 @@ _sk_darken_sse2_lowp: .byte 102,15,219,197 // pand %xmm5,%xmm0 .byte 102,15,223,233 // pandn %xmm1,%xmm5 .byte 102,15,235,232 // por %xmm0,%xmm5 - .byte 102,15,111,128,54,48,0,0 // movdqa 0x3036(%eax),%xmm0 + .byte 102,15,111,128,58,48,0,0 // movdqa 0x303a(%eax),%xmm0 .byte 102,15,127,69,232 // movdqa %xmm0,-0x18(%ebp) .byte 102,15,253,232 // paddw %xmm0,%xmm5 .byte 102,15,113,213,8 // psrlw $0x8,%xmm5 @@ -66957,7 +66929,7 @@ _sk_lighten_sse2_lowp: .byte 15,41,85,200 // movaps %xmm2,-0x38(%ebp) .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call a523 <_sk_lighten_sse2_lowp+0x25> + .byte 232,0,0,0,0 // call a4ff <_sk_lighten_sse2_lowp+0x25> .byte 88 // pop %eax .byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5 .byte 102,15,111,197 // movdqa %xmm5,%xmm0 @@ -66966,7 +66938,7 @@ _sk_lighten_sse2_lowp: .byte 102,15,213,77,72 // pmullw 0x48(%ebp),%xmm1 .byte 102,15,111,197 // movdqa %xmm5,%xmm0 .byte 102,15,213,198 // pmullw %xmm6,%xmm0 - .byte 102,15,111,184,173,46,0,0 // movdqa 0x2ead(%eax),%xmm7 + .byte 102,15,111,184,177,46,0,0 // movdqa 0x2eb1(%eax),%xmm7 .byte 102,15,111,241 // movdqa %xmm1,%xmm6 .byte 102,15,239,247 // pxor %xmm7,%xmm6 .byte 102,15,111,232 // movdqa %xmm0,%xmm5 @@ -66975,7 +66947,7 @@ _sk_lighten_sse2_lowp: .byte 102,15,219,205 // pand %xmm5,%xmm1 .byte 102,15,223,232 // pandn %xmm0,%xmm5 .byte 102,15,235,233 // por %xmm1,%xmm5 - .byte 102,15,111,128,141,46,0,0 // movdqa 0x2e8d(%eax),%xmm0 + .byte 102,15,111,128,145,46,0,0 // movdqa 0x2e91(%eax),%xmm0 .byte 102,15,253,232 // paddw %xmm0,%xmm5 .byte 102,15,111,208 // movdqa %xmm0,%xmm2 .byte 102,15,127,85,232 // movdqa %xmm2,-0x18(%ebp) @@ -67065,7 +67037,7 @@ _sk_difference_sse2_lowp: .byte 15,41,85,184 // movaps %xmm2,-0x48(%ebp) .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call a6c1 <_sk_difference_sse2_lowp+0x25> + .byte 232,0,0,0,0 // call a69d <_sk_difference_sse2_lowp+0x25> .byte 88 // pop %eax .byte 102,15,111,117,72 // movdqa 0x48(%ebp),%xmm6 .byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5 @@ -67076,7 +67048,7 @@ _sk_difference_sse2_lowp: .byte 102,15,111,222 // movdqa %xmm6,%xmm3 .byte 102,15,111,197 // movdqa %xmm5,%xmm0 .byte 102,15,213,199 // pmullw %xmm7,%xmm0 - .byte 102,15,111,184,15,45,0,0 // movdqa 0x2d0f(%eax),%xmm7 + .byte 102,15,111,184,19,45,0,0 // movdqa 0x2d13(%eax),%xmm7 .byte 102,15,111,241 // movdqa %xmm1,%xmm6 .byte 102,15,239,247 // pxor %xmm7,%xmm6 .byte 102,15,111,232 // movdqa %xmm0,%xmm5 @@ -67085,11 +67057,11 @@ _sk_difference_sse2_lowp: .byte 102,15,219,205 // pand %xmm5,%xmm1 .byte 102,15,223,232 // pandn %xmm0,%xmm5 .byte 102,15,235,233 // por %xmm1,%xmm5 - .byte 102,15,111,128,239,44,0,0 // movdqa 0x2cef(%eax),%xmm0 + .byte 102,15,111,128,243,44,0,0 // movdqa 0x2cf3(%eax),%xmm0 .byte 102,15,127,69,216 // movdqa %xmm0,-0x28(%ebp) .byte 102,15,253,232 // paddw %xmm0,%xmm5 .byte 102,15,113,213,7 // psrlw $0x7,%xmm5 - .byte 102,15,111,128,31,45,0,0 // movdqa 0x2d1f(%eax),%xmm0 + .byte 102,15,111,128,35,45,0,0 // movdqa 0x2d23(%eax),%xmm0 .byte 102,15,127,69,232 // movdqa %xmm0,-0x18(%ebp) .byte 102,15,219,232 // pand %xmm0,%xmm5 .byte 102,15,249,213 // psubw %xmm5,%xmm2 @@ -67178,16 +67150,16 @@ _sk_exclusion_sse2_lowp: .byte 131,236,80 // sub $0x50,%esp .byte 102,15,111,225 // movdqa %xmm1,%xmm4 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call a875 <_sk_exclusion_sse2_lowp+0x15> + .byte 232,0,0,0,0 // call a851 <_sk_exclusion_sse2_lowp+0x15> .byte 88 // pop %eax .byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5 .byte 102,15,111,197 // movdqa %xmm5,%xmm0 .byte 102,15,253,193 // paddw %xmm1,%xmm0 .byte 102,15,213,205 // pmullw %xmm5,%xmm1 - .byte 102,15,111,184,59,43,0,0 // movdqa 0x2b3b(%eax),%xmm7 + .byte 102,15,111,184,63,43,0,0 // movdqa 0x2b3f(%eax),%xmm7 .byte 102,15,253,207 // paddw %xmm7,%xmm1 .byte 102,15,113,209,7 // psrlw $0x7,%xmm1 - .byte 102,15,111,176,107,43,0,0 // movdqa 0x2b6b(%eax),%xmm6 + .byte 102,15,111,176,111,43,0,0 // movdqa 0x2b6f(%eax),%xmm6 .byte 102,15,219,206 // pand %xmm6,%xmm1 .byte 102,15,249,193 // psubw %xmm1,%xmm0 .byte 102,15,111,109,40 // movdqa 0x28(%ebp),%xmm5 @@ -67248,9 +67220,9 @@ _sk_hardlight_sse2_lowp: .byte 15,41,85,152 // movaps %xmm2,-0x68(%ebp) .byte 102,15,111,233 // movdqa %xmm1,%xmm5 .byte 102,15,111,224 // movdqa %xmm0,%xmm4 - .byte 232,0,0,0,0 // call a96f <_sk_hardlight_sse2_lowp+0x1c> + .byte 232,0,0,0,0 // call a94b <_sk_hardlight_sse2_lowp+0x1c> .byte 88 // pop %eax - .byte 102,15,111,184,65,42,0,0 // movdqa 0x2a41(%eax),%xmm7 + .byte 102,15,111,184,69,42,0,0 // movdqa 0x2a45(%eax),%xmm7 .byte 102,15,127,125,200 // movdqa %xmm7,-0x38(%ebp) .byte 102,15,111,215 // movdqa %xmm7,%xmm2 .byte 102,15,249,85,72 // psubw 0x48(%ebp),%xmm2 @@ -67277,7 +67249,7 @@ _sk_hardlight_sse2_lowp: .byte 102,15,111,214 // movdqa %xmm6,%xmm2 .byte 102,15,249,209 // psubw %xmm1,%xmm2 .byte 102,15,253,228 // paddw %xmm4,%xmm4 - .byte 102,15,111,128,97,42,0,0 // movdqa 0x2a61(%eax),%xmm0 + .byte 102,15,111,128,101,42,0,0 // movdqa 0x2a65(%eax),%xmm0 .byte 102,15,239,216 // pxor %xmm0,%xmm3 .byte 102,15,127,93,184 // movdqa %xmm3,-0x48(%ebp) .byte 102,15,111,204 // movdqa %xmm4,%xmm1 @@ -67384,10 +67356,10 @@ _sk_overlay_sse2_lowp: .byte 15,41,85,152 // movaps %xmm2,-0x68(%ebp) .byte 15,41,141,120,255,255,255 // movaps %xmm1,-0x88(%ebp) .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call ab91 <_sk_overlay_sse2_lowp+0x1f> + .byte 232,0,0,0,0 // call ab6d <_sk_overlay_sse2_lowp+0x1f> .byte 88 // pop %eax .byte 102,15,111,69,72 // movdqa 0x48(%ebp),%xmm0 - .byte 102,15,111,184,31,40,0,0 // movdqa 0x281f(%eax),%xmm7 + .byte 102,15,111,184,35,40,0,0 // movdqa 0x2823(%eax),%xmm7 .byte 102,15,127,125,232 // movdqa %xmm7,-0x18(%ebp) .byte 102,15,111,215 // movdqa %xmm7,%xmm2 .byte 102,15,249,208 // psubw %xmm0,%xmm2 @@ -67414,7 +67386,7 @@ _sk_overlay_sse2_lowp: .byte 102,15,249,234 // psubw %xmm2,%xmm5 .byte 102,15,111,195 // movdqa %xmm3,%xmm0 .byte 102,15,253,192 // paddw %xmm0,%xmm0 - .byte 102,15,111,144,63,40,0,0 // movdqa 0x283f(%eax),%xmm2 + .byte 102,15,111,144,67,40,0,0 // movdqa 0x2843(%eax),%xmm2 .byte 102,15,127,85,184 // movdqa %xmm2,-0x48(%ebp) .byte 102,15,239,226 // pxor %xmm2,%xmm4 .byte 102,15,239,194 // pxor %xmm2,%xmm0 @@ -67544,10 +67516,10 @@ _sk_load_8888_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call ae00 <_sk_load_8888_sse2_lowp+0x30> + .byte 232,0,0,0,0 // call addc <_sk_load_8888_sse2_lowp+0x30> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,32 // ja ae26 <_sk_load_8888_sse2_lowp+0x56> + .byte 119,32 // ja ae02 <_sk_load_8888_sse2_lowp+0x56> .byte 102,15,239,246 // pxor %xmm6,%xmm6 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,52,1,0,0 // mov 0x134(%edi,%ecx,4),%ecx @@ -67556,14 +67528,14 @@ _sk_load_8888_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 243,15,16,28,179 // movss (%ebx,%esi,4),%xmm3 .byte 15,87,246 // xorps %xmm6,%xmm6 - .byte 235,73 // jmp ae6f <_sk_load_8888_sse2_lowp+0x9f> + .byte 235,73 // jmp ae4b <_sk_load_8888_sse2_lowp+0x9f> .byte 102,15,16,28,179 // movupd (%ebx,%esi,4),%xmm3 .byte 15,16,116,179,16 // movups 0x10(%ebx,%esi,4),%xmm6 - .byte 235,61 // jmp ae6f <_sk_load_8888_sse2_lowp+0x9f> + .byte 235,61 // jmp ae4b <_sk_load_8888_sse2_lowp+0x9f> .byte 102,15,110,68,179,8 // movd 0x8(%ebx,%esi,4),%xmm0 .byte 102,15,112,216,69 // pshufd $0x45,%xmm0,%xmm3 .byte 102,15,18,28,179 // movlpd (%ebx,%esi,4),%xmm3 - .byte 235,43 // jmp ae6f <_sk_load_8888_sse2_lowp+0x9f> + .byte 235,43 // jmp ae4b <_sk_load_8888_sse2_lowp+0x9f> .byte 102,15,110,68,179,24 // movd 0x18(%ebx,%esi,4),%xmm0 .byte 102,15,112,240,69 // pshufd $0x45,%xmm0,%xmm6 .byte 243,15,16,68,179,20 // movss 0x14(%ebx,%esi,4),%xmm0 @@ -67580,7 +67552,7 @@ _sk_load_8888_sse2_lowp: .byte 102,15,114,240,16 // pslld $0x10,%xmm0 .byte 102,15,114,224,16 // psrad $0x10,%xmm0 .byte 102,15,107,200 // packssdw %xmm0,%xmm1 - .byte 102,15,111,175,176,37,0,0 // movdqa 0x25b0(%edi),%xmm5 + .byte 102,15,111,175,180,37,0,0 // movdqa 0x25b4(%edi),%xmm5 .byte 102,15,111,193 // movdqa %xmm1,%xmm0 .byte 102,15,219,197 // pand %xmm5,%xmm0 .byte 102,15,113,209,8 // psrlw $0x8,%xmm1 @@ -67660,10 +67632,10 @@ _sk_load_8888_dst_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call af8d <_sk_load_8888_dst_sse2_lowp+0x3d> + .byte 232,0,0,0,0 // call af69 <_sk_load_8888_dst_sse2_lowp+0x3d> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,32 // ja afb3 <_sk_load_8888_dst_sse2_lowp+0x63> + .byte 119,32 // ja af8f <_sk_load_8888_dst_sse2_lowp+0x63> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,59,1,0,0 // mov 0x13b(%edi,%ecx,4),%ecx @@ -67672,14 +67644,14 @@ _sk_load_8888_dst_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 243,15,16,60,179 // movss (%ebx,%esi,4),%xmm7 .byte 15,87,219 // xorps %xmm3,%xmm3 - .byte 235,73 // jmp affc <_sk_load_8888_dst_sse2_lowp+0xac> + .byte 235,73 // jmp afd8 <_sk_load_8888_dst_sse2_lowp+0xac> .byte 102,15,16,60,179 // movupd (%ebx,%esi,4),%xmm7 .byte 15,16,92,179,16 // movups 0x10(%ebx,%esi,4),%xmm3 - .byte 235,61 // jmp affc <_sk_load_8888_dst_sse2_lowp+0xac> + .byte 235,61 // jmp afd8 <_sk_load_8888_dst_sse2_lowp+0xac> .byte 102,15,110,84,179,8 // movd 0x8(%ebx,%esi,4),%xmm2 .byte 102,15,112,250,69 // pshufd $0x45,%xmm2,%xmm7 .byte 102,15,18,60,179 // movlpd (%ebx,%esi,4),%xmm7 - .byte 235,43 // jmp affc <_sk_load_8888_dst_sse2_lowp+0xac> + .byte 235,43 // jmp afd8 <_sk_load_8888_dst_sse2_lowp+0xac> .byte 102,15,110,84,179,24 // movd 0x18(%ebx,%esi,4),%xmm2 .byte 102,15,112,218,69 // pshufd $0x45,%xmm2,%xmm3 .byte 243,15,16,84,179,20 // movss 0x14(%ebx,%esi,4),%xmm2 @@ -67696,7 +67668,7 @@ _sk_load_8888_dst_sse2_lowp: .byte 102,15,114,242,16 // pslld $0x10,%xmm2 .byte 102,15,114,226,16 // psrad $0x10,%xmm2 .byte 102,15,107,242 // packssdw %xmm2,%xmm6 - .byte 102,15,111,151,35,36,0,0 // movdqa 0x2423(%edi),%xmm2 + .byte 102,15,111,151,39,36,0,0 // movdqa 0x2427(%edi),%xmm2 .byte 102,15,111,206 // movdqa %xmm6,%xmm1 .byte 102,15,219,202 // pand %xmm2,%xmm1 .byte 102,15,113,214,8 // psrlw $0x8,%xmm6 @@ -67790,19 +67762,19 @@ _sk_store_8888_sse2_lowp: .byte 128,227,7 // and $0x7,%bl .byte 254,203 // dec %bl .byte 128,251,6 // cmp $0x6,%bl - .byte 232,0,0,0,0 // call b158 <_sk_store_8888_sse2_lowp+0x74> + .byte 232,0,0,0,0 // call b134 <_sk_store_8888_sse2_lowp+0x74> .byte 89 // pop %ecx .byte 139,117,16 // mov 0x10(%ebp),%esi .byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5 - .byte 119,19 // ja b175 <_sk_store_8888_sse2_lowp+0x91> + .byte 119,19 // ja b151 <_sk_store_8888_sse2_lowp+0x91> .byte 15,182,219 // movzbl %bl,%ebx .byte 3,140,153,184,0,0,0 // add 0xb8(%ecx,%ebx,4),%ecx .byte 255,225 // jmp *%ecx .byte 102,15,126,60,183 // movd %xmm7,(%edi,%esi,4) - .byte 235,93 // jmp b1d2 <_sk_store_8888_sse2_lowp+0xee> + .byte 235,93 // jmp b1ae <_sk_store_8888_sse2_lowp+0xee> .byte 243,15,127,60,183 // movdqu %xmm7,(%edi,%esi,4) .byte 243,15,127,116,183,16 // movdqu %xmm6,0x10(%edi,%esi,4) - .byte 235,80 // jmp b1d2 <_sk_store_8888_sse2_lowp+0xee> + .byte 235,80 // jmp b1ae <_sk_store_8888_sse2_lowp+0xee> .byte 102,15,111,244 // movdqa %xmm4,%xmm6 .byte 15,40,227 // movaps %xmm3,%xmm4 .byte 102,15,112,223,78 // pshufd $0x4e,%xmm7,%xmm3 @@ -67810,7 +67782,7 @@ _sk_store_8888_sse2_lowp: .byte 15,40,220 // movaps %xmm4,%xmm3 .byte 102,15,111,230 // movdqa %xmm6,%xmm4 .byte 102,15,214,60,183 // movq %xmm7,(%edi,%esi,4) - .byte 235,48 // jmp b1d2 <_sk_store_8888_sse2_lowp+0xee> + .byte 235,48 // jmp b1ae <_sk_store_8888_sse2_lowp+0xee> .byte 102,15,112,222,78 // pshufd $0x4e,%xmm6,%xmm3 .byte 102,15,126,92,183,24 // movd %xmm3,0x18(%edi,%esi,4) .byte 15,40,93,72 // movaps 0x48(%ebp),%xmm3 @@ -67847,7 +67819,7 @@ _sk_store_8888_sse2_lowp: .byte 0,0 // add %al,(%eax) .byte 42,0 // sub (%eax),%al .byte 0,0 // add %al,(%eax) - .byte 117,0 // jne b21e <_sk_store_8888_sse2_lowp+0x13a> + .byte 117,0 // jne b1fa <_sk_store_8888_sse2_lowp+0x13a> .byte 0,0 // add %al,(%eax) .byte 111 // outsl %ds:(%esi),(%dx) .byte 0,0 // add %al,(%eax) @@ -67879,10 +67851,10 @@ _sk_load_bgra_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call b25c <_sk_load_bgra_sse2_lowp+0x30> + .byte 232,0,0,0,0 // call b238 <_sk_load_bgra_sse2_lowp+0x30> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,32 // ja b282 <_sk_load_bgra_sse2_lowp+0x56> + .byte 119,32 // ja b25e <_sk_load_bgra_sse2_lowp+0x56> .byte 102,15,239,246 // pxor %xmm6,%xmm6 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,52,1,0,0 // mov 0x134(%edi,%ecx,4),%ecx @@ -67891,14 +67863,14 @@ _sk_load_bgra_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 243,15,16,28,179 // movss (%ebx,%esi,4),%xmm3 .byte 15,87,246 // xorps %xmm6,%xmm6 - .byte 235,73 // jmp b2cb <_sk_load_bgra_sse2_lowp+0x9f> + .byte 235,73 // jmp b2a7 <_sk_load_bgra_sse2_lowp+0x9f> .byte 102,15,16,28,179 // movupd (%ebx,%esi,4),%xmm3 .byte 15,16,116,179,16 // movups 0x10(%ebx,%esi,4),%xmm6 - .byte 235,61 // jmp b2cb <_sk_load_bgra_sse2_lowp+0x9f> + .byte 235,61 // jmp b2a7 <_sk_load_bgra_sse2_lowp+0x9f> .byte 102,15,110,68,179,8 // movd 0x8(%ebx,%esi,4),%xmm0 .byte 102,15,112,216,69 // pshufd $0x45,%xmm0,%xmm3 .byte 102,15,18,28,179 // movlpd (%ebx,%esi,4),%xmm3 - .byte 235,43 // jmp b2cb <_sk_load_bgra_sse2_lowp+0x9f> + .byte 235,43 // jmp b2a7 <_sk_load_bgra_sse2_lowp+0x9f> .byte 102,15,110,68,179,24 // movd 0x18(%ebx,%esi,4),%xmm0 .byte 102,15,112,240,69 // pshufd $0x45,%xmm0,%xmm6 .byte 243,15,16,68,179,20 // movss 0x14(%ebx,%esi,4),%xmm0 @@ -67915,7 +67887,7 @@ _sk_load_bgra_sse2_lowp: .byte 102,15,114,240,16 // pslld $0x10,%xmm0 .byte 102,15,114,224,16 // psrad $0x10,%xmm0 .byte 102,15,107,200 // packssdw %xmm0,%xmm1 - .byte 102,15,111,175,84,33,0,0 // movdqa 0x2154(%edi),%xmm5 + .byte 102,15,111,175,88,33,0,0 // movdqa 0x2158(%edi),%xmm5 .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 102,15,219,213 // pand %xmm5,%xmm2 .byte 102,15,113,209,8 // psrlw $0x8,%xmm1 @@ -67995,10 +67967,10 @@ _sk_load_bgra_dst_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call b3e9 <_sk_load_bgra_dst_sse2_lowp+0x3d> + .byte 232,0,0,0,0 // call b3c5 <_sk_load_bgra_dst_sse2_lowp+0x3d> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,32 // ja b40f <_sk_load_bgra_dst_sse2_lowp+0x63> + .byte 119,32 // ja b3eb <_sk_load_bgra_dst_sse2_lowp+0x63> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,59,1,0,0 // mov 0x13b(%edi,%ecx,4),%ecx @@ -68007,14 +67979,14 @@ _sk_load_bgra_dst_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 243,15,16,60,179 // movss (%ebx,%esi,4),%xmm7 .byte 15,87,219 // xorps %xmm3,%xmm3 - .byte 235,73 // jmp b458 <_sk_load_bgra_dst_sse2_lowp+0xac> + .byte 235,73 // jmp b434 <_sk_load_bgra_dst_sse2_lowp+0xac> .byte 102,15,16,60,179 // movupd (%ebx,%esi,4),%xmm7 .byte 15,16,92,179,16 // movups 0x10(%ebx,%esi,4),%xmm3 - .byte 235,61 // jmp b458 <_sk_load_bgra_dst_sse2_lowp+0xac> + .byte 235,61 // jmp b434 <_sk_load_bgra_dst_sse2_lowp+0xac> .byte 102,15,110,84,179,8 // movd 0x8(%ebx,%esi,4),%xmm2 .byte 102,15,112,250,69 // pshufd $0x45,%xmm2,%xmm7 .byte 102,15,18,60,179 // movlpd (%ebx,%esi,4),%xmm7 - .byte 235,43 // jmp b458 <_sk_load_bgra_dst_sse2_lowp+0xac> + .byte 235,43 // jmp b434 <_sk_load_bgra_dst_sse2_lowp+0xac> .byte 102,15,110,84,179,24 // movd 0x18(%ebx,%esi,4),%xmm2 .byte 102,15,112,218,69 // pshufd $0x45,%xmm2,%xmm3 .byte 243,15,16,84,179,20 // movss 0x14(%ebx,%esi,4),%xmm2 @@ -68031,7 +68003,7 @@ _sk_load_bgra_dst_sse2_lowp: .byte 102,15,114,242,16 // pslld $0x10,%xmm2 .byte 102,15,114,226,16 // psrad $0x10,%xmm2 .byte 102,15,107,242 // packssdw %xmm2,%xmm6 - .byte 102,15,111,151,199,31,0,0 // movdqa 0x1fc7(%edi),%xmm2 + .byte 102,15,111,151,203,31,0,0 // movdqa 0x1fcb(%edi),%xmm2 .byte 102,15,111,206 // movdqa %xmm6,%xmm1 .byte 102,15,219,202 // pand %xmm2,%xmm1 .byte 102,15,113,214,8 // psrlw $0x8,%xmm6 @@ -68125,19 +68097,19 @@ _sk_store_bgra_sse2_lowp: .byte 128,227,7 // and $0x7,%bl .byte 254,203 // dec %bl .byte 128,251,6 // cmp $0x6,%bl - .byte 232,0,0,0,0 // call b5b4 <_sk_store_bgra_sse2_lowp+0x74> + .byte 232,0,0,0,0 // call b590 <_sk_store_bgra_sse2_lowp+0x74> .byte 89 // pop %ecx .byte 139,117,16 // mov 0x10(%ebp),%esi .byte 15,40,109,40 // movaps 0x28(%ebp),%xmm5 - .byte 119,19 // ja b5d1 <_sk_store_bgra_sse2_lowp+0x91> + .byte 119,19 // ja b5ad <_sk_store_bgra_sse2_lowp+0x91> .byte 15,182,219 // movzbl %bl,%ebx .byte 3,140,153,184,0,0,0 // add 0xb8(%ecx,%ebx,4),%ecx .byte 255,225 // jmp *%ecx .byte 102,15,126,60,183 // movd %xmm7,(%edi,%esi,4) - .byte 235,93 // jmp b62e <_sk_store_bgra_sse2_lowp+0xee> + .byte 235,93 // jmp b60a <_sk_store_bgra_sse2_lowp+0xee> .byte 243,15,127,60,183 // movdqu %xmm7,(%edi,%esi,4) .byte 243,15,127,116,183,16 // movdqu %xmm6,0x10(%edi,%esi,4) - .byte 235,80 // jmp b62e <_sk_store_bgra_sse2_lowp+0xee> + .byte 235,80 // jmp b60a <_sk_store_bgra_sse2_lowp+0xee> .byte 102,15,111,244 // movdqa %xmm4,%xmm6 .byte 15,40,227 // movaps %xmm3,%xmm4 .byte 102,15,112,223,78 // pshufd $0x4e,%xmm7,%xmm3 @@ -68145,7 +68117,7 @@ _sk_store_bgra_sse2_lowp: .byte 15,40,220 // movaps %xmm4,%xmm3 .byte 102,15,111,230 // movdqa %xmm6,%xmm4 .byte 102,15,214,60,183 // movq %xmm7,(%edi,%esi,4) - .byte 235,48 // jmp b62e <_sk_store_bgra_sse2_lowp+0xee> + .byte 235,48 // jmp b60a <_sk_store_bgra_sse2_lowp+0xee> .byte 102,15,112,222,78 // pshufd $0x4e,%xmm6,%xmm3 .byte 102,15,126,92,183,24 // movd %xmm3,0x18(%edi,%esi,4) .byte 15,40,93,72 // movaps 0x48(%ebp),%xmm3 @@ -68182,7 +68154,7 @@ _sk_store_bgra_sse2_lowp: .byte 0,0 // add %al,(%eax) .byte 42,0 // sub (%eax),%al .byte 0,0 // add %al,(%eax) - .byte 117,0 // jne b67a <_sk_store_bgra_sse2_lowp+0x13a> + .byte 117,0 // jne b656 <_sk_store_bgra_sse2_lowp+0x13a> .byte 0,0 // add %al,(%eax) .byte 111 // outsl %ds:(%esi),(%dx) .byte 0,0 // add %al,(%eax) @@ -68217,10 +68189,10 @@ _sk_load_565_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call b6c3 <_sk_load_565_sse2_lowp+0x3b> + .byte 232,0,0,0,0 // call b69f <_sk_load_565_sse2_lowp+0x3b> .byte 94 // pop %esi .byte 139,125,16 // mov 0x10(%ebp),%edi - .byte 119,28 // ja b6e5 <_sk_load_565_sse2_lowp+0x5d> + .byte 119,28 // ja b6c1 <_sk_load_565_sse2_lowp+0x5d> .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,142,245,0,0,0 // mov 0xf5(%esi,%ecx,4),%ecx @@ -68228,14 +68200,14 @@ _sk_load_565_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,183,12,123 // movzwl (%ebx,%edi,2),%ecx .byte 102,15,110,193 // movd %ecx,%xmm0 - .byte 235,59 // jmp b720 <_sk_load_565_sse2_lowp+0x98> + .byte 235,59 // jmp b6fc <_sk_load_565_sse2_lowp+0x98> .byte 243,15,111,4,123 // movdqu (%ebx,%edi,2),%xmm0 - .byte 235,52 // jmp b720 <_sk_load_565_sse2_lowp+0x98> + .byte 235,52 // jmp b6fc <_sk_load_565_sse2_lowp+0x98> .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,196,68,123,4,2 // pinsrw $0x2,0x4(%ebx,%edi,2),%xmm0 .byte 243,15,16,12,123 // movss (%ebx,%edi,2),%xmm1 .byte 243,15,16,193 // movss %xmm1,%xmm0 - .byte 235,30 // jmp b720 <_sk_load_565_sse2_lowp+0x98> + .byte 235,30 // jmp b6fc <_sk_load_565_sse2_lowp+0x98> .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,196,68,123,12,6 // pinsrw $0x6,0xc(%ebx,%edi,2),%xmm0 .byte 102,15,196,68,123,10,5 // pinsrw $0x5,0xa(%ebx,%edi,2),%xmm0 @@ -68243,11 +68215,11 @@ _sk_load_565_sse2_lowp: .byte 102,15,18,4,123 // movlpd (%ebx,%edi,2),%xmm0 .byte 102,15,111,248 // movdqa %xmm0,%xmm7 .byte 102,15,113,215,8 // psrlw $0x8,%xmm7 - .byte 102,15,219,190,45,29,0,0 // pand 0x1d2d(%esi),%xmm7 + .byte 102,15,219,190,49,29,0,0 // pand 0x1d31(%esi),%xmm7 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 .byte 102,15,113,209,5 // psrlw $0x5,%xmm1 - .byte 102,15,219,142,61,29,0,0 // pand 0x1d3d(%esi),%xmm1 - .byte 102,15,111,150,77,29,0,0 // movdqa 0x1d4d(%esi),%xmm2 + .byte 102,15,219,142,65,29,0,0 // pand 0x1d41(%esi),%xmm1 + .byte 102,15,111,150,81,29,0,0 // movdqa 0x1d51(%esi),%xmm2 .byte 102,15,219,208 // pand %xmm0,%xmm2 .byte 102,15,113,208,13 // psrlw $0xd,%xmm0 .byte 102,15,235,199 // por %xmm7,%xmm0 @@ -68269,7 +68241,7 @@ _sk_load_565_sse2_lowp: .byte 137,124,36,8 // mov %edi,0x8(%esp) .byte 137,76,36,4 // mov %ecx,0x4(%esp) .byte 137,20,36 // mov %edx,(%esp) - .byte 15,40,158,237,28,0,0 // movaps 0x1ced(%esi),%xmm3 + .byte 15,40,158,241,28,0,0 // movaps 0x1cf1(%esi),%xmm3 .byte 255,80,4 // call *0x4(%eax) .byte 131,196,92 // add $0x5c,%esp .byte 94 // pop %esi @@ -68315,10 +68287,10 @@ _sk_load_565_dst_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call b7ff <_sk_load_565_dst_sse2_lowp+0x2b> + .byte 232,0,0,0,0 // call b7db <_sk_load_565_dst_sse2_lowp+0x2b> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja b821 <_sk_load_565_dst_sse2_lowp+0x4d> + .byte 119,28 // ja b7fd <_sk_load_565_dst_sse2_lowp+0x4d> .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,249,0,0,0 // mov 0xf9(%edi,%ecx,4),%ecx @@ -68326,14 +68298,14 @@ _sk_load_565_dst_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,183,12,115 // movzwl (%ebx,%esi,2),%ecx .byte 102,15,110,225 // movd %ecx,%xmm4 - .byte 235,59 // jmp b85c <_sk_load_565_dst_sse2_lowp+0x88> + .byte 235,59 // jmp b838 <_sk_load_565_dst_sse2_lowp+0x88> .byte 243,15,111,36,115 // movdqu (%ebx,%esi,2),%xmm4 - .byte 235,52 // jmp b85c <_sk_load_565_dst_sse2_lowp+0x88> + .byte 235,52 // jmp b838 <_sk_load_565_dst_sse2_lowp+0x88> .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,100,115,4,2 // pinsrw $0x2,0x4(%ebx,%esi,2),%xmm4 .byte 243,15,16,44,115 // movss (%ebx,%esi,2),%xmm5 .byte 243,15,16,229 // movss %xmm5,%xmm4 - .byte 235,30 // jmp b85c <_sk_load_565_dst_sse2_lowp+0x88> + .byte 235,30 // jmp b838 <_sk_load_565_dst_sse2_lowp+0x88> .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,100,115,12,6 // pinsrw $0x6,0xc(%ebx,%esi,2),%xmm4 .byte 102,15,196,100,115,10,5 // pinsrw $0x5,0xa(%ebx,%esi,2),%xmm4 @@ -68341,11 +68313,11 @@ _sk_load_565_dst_sse2_lowp: .byte 102,15,18,36,115 // movlpd (%ebx,%esi,2),%xmm4 .byte 102,15,111,244 // movdqa %xmm4,%xmm6 .byte 102,15,113,214,8 // psrlw $0x8,%xmm6 - .byte 102,15,219,183,241,27,0,0 // pand 0x1bf1(%edi),%xmm6 + .byte 102,15,219,183,245,27,0,0 // pand 0x1bf5(%edi),%xmm6 .byte 102,15,111,236 // movdqa %xmm4,%xmm5 .byte 102,15,113,213,5 // psrlw $0x5,%xmm5 - .byte 102,15,219,175,1,28,0,0 // pand 0x1c01(%edi),%xmm5 - .byte 102,15,111,191,17,28,0,0 // movdqa 0x1c11(%edi),%xmm7 + .byte 102,15,219,175,5,28,0,0 // pand 0x1c05(%edi),%xmm5 + .byte 102,15,111,191,21,28,0,0 // movdqa 0x1c15(%edi),%xmm7 .byte 102,15,219,252 // pand %xmm4,%xmm7 .byte 102,15,113,212,13 // psrlw $0xd,%xmm4 .byte 102,15,235,230 // por %xmm6,%xmm4 @@ -68358,7 +68330,7 @@ _sk_load_565_dst_sse2_lowp: .byte 102,15,113,215,2 // psrlw $0x2,%xmm7 .byte 102,15,235,254 // por %xmm6,%xmm7 .byte 141,72,8 // lea 0x8(%eax),%ecx - .byte 15,40,183,177,27,0,0 // movaps 0x1bb1(%edi),%xmm6 + .byte 15,40,183,181,27,0,0 // movaps 0x1bb5(%edi),%xmm6 .byte 15,41,116,36,64 // movaps %xmm6,0x40(%esp) .byte 139,125,20 // mov 0x14(%ebp),%edi .byte 137,124,36,12 // mov %edi,0xc(%esp) @@ -68403,15 +68375,15 @@ _sk_store_565_sse2_lowp: .byte 86 // push %esi .byte 131,236,92 // sub $0x5c,%esp .byte 102,15,111,226 // movdqa %xmm2,%xmm4 - .byte 232,0,0,0,0 // call b926 <_sk_store_565_sse2_lowp+0x12> + .byte 232,0,0,0,0 // call b902 <_sk_store_565_sse2_lowp+0x12> .byte 95 // pop %edi .byte 15,40,109,72 // movaps 0x48(%ebp),%xmm5 .byte 102,15,111,208 // movdqa %xmm0,%xmm2 .byte 102,15,113,242,8 // psllw $0x8,%xmm2 - .byte 102,15,219,151,250,26,0,0 // pand 0x1afa(%edi),%xmm2 + .byte 102,15,219,151,254,26,0,0 // pand 0x1afe(%edi),%xmm2 .byte 102,15,111,241 // movdqa %xmm1,%xmm6 .byte 102,15,113,246,3 // psllw $0x3,%xmm6 - .byte 102,15,219,183,10,27,0,0 // pand 0x1b0a(%edi),%xmm6 + .byte 102,15,219,183,14,27,0,0 // pand 0x1b0e(%edi),%xmm6 .byte 102,15,235,242 // por %xmm2,%xmm6 .byte 102,15,111,212 // movdqa %xmm4,%xmm2 .byte 102,15,113,210,3 // psrlw $0x3,%xmm2 @@ -68430,19 +68402,19 @@ _sk_store_565_sse2_lowp: .byte 128,249,6 // cmp $0x6,%cl .byte 139,117,16 // mov 0x10(%ebp),%esi .byte 15,40,125,24 // movaps 0x18(%ebp),%xmm7 - .byte 119,22 // ja b99e <_sk_store_565_sse2_lowp+0x8a> + .byte 119,22 // ja b97a <_sk_store_565_sse2_lowp+0x8a> .byte 15,182,201 // movzbl %cl,%ecx .byte 3,188,143,242,0,0,0 // add 0xf2(%edi,%ecx,4),%edi .byte 255,231 // jmp *%edi .byte 102,15,126,209 // movd %xmm2,%ecx .byte 102,137,12,115 // mov %cx,(%ebx,%esi,2) - .byte 235,59 // jmp b9d9 <_sk_store_565_sse2_lowp+0xc5> + .byte 235,59 // jmp b9b5 <_sk_store_565_sse2_lowp+0xc5> .byte 243,15,127,20,115 // movdqu %xmm2,(%ebx,%esi,2) - .byte 235,52 // jmp b9d9 <_sk_store_565_sse2_lowp+0xc5> + .byte 235,52 // jmp b9b5 <_sk_store_565_sse2_lowp+0xc5> .byte 102,15,197,202,2 // pextrw $0x2,%xmm2,%ecx .byte 102,137,76,115,4 // mov %cx,0x4(%ebx,%esi,2) .byte 102,15,126,20,115 // movd %xmm2,(%ebx,%esi,2) - .byte 235,35 // jmp b9d9 <_sk_store_565_sse2_lowp+0xc5> + .byte 235,35 // jmp b9b5 <_sk_store_565_sse2_lowp+0xc5> .byte 102,15,197,202,6 // pextrw $0x6,%xmm2,%ecx .byte 102,137,76,115,12 // mov %cx,0xc(%ebx,%esi,2) .byte 102,15,197,202,5 // pextrw $0x5,%xmm2,%ecx @@ -68504,10 +68476,10 @@ _sk_load_a8_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call ba6e <_sk_load_a8_sse2_lowp+0x3a> + .byte 232,0,0,0,0 // call ba4a <_sk_load_a8_sse2_lowp+0x3a> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja ba90 <_sk_load_a8_sse2_lowp+0x5c> + .byte 119,28 // ja ba6c <_sk_load_a8_sse2_lowp+0x5c> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,198,0,0,0 // mov 0xc6(%edi,%ecx,4),%ecx @@ -68515,10 +68487,10 @@ _sk_load_a8_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx .byte 102,15,110,217 // movd %ecx,%xmm3 - .byte 235,90 // jmp baea <_sk_load_a8_sse2_lowp+0xb6> + .byte 235,90 // jmp bac6 <_sk_load_a8_sse2_lowp+0xb6> .byte 243,15,126,28,51 // movq (%ebx,%esi,1),%xmm3 .byte 102,15,96,216 // punpcklbw %xmm0,%xmm3 - .byte 235,79 // jmp baea <_sk_load_a8_sse2_lowp+0xb6> + .byte 235,79 // jmp bac6 <_sk_load_a8_sse2_lowp+0xb6> .byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,217,2 // pinsrw $0x2,%ecx,%xmm3 @@ -68526,7 +68498,7 @@ _sk_load_a8_sse2_lowp: .byte 102,15,110,233 // movd %ecx,%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 243,15,16,221 // movss %xmm5,%xmm3 - .byte 235,47 // jmp baea <_sk_load_a8_sse2_lowp+0xb6> + .byte 235,47 // jmp bac6 <_sk_load_a8_sse2_lowp+0xb6> .byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,217,6 // pinsrw $0x6,%ecx,%xmm3 @@ -68537,7 +68509,7 @@ _sk_load_a8_sse2_lowp: .byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 242,15,16,221 // movsd %xmm5,%xmm3 - .byte 102,15,219,159,66,25,0,0 // pand 0x1942(%edi),%xmm3 + .byte 102,15,219,159,70,25,0,0 // pand 0x1946(%edi),%xmm3 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 15,41,100,36,64 // movaps %xmm4,0x40(%esp) .byte 15,41,84,36,48 // movaps %xmm2,0x30(%esp) @@ -68592,10 +68564,10 @@ _sk_load_a8_dst_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call bb79 <_sk_load_a8_dst_sse2_lowp+0x29> + .byte 232,0,0,0,0 // call bb55 <_sk_load_a8_dst_sse2_lowp+0x29> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja bb9b <_sk_load_a8_dst_sse2_lowp+0x4b> + .byte 119,28 // ja bb77 <_sk_load_a8_dst_sse2_lowp+0x4b> .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,195,0,0,0 // mov 0xc3(%edi,%ecx,4),%ecx @@ -68603,10 +68575,10 @@ _sk_load_a8_dst_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx .byte 102,15,110,225 // movd %ecx,%xmm4 - .byte 235,90 // jmp bbf5 <_sk_load_a8_dst_sse2_lowp+0xa5> + .byte 235,90 // jmp bbd1 <_sk_load_a8_dst_sse2_lowp+0xa5> .byte 243,15,126,36,51 // movq (%ebx,%esi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 - .byte 235,79 // jmp bbf5 <_sk_load_a8_dst_sse2_lowp+0xa5> + .byte 235,79 // jmp bbd1 <_sk_load_a8_dst_sse2_lowp+0xa5> .byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,225,2 // pinsrw $0x2,%ecx,%xmm4 @@ -68614,7 +68586,7 @@ _sk_load_a8_dst_sse2_lowp: .byte 102,15,110,233 // movd %ecx,%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 243,15,16,229 // movss %xmm5,%xmm4 - .byte 235,47 // jmp bbf5 <_sk_load_a8_dst_sse2_lowp+0xa5> + .byte 235,47 // jmp bbd1 <_sk_load_a8_dst_sse2_lowp+0xa5> .byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,225,6 // pinsrw $0x6,%ecx,%xmm4 @@ -68625,7 +68597,7 @@ _sk_load_a8_dst_sse2_lowp: .byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 242,15,16,229 // movsd %xmm5,%xmm4 - .byte 102,15,219,167,55,24,0,0 // pand 0x1837(%edi),%xmm4 + .byte 102,15,219,167,59,24,0,0 // pand 0x183b(%edi),%xmm4 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 102,15,127,100,36,64 // movdqa %xmm4,0x40(%esp) .byte 102,15,239,228 // pxor %xmm4,%xmm4 @@ -68682,32 +68654,32 @@ _sk_store_a8_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call bc91 <_sk_store_a8_sse2_lowp+0x39> + .byte 232,0,0,0,0 // call bc6d <_sk_store_a8_sse2_lowp+0x39> .byte 91 // pop %ebx .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,26 // ja bcb1 <_sk_store_a8_sse2_lowp+0x59> + .byte 119,26 // ja bc8d <_sk_store_a8_sse2_lowp+0x59> .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,139,223,0,0,0 // mov 0xdf(%ebx,%ecx,4),%ecx .byte 1,217 // add %ebx,%ecx .byte 255,225 // jmp *%ecx .byte 102,15,126,217 // movd %xmm3,%ecx .byte 136,12,55 // mov %cl,(%edi,%esi,1) - .byte 233,136,0,0,0 // jmp bd39 <_sk_store_a8_sse2_lowp+0xe1> - .byte 102,15,111,163,31,23,0,0 // movdqa 0x171f(%ebx),%xmm4 + .byte 233,136,0,0,0 // jmp bd15 <_sk_store_a8_sse2_lowp+0xe1> + .byte 102,15,111,163,35,23,0,0 // movdqa 0x1723(%ebx),%xmm4 .byte 102,15,219,227 // pand %xmm3,%xmm4 .byte 102,15,103,228 // packuswb %xmm4,%xmm4 .byte 102,15,214,36,55 // movq %xmm4,(%edi,%esi,1) .byte 15,40,101,24 // movaps 0x18(%ebp),%xmm4 - .byte 235,109 // jmp bd39 <_sk_store_a8_sse2_lowp+0xe1> + .byte 235,109 // jmp bd15 <_sk_store_a8_sse2_lowp+0xe1> .byte 102,15,197,203,2 // pextrw $0x2,%xmm3,%ecx .byte 136,76,55,2 // mov %cl,0x2(%edi,%esi,1) - .byte 102,15,111,163,31,23,0,0 // movdqa 0x171f(%ebx),%xmm4 + .byte 102,15,111,163,35,23,0,0 // movdqa 0x1723(%ebx),%xmm4 .byte 102,15,219,227 // pand %xmm3,%xmm4 .byte 102,15,103,228 // packuswb %xmm4,%xmm4 .byte 102,15,126,225 // movd %xmm4,%ecx .byte 15,40,101,24 // movaps 0x18(%ebp),%xmm4 .byte 102,137,12,55 // mov %cx,(%edi,%esi,1) - .byte 235,70 // jmp bd39 <_sk_store_a8_sse2_lowp+0xe1> + .byte 235,70 // jmp bd15 <_sk_store_a8_sse2_lowp+0xe1> .byte 102,15,197,203,6 // pextrw $0x6,%xmm3,%ecx .byte 136,76,55,6 // mov %cl,0x6(%edi,%esi,1) .byte 102,15,197,203,5 // pextrw $0x5,%xmm3,%ecx @@ -68717,7 +68689,7 @@ _sk_store_a8_sse2_lowp: .byte 15,40,254 // movaps %xmm6,%xmm7 .byte 15,40,245 // movaps %xmm5,%xmm6 .byte 15,40,236 // movaps %xmm4,%xmm5 - .byte 102,15,111,163,31,23,0,0 // movdqa 0x171f(%ebx),%xmm4 + .byte 102,15,111,163,35,23,0,0 // movdqa 0x1723(%ebx),%xmm4 .byte 102,15,219,227 // pand %xmm3,%xmm4 .byte 102,15,103,228 // packuswb %xmm4,%xmm4 .byte 102,15,126,36,55 // movd %xmm4,(%edi,%esi,1) @@ -68751,7 +68723,7 @@ _sk_store_a8_sse2_lowp: .byte 0,0 // add %al,(%eax) .byte 0,125,0 // add %bh,0x0(%ebp) .byte 0,0 // add %al,(%eax) - .byte 116,0 // je bd82 <_sk_store_a8_sse2_lowp+0x12a> + .byte 116,0 // je bd5e <_sk_store_a8_sse2_lowp+0x12a> .byte 0,0 // add %al,(%eax) .byte 107,0,0 // imul $0x0,(%eax),%eax .byte 0,98,0 // add %ah,0x0(%edx) @@ -68781,10 +68753,10 @@ _sk_load_g8_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call bdc5 <_sk_load_g8_sse2_lowp+0x39> + .byte 232,0,0,0,0 // call bda1 <_sk_load_g8_sse2_lowp+0x39> .byte 94 // pop %esi .byte 139,125,16 // mov 0x10(%ebp),%edi - .byte 119,28 // ja bde7 <_sk_load_g8_sse2_lowp+0x5b> + .byte 119,28 // ja bdc3 <_sk_load_g8_sse2_lowp+0x5b> .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,142,199,0,0,0 // mov 0xc7(%esi,%ecx,4),%ecx @@ -68792,10 +68764,10 @@ _sk_load_g8_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,182,12,59 // movzbl (%ebx,%edi,1),%ecx .byte 102,15,110,193 // movd %ecx,%xmm0 - .byte 235,90 // jmp be41 <_sk_load_g8_sse2_lowp+0xb5> + .byte 235,90 // jmp be1d <_sk_load_g8_sse2_lowp+0xb5> .byte 243,15,126,4,59 // movq (%ebx,%edi,1),%xmm0 .byte 102,15,96,192 // punpcklbw %xmm0,%xmm0 - .byte 235,79 // jmp be41 <_sk_load_g8_sse2_lowp+0xb5> + .byte 235,79 // jmp be1d <_sk_load_g8_sse2_lowp+0xb5> .byte 15,182,76,59,2 // movzbl 0x2(%ebx,%edi,1),%ecx .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,196,193,2 // pinsrw $0x2,%ecx,%xmm0 @@ -68803,7 +68775,7 @@ _sk_load_g8_sse2_lowp: .byte 102,15,110,233 // movd %ecx,%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 243,15,16,197 // movss %xmm5,%xmm0 - .byte 235,47 // jmp be41 <_sk_load_g8_sse2_lowp+0xb5> + .byte 235,47 // jmp be1d <_sk_load_g8_sse2_lowp+0xb5> .byte 15,182,76,59,6 // movzbl 0x6(%ebx,%edi,1),%ecx .byte 102,15,239,192 // pxor %xmm0,%xmm0 .byte 102,15,196,193,6 // pinsrw $0x6,%ecx,%xmm0 @@ -68814,7 +68786,7 @@ _sk_load_g8_sse2_lowp: .byte 102,15,110,44,59 // movd (%ebx,%edi,1),%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 242,15,16,197 // movsd %xmm5,%xmm0 - .byte 102,15,219,134,235,21,0,0 // pand 0x15eb(%esi),%xmm0 + .byte 102,15,219,134,239,21,0,0 // pand 0x15ef(%esi),%xmm0 .byte 141,72,8 // lea 0x8(%eax),%ecx .byte 15,41,100,36,64 // movaps %xmm4,0x40(%esp) .byte 15,41,92,36,48 // movaps %xmm3,0x30(%esp) @@ -68825,7 +68797,7 @@ _sk_load_g8_sse2_lowp: .byte 137,124,36,8 // mov %edi,0x8(%esp) .byte 137,76,36,4 // mov %ecx,0x4(%esp) .byte 137,20,36 // mov %edx,(%esp) - .byte 15,40,158,235,21,0,0 // movaps 0x15eb(%esi),%xmm3 + .byte 15,40,158,239,21,0,0 // movaps 0x15ef(%esi),%xmm3 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 .byte 102,15,111,208 // movdqa %xmm0,%xmm2 .byte 255,80,4 // call *0x4(%eax) @@ -68868,10 +68840,10 @@ _sk_load_g8_dst_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call bed1 <_sk_load_g8_dst_sse2_lowp+0x29> + .byte 232,0,0,0,0 // call bead <_sk_load_g8_dst_sse2_lowp+0x29> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja bef3 <_sk_load_g8_dst_sse2_lowp+0x4b> + .byte 119,28 // ja becf <_sk_load_g8_dst_sse2_lowp+0x4b> .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,195,0,0,0 // mov 0xc3(%edi,%ecx,4),%ecx @@ -68879,10 +68851,10 @@ _sk_load_g8_dst_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx .byte 102,15,110,225 // movd %ecx,%xmm4 - .byte 235,90 // jmp bf4d <_sk_load_g8_dst_sse2_lowp+0xa5> + .byte 235,90 // jmp bf29 <_sk_load_g8_dst_sse2_lowp+0xa5> .byte 243,15,126,36,51 // movq (%ebx,%esi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 - .byte 235,79 // jmp bf4d <_sk_load_g8_dst_sse2_lowp+0xa5> + .byte 235,79 // jmp bf29 <_sk_load_g8_dst_sse2_lowp+0xa5> .byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,225,2 // pinsrw $0x2,%ecx,%xmm4 @@ -68890,7 +68862,7 @@ _sk_load_g8_dst_sse2_lowp: .byte 102,15,110,233 // movd %ecx,%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 243,15,16,229 // movss %xmm5,%xmm4 - .byte 235,47 // jmp bf4d <_sk_load_g8_dst_sse2_lowp+0xa5> + .byte 235,47 // jmp bf29 <_sk_load_g8_dst_sse2_lowp+0xa5> .byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,225,6 // pinsrw $0x6,%ecx,%xmm4 @@ -68901,9 +68873,9 @@ _sk_load_g8_dst_sse2_lowp: .byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 242,15,16,229 // movsd %xmm5,%xmm4 - .byte 102,15,219,167,223,20,0,0 // pand 0x14df(%edi),%xmm4 + .byte 102,15,219,167,227,20,0,0 // pand 0x14e3(%edi),%xmm4 .byte 141,72,8 // lea 0x8(%eax),%ecx - .byte 15,40,175,223,20,0,0 // movaps 0x14df(%edi),%xmm5 + .byte 15,40,175,227,20,0,0 // movaps 0x14e3(%edi),%xmm5 .byte 15,41,108,36,64 // movaps %xmm5,0x40(%esp) .byte 102,15,127,100,36,48 // movdqa %xmm4,0x30(%esp) .byte 102,15,127,100,36,32 // movdqa %xmm4,0x20(%esp) @@ -68944,7 +68916,7 @@ _sk_luminance_to_alpha_sse2_lowp: .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp .byte 102,15,111,218 // movdqa %xmm2,%xmm3 - .byte 232,0,0,0,0 // call bfc1 <_sk_luminance_to_alpha_sse2_lowp+0x11> + .byte 232,0,0,0,0 // call bf9d <_sk_luminance_to_alpha_sse2_lowp+0x11> .byte 88 // pop %eax .byte 139,77,8 // mov 0x8(%ebp),%ecx .byte 139,85,16 // mov 0x10(%ebp),%edx @@ -68954,10 +68926,10 @@ _sk_luminance_to_alpha_sse2_lowp: .byte 15,40,109,56 // movaps 0x38(%ebp),%xmm5 .byte 15,40,117,72 // movaps 0x48(%ebp),%xmm6 .byte 139,125,12 // mov 0xc(%ebp),%edi - .byte 102,15,213,128,127,20,0,0 // pmullw 0x147f(%eax),%xmm0 - .byte 102,15,213,136,143,20,0,0 // pmullw 0x148f(%eax),%xmm1 + .byte 102,15,213,128,131,20,0,0 // pmullw 0x1483(%eax),%xmm0 + .byte 102,15,213,136,147,20,0,0 // pmullw 0x1493(%eax),%xmm1 .byte 102,15,253,200 // paddw %xmm0,%xmm1 - .byte 102,15,213,152,159,20,0,0 // pmullw 0x149f(%eax),%xmm3 + .byte 102,15,213,152,163,20,0,0 // pmullw 0x14a3(%eax),%xmm3 .byte 102,15,253,217 // paddw %xmm1,%xmm3 .byte 102,15,113,211,8 // psrlw $0x8,%xmm3 .byte 141,71,4 // lea 0x4(%edi),%eax @@ -68988,15 +68960,15 @@ _sk_scale_1_float_sse2_lowp: .byte 87 // push %edi .byte 86 // push %esi .byte 131,236,80 // sub $0x50,%esp - .byte 232,0,0,0,0 // call c04a <_sk_scale_1_float_sse2_lowp+0xd> + .byte 232,0,0,0,0 // call c026 <_sk_scale_1_float_sse2_lowp+0xd> .byte 94 // pop %esi .byte 139,69,8 // mov 0x8(%ebp),%eax .byte 139,85,16 // mov 0x10(%ebp),%edx .byte 139,77,12 // mov 0xc(%ebp),%ecx .byte 139,57 // mov (%ecx),%edi .byte 243,15,16,39 // movss (%edi),%xmm4 - .byte 243,15,89,166,42,20,0,0 // mulss 0x142a(%esi),%xmm4 - .byte 243,15,88,166,38,20,0,0 // addss 0x1426(%esi),%xmm4 + .byte 243,15,89,166,46,20,0,0 // mulss 0x142e(%esi),%xmm4 + .byte 243,15,88,166,42,20,0,0 // addss 0x142a(%esi),%xmm4 .byte 243,15,44,252 // cvttss2si %xmm4,%edi .byte 102,15,110,239 // movd %edi,%xmm5 .byte 139,125,20 // mov 0x14(%ebp),%edi @@ -69009,7 +68981,7 @@ _sk_scale_1_float_sse2_lowp: .byte 102,15,213,205 // pmullw %xmm5,%xmm1 .byte 102,15,213,213 // pmullw %xmm5,%xmm2 .byte 102,15,213,221 // pmullw %xmm5,%xmm3 - .byte 102,15,111,174,102,19,0,0 // movdqa 0x1366(%esi),%xmm5 + .byte 102,15,111,174,106,19,0,0 // movdqa 0x136a(%esi),%xmm5 .byte 102,15,253,197 // paddw %xmm5,%xmm0 .byte 102,15,253,205 // paddw %xmm5,%xmm1 .byte 102,15,253,213 // paddw %xmm5,%xmm2 @@ -69048,19 +69020,19 @@ _sk_lerp_1_float_sse2_lowp: .byte 102,15,111,218 // movdqa %xmm2,%xmm3 .byte 102,15,111,209 // movdqa %xmm1,%xmm2 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 - .byte 232,0,0,0,0 // call c118 <_sk_lerp_1_float_sse2_lowp+0x1d> + .byte 232,0,0,0,0 // call c0f4 <_sk_lerp_1_float_sse2_lowp+0x1d> .byte 89 // pop %ecx .byte 102,15,111,109,24 // movdqa 0x18(%ebp),%xmm5 .byte 139,69,12 // mov 0xc(%ebp),%eax .byte 139,16 // mov (%eax),%edx .byte 243,15,16,50 // movss (%edx),%xmm6 - .byte 243,15,89,177,92,19,0,0 // mulss 0x135c(%ecx),%xmm6 - .byte 243,15,88,177,88,19,0,0 // addss 0x1358(%ecx),%xmm6 + .byte 243,15,89,177,96,19,0,0 // mulss 0x1360(%ecx),%xmm6 + .byte 243,15,88,177,92,19,0,0 // addss 0x135c(%ecx),%xmm6 .byte 243,15,44,214 // cvttss2si %xmm6,%edx .byte 102,15,110,242 // movd %edx,%xmm6 .byte 242,15,112,246,0 // pshuflw $0x0,%xmm6,%xmm6 .byte 102,15,112,246,80 // pshufd $0x50,%xmm6,%xmm6 - .byte 102,15,111,129,152,18,0,0 // movdqa 0x1298(%ecx),%xmm0 + .byte 102,15,111,129,156,18,0,0 // movdqa 0x129c(%ecx),%xmm0 .byte 102,15,213,206 // pmullw %xmm6,%xmm1 .byte 102,15,253,200 // paddw %xmm0,%xmm1 .byte 102,15,213,214 // pmullw %xmm6,%xmm2 @@ -69133,10 +69105,10 @@ _sk_scale_u8_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call c241 <_sk_scale_u8_sse2_lowp+0x31> + .byte 232,0,0,0,0 // call c21d <_sk_scale_u8_sse2_lowp+0x31> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja c263 <_sk_scale_u8_sse2_lowp+0x53> + .byte 119,28 // ja c23f <_sk_scale_u8_sse2_lowp+0x53> .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,3,1,0,0 // mov 0x103(%edi,%ecx,4),%ecx @@ -69144,10 +69116,10 @@ _sk_scale_u8_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx .byte 102,15,110,225 // movd %ecx,%xmm4 - .byte 235,90 // jmp c2bd <_sk_scale_u8_sse2_lowp+0xad> + .byte 235,90 // jmp c299 <_sk_scale_u8_sse2_lowp+0xad> .byte 243,15,126,36,51 // movq (%ebx,%esi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 - .byte 235,79 // jmp c2bd <_sk_scale_u8_sse2_lowp+0xad> + .byte 235,79 // jmp c299 <_sk_scale_u8_sse2_lowp+0xad> .byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,225,2 // pinsrw $0x2,%ecx,%xmm4 @@ -69155,7 +69127,7 @@ _sk_scale_u8_sse2_lowp: .byte 102,15,110,233 // movd %ecx,%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 243,15,16,229 // movss %xmm5,%xmm4 - .byte 235,47 // jmp c2bd <_sk_scale_u8_sse2_lowp+0xad> + .byte 235,47 // jmp c299 <_sk_scale_u8_sse2_lowp+0xad> .byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx .byte 102,15,239,228 // pxor %xmm4,%xmm4 .byte 102,15,196,225,6 // pinsrw $0x6,%ecx,%xmm4 @@ -69166,9 +69138,9 @@ _sk_scale_u8_sse2_lowp: .byte 102,15,110,44,51 // movd (%ebx,%esi,1),%xmm5 .byte 102,15,96,232 // punpcklbw %xmm0,%xmm5 .byte 242,15,16,229 // movsd %xmm5,%xmm4 - .byte 102,15,219,167,111,17,0,0 // pand 0x116f(%edi),%xmm4 + .byte 102,15,219,167,115,17,0,0 // pand 0x1173(%edi),%xmm4 .byte 102,15,213,196 // pmullw %xmm4,%xmm0 - .byte 102,15,111,175,111,17,0,0 // movdqa 0x116f(%edi),%xmm5 + .byte 102,15,111,175,115,17,0,0 // movdqa 0x1173(%edi),%xmm5 .byte 102,15,253,197 // paddw %xmm5,%xmm0 .byte 102,15,113,208,8 // psrlw $0x8,%xmm0 .byte 102,15,213,204 // pmullw %xmm4,%xmm1 @@ -69235,10 +69207,10 @@ _sk_lerp_u8_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call c38e <_sk_lerp_u8_sse2_lowp+0x2e> + .byte 232,0,0,0,0 // call c36a <_sk_lerp_u8_sse2_lowp+0x2e> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja c3b0 <_sk_lerp_u8_sse2_lowp+0x50> + .byte 119,28 // ja c38c <_sk_lerp_u8_sse2_lowp+0x50> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,74,1,0,0 // mov 0x14a(%edi,%ecx,4),%ecx @@ -69246,10 +69218,10 @@ _sk_lerp_u8_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,182,12,51 // movzbl (%ebx,%esi,1),%ecx .byte 102,15,110,217 // movd %ecx,%xmm3 - .byte 235,90 // jmp c40a <_sk_lerp_u8_sse2_lowp+0xaa> + .byte 235,90 // jmp c3e6 <_sk_lerp_u8_sse2_lowp+0xaa> .byte 243,15,126,28,51 // movq (%ebx,%esi,1),%xmm3 .byte 102,15,96,216 // punpcklbw %xmm0,%xmm3 - .byte 235,79 // jmp c40a <_sk_lerp_u8_sse2_lowp+0xaa> + .byte 235,79 // jmp c3e6 <_sk_lerp_u8_sse2_lowp+0xaa> .byte 15,182,76,51,2 // movzbl 0x2(%ebx,%esi,1),%ecx .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,217,2 // pinsrw $0x2,%ecx,%xmm3 @@ -69257,7 +69229,7 @@ _sk_lerp_u8_sse2_lowp: .byte 102,15,110,225 // movd %ecx,%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 .byte 243,15,16,220 // movss %xmm4,%xmm3 - .byte 235,47 // jmp c40a <_sk_lerp_u8_sse2_lowp+0xaa> + .byte 235,47 // jmp c3e6 <_sk_lerp_u8_sse2_lowp+0xaa> .byte 15,182,76,51,6 // movzbl 0x6(%ebx,%esi,1),%ecx .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,217,6 // pinsrw $0x6,%ecx,%xmm3 @@ -69268,8 +69240,8 @@ _sk_lerp_u8_sse2_lowp: .byte 102,15,110,36,51 // movd (%ebx,%esi,1),%xmm4 .byte 102,15,96,224 // punpcklbw %xmm0,%xmm4 .byte 242,15,16,220 // movsd %xmm4,%xmm3 - .byte 102,15,219,159,34,16,0,0 // pand 0x1022(%edi),%xmm3 - .byte 102,15,111,183,34,16,0,0 // movdqa 0x1022(%edi),%xmm6 + .byte 102,15,219,159,38,16,0,0 // pand 0x1026(%edi),%xmm3 + .byte 102,15,111,183,38,16,0,0 // movdqa 0x1026(%edi),%xmm6 .byte 102,15,111,227 // movdqa %xmm3,%xmm4 .byte 102,15,239,230 // pxor %xmm6,%xmm4 .byte 102,15,111,252 // movdqa %xmm4,%xmm7 @@ -69358,10 +69330,10 @@ _sk_scale_565_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call c537 <_sk_scale_565_sse2_lowp+0x43> + .byte 232,0,0,0,0 // call c513 <_sk_scale_565_sse2_lowp+0x43> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja c559 <_sk_scale_565_sse2_lowp+0x65> + .byte 119,28 // ja c535 <_sk_scale_565_sse2_lowp+0x65> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,249,1,0,0 // mov 0x1f9(%edi,%ecx,4),%ecx @@ -69369,14 +69341,14 @@ _sk_scale_565_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,183,12,115 // movzwl (%ebx,%esi,2),%ecx .byte 102,15,110,217 // movd %ecx,%xmm3 - .byte 235,59 // jmp c594 <_sk_scale_565_sse2_lowp+0xa0> + .byte 235,59 // jmp c570 <_sk_scale_565_sse2_lowp+0xa0> .byte 243,15,111,28,115 // movdqu (%ebx,%esi,2),%xmm3 - .byte 235,52 // jmp c594 <_sk_scale_565_sse2_lowp+0xa0> + .byte 235,52 // jmp c570 <_sk_scale_565_sse2_lowp+0xa0> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,92,115,4,2 // pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3 .byte 243,15,16,12,115 // movss (%ebx,%esi,2),%xmm1 .byte 243,15,16,217 // movss %xmm1,%xmm3 - .byte 235,30 // jmp c594 <_sk_scale_565_sse2_lowp+0xa0> + .byte 235,30 // jmp c570 <_sk_scale_565_sse2_lowp+0xa0> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,92,115,12,6 // pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3 .byte 102,15,196,92,115,10,5 // pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3 @@ -69384,11 +69356,11 @@ _sk_scale_565_sse2_lowp: .byte 102,15,18,28,115 // movlpd (%ebx,%esi,2),%xmm3 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,113,209,8 // psrlw $0x8,%xmm1 - .byte 102,15,219,143,185,14,0,0 // pand 0xeb9(%edi),%xmm1 + .byte 102,15,219,143,189,14,0,0 // pand 0xebd(%edi),%xmm1 .byte 102,15,111,211 // movdqa %xmm3,%xmm2 .byte 102,15,113,210,5 // psrlw $0x5,%xmm2 - .byte 102,15,219,151,201,14,0,0 // pand 0xec9(%edi),%xmm2 - .byte 102,15,111,135,217,14,0,0 // movdqa 0xed9(%edi),%xmm0 + .byte 102,15,219,151,205,14,0,0 // pand 0xecd(%edi),%xmm2 + .byte 102,15,111,135,221,14,0,0 // movdqa 0xedd(%edi),%xmm0 .byte 102,15,219,195 // pand %xmm3,%xmm0 .byte 102,15,113,211,13 // psrlw $0xd,%xmm3 .byte 102,15,235,217 // por %xmm1,%xmm3 @@ -69401,7 +69373,7 @@ _sk_scale_565_sse2_lowp: .byte 102,15,113,208,2 // psrlw $0x2,%xmm0 .byte 102,15,235,193 // por %xmm1,%xmm0 .byte 102,15,127,69,200 // movdqa %xmm0,-0x38(%ebp) - .byte 102,15,111,167,153,14,0,0 // movdqa 0xe99(%edi),%xmm4 + .byte 102,15,111,167,157,14,0,0 // movdqa 0xe9d(%edi),%xmm4 .byte 15,41,117,184 // movaps %xmm6,-0x48(%ebp) .byte 102,15,239,244 // pxor %xmm4,%xmm6 .byte 102,15,239,252 // pxor %xmm4,%xmm7 @@ -69444,7 +69416,7 @@ _sk_scale_565_sse2_lowp: .byte 102,15,111,229 // movdqa %xmm5,%xmm4 .byte 102,15,213,101,136 // pmullw -0x78(%ebp),%xmm4 .byte 102,15,213,125,184 // pmullw -0x48(%ebp),%xmm7 - .byte 102,15,111,135,121,14,0,0 // movdqa 0xe79(%edi),%xmm0 + .byte 102,15,111,135,125,14,0,0 // movdqa 0xe7d(%edi),%xmm0 .byte 102,15,253,216 // paddw %xmm0,%xmm3 .byte 102,15,253,208 // paddw %xmm0,%xmm2 .byte 102,15,253,224 // paddw %xmm0,%xmm4 @@ -69521,10 +69493,10 @@ _sk_lerp_565_sse2_lowp: .byte 128,225,7 // and $0x7,%cl .byte 254,201 // dec %cl .byte 128,249,6 // cmp $0x6,%cl - .byte 232,0,0,0,0 // call c78f <_sk_lerp_565_sse2_lowp+0x43> + .byte 232,0,0,0,0 // call c76b <_sk_lerp_565_sse2_lowp+0x43> .byte 95 // pop %edi .byte 139,117,16 // mov 0x10(%ebp),%esi - .byte 119,28 // ja c7b1 <_sk_lerp_565_sse2_lowp+0x65> + .byte 119,28 // ja c78d <_sk_lerp_565_sse2_lowp+0x65> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 15,182,201 // movzbl %cl,%ecx .byte 139,140,143,73,2,0,0 // mov 0x249(%edi,%ecx,4),%ecx @@ -69532,14 +69504,14 @@ _sk_lerp_565_sse2_lowp: .byte 255,225 // jmp *%ecx .byte 15,183,12,115 // movzwl (%ebx,%esi,2),%ecx .byte 102,15,110,217 // movd %ecx,%xmm3 - .byte 235,59 // jmp c7ec <_sk_lerp_565_sse2_lowp+0xa0> + .byte 235,59 // jmp c7c8 <_sk_lerp_565_sse2_lowp+0xa0> .byte 243,15,111,28,115 // movdqu (%ebx,%esi,2),%xmm3 - .byte 235,52 // jmp c7ec <_sk_lerp_565_sse2_lowp+0xa0> + .byte 235,52 // jmp c7c8 <_sk_lerp_565_sse2_lowp+0xa0> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,92,115,4,2 // pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3 .byte 243,15,16,12,115 // movss (%ebx,%esi,2),%xmm1 .byte 243,15,16,217 // movss %xmm1,%xmm3 - .byte 235,30 // jmp c7ec <_sk_lerp_565_sse2_lowp+0xa0> + .byte 235,30 // jmp c7c8 <_sk_lerp_565_sse2_lowp+0xa0> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 102,15,196,92,115,12,6 // pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3 .byte 102,15,196,92,115,10,5 // pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3 @@ -69547,11 +69519,11 @@ _sk_lerp_565_sse2_lowp: .byte 102,15,18,28,115 // movlpd (%ebx,%esi,2),%xmm3 .byte 102,15,111,203 // movdqa %xmm3,%xmm1 .byte 102,15,113,209,8 // psrlw $0x8,%xmm1 - .byte 102,15,219,143,97,12,0,0 // pand 0xc61(%edi),%xmm1 + .byte 102,15,219,143,101,12,0,0 // pand 0xc65(%edi),%xmm1 .byte 102,15,111,211 // movdqa %xmm3,%xmm2 .byte 102,15,113,210,5 // psrlw $0x5,%xmm2 - .byte 102,15,219,151,113,12,0,0 // pand 0xc71(%edi),%xmm2 - .byte 102,15,111,175,129,12,0,0 // movdqa 0xc81(%edi),%xmm5 + .byte 102,15,219,151,117,12,0,0 // pand 0xc75(%edi),%xmm2 + .byte 102,15,111,175,133,12,0,0 // movdqa 0xc85(%edi),%xmm5 .byte 102,15,219,235 // pand %xmm3,%xmm5 .byte 102,15,113,211,13 // psrlw $0xd,%xmm3 .byte 102,15,235,217 // por %xmm1,%xmm3 @@ -69564,7 +69536,7 @@ _sk_lerp_565_sse2_lowp: .byte 102,15,113,213,2 // psrlw $0x2,%xmm5 .byte 102,15,235,233 // por %xmm1,%xmm5 .byte 102,15,127,109,216 // movdqa %xmm5,-0x28(%ebp) - .byte 102,15,111,167,65,12,0,0 // movdqa 0xc41(%edi),%xmm4 + .byte 102,15,111,167,69,12,0,0 // movdqa 0xc45(%edi),%xmm4 .byte 102,15,111,198 // movdqa %xmm6,%xmm0 .byte 102,15,111,200 // movdqa %xmm0,%xmm1 .byte 102,15,239,204 // pxor %xmm4,%xmm1 @@ -69605,7 +69577,7 @@ _sk_lerp_565_sse2_lowp: .byte 102,15,235,249 // por %xmm1,%xmm7 .byte 102,15,111,195 // movdqa %xmm3,%xmm0 .byte 102,15,213,93,168 // pmullw -0x58(%ebp),%xmm3 - .byte 102,15,111,143,33,12,0,0 // movdqa 0xc21(%edi),%xmm1 + .byte 102,15,111,143,37,12,0,0 // movdqa 0xc25(%edi),%xmm1 .byte 102,15,239,193 // pxor %xmm1,%xmm0 .byte 102,15,111,101,24 // movdqa 0x18(%ebp),%xmm4 .byte 102,15,213,196 // pmullw %xmm4,%xmm0 @@ -69701,11 +69673,11 @@ _sk_srcover_rgba_8888_sse2_lowp: .byte 128,227,7 // and $0x7,%bl .byte 254,203 // dec %bl .byte 128,251,6 // cmp $0x6,%bl - .byte 232,0,0,0,0 // call ca33 <_sk_srcover_rgba_8888_sse2_lowp+0x3f> + .byte 232,0,0,0,0 // call ca0f <_sk_srcover_rgba_8888_sse2_lowp+0x3f> .byte 89 // pop %ecx .byte 139,117,16 // mov 0x10(%ebp),%esi .byte 15,182,211 // movzbl %bl,%edx - .byte 119,29 // ja ca59 <_sk_srcover_rgba_8888_sse2_lowp+0x65> + .byte 119,29 // ja ca35 <_sk_srcover_rgba_8888_sse2_lowp+0x65> .byte 102,15,239,219 // pxor %xmm3,%xmm3 .byte 139,132,145,77,2,0,0 // mov 0x24d(%ecx,%edx,4),%eax .byte 1,200 // add %ecx,%eax @@ -69713,14 +69685,14 @@ _sk_srcover_rgba_8888_sse2_lowp: .byte 255,224 // jmp *%eax .byte 243,15,16,52,183 // movss (%edi,%esi,4),%xmm6 .byte 15,87,219 // xorps %xmm3,%xmm3 - .byte 235,73 // jmp caa2 <_sk_srcover_rgba_8888_sse2_lowp+0xae> + .byte 235,73 // jmp ca7e <_sk_srcover_rgba_8888_sse2_lowp+0xae> .byte 102,15,16,52,183 // movupd (%edi,%esi,4),%xmm6 .byte 15,16,92,183,16 // movups 0x10(%edi,%esi,4),%xmm3 - .byte 235,61 // jmp caa2 <_sk_srcover_rgba_8888_sse2_lowp+0xae> + .byte 235,61 // jmp ca7e <_sk_srcover_rgba_8888_sse2_lowp+0xae> .byte 102,15,110,68,183,8 // movd 0x8(%edi,%esi,4),%xmm0 .byte 102,15,112,240,69 // pshufd $0x45,%xmm0,%xmm6 .byte 102,15,18,52,183 // movlpd (%edi,%esi,4),%xmm6 - .byte 235,43 // jmp caa2 <_sk_srcover_rgba_8888_sse2_lowp+0xae> + .byte 235,43 // jmp ca7e <_sk_srcover_rgba_8888_sse2_lowp+0xae> .byte 102,15,110,68,183,24 // movd 0x18(%edi,%esi,4),%xmm0 .byte 102,15,112,216,69 // pshufd $0x45,%xmm0,%xmm3 .byte 243,15,16,68,183,20 // movss 0x14(%edi,%esi,4),%xmm0 @@ -69746,7 +69718,7 @@ _sk_srcover_rgba_8888_sse2_lowp: .byte 102,15,114,243,16 // pslld $0x10,%xmm3 .byte 102,15,114,227,16 // psrad $0x10,%xmm3 .byte 102,15,107,243 // packssdw %xmm3,%xmm6 - .byte 102,15,111,153,125,9,0,0 // movdqa 0x97d(%ecx),%xmm3 + .byte 102,15,111,153,129,9,0,0 // movdqa 0x981(%ecx),%xmm3 .byte 102,15,114,208,16 // psrld $0x10,%xmm0 .byte 102,15,114,210,16 // psrld $0x10,%xmm2 .byte 102,15,114,242,16 // pslld $0x10,%xmm2 @@ -69798,18 +69770,18 @@ _sk_srcover_rgba_8888_sse2_lowp: .byte 102,15,105,220 // punpckhwd %xmm4,%xmm3 .byte 102,15,235,222 // por %xmm6,%xmm3 .byte 128,251,6 // cmp $0x6,%bl - .byte 119,16 // ja cbe3 <_sk_srcover_rgba_8888_sse2_lowp+0x1ef> + .byte 119,16 // ja cbbf <_sk_srcover_rgba_8888_sse2_lowp+0x1ef> .byte 3,140,145,105,2,0,0 // add 0x269(%ecx,%edx,4),%ecx .byte 255,225 // jmp *%ecx .byte 102,15,126,4,183 // movd %xmm0,(%edi,%esi,4) - .byte 235,64 // jmp cc23 <_sk_srcover_rgba_8888_sse2_lowp+0x22f> + .byte 235,64 // jmp cbff <_sk_srcover_rgba_8888_sse2_lowp+0x22f> .byte 243,15,127,4,183 // movdqu %xmm0,(%edi,%esi,4) .byte 243,15,127,92,183,16 // movdqu %xmm3,0x10(%edi,%esi,4) - .byte 235,51 // jmp cc23 <_sk_srcover_rgba_8888_sse2_lowp+0x22f> + .byte 235,51 // jmp cbff <_sk_srcover_rgba_8888_sse2_lowp+0x22f> .byte 102,15,112,208,78 // pshufd $0x4e,%xmm0,%xmm2 .byte 102,15,126,84,183,8 // movd %xmm2,0x8(%edi,%esi,4) .byte 102,15,214,4,183 // movq %xmm0,(%edi,%esi,4) - .byte 235,33 // jmp cc23 <_sk_srcover_rgba_8888_sse2_lowp+0x22f> + .byte 235,33 // jmp cbff <_sk_srcover_rgba_8888_sse2_lowp+0x22f> .byte 102,15,112,211,78 // pshufd $0x4e,%xmm3,%xmm2 .byte 102,15,126,84,183,24 // movd %xmm2,0x18(%edi,%esi,4) .byte 102,15,112,211,229 // pshufd $0xe5,%xmm3,%xmm2 @@ -69938,11 +69910,11 @@ BALIGN16 .byte 0,128,191,0,0,128 // add %al,-0x7fffff41(%eax) .byte 191,0,0,224,64 // mov $0x40e00000,%edi .byte 0,0 // add %al,(%eax) - .byte 224,64 // loopne cda8 <.literal16+0xe8> + .byte 224,64 // loopne cd88 <.literal16+0xe8> .byte 0,0 // add %al,(%eax) - .byte 224,64 // loopne cdac <.literal16+0xec> + .byte 224,64 // loopne cd8c <.literal16+0xec> .byte 0,0 // add %al,(%eax) - .byte 224,64 // loopne cdb0 <.literal16+0xf0> + .byte 224,64 // loopne cd90 <.literal16+0xf0> .byte 154,153,153,62,154,153,153 // lcall $0x9999,$0x9a3e9999 .byte 62,154,153,153,62,154,153,153 // ds lcall $0x9999,$0x9a3e9999 .byte 62,61,10,23,63,61 // ds cmp $0x3d3f170a,%eax @@ -69953,16 +69925,16 @@ BALIGN16 .byte 63 // aas .byte 174 // scas %es:(%edi),%al .byte 71 // inc %edi - .byte 225,61 // loope cdd1 <.literal16+0x111> + .byte 225,61 // loope cdb1 <.literal16+0x111> .byte 174 // scas %es:(%edi),%al .byte 71 // inc %edi - .byte 225,61 // loope cdd5 <.literal16+0x115> + .byte 225,61 // loope cdb5 <.literal16+0x115> .byte 174 // scas %es:(%edi),%al .byte 71 // inc %edi - .byte 225,61 // loope cdd9 <.literal16+0x119> + .byte 225,61 // loope cdb9 <.literal16+0x119> .byte 174 // scas %es:(%edi),%al .byte 71 // inc %edi - .byte 225,61 // loope cddd <.literal16+0x11d> + .byte 225,61 // loope cdbd <.literal16+0x11d> .byte 255,0 // incl (%eax) .byte 0,0 // add %al,(%eax) .byte 255,0 // incl (%eax) @@ -69972,13 +69944,13 @@ BALIGN16 .byte 255,0 // incl (%eax) .byte 0,0 // add %al,(%eax) .byte 0,0 // add %al,(%eax) - .byte 127,67 // jg cdf7 <.literal16+0x137> + .byte 127,67 // jg cdd7 <.literal16+0x137> .byte 0,0 // add %al,(%eax) - .byte 127,67 // jg cdfb <.literal16+0x13b> + .byte 127,67 // jg cddb <.literal16+0x13b> .byte 0,0 // add %al,(%eax) - .byte 127,67 // jg cdff <.literal16+0x13f> + .byte 127,67 // jg cddf <.literal16+0x13f> .byte 0,0 // add %al,(%eax) - .byte 127,67 // jg ce03 <.literal16+0x143> + .byte 127,67 // jg cde3 <.literal16+0x143> .byte 145 // xchg %eax,%ecx .byte 131,158,61,145,131,158,61 // sbbl $0x3d,-0x617c6ec3(%esi) .byte 145 // xchg %eax,%ecx @@ -70129,13 +70101,13 @@ BALIGN16 .byte 132,55 // test %dh,(%edi) .byte 8,33 // or %ah,(%ecx) .byte 132,55 // test %dh,(%edi) - .byte 224,7 // loopne cf09 <.literal16+0x249> + .byte 224,7 // loopne cee9 <.literal16+0x249> .byte 0,0 // add %al,(%eax) - .byte 224,7 // loopne cf0d <.literal16+0x24d> + .byte 224,7 // loopne ceed <.literal16+0x24d> .byte 0,0 // add %al,(%eax) - .byte 224,7 // loopne cf11 <.literal16+0x251> + .byte 224,7 // loopne cef1 <.literal16+0x251> .byte 0,0 // add %al,(%eax) - .byte 224,7 // loopne cf15 <.literal16+0x255> + .byte 224,7 // loopne cef5 <.literal16+0x255> .byte 0,0 // add %al,(%eax) .byte 33,8 // and %ecx,(%eax) .byte 2,58 // add (%edx),%bh @@ -70184,17 +70156,17 @@ BALIGN16 .byte 0,0 // add %al,(%eax) .byte 52,255 // xor $0xff,%al .byte 255 // (bad) - .byte 127,0 // jg cf74 <.literal16+0x2b4> + .byte 127,0 // jg cf54 <.literal16+0x2b4> .byte 255 // (bad) .byte 255 // (bad) - .byte 127,0 // jg cf78 <.literal16+0x2b8> + .byte 127,0 // jg cf58 <.literal16+0x2b8> .byte 255 // (bad) .byte 255 // (bad) - .byte 127,0 // jg cf7c <.literal16+0x2bc> + .byte 127,0 // jg cf5c <.literal16+0x2bc> .byte 255 // (bad) .byte 255 // (bad) - .byte 127,0 // jg cf80 <.literal16+0x2c0> - .byte 119,115 // ja cff5 <.literal16+0x335> + .byte 127,0 // jg cf60 <.literal16+0x2c0> + .byte 119,115 // ja cfd5 <.literal16+0x335> .byte 248 // clc .byte 194,119,115 // ret $0x7377 .byte 248 // clc @@ -70205,7 +70177,7 @@ BALIGN16 .byte 194,117,191 // ret $0xbf75 .byte 191,63,117,191,191 // mov $0xbfbf753f,%edi .byte 63 // aas - .byte 117,191 // jne cf59 <.literal16+0x299> + .byte 117,191 // jne cf39 <.literal16+0x299> .byte 191,63,117,191,191 // mov $0xbfbf753f,%edi .byte 63 // aas .byte 249 // stc @@ -70221,7 +70193,7 @@ BALIGN16 .byte 68 // inc %esp .byte 180,62 // mov $0x3e,%ah .byte 163,233,220,63,163 // mov %eax,0xa33fdce9 - .byte 233,220,63,163,233 // jmp e9a40f96 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a345a2> + .byte 233,220,63,163,233 // jmp e9a40f76 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a345a6> .byte 220,63 // fdivrl (%edi) .byte 163,233,220,63,81 // mov %eax,0x513fdce9 .byte 140,242 // mov %?,%edx @@ -70317,16 +70289,16 @@ BALIGN16 .byte 128,3,62 // addb $0x3e,(%ebx) .byte 31 // pop %ds .byte 215 // xlat %ds:(%ebx) - .byte 118,63 // jbe d0e3 <.literal16+0x423> + .byte 118,63 // jbe d0c3 <.literal16+0x423> .byte 31 // pop %ds .byte 215 // xlat %ds:(%ebx) - .byte 118,63 // jbe d0e7 <.literal16+0x427> + .byte 118,63 // jbe d0c7 <.literal16+0x427> .byte 31 // pop %ds .byte 215 // xlat %ds:(%ebx) - .byte 118,63 // jbe d0eb <.literal16+0x42b> + .byte 118,63 // jbe d0cb <.literal16+0x42b> .byte 31 // pop %ds .byte 215 // xlat %ds:(%ebx) - .byte 118,63 // jbe d0ef <.literal16+0x42f> + .byte 118,63 // jbe d0cf <.literal16+0x42f> .byte 246,64,83,63 // testb $0x3f,0x53(%eax) .byte 246,64,83,63 // testb $0x3f,0x53(%eax) .byte 246,64,83,63 // testb $0x3f,0x53(%eax) @@ -70352,13 +70324,13 @@ BALIGN16 .byte 248 // clc .byte 65 // inc %ecx .byte 0,0 // add %al,(%eax) - .byte 124,66 // jl d126 <.literal16+0x466> + .byte 124,66 // jl d106 <.literal16+0x466> .byte 0,0 // add %al,(%eax) - .byte 124,66 // jl d12a <.literal16+0x46a> + .byte 124,66 // jl d10a <.literal16+0x46a> .byte 0,0 // add %al,(%eax) - .byte 124,66 // jl d12e <.literal16+0x46e> + .byte 124,66 // jl d10e <.literal16+0x46e> .byte 0,0 // add %al,(%eax) - .byte 124,66 // jl d132 <.literal16+0x472> + .byte 124,66 // jl d112 <.literal16+0x472> .byte 0,240 // add %dh,%al .byte 0,0 // add %al,(%eax) .byte 0,240 // add %dh,%al @@ -70404,25 +70376,25 @@ BALIGN16 .byte 136,136,61,137,136,136 // mov %cl,-0x777776c3(%eax) .byte 61,137,136,136,61 // cmp $0x3d888889,%eax .byte 0,0 // add %al,(%eax) - .byte 112,65 // jo d1b5 <.literal16+0x4f5> + .byte 112,65 // jo d195 <.literal16+0x4f5> .byte 0,0 // add %al,(%eax) - .byte 112,65 // jo d1b9 <.literal16+0x4f9> + .byte 112,65 // jo d199 <.literal16+0x4f9> .byte 0,0 // add %al,(%eax) - .byte 112,65 // jo d1bd <.literal16+0x4fd> + .byte 112,65 // jo d19d <.literal16+0x4fd> .byte 0,0 // add %al,(%eax) - .byte 112,65 // jo d1c1 <.literal16+0x501> + .byte 112,65 // jo d1a1 <.literal16+0x501> .byte 0,128,0,0,0,128 // add %al,-0x80000000(%eax) .byte 0,0 // add %al,(%eax) .byte 0,128,0,0,0,128 // add %al,-0x80000000(%eax) .byte 0,0 // add %al,(%eax) .byte 255 // (bad) - .byte 127,0 // jg d193 <.literal16+0x4d3> + .byte 127,0 // jg d173 <.literal16+0x4d3> .byte 0,255 // add %bh,%bh - .byte 127,0 // jg d197 <.literal16+0x4d7> + .byte 127,0 // jg d177 <.literal16+0x4d7> .byte 0,255 // add %bh,%bh - .byte 127,0 // jg d19b <.literal16+0x4db> + .byte 127,0 // jg d17b <.literal16+0x4db> .byte 0,255 // add %bh,%bh - .byte 127,0 // jg d19f <.literal16+0x4df> + .byte 127,0 // jg d17f <.literal16+0x4df> .byte 0,0 // add %al,(%eax) .byte 4,0 // add $0x0,%al .byte 0,0 // add %al,(%eax) @@ -70448,13 +70420,13 @@ BALIGN16 .byte 255 // (bad) .byte 255 // (bad) .byte 255 // (bad) - .byte 127,255 // jg d1d8 <.literal16+0x518> + .byte 127,255 // jg d1b8 <.literal16+0x518> .byte 255 // (bad) .byte 255 // (bad) - .byte 127,255 // jg d1dc <.literal16+0x51c> + .byte 127,255 // jg d1bc <.literal16+0x51c> .byte 255 // (bad) .byte 255 // (bad) - .byte 127,0 // jg d1e1 <.literal16+0x521> + .byte 127,0 // jg d1c1 <.literal16+0x521> .byte 0,128,56,0,0,128 // add %al,-0x7fffffc8(%eax) .byte 56,0 // cmp %al,(%eax) .byte 0,128,56,0,0,128 // add %al,-0x7fffffc8(%eax) @@ -70468,13 +70440,13 @@ BALIGN16 .byte 0,255 // add %bh,%bh .byte 255,0 // incl (%eax) .byte 255 // (bad) - .byte 127,71 // jg d24b <.literal16+0x58b> + .byte 127,71 // jg d22b <.literal16+0x58b> .byte 0,255 // add %bh,%bh - .byte 127,71 // jg d24f <.literal16+0x58f> + .byte 127,71 // jg d22f <.literal16+0x58f> .byte 0,255 // add %bh,%bh - .byte 127,71 // jg d253 <.literal16+0x593> + .byte 127,71 // jg d233 <.literal16+0x593> .byte 0,255 // add %bh,%bh - .byte 127,71 // jg d257 <.literal16+0x597> + .byte 127,71 // jg d237 <.literal16+0x597> .byte 208 // (bad) .byte 179,89 // mov $0x59,%bl .byte 62,208 // ds (bad) @@ -70527,7 +70499,7 @@ BALIGN16 .byte 192,45,16,17,192,45,16 // shrb $0x10,0x2dc01110 .byte 17,192 // adc %eax,%eax .byte 45,16,17,192,18 // sub $0x12c01110,%eax - .byte 120,57 // js d2bc <.literal16+0x5fc> + .byte 120,57 // js d29c <.literal16+0x5fc> .byte 64 // inc %eax .byte 18,120,57 // adc 0x39(%eax),%bh .byte 64 // inc %eax @@ -70598,13 +70570,13 @@ BALIGN16 .byte 192,191,0,0,192,191,0 // sarb $0x0,-0x40400000(%edi) .byte 0,192 // add %al,%al .byte 191,0,0,192,191 // mov $0xbfc00000,%edi - .byte 114,28 // jb d36e <.literal16+0x6ae> + .byte 114,28 // jb d34e <.literal16+0x6ae> .byte 199 // (bad) - .byte 62,114,28 // jb,pt d372 <.literal16+0x6b2> + .byte 62,114,28 // jb,pt d352 <.literal16+0x6b2> .byte 199 // (bad) - .byte 62,114,28 // jb,pt d376 <.literal16+0x6b6> + .byte 62,114,28 // jb,pt d356 <.literal16+0x6b6> .byte 199 // (bad) - .byte 62,114,28 // jb,pt d37a <.literal16+0x6ba> + .byte 62,114,28 // jb,pt d35a <.literal16+0x6ba> .byte 199 // (bad) .byte 62,85 // ds push %ebp .byte 85 // push %ebp @@ -70625,13 +70597,13 @@ BALIGN16 .byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%esi) .byte 99,61,57,142,99,61 // arpl %di,0x3d638e39 .byte 57,142,99,61,114,249 // cmp %ecx,-0x68dc29d(%esi) - .byte 127,63 // jg d3d3 <.literal16+0x713> - .byte 114,249 // jb d38f <.literal16+0x6cf> - .byte 127,63 // jg d3d7 <.literal16+0x717> - .byte 114,249 // jb d393 <.literal16+0x6d3> - .byte 127,63 // jg d3db <.literal16+0x71b> - .byte 114,249 // jb d397 <.literal16+0x6d7> - .byte 127,63 // jg d3df <.literal16+0x71f> + .byte 127,63 // jg d3b3 <.literal16+0x713> + .byte 114,249 // jb d36f <.literal16+0x6cf> + .byte 127,63 // jg d3b7 <.literal16+0x717> + .byte 114,249 // jb d373 <.literal16+0x6d3> + .byte 127,63 // jg d3bb <.literal16+0x71b> + .byte 114,249 // jb d377 <.literal16+0x6d7> + .byte 127,63 // jg d3bf <.literal16+0x71f> .byte 3,0 // add (%eax),%eax .byte 0,0 // add %al,(%eax) .byte 3,0 // add (%eax),%eax @@ -70699,14 +70671,14 @@ BALIGN16 .byte 0,248 // add %bh,%al .byte 0,248 // add %bh,%al .byte 0,248 // add %bh,%al - .byte 224,255 // loopne d431 <.literal16+0x771> - .byte 224,255 // loopne d433 <.literal16+0x773> - .byte 224,255 // loopne d435 <.literal16+0x775> - .byte 224,255 // loopne d437 <.literal16+0x777> - .byte 224,255 // loopne d439 <.literal16+0x779> - .byte 224,255 // loopne d43b <.literal16+0x77b> - .byte 224,255 // loopne d43d <.literal16+0x77d> - .byte 224,255 // loopne d43f <.literal16+0x77f> + .byte 224,255 // loopne d411 <.literal16+0x771> + .byte 224,255 // loopne d413 <.literal16+0x773> + .byte 224,255 // loopne d415 <.literal16+0x775> + .byte 224,255 // loopne d417 <.literal16+0x777> + .byte 224,255 // loopne d419 <.literal16+0x779> + .byte 224,255 // loopne d41b <.literal16+0x77b> + .byte 224,255 // loopne d41d <.literal16+0x77d> + .byte 224,255 // loopne d41f <.literal16+0x77f> .byte 54,0,54 // add %dh,%ss:(%esi) .byte 0,54 // add %dh,(%esi) .byte 0,54 // add %dh,(%esi) @@ -70730,5 +70702,5 @@ BALIGN4 .byte 0,0 // add %al,(%eax) .byte 0,63 // add %bh,(%edi) .byte 0,0 // add %al,(%eax) - .byte 127,67 // jg d4bb <_sk_srcover_rgba_8888_sse2_lowp+0xac7> + .byte 127,67 // jg d49b <_sk_srcover_rgba_8888_sse2_lowp+0xacb> #endif diff --git a/src/jumper/SkJumper_generated_win.S b/src/jumper/SkJumper_generated_win.S index fe43ec82ae..5dc6f3a640 100644 --- a/src/jumper/SkJumper_generated_win.S +++ b/src/jumper/SkJumper_generated_win.S @@ -43575,11 +43575,11 @@ _sk_seed_shader_sse2 LABEL PROC DB 102,15,110,2 ; movd (%edx),%xmm0 DB 102,15,112,192,0 ; pshufd $0x0,%xmm0,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,88,128,247,203,0,0 ; addps 0xcbf7(%eax),%xmm0 + DB 15,88,128,215,203,0,0 ; addps 0xcbd7(%eax),%xmm0 DB 102,15,110,74,4 ; movd 0x4(%edx),%xmm1 DB 102,15,112,201,0 ; pshufd $0x0,%xmm1,%xmm1 DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 - DB 15,88,136,7,204,0,0 ; addps 0xcc07(%eax),%xmm1 + DB 15,88,136,231,203,0,0 ; addps 0xcbe7(%eax),%xmm1 DB 141,113,4 ; lea 0x4(%ecx),%esi DB 15,87,210 ; xorps %xmm2,%xmm2 DB 15,41,82,64 ; movaps %xmm2,0x40(%edx) @@ -43587,7 +43587,7 @@ _sk_seed_shader_sse2 LABEL PROC DB 15,41,82,32 ; movaps %xmm2,0x20(%edx) DB 15,41,82,16 ; movaps %xmm2,0x10(%edx) DB 131,236,8 ; sub $0x8,%esp - DB 15,40,144,23,204,0,0 ; movaps 0xcc17(%eax),%xmm2 + DB 15,40,144,247,203,0,0 ; movaps 0xcbf7(%eax),%xmm2 DB 15,87,219 ; xorps %xmm3,%xmm3 DB 86 ; push %esi DB 82 ; push %edx @@ -43612,15 +43612,15 @@ _sk_dither_sse2 LABEL PROC DB 139,69,8 ; mov 0x8(%ebp),%eax DB 102,15,110,32 ; movd (%eax),%xmm4 DB 102,15,112,228,0 ; pshufd $0x0,%xmm4,%xmm4 - DB 102,15,254,161,178,203,0,0 ; paddd 0xcbb2(%ecx),%xmm4 + DB 102,15,254,161,146,203,0,0 ; paddd 0xcb92(%ecx),%xmm4 DB 102,15,110,104,4 ; movd 0x4(%eax),%xmm5 DB 102,15,112,253,0 ; pshufd $0x0,%xmm5,%xmm7 DB 102,15,239,252 ; pxor %xmm4,%xmm7 - DB 102,15,111,177,194,203,0,0 ; movdqa 0xcbc2(%ecx),%xmm6 + DB 102,15,111,177,162,203,0,0 ; movdqa 0xcba2(%ecx),%xmm6 DB 102,15,111,207 ; movdqa %xmm7,%xmm1 DB 102,15,219,206 ; pand %xmm6,%xmm1 DB 102,15,114,241,5 ; pslld $0x5,%xmm1 - DB 102,15,111,129,226,203,0,0 ; movdqa 0xcbe2(%ecx),%xmm0 + DB 102,15,111,129,194,203,0,0 ; movdqa 0xcbc2(%ecx),%xmm0 DB 102,15,111,239 ; movdqa %xmm7,%xmm5 DB 102,15,219,232 ; pand %xmm0,%xmm5 DB 102,15,114,245,2 ; pslld $0x2,%xmm5 @@ -43630,7 +43630,7 @@ _sk_dither_sse2 LABEL PROC DB 102,15,219,196 ; pand %xmm4,%xmm0 DB 102,15,254,192 ; paddd %xmm0,%xmm0 DB 102,15,235,198 ; por %xmm6,%xmm0 - DB 102,15,111,137,210,203,0,0 ; movdqa 0xcbd2(%ecx),%xmm1 + DB 102,15,111,137,178,203,0,0 ; movdqa 0xcbb2(%ecx),%xmm1 DB 102,15,219,249 ; pand %xmm1,%xmm7 DB 102,15,219,225 ; pand %xmm1,%xmm4 DB 102,15,114,212,2 ; psrld $0x2,%xmm4 @@ -43641,8 +43641,8 @@ _sk_dither_sse2 LABEL PROC DB 102,15,114,215,1 ; psrld $0x1,%xmm7 DB 102,15,235,231 ; por %xmm7,%xmm4 DB 15,91,196 ; cvtdq2ps %xmm4,%xmm0 - DB 15,89,129,242,203,0,0 ; mulps 0xcbf2(%ecx),%xmm0 - DB 15,88,129,2,204,0,0 ; addps 0xcc02(%ecx),%xmm0 + DB 15,89,129,210,203,0,0 ; mulps 0xcbd2(%ecx),%xmm0 + DB 15,88,129,226,203,0,0 ; addps 0xcbe2(%ecx),%xmm0 DB 243,15,16,14 ; movss (%esi),%xmm1 DB 15,198,201,0 ; shufps $0x0,%xmm1,%xmm1 DB 15,89,200 ; mulps %xmm0,%xmm1 @@ -43706,7 +43706,7 @@ _sk_black_color_sse2 LABEL PROC DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 141,81,4 ; lea 0x4(%ecx),%edx DB 131,236,8 ; sub $0x8,%esp - DB 15,40,152,102,202,0,0 ; movaps 0xca66(%eax),%xmm3 + DB 15,40,152,70,202,0,0 ; movaps 0xca46(%eax),%xmm3 DB 15,87,192 ; xorps %xmm0,%xmm0 DB 15,87,201 ; xorps %xmm1,%xmm1 DB 15,87,210 ; xorps %xmm2,%xmm2 @@ -43727,7 +43727,7 @@ _sk_white_color_sse2 LABEL PROC DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 141,81,4 ; lea 0x4(%ecx),%edx DB 131,236,8 ; sub $0x8,%esp - DB 15,40,128,54,202,0,0 ; movaps 0xca36(%eax),%xmm0 + DB 15,40,128,22,202,0,0 ; movaps 0xca16(%eax),%xmm0 DB 15,40,200 ; movaps %xmm0,%xmm1 DB 15,40,208 ; movaps %xmm0,%xmm2 DB 15,40,216 ; movaps %xmm0,%xmm3 @@ -43809,7 +43809,7 @@ _sk_srcatop_sse2 LABEL PROC DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 15,40,97,64 ; movaps 0x40(%ecx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 - DB 15,40,170,135,201,0,0 ; movaps 0xc987(%edx),%xmm5 + DB 15,40,170,103,201,0,0 ; movaps 0xc967(%edx),%xmm5 DB 15,92,235 ; subps %xmm3,%xmm5 DB 15,40,113,16 ; movaps 0x10(%ecx),%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 @@ -43846,7 +43846,7 @@ _sk_dstatop_sse2 LABEL PROC DB 15,40,105,64 ; movaps 0x40(%ecx),%xmm5 DB 15,40,113,16 ; movaps 0x10(%ecx),%xmm6 DB 15,89,243 ; mulps %xmm3,%xmm6 - DB 15,40,162,40,201,0,0 ; movaps 0xc928(%edx),%xmm4 + DB 15,40,162,8,201,0,0 ; movaps 0xc908(%edx),%xmm4 DB 15,92,229 ; subps %xmm5,%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 15,88,198 ; addps %xmm6,%xmm0 @@ -43924,7 +43924,7 @@ _sk_srcout_sse2 LABEL PROC DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,85,8 ; mov 0x8(%ebp),%edx - DB 15,40,160,103,200,0,0 ; movaps 0xc867(%eax),%xmm4 + DB 15,40,160,71,200,0,0 ; movaps 0xc847(%eax),%xmm4 DB 15,92,98,64 ; subps 0x40(%edx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 15,89,204 ; mulps %xmm4,%xmm1 @@ -43948,7 +43948,7 @@ _sk_dstout_sse2 LABEL PROC DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,85,8 ; mov 0x8(%ebp),%edx - DB 15,40,160,47,200,0,0 ; movaps 0xc82f(%eax),%xmm4 + DB 15,40,160,15,200,0,0 ; movaps 0xc80f(%eax),%xmm4 DB 15,92,227 ; subps %xmm3,%xmm4 DB 15,40,66,16 ; movaps 0x10(%edx),%xmm0 DB 15,89,196 ; mulps %xmm4,%xmm0 @@ -43976,7 +43976,7 @@ _sk_srcover_sse2 LABEL PROC DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,85,8 ; mov 0x8(%ebp),%edx - DB 15,40,160,232,199,0,0 ; movaps 0xc7e8(%eax),%xmm4 + DB 15,40,160,200,199,0,0 ; movaps 0xc7c8(%eax),%xmm4 DB 15,92,227 ; subps %xmm3,%xmm4 DB 15,40,106,16 ; movaps 0x10(%edx),%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 @@ -44008,7 +44008,7 @@ _sk_dstover_sse2 LABEL PROC DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,85,8 ; mov 0x8(%ebp),%edx DB 15,40,106,64 ; movaps 0x40(%edx),%xmm5 - DB 15,40,160,152,199,0,0 ; movaps 0xc798(%eax),%xmm4 + DB 15,40,160,120,199,0,0 ; movaps 0xc778(%eax),%xmm4 DB 15,92,229 ; subps %xmm5,%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 15,88,66,16 ; addps 0x10(%edx),%xmm0 @@ -44060,7 +44060,7 @@ _sk_multiply_sse2 LABEL PROC DB 139,69,8 ; mov 0x8(%ebp),%eax DB 15,40,80,64 ; movaps 0x40(%eax),%xmm2 DB 15,41,85,200 ; movaps %xmm2,-0x38(%ebp) - DB 15,40,129,25,199,0,0 ; movaps 0xc719(%ecx),%xmm0 + DB 15,40,129,249,198,0,0 ; movaps 0xc6f9(%ecx),%xmm0 DB 15,40,240 ; movaps %xmm0,%xmm6 DB 15,92,242 ; subps %xmm2,%xmm6 DB 15,40,254 ; movaps %xmm6,%xmm7 @@ -44118,7 +44118,7 @@ _sk_plus__sse2 LABEL PROC DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,85,8 ; mov 0x8(%ebp),%edx DB 15,88,66,16 ; addps 0x10(%edx),%xmm0 - DB 15,40,160,115,198,0,0 ; movaps 0xc673(%eax),%xmm4 + DB 15,40,160,83,198,0,0 ; movaps 0xc653(%eax),%xmm4 DB 15,93,196 ; minps %xmm4,%xmm0 DB 15,88,74,32 ; addps 0x20(%edx),%xmm1 DB 15,93,204 ; minps %xmm4,%xmm1 @@ -44186,7 +44186,7 @@ _sk_xor__sse2 LABEL PROC DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 15,40,105,64 ; movaps 0x40(%ecx),%xmm5 - DB 15,40,154,197,197,0,0 ; movaps 0xc5c5(%edx),%xmm3 + DB 15,40,154,165,197,0,0 ; movaps 0xc5a5(%edx),%xmm3 DB 15,40,243 ; movaps %xmm3,%xmm6 DB 15,92,245 ; subps %xmm5,%xmm6 DB 15,89,198 ; mulps %xmm6,%xmm0 @@ -44246,7 +44246,7 @@ _sk_darken_sse2 LABEL PROC DB 15,89,203 ; mulps %xmm3,%xmm1 DB 15,95,209 ; maxps %xmm1,%xmm2 DB 15,92,234 ; subps %xmm2,%xmm5 - DB 15,40,138,93,197,0,0 ; movaps 0xc55d(%edx),%xmm1 + DB 15,40,138,61,197,0,0 ; movaps 0xc53d(%edx),%xmm1 DB 15,92,203 ; subps %xmm3,%xmm1 DB 15,89,206 ; mulps %xmm6,%xmm1 DB 15,88,217 ; addps %xmm1,%xmm3 @@ -44293,7 +44293,7 @@ _sk_lighten_sse2 LABEL PROC DB 15,89,203 ; mulps %xmm3,%xmm1 DB 15,93,209 ; minps %xmm1,%xmm2 DB 15,92,234 ; subps %xmm2,%xmm5 - DB 15,40,138,221,196,0,0 ; movaps 0xc4dd(%edx),%xmm1 + DB 15,40,138,189,196,0,0 ; movaps 0xc4bd(%edx),%xmm1 DB 15,92,203 ; subps %xmm3,%xmm1 DB 15,89,206 ; mulps %xmm6,%xmm1 DB 15,88,217 ; addps %xmm1,%xmm3 @@ -44344,7 +44344,7 @@ _sk_difference_sse2 LABEL PROC DB 15,93,214 ; minps %xmm6,%xmm2 DB 15,88,210 ; addps %xmm2,%xmm2 DB 15,92,226 ; subps %xmm2,%xmm4 - DB 15,40,146,90,196,0,0 ; movaps 0xc45a(%edx),%xmm2 + DB 15,40,146,58,196,0,0 ; movaps 0xc43a(%edx),%xmm2 DB 15,92,211 ; subps %xmm3,%xmm2 DB 15,89,213 ; mulps %xmm5,%xmm2 DB 15,88,218 ; addps %xmm2,%xmm3 @@ -44386,7 +44386,7 @@ _sk_exclusion_sse2 LABEL PROC DB 15,89,202 ; mulps %xmm2,%xmm1 DB 15,88,201 ; addps %xmm1,%xmm1 DB 15,92,233 ; subps %xmm1,%xmm5 - DB 15,40,138,212,195,0,0 ; movaps 0xc3d4(%edx),%xmm1 + DB 15,40,138,180,195,0,0 ; movaps 0xc3b4(%edx),%xmm1 DB 15,92,203 ; subps %xmm3,%xmm1 DB 15,89,73,64 ; mulps 0x40(%ecx),%xmm1 DB 15,88,217 ; addps %xmm1,%xmm3 @@ -44425,7 +44425,7 @@ _sk_colorburn_sse2 LABEL PROC DB 15,93,198 ; minps %xmm6,%xmm0 DB 15,40,233 ; movaps %xmm1,%xmm5 DB 15,92,232 ; subps %xmm0,%xmm5 - DB 15,40,177,85,195,0,0 ; movaps 0xc355(%ecx),%xmm6 + DB 15,40,177,53,195,0,0 ; movaps 0xc335(%ecx),%xmm6 DB 15,40,198 ; movaps %xmm6,%xmm0 DB 15,92,193 ; subps %xmm1,%xmm0 DB 15,41,69,200 ; movaps %xmm0,-0x38(%ebp) @@ -44540,7 +44540,7 @@ _sk_colordodge_sse2 LABEL PROC DB 89 ; pop %ecx DB 139,69,8 ; mov 0x8(%ebp),%eax DB 15,40,72,16 ; movaps 0x10(%eax),%xmm1 - DB 15,40,145,204,193,0,0 ; movaps 0xc1cc(%ecx),%xmm2 + DB 15,40,145,172,193,0,0 ; movaps 0xc1ac(%ecx),%xmm2 DB 15,40,226 ; movaps %xmm2,%xmm4 DB 15,92,214 ; subps %xmm6,%xmm2 DB 15,40,250 ; movaps %xmm2,%xmm7 @@ -44655,7 +44655,7 @@ _sk_hardlight_sse2 LABEL PROC DB 89 ; pop %ecx DB 139,69,8 ; mov 0x8(%ebp),%eax DB 15,40,72,64 ; movaps 0x40(%eax),%xmm1 - DB 15,40,145,107,192,0,0 ; movaps 0xc06b(%ecx),%xmm2 + DB 15,40,145,75,192,0,0 ; movaps 0xc04b(%ecx),%xmm2 DB 15,40,234 ; movaps %xmm2,%xmm5 DB 15,92,233 ; subps %xmm1,%xmm5 DB 15,40,225 ; movaps %xmm1,%xmm4 @@ -44763,7 +44763,7 @@ _sk_overlay_sse2 LABEL PROC DB 89 ; pop %ecx DB 139,69,8 ; mov 0x8(%ebp),%eax DB 15,40,80,64 ; movaps 0x40(%eax),%xmm2 - DB 15,40,161,32,191,0,0 ; movaps 0xbf20(%ecx),%xmm4 + DB 15,40,161,0,191,0,0 ; movaps 0xbf00(%ecx),%xmm4 DB 15,40,244 ; movaps %xmm4,%xmm6 DB 15,92,242 ; subps %xmm2,%xmm6 DB 15,40,206 ; movaps %xmm6,%xmm1 @@ -44889,17 +44889,17 @@ _sk_softlight_sse2 LABEL PROC DB 232,0,0,0,0 ; call f60 <_sk_softlight_sse2+0x52> DB 89 ; pop %ecx DB 15,40,194 ; movaps %xmm2,%xmm0 - DB 15,40,137,0,190,0,0 ; movaps 0xbe00(%ecx),%xmm1 + DB 15,40,137,224,189,0,0 ; movaps 0xbde0(%ecx),%xmm1 DB 15,41,141,104,255,255,255 ; movaps %xmm1,-0x98(%ebp) DB 15,88,193 ; addps %xmm1,%xmm0 DB 15,89,198 ; mulps %xmm6,%xmm0 - DB 15,40,185,144,189,0,0 ; movaps 0xbd90(%ecx),%xmm7 + DB 15,40,185,112,189,0,0 ; movaps 0xbd70(%ecx),%xmm7 DB 15,41,125,232 ; movaps %xmm7,-0x18(%ebp) DB 15,92,250 ; subps %xmm2,%xmm7 DB 15,82,242 ; rsqrtps %xmm2,%xmm6 DB 15,83,206 ; rcpps %xmm6,%xmm1 DB 15,92,202 ; subps %xmm2,%xmm1 - DB 15,40,161,16,190,0,0 ; movaps 0xbe10(%ecx),%xmm4 + DB 15,40,161,240,189,0,0 ; movaps 0xbdf0(%ecx),%xmm4 DB 15,41,101,152 ; movaps %xmm4,-0x68(%ebp) DB 15,89,212 ; mulps %xmm4,%xmm2 DB 15,88,208 ; addps %xmm0,%xmm2 @@ -45103,7 +45103,7 @@ _sk_hue_sse2 LABEL PROC DB 15,40,226 ; movaps %xmm2,%xmm4 DB 15,40,72,64 ; movaps 0x40(%eax),%xmm1 DB 15,41,77,216 ; movaps %xmm1,-0x28(%ebp) - DB 15,40,169,207,186,0,0 ; movaps 0xbacf(%ecx),%xmm5 + DB 15,40,169,175,186,0,0 ; movaps 0xbaaf(%ecx),%xmm5 DB 15,92,233 ; subps %xmm1,%xmm5 DB 15,89,197 ; mulps %xmm5,%xmm0 DB 15,41,133,72,255,255,255 ; movaps %xmm0,-0xb8(%ebp) @@ -45136,17 +45136,17 @@ _sk_hue_sse2 LABEL PROC DB 15,89,233 ; mulps %xmm1,%xmm5 DB 15,41,173,120,255,255,255 ; movaps %xmm5,-0x88(%ebp) DB 15,89,193 ; mulps %xmm1,%xmm0 - DB 15,40,153,95,187,0,0 ; movaps 0xbb5f(%ecx),%xmm3 + DB 15,40,153,63,187,0,0 ; movaps 0xbb3f(%ecx),%xmm3 DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp) DB 15,40,117,152 ; movaps -0x68(%ebp),%xmm6 DB 15,40,206 ; movaps %xmm6,%xmm1 DB 15,89,203 ; mulps %xmm3,%xmm1 - DB 15,40,153,111,187,0,0 ; movaps 0xbb6f(%ecx),%xmm3 + DB 15,40,153,79,187,0,0 ; movaps 0xbb4f(%ecx),%xmm3 DB 15,40,109,136 ; movaps -0x78(%ebp),%xmm5 DB 15,40,253 ; movaps %xmm5,%xmm7 DB 15,89,251 ; mulps %xmm3,%xmm7 DB 15,88,249 ; addps %xmm1,%xmm7 - DB 15,40,137,207,186,0,0 ; movaps 0xbacf(%ecx),%xmm1 + DB 15,40,137,175,186,0,0 ; movaps 0xbaaf(%ecx),%xmm1 DB 15,92,77,184 ; subps -0x48(%ebp),%xmm1 DB 15,89,241 ; mulps %xmm1,%xmm6 DB 15,41,117,152 ; movaps %xmm6,-0x68(%ebp) @@ -45156,7 +45156,7 @@ _sk_hue_sse2 LABEL PROC DB 15,40,77,200 ; movaps -0x38(%ebp),%xmm1 DB 15,89,241 ; mulps %xmm1,%xmm6 DB 15,41,117,168 ; movaps %xmm6,-0x58(%ebp) - DB 15,40,169,127,187,0,0 ; movaps 0xbb7f(%ecx),%xmm5 + DB 15,40,169,95,187,0,0 ; movaps 0xbb5f(%ecx),%xmm5 DB 15,89,205 ; mulps %xmm5,%xmm1 DB 15,88,207 ; addps %xmm7,%xmm1 DB 15,94,212 ; divps %xmm4,%xmm2 @@ -45347,17 +45347,17 @@ _sk_saturation_sse2 LABEL PROC DB 15,89,253 ; mulps %xmm5,%xmm7 DB 232,0,0,0,0 ; call 1575 <_sk_saturation_sse2+0xb0> DB 89 ; pop %ecx - DB 15,40,153,11,184,0,0 ; movaps 0xb80b(%ecx),%xmm3 + DB 15,40,153,235,183,0,0 ; movaps 0xb7eb(%ecx),%xmm3 DB 15,41,157,88,255,255,255 ; movaps %xmm3,-0xa8(%ebp) DB 15,40,77,184 ; movaps -0x48(%ebp),%xmm1 DB 15,40,193 ; movaps %xmm1,%xmm0 DB 15,89,195 ; mulps %xmm3,%xmm0 - DB 15,40,153,27,184,0,0 ; movaps 0xb81b(%ecx),%xmm3 + DB 15,40,153,251,183,0,0 ; movaps 0xb7fb(%ecx),%xmm3 DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp) DB 15,40,238 ; movaps %xmm6,%xmm5 DB 15,89,235 ; mulps %xmm3,%xmm5 DB 15,88,232 ; addps %xmm0,%xmm5 - DB 15,40,129,123,183,0,0 ; movaps 0xb77b(%ecx),%xmm0 + DB 15,40,129,91,183,0,0 ; movaps 0xb75b(%ecx),%xmm0 DB 15,41,133,104,255,255,255 ; movaps %xmm0,-0x98(%ebp) DB 15,92,69,216 ; subps -0x28(%ebp),%xmm0 DB 15,89,200 ; mulps %xmm0,%xmm1 @@ -45369,7 +45369,7 @@ _sk_saturation_sse2 LABEL PROC DB 15,89,200 ; mulps %xmm0,%xmm1 DB 15,41,141,120,255,255,255 ; movaps %xmm1,-0x88(%ebp) DB 15,40,200 ; movaps %xmm0,%xmm1 - DB 15,40,129,43,184,0,0 ; movaps 0xb82b(%ecx),%xmm0 + DB 15,40,129,11,184,0,0 ; movaps 0xb80b(%ecx),%xmm0 DB 15,89,200 ; mulps %xmm0,%xmm1 DB 15,88,205 ; addps %xmm5,%xmm1 DB 15,40,109,168 ; movaps -0x58(%ebp),%xmm5 @@ -45526,16 +45526,16 @@ _sk_color_sse2 LABEL PROC DB 139,69,8 ; mov 0x8(%ebp),%eax DB 15,40,80,16 ; movaps 0x10(%eax),%xmm2 DB 15,40,72,32 ; movaps 0x20(%eax),%xmm1 - DB 15,40,177,176,181,0,0 ; movaps 0xb5b0(%ecx),%xmm6 + DB 15,40,177,144,181,0,0 ; movaps 0xb590(%ecx),%xmm6 DB 15,41,117,216 ; movaps %xmm6,-0x28(%ebp) DB 15,40,194 ; movaps %xmm2,%xmm0 DB 15,89,198 ; mulps %xmm6,%xmm0 - DB 15,40,153,192,181,0,0 ; movaps 0xb5c0(%ecx),%xmm3 + DB 15,40,153,160,181,0,0 ; movaps 0xb5a0(%ecx),%xmm3 DB 15,41,93,184 ; movaps %xmm3,-0x48(%ebp) DB 15,40,241 ; movaps %xmm1,%xmm6 DB 15,89,243 ; mulps %xmm3,%xmm6 DB 15,88,240 ; addps %xmm0,%xmm6 - DB 15,40,129,32,181,0,0 ; movaps 0xb520(%ecx),%xmm0 + DB 15,40,129,0,181,0,0 ; movaps 0xb500(%ecx),%xmm0 DB 15,41,69,168 ; movaps %xmm0,-0x58(%ebp) DB 15,92,69,200 ; subps -0x38(%ebp),%xmm0 DB 15,89,208 ; mulps %xmm0,%xmm2 @@ -45545,7 +45545,7 @@ _sk_color_sse2 LABEL PROC DB 15,40,80,48 ; movaps 0x30(%eax),%xmm2 DB 15,89,194 ; mulps %xmm2,%xmm0 DB 15,41,133,72,255,255,255 ; movaps %xmm0,-0xb8(%ebp) - DB 15,40,137,208,181,0,0 ; movaps 0xb5d0(%ecx),%xmm1 + DB 15,40,137,176,181,0,0 ; movaps 0xb5b0(%ecx),%xmm1 DB 15,89,209 ; mulps %xmm1,%xmm2 DB 15,88,214 ; addps %xmm6,%xmm2 DB 15,40,88,64 ; movaps 0x40(%eax),%xmm3 @@ -45702,18 +45702,18 @@ _sk_luminosity_sse2 LABEL PROC DB 232,0,0,0,0 ; call 1a33 <_sk_luminosity_sse2+0x11> DB 89 ; pop %ecx DB 139,69,8 ; mov 0x8(%ebp),%eax - DB 15,40,161,77,179,0,0 ; movaps 0xb34d(%ecx),%xmm4 + DB 15,40,161,45,179,0,0 ; movaps 0xb32d(%ecx),%xmm4 DB 15,41,101,232 ; movaps %xmm4,-0x18(%ebp) DB 15,40,208 ; movaps %xmm0,%xmm2 DB 15,89,212 ; mulps %xmm4,%xmm2 - DB 15,40,161,93,179,0,0 ; movaps 0xb35d(%ecx),%xmm4 + DB 15,40,161,61,179,0,0 ; movaps 0xb33d(%ecx),%xmm4 DB 15,41,101,216 ; movaps %xmm4,-0x28(%ebp) DB 15,40,233 ; movaps %xmm1,%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 DB 15,88,234 ; addps %xmm2,%xmm5 DB 15,40,80,64 ; movaps 0x40(%eax),%xmm2 DB 15,41,85,184 ; movaps %xmm2,-0x48(%ebp) - DB 15,40,161,189,178,0,0 ; movaps 0xb2bd(%ecx),%xmm4 + DB 15,40,161,157,178,0,0 ; movaps 0xb29d(%ecx),%xmm4 DB 15,40,252 ; movaps %xmm4,%xmm7 DB 15,92,250 ; subps %xmm2,%xmm7 DB 15,89,199 ; mulps %xmm7,%xmm0 @@ -45723,7 +45723,7 @@ _sk_luminosity_sse2 LABEL PROC DB 15,89,254 ; mulps %xmm6,%xmm7 DB 15,41,189,104,255,255,255 ; movaps %xmm7,-0x98(%ebp) DB 15,40,214 ; movaps %xmm6,%xmm2 - DB 15,40,137,109,179,0,0 ; movaps 0xb36d(%ecx),%xmm1 + DB 15,40,137,77,179,0,0 ; movaps 0xb34d(%ecx),%xmm1 DB 15,89,209 ; mulps %xmm1,%xmm2 DB 15,88,213 ; addps %xmm5,%xmm2 DB 15,40,104,16 ; movaps 0x10(%eax),%xmm5 @@ -45897,7 +45897,7 @@ _sk_srcover_rgba_8888_sse2 LABEL PROC DB 139,49 ; mov (%ecx),%esi DB 15,133,224,0,0,0 ; jne 1da0 <_sk_srcover_rgba_8888_sse2+0x119> DB 243,15,111,20,178 ; movdqu (%edx,%esi,4),%xmm2 - DB 102,15,111,167,18,177,0,0 ; movdqa 0xb112(%edi),%xmm4 + DB 102,15,111,167,242,176,0,0 ; movdqa 0xb0f2(%edi),%xmm4 DB 102,15,111,234 ; movdqa %xmm2,%xmm5 DB 102,15,219,236 ; pand %xmm4,%xmm5 DB 102,15,111,242 ; movdqa %xmm2,%xmm6 @@ -45908,9 +45908,9 @@ _sk_srcover_rgba_8888_sse2 LABEL PROC DB 102,15,219,252 ; pand %xmm4,%xmm7 DB 15,91,229 ; cvtdq2ps %xmm5,%xmm4 DB 15,41,97,16 ; movaps %xmm4,0x10(%ecx) - DB 15,40,175,82,176,0,0 ; movaps 0xb052(%edi),%xmm5 + DB 15,40,175,50,176,0,0 ; movaps 0xb032(%edi),%xmm5 DB 15,92,235 ; subps %xmm3,%xmm5 - DB 15,40,143,34,177,0,0 ; movaps 0xb122(%edi),%xmm1 + DB 15,40,143,2,177,0,0 ; movaps 0xb102(%edi),%xmm1 DB 15,89,193 ; mulps %xmm1,%xmm0 DB 15,89,229 ; mulps %xmm5,%xmm4 DB 15,88,224 ; addps %xmm0,%xmm4 @@ -46020,7 +46020,7 @@ _sk_clamp_1_sse2 LABEL PROC DB 232,0,0,0,0 ; call 1e4a <_sk_clamp_1_sse2+0xb> DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 15,40,160,166,174,0,0 ; movaps 0xaea6(%eax),%xmm4 + DB 15,40,160,134,174,0,0 ; movaps 0xae86(%eax),%xmm4 DB 15,93,196 ; minps %xmm4,%xmm0 DB 15,93,204 ; minps %xmm4,%xmm1 DB 15,93,212 ; minps %xmm4,%xmm2 @@ -46042,7 +46042,7 @@ _sk_clamp_a_sse2 LABEL PROC DB 232,0,0,0,0 ; call 1e7d <_sk_clamp_a_sse2+0xb> DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 15,93,152,115,174,0,0 ; minps 0xae73(%eax),%xmm3 + DB 15,93,152,83,174,0,0 ; minps 0xae53(%eax),%xmm3 DB 15,93,195 ; minps %xmm3,%xmm0 DB 15,93,203 ; minps %xmm3,%xmm1 DB 15,93,211 ; minps %xmm3,%xmm2 @@ -46065,7 +46065,7 @@ _sk_clamp_a_dst_sse2 LABEL PROC DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,85,8 ; mov 0x8(%ebp),%edx DB 15,40,98,64 ; movaps 0x40(%edx),%xmm4 - DB 15,93,160,67,174,0,0 ; minps 0xae43(%eax),%xmm4 + DB 15,93,160,35,174,0,0 ; minps 0xae23(%eax),%xmm4 DB 15,41,98,64 ; movaps %xmm4,0x40(%edx) DB 15,40,106,16 ; movaps 0x10(%edx),%xmm5 DB 15,40,114,32 ; movaps 0x20(%edx),%xmm6 @@ -46133,7 +46133,7 @@ _sk_invert_sse2 LABEL PROC DB 232,0,0,0,0 ; call 1f58 <_sk_invert_sse2+0xb> DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 15,40,160,152,173,0,0 ; movaps 0xad98(%eax),%xmm4 + DB 15,40,160,120,173,0,0 ; movaps 0xad78(%eax),%xmm4 DB 15,40,236 ; movaps %xmm4,%xmm5 DB 15,92,232 ; subps %xmm0,%xmm5 DB 15,40,244 ; movaps %xmm4,%xmm6 @@ -46246,7 +46246,7 @@ _sk_unpremul_sse2 LABEL PROC DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 15,87,228 ; xorps %xmm4,%xmm4 - DB 15,40,168,154,172,0,0 ; movaps 0xac9a(%eax),%xmm5 + DB 15,40,168,122,172,0,0 ; movaps 0xac7a(%eax),%xmm5 DB 15,94,235 ; divps %xmm3,%xmm5 DB 15,194,227,4 ; cmpneqps %xmm3,%xmm4 DB 15,84,229 ; andps %xmm5,%xmm4 @@ -46275,19 +46275,19 @@ _sk_from_srgb_sse2 LABEL PROC DB 88 ; pop %eax DB 15,40,202 ; movaps %xmm2,%xmm1 DB 15,89,201 ; mulps %xmm1,%xmm1 - DB 15,40,160,224,172,0,0 ; movaps 0xace0(%eax),%xmm4 + DB 15,40,160,192,172,0,0 ; movaps 0xacc0(%eax),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 - DB 15,40,176,64,173,0,0 ; movaps 0xad40(%eax),%xmm6 + DB 15,40,176,32,173,0,0 ; movaps 0xad20(%eax),%xmm6 DB 15,41,117,216 ; movaps %xmm6,-0x28(%ebp) DB 15,88,198 ; addps %xmm6,%xmm0 DB 15,89,193 ; mulps %xmm1,%xmm0 - DB 15,40,176,48,173,0,0 ; movaps 0xad30(%eax),%xmm6 + DB 15,40,176,16,173,0,0 ; movaps 0xad10(%eax),%xmm6 DB 15,40,202 ; movaps %xmm2,%xmm1 DB 15,89,206 ; mulps %xmm6,%xmm1 - DB 15,40,184,80,173,0,0 ; movaps 0xad50(%eax),%xmm7 + DB 15,40,184,48,173,0,0 ; movaps 0xad30(%eax),%xmm7 DB 15,41,125,232 ; movaps %xmm7,-0x18(%ebp) DB 15,88,199 ; addps %xmm7,%xmm0 - DB 15,40,184,96,173,0,0 ; movaps 0xad60(%eax),%xmm7 + DB 15,40,184,64,173,0,0 ; movaps 0xad40(%eax),%xmm7 DB 15,194,215,1 ; cmpltps %xmm7,%xmm2 DB 15,84,202 ; andps %xmm2,%xmm1 DB 15,85,208 ; andnps %xmm0,%xmm2 @@ -46345,18 +46345,18 @@ _sk_from_srgb_dst_sse2 LABEL PROC DB 15,40,72,16 ; movaps 0x10(%eax),%xmm1 DB 15,40,233 ; movaps %xmm1,%xmm5 DB 15,89,237 ; mulps %xmm5,%xmm5 - DB 15,40,161,5,172,0,0 ; movaps 0xac05(%ecx),%xmm4 + DB 15,40,161,229,171,0,0 ; movaps 0xabe5(%ecx),%xmm4 DB 15,40,193 ; movaps %xmm1,%xmm0 DB 15,89,196 ; mulps %xmm4,%xmm0 - DB 15,40,177,101,172,0,0 ; movaps 0xac65(%ecx),%xmm6 + DB 15,40,177,69,172,0,0 ; movaps 0xac45(%ecx),%xmm6 DB 15,88,198 ; addps %xmm6,%xmm0 DB 15,89,197 ; mulps %xmm5,%xmm0 - DB 15,40,169,85,172,0,0 ; movaps 0xac55(%ecx),%xmm5 + DB 15,40,169,53,172,0,0 ; movaps 0xac35(%ecx),%xmm5 DB 15,40,209 ; movaps %xmm1,%xmm2 DB 15,89,213 ; mulps %xmm5,%xmm2 - DB 15,40,185,117,172,0,0 ; movaps 0xac75(%ecx),%xmm7 + DB 15,40,185,85,172,0,0 ; movaps 0xac55(%ecx),%xmm7 DB 15,88,199 ; addps %xmm7,%xmm0 - DB 15,40,153,133,172,0,0 ; movaps 0xac85(%ecx),%xmm3 + DB 15,40,153,101,172,0,0 ; movaps 0xac65(%ecx),%xmm3 DB 15,194,203,1 ; cmpltps %xmm3,%xmm1 DB 15,84,209 ; andps %xmm1,%xmm2 DB 15,85,200 ; andnps %xmm0,%xmm1 @@ -46416,25 +46416,25 @@ _sk_to_srgb_sse2 LABEL PROC DB 232,0,0,0,0 ; call 2266 <_sk_to_srgb_sse2+0x18> DB 88 ; pop %eax DB 15,82,218 ; rsqrtps %xmm2,%xmm3 - DB 15,40,160,186,171,0,0 ; movaps 0xabba(%eax),%xmm4 + DB 15,40,160,154,171,0,0 ; movaps 0xab9a(%eax),%xmm4 DB 15,40,235 ; movaps %xmm3,%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 - DB 15,40,128,202,171,0,0 ; movaps 0xabca(%eax),%xmm0 + DB 15,40,128,170,171,0,0 ; movaps 0xabaa(%eax),%xmm0 DB 15,41,69,232 ; movaps %xmm0,-0x18(%ebp) DB 15,88,232 ; addps %xmm0,%xmm5 DB 15,89,235 ; mulps %xmm3,%xmm5 - DB 15,40,128,218,171,0,0 ; movaps 0xabda(%eax),%xmm0 + DB 15,40,128,186,171,0,0 ; movaps 0xabba(%eax),%xmm0 DB 15,41,69,200 ; movaps %xmm0,-0x38(%ebp) DB 15,88,232 ; addps %xmm0,%xmm5 - DB 15,40,128,234,171,0,0 ; movaps 0xabea(%eax),%xmm0 + DB 15,40,128,202,171,0,0 ; movaps 0xabca(%eax),%xmm0 DB 15,41,69,216 ; movaps %xmm0,-0x28(%ebp) DB 15,88,216 ; addps %xmm0,%xmm3 DB 15,83,195 ; rcpps %xmm3,%xmm0 DB 15,89,197 ; mulps %xmm5,%xmm0 - DB 15,40,168,170,171,0,0 ; movaps 0xabaa(%eax),%xmm5 + DB 15,40,168,138,171,0,0 ; movaps 0xab8a(%eax),%xmm5 DB 15,40,202 ; movaps %xmm2,%xmm1 DB 15,89,205 ; mulps %xmm5,%xmm1 - DB 15,40,152,250,171,0,0 ; movaps 0xabfa(%eax),%xmm3 + DB 15,40,152,218,171,0,0 ; movaps 0xabda(%eax),%xmm3 DB 15,194,211,1 ; cmpltps %xmm3,%xmm2 DB 15,84,202 ; andps %xmm2,%xmm1 DB 15,85,208 ; andnps %xmm0,%xmm2 @@ -46503,14 +46503,14 @@ _sk_rgb_to_hsl_sse2 LABEL PROC DB 15,40,195 ; movaps %xmm3,%xmm0 DB 15,92,193 ; subps %xmm1,%xmm0 DB 15,41,69,216 ; movaps %xmm0,-0x28(%ebp) - DB 15,40,136,147,169,0,0 ; movaps 0xa993(%eax),%xmm1 + DB 15,40,136,115,169,0,0 ; movaps 0xa973(%eax),%xmm1 DB 15,94,200 ; divps %xmm0,%xmm1 DB 15,40,199 ; movaps %xmm7,%xmm0 DB 15,92,194 ; subps %xmm2,%xmm0 DB 15,89,193 ; mulps %xmm1,%xmm0 DB 15,40,239 ; movaps %xmm7,%xmm5 DB 15,194,234,1 ; cmpltps %xmm2,%xmm5 - DB 15,84,168,19,171,0,0 ; andps 0xab13(%eax),%xmm5 + DB 15,84,168,243,170,0,0 ; andps 0xaaf3(%eax),%xmm5 DB 15,88,232 ; addps %xmm0,%xmm5 DB 15,40,195 ; movaps %xmm3,%xmm0 DB 15,194,196,0 ; cmpeqps %xmm4,%xmm0 @@ -46520,9 +46520,9 @@ _sk_rgb_to_hsl_sse2 LABEL PROC DB 15,92,231 ; subps %xmm7,%xmm4 DB 15,89,209 ; mulps %xmm1,%xmm2 DB 15,89,225 ; mulps %xmm1,%xmm4 - DB 15,40,136,35,171,0,0 ; movaps 0xab23(%eax),%xmm1 + DB 15,40,136,3,171,0,0 ; movaps 0xab03(%eax),%xmm1 DB 15,88,209 ; addps %xmm1,%xmm2 - DB 15,88,160,51,171,0,0 ; addps 0xab33(%eax),%xmm4 + DB 15,88,160,19,171,0,0 ; addps 0xab13(%eax),%xmm4 DB 15,84,214 ; andps %xmm6,%xmm2 DB 15,85,244 ; andnps %xmm4,%xmm6 DB 15,86,242 ; orps %xmm2,%xmm6 @@ -46534,7 +46534,7 @@ _sk_rgb_to_hsl_sse2 LABEL PROC DB 15,194,226,4 ; cmpneqps %xmm2,%xmm4 DB 15,92,203 ; subps %xmm3,%xmm1 DB 15,88,218 ; addps %xmm2,%xmm3 - DB 15,40,168,131,169,0,0 ; movaps 0xa983(%eax),%xmm5 + DB 15,40,168,99,169,0,0 ; movaps 0xa963(%eax),%xmm5 DB 15,92,202 ; subps %xmm2,%xmm1 DB 15,40,211 ; movaps %xmm3,%xmm2 DB 15,89,213 ; mulps %xmm5,%xmm2 @@ -46544,7 +46544,7 @@ _sk_rgb_to_hsl_sse2 LABEL PROC DB 15,86,233 ; orps %xmm1,%xmm5 DB 15,40,77,216 ; movaps -0x28(%ebp),%xmm1 DB 15,94,205 ; divps %xmm5,%xmm1 - DB 15,89,128,67,171,0,0 ; mulps 0xab43(%eax),%xmm0 + DB 15,89,128,35,171,0,0 ; mulps 0xab23(%eax),%xmm0 DB 15,84,196 ; andps %xmm4,%xmm0 DB 15,84,204 ; andps %xmm4,%xmm1 DB 139,69,12 ; mov 0xc(%ebp),%eax @@ -46567,7 +46567,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC DB 15,41,69,184 ; movaps %xmm0,-0x48(%ebp) DB 232,0,0,0,0 ; call 2458 <_sk_hsl_to_rgb_sse2+0x19> DB 88 ; pop %eax - DB 15,40,160,136,168,0,0 ; movaps 0xa888(%eax),%xmm4 + DB 15,40,160,104,168,0,0 ; movaps 0xa868(%eax),%xmm4 DB 15,40,220 ; movaps %xmm4,%xmm3 DB 15,41,165,104,255,255,255 ; movaps %xmm4,-0x98(%ebp) DB 15,194,218,2 ; cmpleps %xmm2,%xmm3 @@ -46580,13 +46580,13 @@ _sk_hsl_to_rgb_sse2 LABEL PROC DB 15,84,243 ; andps %xmm3,%xmm6 DB 15,85,217 ; andnps %xmm1,%xmm3 DB 15,86,222 ; orps %xmm6,%xmm3 - DB 15,40,168,88,170,0,0 ; movaps 0xaa58(%eax),%xmm5 + DB 15,40,168,56,170,0,0 ; movaps 0xaa38(%eax),%xmm5 DB 15,88,232 ; addps %xmm0,%xmm5 DB 243,15,91,205 ; cvttps2dq %xmm5,%xmm1 DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,194,193,1 ; cmpltps %xmm1,%xmm0 - DB 15,40,176,152,168,0,0 ; movaps 0xa898(%eax),%xmm6 + DB 15,40,176,120,168,0,0 ; movaps 0xa878(%eax),%xmm6 DB 15,41,117,136 ; movaps %xmm6,-0x78(%ebp) DB 15,84,198 ; andps %xmm6,%xmm0 DB 15,92,200 ; subps %xmm0,%xmm1 @@ -46596,19 +46596,19 @@ _sk_hsl_to_rgb_sse2 LABEL PROC DB 15,41,93,216 ; movaps %xmm3,-0x28(%ebp) DB 15,88,210 ; addps %xmm2,%xmm2 DB 15,92,211 ; subps %xmm3,%xmm2 - DB 15,40,184,104,170,0,0 ; movaps 0xaa68(%eax),%xmm7 + DB 15,40,184,72,170,0,0 ; movaps 0xaa48(%eax),%xmm7 DB 15,41,189,88,255,255,255 ; movaps %xmm7,-0xa8(%ebp) DB 15,194,253,2 ; cmpleps %xmm5,%xmm7 DB 15,92,218 ; subps %xmm2,%xmm3 DB 15,41,93,200 ; movaps %xmm3,-0x38(%ebp) DB 15,40,204 ; movaps %xmm4,%xmm1 DB 15,194,205,2 ; cmpleps %xmm5,%xmm1 - DB 15,40,160,72,170,0,0 ; movaps 0xaa48(%eax),%xmm4 + DB 15,40,160,40,170,0,0 ; movaps 0xaa28(%eax),%xmm4 DB 15,41,165,120,255,255,255 ; movaps %xmm4,-0x88(%ebp) DB 15,194,229,2 ; cmpleps %xmm5,%xmm4 - DB 15,40,176,24,170,0,0 ; movaps 0xaa18(%eax),%xmm6 + DB 15,40,176,248,169,0,0 ; movaps 0xa9f8(%eax),%xmm6 DB 15,89,238 ; mulps %xmm6,%xmm5 - DB 15,40,128,56,170,0,0 ; movaps 0xaa38(%eax),%xmm0 + DB 15,40,128,24,170,0,0 ; movaps 0xaa18(%eax),%xmm0 DB 15,41,69,168 ; movaps %xmm0,-0x58(%ebp) DB 15,92,197 ; subps %xmm5,%xmm0 DB 15,89,195 ; mulps %xmm3,%xmm0 @@ -46634,18 +46634,18 @@ _sk_hsl_to_rgb_sse2 LABEL PROC DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 DB 15,40,203 ; movaps %xmm3,%xmm1 DB 15,194,200,1 ; cmpltps %xmm0,%xmm1 - DB 15,84,136,152,168,0,0 ; andps 0xa898(%eax),%xmm1 + DB 15,84,136,120,168,0,0 ; andps 0xa878(%eax),%xmm1 DB 15,92,193 ; subps %xmm1,%xmm0 DB 15,40,203 ; movaps %xmm3,%xmm1 DB 15,92,200 ; subps %xmm0,%xmm1 - DB 15,40,128,104,170,0,0 ; movaps 0xaa68(%eax),%xmm0 + DB 15,40,128,72,170,0,0 ; movaps 0xaa48(%eax),%xmm0 DB 15,194,193,2 ; cmpleps %xmm1,%xmm0 - DB 15,40,152,136,168,0,0 ; movaps 0xa888(%eax),%xmm3 + DB 15,40,152,104,168,0,0 ; movaps 0xa868(%eax),%xmm3 DB 15,194,217,2 ; cmpleps %xmm1,%xmm3 - DB 15,40,160,72,170,0,0 ; movaps 0xaa48(%eax),%xmm4 + DB 15,40,160,40,170,0,0 ; movaps 0xaa28(%eax),%xmm4 DB 15,194,225,2 ; cmpleps %xmm1,%xmm4 DB 15,89,206 ; mulps %xmm6,%xmm1 - DB 15,40,168,56,170,0,0 ; movaps 0xaa38(%eax),%xmm5 + DB 15,40,168,24,170,0,0 ; movaps 0xaa18(%eax),%xmm5 DB 15,92,233 ; subps %xmm1,%xmm5 DB 15,89,239 ; mulps %xmm7,%xmm5 DB 15,88,234 ; addps %xmm2,%xmm5 @@ -46665,7 +46665,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC DB 15,40,125,232 ; movaps -0x18(%ebp),%xmm7 DB 15,85,252 ; andnps %xmm4,%xmm7 DB 15,40,93,184 ; movaps -0x48(%ebp),%xmm3 - DB 15,88,152,120,170,0,0 ; addps 0xaa78(%eax),%xmm3 + DB 15,88,152,88,170,0,0 ; addps 0xaa58(%eax),%xmm3 DB 243,15,91,195 ; cvttps2dq %xmm3,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 DB 15,40,203 ; movaps %xmm3,%xmm1 @@ -46763,9 +46763,9 @@ _sk_scale_u8_sse2 LABEL PROC DB 102,15,110,36,62 ; movd (%esi,%edi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4 - DB 102,15,219,162,222,166,0,0 ; pand 0xa6de(%edx),%xmm4 + DB 102,15,219,162,190,166,0,0 ; pand 0xa6be(%edx),%xmm4 DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 - DB 15,89,162,14,168,0,0 ; mulps 0xa80e(%edx),%xmm4 + DB 15,89,162,238,167,0,0 ; mulps 0xa7ee(%edx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 15,89,204 ; mulps %xmm4,%xmm1 DB 15,89,212 ; mulps %xmm4,%xmm2 @@ -46829,17 +46829,17 @@ _sk_scale_565_sse2 LABEL PROC DB 15,133,157,0,0,0 ; jne 284a <_sk_scale_565_sse2+0xd8> DB 243,15,126,52,126 ; movq (%esi,%edi,2),%xmm6 DB 102,15,97,240 ; punpcklwd %xmm0,%xmm6 - DB 102,15,111,162,100,167,0,0 ; movdqa 0xa764(%edx),%xmm4 + DB 102,15,111,162,68,167,0,0 ; movdqa 0xa744(%edx),%xmm4 DB 102,15,219,230 ; pand %xmm6,%xmm4 DB 15,91,212 ; cvtdq2ps %xmm4,%xmm2 - DB 15,89,146,116,167,0,0 ; mulps 0xa774(%edx),%xmm2 - DB 102,15,111,170,132,167,0,0 ; movdqa 0xa784(%edx),%xmm5 + DB 15,89,146,84,167,0,0 ; mulps 0xa754(%edx),%xmm2 + DB 102,15,111,170,100,167,0,0 ; movdqa 0xa764(%edx),%xmm5 DB 102,15,219,238 ; pand %xmm6,%xmm5 DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5 - DB 15,89,170,148,167,0,0 ; mulps 0xa794(%edx),%xmm5 - DB 102,15,219,178,164,167,0,0 ; pand 0xa7a4(%edx),%xmm6 + DB 15,89,170,116,167,0,0 ; mulps 0xa774(%edx),%xmm5 + DB 102,15,219,178,132,167,0,0 ; pand 0xa784(%edx),%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 - DB 15,89,178,180,167,0,0 ; mulps 0xa7b4(%edx),%xmm6 + DB 15,89,178,148,167,0,0 ; mulps 0xa794(%edx),%xmm6 DB 15,40,253 ; movaps %xmm5,%xmm7 DB 15,93,254 ; minps %xmm6,%xmm7 DB 15,40,226 ; movaps %xmm2,%xmm4 @@ -46949,9 +46949,9 @@ _sk_lerp_u8_sse2 LABEL PROC DB 102,15,110,36,62 ; movd (%esi,%edi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4 - DB 102,15,219,162,182,164,0,0 ; pand 0xa4b6(%edx),%xmm4 + DB 102,15,219,162,150,164,0,0 ; pand 0xa496(%edx),%xmm4 DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 - DB 15,89,162,230,165,0,0 ; mulps 0xa5e6(%edx),%xmm4 + DB 15,89,162,198,165,0,0 ; mulps 0xa5c6(%edx),%xmm4 DB 15,40,105,16 ; movaps 0x10(%ecx),%xmm5 DB 15,40,113,32 ; movaps 0x20(%ecx),%xmm6 DB 15,92,197 ; subps %xmm5,%xmm0 @@ -47027,17 +47027,17 @@ _sk_lerp_565_sse2 LABEL PROC DB 15,133,211,0,0,0 ; jne 2ad8 <_sk_lerp_565_sse2+0x113> DB 243,15,126,44,126 ; movq (%esi,%edi,2),%xmm5 DB 102,15,97,232 ; punpcklwd %xmm0,%xmm5 - DB 102,15,111,162,12,165,0,0 ; movdqa 0xa50c(%edx),%xmm4 + DB 102,15,111,162,236,164,0,0 ; movdqa 0xa4ec(%edx),%xmm4 DB 102,15,219,229 ; pand %xmm5,%xmm4 DB 15,91,204 ; cvtdq2ps %xmm4,%xmm1 - DB 15,89,138,28,165,0,0 ; mulps 0xa51c(%edx),%xmm1 - DB 102,15,111,178,44,165,0,0 ; movdqa 0xa52c(%edx),%xmm6 + DB 15,89,138,252,164,0,0 ; mulps 0xa4fc(%edx),%xmm1 + DB 102,15,111,178,12,165,0,0 ; movdqa 0xa50c(%edx),%xmm6 DB 102,15,219,245 ; pand %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 - DB 15,89,178,60,165,0,0 ; mulps 0xa53c(%edx),%xmm6 - DB 102,15,219,170,76,165,0,0 ; pand 0xa54c(%edx),%xmm5 + DB 15,89,178,28,165,0,0 ; mulps 0xa51c(%edx),%xmm6 + DB 102,15,219,170,44,165,0,0 ; pand 0xa52c(%edx),%xmm5 DB 15,91,213 ; cvtdq2ps %xmm5,%xmm2 - DB 15,89,146,92,165,0,0 ; mulps 0xa55c(%edx),%xmm2 + DB 15,89,146,60,165,0,0 ; mulps 0xa53c(%edx),%xmm2 DB 15,40,218 ; movaps %xmm2,%xmm3 DB 15,41,93,200 ; movaps %xmm3,-0x38(%ebp) DB 15,40,254 ; movaps %xmm6,%xmm7 @@ -47114,16 +47114,16 @@ _sk_load_tables_sse2 LABEL PROC DB 131,236,12 ; sub $0xc,%esp DB 232,0,0,0,0 ; call 2b2e <_sk_load_tables_sse2+0xe> DB 90 ; pop %edx - DB 139,117,12 ; mov 0xc(%ebp),%esi + DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,57 ; mov (%ecx),%edi + DB 139,48 ; mov (%eax),%esi DB 139,65,8 ; mov 0x8(%ecx),%eax DB 133,192 ; test %eax,%eax - DB 139,54 ; mov (%esi),%esi + DB 139,57 ; mov (%ecx),%edi DB 139,30 ; mov (%esi),%ebx DB 15,133,22,1,0,0 ; jne 2c5c <_sk_load_tables_sse2+0x13c> DB 243,15,111,28,187 ; movdqu (%ebx,%edi,4),%xmm3 - DB 102,15,111,146,130,162,0,0 ; movdqa 0xa282(%edx),%xmm2 + DB 102,15,111,146,98,162,0,0 ; movdqa 0xa262(%edx),%xmm2 DB 102,15,111,195 ; movdqa %xmm3,%xmm0 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1 @@ -47179,7 +47179,7 @@ _sk_load_tables_sse2 LABEL PROC DB 102,15,20,215 ; unpcklpd %xmm7,%xmm2 DB 102,15,114,211,24 ; psrld $0x18,%xmm3 DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3 - DB 15,89,154,178,163,0,0 ; mulps 0xa3b2(%edx),%xmm3 + DB 15,89,154,146,163,0,0 ; mulps 0xa392(%edx),%xmm3 DB 139,69,12 ; mov 0xc(%ebp),%eax DB 137,194 ; mov %eax,%edx DB 141,66,8 ; lea 0x8(%edx),%eax @@ -47218,17 +47218,17 @@ _sk_load_tables_u16_be_sse2 LABEL PROC DB 131,236,44 ; sub $0x2c,%esp DB 232,0,0,0,0 ; call 2c9f <_sk_load_tables_u16_be_sse2+0xe> DB 90 ; pop %edx - DB 139,69,12 ; mov 0xc(%ebp),%eax + DB 139,117,12 ; mov 0xc(%ebp),%esi DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,57 ; mov (%ecx),%edi - DB 139,89,8 ; mov 0x8(%ecx),%ebx + DB 139,65,8 ; mov 0x8(%ecx),%eax DB 193,231,2 ; shl $0x2,%edi - DB 133,219 ; test %ebx,%ebx - DB 139,48 ; mov (%eax),%esi - DB 139,6 ; mov (%esi),%eax + DB 133,192 ; test %eax,%eax + DB 139,54 ; mov (%esi),%esi + DB 139,30 ; mov (%esi),%ebx DB 15,133,210,1,0,0 ; jne 2e8c <_sk_load_tables_u16_be_sse2+0x1fb> - DB 102,15,16,4,120 ; movupd (%eax,%edi,2),%xmm0 - DB 243,15,111,76,120,16 ; movdqu 0x10(%eax,%edi,2),%xmm1 + DB 102,15,16,4,123 ; movupd (%ebx,%edi,2),%xmm0 + DB 243,15,111,76,123,16 ; movdqu 0x10(%ebx,%edi,2),%xmm1 DB 102,15,40,216 ; movapd %xmm0,%xmm3 DB 102,15,97,217 ; punpcklwd %xmm1,%xmm3 DB 102,15,105,193 ; punpckhwd %xmm1,%xmm0 @@ -47252,7 +47252,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC DB 242,15,112,192,232 ; pshuflw $0xe8,%xmm0,%xmm0 DB 243,15,112,192,232 ; pshufhw $0xe8,%xmm0,%xmm0 DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0 - DB 102,15,111,146,177,162,0,0 ; movdqa 0xa2b1(%edx),%xmm2 + DB 102,15,111,146,145,162,0,0 ; movdqa 0xa291(%edx),%xmm2 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,97,196 ; punpcklwd %xmm4,%xmm0 @@ -47324,7 +47324,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC DB 243,15,126,93,232 ; movq -0x18(%ebp),%xmm3 DB 102,15,97,220 ; punpcklwd %xmm4,%xmm3 DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3 - DB 15,89,154,193,162,0,0 ; mulps 0xa2c1(%edx),%xmm3 + DB 15,89,154,161,162,0,0 ; mulps 0xa2a1(%edx),%xmm3 DB 139,69,12 ; mov 0xc(%ebp),%eax DB 137,194 ; mov %eax,%edx DB 141,66,8 ; lea 0x8(%edx),%eax @@ -47338,14 +47338,14 @@ _sk_load_tables_u16_be_sse2 LABEL PROC DB 91 ; pop %ebx DB 93 ; pop %ebp DB 195 ; ret - DB 242,15,16,4,120 ; movsd (%eax,%edi,2),%xmm0 + DB 242,15,16,4,123 ; movsd (%ebx,%edi,2),%xmm0 DB 102,15,239,201 ; pxor %xmm1,%xmm1 - DB 131,251,1 ; cmp $0x1,%ebx + DB 131,248,1 ; cmp $0x1,%eax DB 15,132,39,254,255,255 ; je 2cc5 <_sk_load_tables_u16_be_sse2+0x34> - DB 102,15,22,68,120,8 ; movhpd 0x8(%eax,%edi,2),%xmm0 - DB 131,251,3 ; cmp $0x3,%ebx + DB 102,15,22,68,123,8 ; movhpd 0x8(%ebx,%edi,2),%xmm0 + DB 131,248,3 ; cmp $0x3,%eax DB 15,130,24,254,255,255 ; jb 2cc5 <_sk_load_tables_u16_be_sse2+0x34> - DB 243,15,126,76,120,16 ; movq 0x10(%eax,%edi,2),%xmm1 + DB 243,15,126,76,123,16 ; movq 0x10(%ebx,%edi,2),%xmm1 DB 233,13,254,255,255 ; jmp 2cc5 <_sk_load_tables_u16_be_sse2+0x34> PUBLIC _sk_load_tables_rgb_u16_be_sse2 @@ -47395,7 +47395,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC DB 242,15,112,194,232 ; pshuflw $0xe8,%xmm2,%xmm0 DB 243,15,112,192,232 ; pshufhw $0xe8,%xmm0,%xmm0 DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0 - DB 102,15,111,146,138,160,0,0 ; movdqa 0xa08a(%edx),%xmm2 + DB 102,15,111,146,106,160,0,0 ; movdqa 0xa06a(%edx),%xmm2 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,97,195 ; punpcklwd %xmm3,%xmm0 @@ -47460,7 +47460,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC DB 137,198 ; mov %eax,%esi DB 141,70,8 ; lea 0x8(%esi),%eax DB 131,236,8 ; sub $0x8,%esp - DB 15,40,154,42,158,0,0 ; movaps 0x9e2a(%edx),%xmm3 + DB 15,40,154,10,158,0,0 ; movaps 0x9e0a(%edx),%xmm3 DB 80 ; push %eax DB 81 ; push %ecx DB 255,86,4 ; call *0x4(%esi) @@ -47501,7 +47501,7 @@ _sk_byte_tables_sse2 LABEL PROC DB 90 ; pop %edx DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,8 ; mov (%eax),%ecx - DB 15,40,162,205,156,0,0 ; movaps 0x9ccd(%edx),%xmm4 + DB 15,40,162,173,156,0,0 ; movaps 0x9cad(%edx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0 DB 102,15,112,232,78 ; pshufd $0x4e,%xmm0,%xmm5 @@ -47523,7 +47523,7 @@ _sk_byte_tables_sse2 LABEL PROC DB 102,15,110,192 ; movd %eax,%xmm0 DB 139,65,4 ; mov 0x4(%ecx),%eax DB 102,15,196,195,1 ; pinsrw $0x1,%ebx,%xmm0 - DB 15,40,170,237,157,0,0 ; movaps 0x9ded(%edx),%xmm5 + DB 15,40,170,205,157,0,0 ; movaps 0x9dcd(%edx),%xmm5 DB 15,89,204 ; mulps %xmm4,%xmm1 DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1 DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6 @@ -47651,7 +47651,7 @@ _sk_byte_tables_rgb_sse2 LABEL PROC DB 102,15,110,199 ; movd %edi,%xmm0 DB 139,121,4 ; mov 0x4(%ecx),%edi DB 102,15,196,198,1 ; pinsrw $0x1,%esi,%xmm0 - DB 15,40,170,241,155,0,0 ; movaps 0x9bf1(%edx),%xmm5 + DB 15,40,170,209,155,0,0 ; movaps 0x9bd1(%edx),%xmm5 DB 15,89,204 ; mulps %xmm4,%xmm1 DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1 DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6 @@ -47897,15 +47897,15 @@ _sk_parametric_r_sse2 LABEL PROC DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,88,245 ; addps %xmm5,%xmm6 DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5 - DB 15,89,170,177,153,0,0 ; mulps 0x99b1(%edx),%xmm5 - DB 15,84,178,193,153,0,0 ; andps 0x99c1(%edx),%xmm6 - DB 15,86,178,33,151,0,0 ; orps 0x9721(%edx),%xmm6 - DB 15,88,170,209,153,0,0 ; addps 0x99d1(%edx),%xmm5 - DB 15,40,186,225,153,0,0 ; movaps 0x99e1(%edx),%xmm7 + DB 15,89,170,145,153,0,0 ; mulps 0x9991(%edx),%xmm5 + DB 15,84,178,161,153,0,0 ; andps 0x99a1(%edx),%xmm6 + DB 15,86,178,1,151,0,0 ; orps 0x9701(%edx),%xmm6 + DB 15,88,170,177,153,0,0 ; addps 0x99b1(%edx),%xmm5 + DB 15,40,186,193,153,0,0 ; movaps 0x99c1(%edx),%xmm7 DB 15,89,254 ; mulps %xmm6,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,88,178,241,153,0,0 ; addps 0x99f1(%edx),%xmm6 - DB 15,40,186,1,154,0,0 ; movaps 0x9a01(%edx),%xmm7 + DB 15,88,178,209,153,0,0 ; addps 0x99d1(%edx),%xmm6 + DB 15,40,186,225,153,0,0 ; movaps 0x99e1(%edx),%xmm7 DB 15,94,254 ; divps %xmm6,%xmm7 DB 243,15,16,49 ; movss (%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -47915,21 +47915,21 @@ _sk_parametric_r_sse2 LABEL PROC DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,194,199,1 ; cmpltps %xmm7,%xmm0 - DB 15,40,178,49,151,0,0 ; movaps 0x9731(%edx),%xmm6 + DB 15,40,178,17,151,0,0 ; movaps 0x9711(%edx),%xmm6 DB 15,84,198 ; andps %xmm6,%xmm0 DB 15,92,248 ; subps %xmm0,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,92,199 ; subps %xmm7,%xmm0 - DB 15,88,170,17,154,0,0 ; addps 0x9a11(%edx),%xmm5 - DB 15,40,186,33,154,0,0 ; movaps 0x9a21(%edx),%xmm7 + DB 15,88,170,241,153,0,0 ; addps 0x99f1(%edx),%xmm5 + DB 15,40,186,1,154,0,0 ; movaps 0x9a01(%edx),%xmm7 DB 15,89,248 ; mulps %xmm0,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,40,186,49,154,0,0 ; movaps 0x9a31(%edx),%xmm7 + DB 15,40,186,17,154,0,0 ; movaps 0x9a11(%edx),%xmm7 DB 15,92,248 ; subps %xmm0,%xmm7 - DB 15,40,130,65,154,0,0 ; movaps 0x9a41(%edx),%xmm0 + DB 15,40,130,33,154,0,0 ; movaps 0x9a21(%edx),%xmm0 DB 15,94,199 ; divps %xmm7,%xmm0 DB 15,88,197 ; addps %xmm5,%xmm0 - DB 15,89,130,81,154,0,0 ; mulps 0x9a51(%edx),%xmm0 + DB 15,89,130,49,154,0,0 ; mulps 0x9a31(%edx),%xmm0 DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0 DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 @@ -47981,15 +47981,15 @@ _sk_parametric_g_sse2 LABEL PROC DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,88,245 ; addps %xmm5,%xmm6 DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5 - DB 15,89,170,122,152,0,0 ; mulps 0x987a(%edx),%xmm5 - DB 15,84,178,138,152,0,0 ; andps 0x988a(%edx),%xmm6 - DB 15,86,178,234,149,0,0 ; orps 0x95ea(%edx),%xmm6 - DB 15,88,170,154,152,0,0 ; addps 0x989a(%edx),%xmm5 - DB 15,40,186,170,152,0,0 ; movaps 0x98aa(%edx),%xmm7 + DB 15,89,170,90,152,0,0 ; mulps 0x985a(%edx),%xmm5 + DB 15,84,178,106,152,0,0 ; andps 0x986a(%edx),%xmm6 + DB 15,86,178,202,149,0,0 ; orps 0x95ca(%edx),%xmm6 + DB 15,88,170,122,152,0,0 ; addps 0x987a(%edx),%xmm5 + DB 15,40,186,138,152,0,0 ; movaps 0x988a(%edx),%xmm7 DB 15,89,254 ; mulps %xmm6,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,88,178,186,152,0,0 ; addps 0x98ba(%edx),%xmm6 - DB 15,40,186,202,152,0,0 ; movaps 0x98ca(%edx),%xmm7 + DB 15,88,178,154,152,0,0 ; addps 0x989a(%edx),%xmm6 + DB 15,40,186,170,152,0,0 ; movaps 0x98aa(%edx),%xmm7 DB 15,94,254 ; divps %xmm6,%xmm7 DB 243,15,16,49 ; movss (%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -47999,21 +47999,21 @@ _sk_parametric_g_sse2 LABEL PROC DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,194,199,1 ; cmpltps %xmm7,%xmm0 - DB 15,40,178,250,149,0,0 ; movaps 0x95fa(%edx),%xmm6 + DB 15,40,178,218,149,0,0 ; movaps 0x95da(%edx),%xmm6 DB 15,84,198 ; andps %xmm6,%xmm0 DB 15,92,248 ; subps %xmm0,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,92,199 ; subps %xmm7,%xmm0 - DB 15,88,170,218,152,0,0 ; addps 0x98da(%edx),%xmm5 - DB 15,40,186,234,152,0,0 ; movaps 0x98ea(%edx),%xmm7 + DB 15,88,170,186,152,0,0 ; addps 0x98ba(%edx),%xmm5 + DB 15,40,186,202,152,0,0 ; movaps 0x98ca(%edx),%xmm7 DB 15,89,248 ; mulps %xmm0,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,40,186,250,152,0,0 ; movaps 0x98fa(%edx),%xmm7 + DB 15,40,186,218,152,0,0 ; movaps 0x98da(%edx),%xmm7 DB 15,92,248 ; subps %xmm0,%xmm7 - DB 15,40,130,10,153,0,0 ; movaps 0x990a(%edx),%xmm0 + DB 15,40,130,234,152,0,0 ; movaps 0x98ea(%edx),%xmm0 DB 15,94,199 ; divps %xmm7,%xmm0 DB 15,88,197 ; addps %xmm5,%xmm0 - DB 15,89,130,26,153,0,0 ; mulps 0x991a(%edx),%xmm0 + DB 15,89,130,250,152,0,0 ; mulps 0x98fa(%edx),%xmm0 DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0 DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 @@ -48064,15 +48064,15 @@ _sk_parametric_b_sse2 LABEL PROC DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,88,245 ; addps %xmm5,%xmm6 DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5 - DB 15,89,170,70,151,0,0 ; mulps 0x9746(%edx),%xmm5 - DB 15,84,178,86,151,0,0 ; andps 0x9756(%edx),%xmm6 - DB 15,86,178,182,148,0,0 ; orps 0x94b6(%edx),%xmm6 - DB 15,88,170,102,151,0,0 ; addps 0x9766(%edx),%xmm5 - DB 15,40,186,118,151,0,0 ; movaps 0x9776(%edx),%xmm7 + DB 15,89,170,38,151,0,0 ; mulps 0x9726(%edx),%xmm5 + DB 15,84,178,54,151,0,0 ; andps 0x9736(%edx),%xmm6 + DB 15,86,178,150,148,0,0 ; orps 0x9496(%edx),%xmm6 + DB 15,88,170,70,151,0,0 ; addps 0x9746(%edx),%xmm5 + DB 15,40,186,86,151,0,0 ; movaps 0x9756(%edx),%xmm7 DB 15,89,254 ; mulps %xmm6,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,88,178,134,151,0,0 ; addps 0x9786(%edx),%xmm6 - DB 15,40,186,150,151,0,0 ; movaps 0x9796(%edx),%xmm7 + DB 15,88,178,102,151,0,0 ; addps 0x9766(%edx),%xmm6 + DB 15,40,186,118,151,0,0 ; movaps 0x9776(%edx),%xmm7 DB 15,94,254 ; divps %xmm6,%xmm7 DB 243,15,16,49 ; movss (%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -48082,21 +48082,21 @@ _sk_parametric_b_sse2 LABEL PROC DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,194,199,1 ; cmpltps %xmm7,%xmm0 - DB 15,40,178,198,148,0,0 ; movaps 0x94c6(%edx),%xmm6 + DB 15,40,178,166,148,0,0 ; movaps 0x94a6(%edx),%xmm6 DB 15,84,198 ; andps %xmm6,%xmm0 DB 15,92,248 ; subps %xmm0,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,92,199 ; subps %xmm7,%xmm0 - DB 15,88,170,166,151,0,0 ; addps 0x97a6(%edx),%xmm5 - DB 15,40,186,182,151,0,0 ; movaps 0x97b6(%edx),%xmm7 + DB 15,88,170,134,151,0,0 ; addps 0x9786(%edx),%xmm5 + DB 15,40,186,150,151,0,0 ; movaps 0x9796(%edx),%xmm7 DB 15,89,248 ; mulps %xmm0,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,40,186,198,151,0,0 ; movaps 0x97c6(%edx),%xmm7 + DB 15,40,186,166,151,0,0 ; movaps 0x97a6(%edx),%xmm7 DB 15,92,248 ; subps %xmm0,%xmm7 - DB 15,40,130,214,151,0,0 ; movaps 0x97d6(%edx),%xmm0 + DB 15,40,130,182,151,0,0 ; movaps 0x97b6(%edx),%xmm0 DB 15,94,199 ; divps %xmm7,%xmm0 DB 15,88,197 ; addps %xmm5,%xmm0 - DB 15,89,130,230,151,0,0 ; mulps 0x97e6(%edx),%xmm0 + DB 15,89,130,198,151,0,0 ; mulps 0x97c6(%edx),%xmm0 DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0 DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 @@ -48147,15 +48147,15 @@ _sk_parametric_a_sse2 LABEL PROC DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,88,245 ; addps %xmm5,%xmm6 DB 15,91,238 ; cvtdq2ps %xmm6,%xmm5 - DB 15,89,170,18,150,0,0 ; mulps 0x9612(%edx),%xmm5 - DB 15,84,178,34,150,0,0 ; andps 0x9622(%edx),%xmm6 - DB 15,86,178,130,147,0,0 ; orps 0x9382(%edx),%xmm6 - DB 15,88,170,50,150,0,0 ; addps 0x9632(%edx),%xmm5 - DB 15,40,186,66,150,0,0 ; movaps 0x9642(%edx),%xmm7 + DB 15,89,170,242,149,0,0 ; mulps 0x95f2(%edx),%xmm5 + DB 15,84,178,2,150,0,0 ; andps 0x9602(%edx),%xmm6 + DB 15,86,178,98,147,0,0 ; orps 0x9362(%edx),%xmm6 + DB 15,88,170,18,150,0,0 ; addps 0x9612(%edx),%xmm5 + DB 15,40,186,34,150,0,0 ; movaps 0x9622(%edx),%xmm7 DB 15,89,254 ; mulps %xmm6,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,88,178,82,150,0,0 ; addps 0x9652(%edx),%xmm6 - DB 15,40,186,98,150,0,0 ; movaps 0x9662(%edx),%xmm7 + DB 15,88,178,50,150,0,0 ; addps 0x9632(%edx),%xmm6 + DB 15,40,186,66,150,0,0 ; movaps 0x9642(%edx),%xmm7 DB 15,94,254 ; divps %xmm6,%xmm7 DB 243,15,16,49 ; movss (%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -48165,21 +48165,21 @@ _sk_parametric_a_sse2 LABEL PROC DB 15,91,254 ; cvtdq2ps %xmm6,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,194,199,1 ; cmpltps %xmm7,%xmm0 - DB 15,40,178,146,147,0,0 ; movaps 0x9392(%edx),%xmm6 + DB 15,40,178,114,147,0,0 ; movaps 0x9372(%edx),%xmm6 DB 15,84,198 ; andps %xmm6,%xmm0 DB 15,92,248 ; subps %xmm0,%xmm7 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,92,199 ; subps %xmm7,%xmm0 - DB 15,88,170,114,150,0,0 ; addps 0x9672(%edx),%xmm5 - DB 15,40,186,130,150,0,0 ; movaps 0x9682(%edx),%xmm7 + DB 15,88,170,82,150,0,0 ; addps 0x9652(%edx),%xmm5 + DB 15,40,186,98,150,0,0 ; movaps 0x9662(%edx),%xmm7 DB 15,89,248 ; mulps %xmm0,%xmm7 DB 15,92,239 ; subps %xmm7,%xmm5 - DB 15,40,186,146,150,0,0 ; movaps 0x9692(%edx),%xmm7 + DB 15,40,186,114,150,0,0 ; movaps 0x9672(%edx),%xmm7 DB 15,92,248 ; subps %xmm0,%xmm7 - DB 15,40,130,162,150,0,0 ; movaps 0x96a2(%edx),%xmm0 + DB 15,40,130,130,150,0,0 ; movaps 0x9682(%edx),%xmm0 DB 15,94,199 ; divps %xmm7,%xmm0 DB 15,88,197 ; addps %xmm5,%xmm0 - DB 15,89,130,178,150,0,0 ; mulps 0x96b2(%edx),%xmm0 + DB 15,89,130,146,150,0,0 ; mulps 0x9692(%edx),%xmm0 DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0 DB 243,15,16,105,20 ; movss 0x14(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 @@ -48212,15 +48212,15 @@ _sk_gamma_sse2 LABEL PROC DB 232,0,0,0,0 ; call 3a8f <_sk_gamma_sse2+0x12> DB 88 ; pop %eax DB 15,91,195 ; cvtdq2ps %xmm3,%xmm0 - DB 15,89,128,225,148,0,0 ; mulps 0x94e1(%eax),%xmm0 - DB 15,84,152,241,148,0,0 ; andps 0x94f1(%eax),%xmm3 - DB 15,86,152,81,146,0,0 ; orps 0x9251(%eax),%xmm3 - DB 15,88,128,1,149,0,0 ; addps 0x9501(%eax),%xmm0 + DB 15,89,128,193,148,0,0 ; mulps 0x94c1(%eax),%xmm0 + DB 15,84,152,209,148,0,0 ; andps 0x94d1(%eax),%xmm3 + DB 15,86,152,49,146,0,0 ; orps 0x9231(%eax),%xmm3 + DB 15,88,128,225,148,0,0 ; addps 0x94e1(%eax),%xmm0 DB 15,40,227 ; movaps %xmm3,%xmm4 - DB 15,89,160,17,149,0,0 ; mulps 0x9511(%eax),%xmm4 + DB 15,89,160,241,148,0,0 ; mulps 0x94f1(%eax),%xmm4 DB 15,92,196 ; subps %xmm4,%xmm0 - DB 15,88,152,33,149,0,0 ; addps 0x9521(%eax),%xmm3 - DB 15,40,160,49,149,0,0 ; movaps 0x9531(%eax),%xmm4 + DB 15,88,152,1,149,0,0 ; addps 0x9501(%eax),%xmm3 + DB 15,40,160,17,149,0,0 ; movaps 0x9511(%eax),%xmm4 DB 15,94,227 ; divps %xmm3,%xmm4 DB 15,92,196 ; subps %xmm4,%xmm0 DB 139,77,12 ; mov 0xc(%ebp),%ecx @@ -48233,30 +48233,30 @@ _sk_gamma_sse2 LABEL PROC DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3 DB 15,40,224 ; movaps %xmm0,%xmm4 DB 15,194,227,1 ; cmpltps %xmm3,%xmm4 - DB 15,84,160,97,146,0,0 ; andps 0x9261(%eax),%xmm4 + DB 15,84,160,65,146,0,0 ; andps 0x9241(%eax),%xmm4 DB 15,92,220 ; subps %xmm4,%xmm3 DB 15,40,224 ; movaps %xmm0,%xmm4 DB 15,92,227 ; subps %xmm3,%xmm4 - DB 15,88,128,65,149,0,0 ; addps 0x9541(%eax),%xmm0 - DB 15,40,176,97,149,0,0 ; movaps 0x9561(%eax),%xmm6 + DB 15,88,128,33,149,0,0 ; addps 0x9521(%eax),%xmm0 + DB 15,40,176,65,149,0,0 ; movaps 0x9541(%eax),%xmm6 DB 15,92,244 ; subps %xmm4,%xmm6 - DB 15,40,168,81,149,0,0 ; movaps 0x9551(%eax),%xmm5 + DB 15,40,168,49,149,0,0 ; movaps 0x9531(%eax),%xmm5 DB 15,89,229 ; mulps %xmm5,%xmm4 DB 15,92,196 ; subps %xmm4,%xmm0 - DB 15,40,152,113,149,0,0 ; movaps 0x9571(%eax),%xmm3 + DB 15,40,152,81,149,0,0 ; movaps 0x9551(%eax),%xmm3 DB 15,40,227 ; movaps %xmm3,%xmm4 DB 15,94,230 ; divps %xmm6,%xmm4 DB 15,88,224 ; addps %xmm0,%xmm4 DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0 - DB 15,89,128,225,148,0,0 ; mulps 0x94e1(%eax),%xmm0 - DB 15,84,136,241,148,0,0 ; andps 0x94f1(%eax),%xmm1 - DB 15,86,136,81,146,0,0 ; orps 0x9251(%eax),%xmm1 - DB 15,88,128,1,149,0,0 ; addps 0x9501(%eax),%xmm0 + DB 15,89,128,193,148,0,0 ; mulps 0x94c1(%eax),%xmm0 + DB 15,84,136,209,148,0,0 ; andps 0x94d1(%eax),%xmm1 + DB 15,86,136,49,146,0,0 ; orps 0x9231(%eax),%xmm1 + DB 15,88,128,225,148,0,0 ; addps 0x94e1(%eax),%xmm0 DB 15,40,241 ; movaps %xmm1,%xmm6 - DB 15,89,176,17,149,0,0 ; mulps 0x9511(%eax),%xmm6 + DB 15,89,176,241,148,0,0 ; mulps 0x94f1(%eax),%xmm6 DB 15,92,198 ; subps %xmm6,%xmm0 - DB 15,88,136,33,149,0,0 ; addps 0x9521(%eax),%xmm1 - DB 15,40,176,49,149,0,0 ; movaps 0x9531(%eax),%xmm6 + DB 15,88,136,1,149,0,0 ; addps 0x9501(%eax),%xmm1 + DB 15,40,176,17,149,0,0 ; movaps 0x9511(%eax),%xmm6 DB 15,94,241 ; divps %xmm1,%xmm6 DB 15,92,198 ; subps %xmm6,%xmm0 DB 15,89,199 ; mulps %xmm7,%xmm0 @@ -48264,12 +48264,12 @@ _sk_gamma_sse2 LABEL PROC DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 DB 15,40,240 ; movaps %xmm0,%xmm6 DB 15,194,241,1 ; cmpltps %xmm1,%xmm6 - DB 15,84,176,97,146,0,0 ; andps 0x9261(%eax),%xmm6 + DB 15,84,176,65,146,0,0 ; andps 0x9241(%eax),%xmm6 DB 15,92,206 ; subps %xmm6,%xmm1 DB 15,40,240 ; movaps %xmm0,%xmm6 DB 15,92,241 ; subps %xmm1,%xmm6 - DB 15,88,128,65,149,0,0 ; addps 0x9541(%eax),%xmm0 - DB 15,40,184,97,149,0,0 ; movaps 0x9561(%eax),%xmm7 + DB 15,88,128,33,149,0,0 ; addps 0x9521(%eax),%xmm0 + DB 15,40,184,65,149,0,0 ; movaps 0x9541(%eax),%xmm7 DB 15,92,254 ; subps %xmm6,%xmm7 DB 15,89,245 ; mulps %xmm5,%xmm6 DB 15,92,198 ; subps %xmm6,%xmm0 @@ -48277,15 +48277,15 @@ _sk_gamma_sse2 LABEL PROC DB 15,94,207 ; divps %xmm7,%xmm1 DB 15,88,200 ; addps %xmm0,%xmm1 DB 15,91,194 ; cvtdq2ps %xmm2,%xmm0 - DB 15,89,128,225,148,0,0 ; mulps 0x94e1(%eax),%xmm0 - DB 15,84,144,241,148,0,0 ; andps 0x94f1(%eax),%xmm2 - DB 15,86,144,81,146,0,0 ; orps 0x9251(%eax),%xmm2 - DB 15,88,128,1,149,0,0 ; addps 0x9501(%eax),%xmm0 - DB 15,40,176,17,149,0,0 ; movaps 0x9511(%eax),%xmm6 + DB 15,89,128,193,148,0,0 ; mulps 0x94c1(%eax),%xmm0 + DB 15,84,144,209,148,0,0 ; andps 0x94d1(%eax),%xmm2 + DB 15,86,144,49,146,0,0 ; orps 0x9231(%eax),%xmm2 + DB 15,88,128,225,148,0,0 ; addps 0x94e1(%eax),%xmm0 + DB 15,40,176,241,148,0,0 ; movaps 0x94f1(%eax),%xmm6 DB 15,89,242 ; mulps %xmm2,%xmm6 DB 15,92,198 ; subps %xmm6,%xmm0 - DB 15,88,144,33,149,0,0 ; addps 0x9521(%eax),%xmm2 - DB 15,40,176,49,149,0,0 ; movaps 0x9531(%eax),%xmm6 + DB 15,88,144,1,149,0,0 ; addps 0x9501(%eax),%xmm2 + DB 15,40,176,17,149,0,0 ; movaps 0x9511(%eax),%xmm6 DB 15,94,242 ; divps %xmm2,%xmm6 DB 15,92,198 ; subps %xmm6,%xmm0 DB 15,89,69,232 ; mulps -0x18(%ebp),%xmm0 @@ -48293,18 +48293,18 @@ _sk_gamma_sse2 LABEL PROC DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2 DB 15,40,240 ; movaps %xmm0,%xmm6 DB 15,194,242,1 ; cmpltps %xmm2,%xmm6 - DB 15,84,176,97,146,0,0 ; andps 0x9261(%eax),%xmm6 + DB 15,84,176,65,146,0,0 ; andps 0x9241(%eax),%xmm6 DB 15,92,214 ; subps %xmm6,%xmm2 DB 15,40,240 ; movaps %xmm0,%xmm6 DB 15,92,242 ; subps %xmm2,%xmm6 - DB 15,88,128,65,149,0,0 ; addps 0x9541(%eax),%xmm0 + DB 15,88,128,33,149,0,0 ; addps 0x9521(%eax),%xmm0 DB 15,89,238 ; mulps %xmm6,%xmm5 DB 15,92,197 ; subps %xmm5,%xmm0 - DB 15,40,144,97,149,0,0 ; movaps 0x9561(%eax),%xmm2 + DB 15,40,144,65,149,0,0 ; movaps 0x9541(%eax),%xmm2 DB 15,92,214 ; subps %xmm6,%xmm2 DB 15,94,218 ; divps %xmm2,%xmm3 DB 15,88,216 ; addps %xmm0,%xmm3 - DB 15,40,128,129,149,0,0 ; movaps 0x9581(%eax),%xmm0 + DB 15,40,128,97,149,0,0 ; movaps 0x9561(%eax),%xmm0 DB 15,89,224 ; mulps %xmm0,%xmm4 DB 15,89,200 ; mulps %xmm0,%xmm1 DB 15,89,216 ; mulps %xmm0,%xmm3 @@ -48331,29 +48331,29 @@ _sk_lab_to_xyz_sse2 LABEL PROC DB 15,40,208 ; movaps %xmm0,%xmm2 DB 232,0,0,0,0 ; call 3c77 <_sk_lab_to_xyz_sse2+0x15> DB 88 ; pop %eax - DB 15,89,144,169,147,0,0 ; mulps 0x93a9(%eax),%xmm2 - DB 15,40,160,73,145,0,0 ; movaps 0x9149(%eax),%xmm4 + DB 15,89,144,137,147,0,0 ; mulps 0x9389(%eax),%xmm2 + DB 15,40,160,41,145,0,0 ; movaps 0x9129(%eax),%xmm4 DB 15,89,204 ; mulps %xmm4,%xmm1 - DB 15,40,168,185,147,0,0 ; movaps 0x93b9(%eax),%xmm5 + DB 15,40,168,153,147,0,0 ; movaps 0x9399(%eax),%xmm5 DB 15,88,205 ; addps %xmm5,%xmm1 DB 15,89,220 ; mulps %xmm4,%xmm3 DB 15,88,221 ; addps %xmm5,%xmm3 - DB 15,88,144,201,147,0,0 ; addps 0x93c9(%eax),%xmm2 - DB 15,89,144,217,147,0,0 ; mulps 0x93d9(%eax),%xmm2 - DB 15,89,136,233,147,0,0 ; mulps 0x93e9(%eax),%xmm1 + DB 15,88,144,169,147,0,0 ; addps 0x93a9(%eax),%xmm2 + DB 15,89,144,185,147,0,0 ; mulps 0x93b9(%eax),%xmm2 + DB 15,89,136,201,147,0,0 ; mulps 0x93c9(%eax),%xmm1 DB 15,88,202 ; addps %xmm2,%xmm1 - DB 15,89,152,249,147,0,0 ; mulps 0x93f9(%eax),%xmm3 + DB 15,89,152,217,147,0,0 ; mulps 0x93d9(%eax),%xmm3 DB 15,40,234 ; movaps %xmm2,%xmm5 DB 15,92,235 ; subps %xmm3,%xmm5 DB 15,40,193 ; movaps %xmm1,%xmm0 DB 15,89,192 ; mulps %xmm0,%xmm0 DB 15,89,193 ; mulps %xmm1,%xmm0 - DB 15,40,152,9,148,0,0 ; movaps 0x9409(%eax),%xmm3 + DB 15,40,152,233,147,0,0 ; movaps 0x93e9(%eax),%xmm3 DB 15,40,227 ; movaps %xmm3,%xmm4 DB 15,194,224,1 ; cmpltps %xmm0,%xmm4 - DB 15,40,176,25,148,0,0 ; movaps 0x9419(%eax),%xmm6 + DB 15,40,176,249,147,0,0 ; movaps 0x93f9(%eax),%xmm6 DB 15,88,206 ; addps %xmm6,%xmm1 - DB 15,40,184,41,148,0,0 ; movaps 0x9429(%eax),%xmm7 + DB 15,40,184,9,148,0,0 ; movaps 0x9409(%eax),%xmm7 DB 15,89,207 ; mulps %xmm7,%xmm1 DB 15,84,196 ; andps %xmm4,%xmm0 DB 15,85,225 ; andnps %xmm1,%xmm4 @@ -48378,8 +48378,8 @@ _sk_lab_to_xyz_sse2 LABEL PROC DB 15,85,221 ; andnps %xmm5,%xmm3 DB 15,86,216 ; orps %xmm0,%xmm3 DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 15,89,160,57,148,0,0 ; mulps 0x9439(%eax),%xmm4 - DB 15,89,152,73,148,0,0 ; mulps 0x9449(%eax),%xmm3 + DB 15,89,160,25,148,0,0 ; mulps 0x9419(%eax),%xmm4 + DB 15,89,152,41,148,0,0 ; mulps 0x9429(%eax),%xmm3 DB 141,65,4 ; lea 0x4(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp DB 15,40,196 ; movaps %xmm4,%xmm0 @@ -48415,9 +48415,9 @@ _sk_load_a8_sse2 LABEL PROC DB 102,15,110,4,62 ; movd (%esi,%edi,1),%xmm0 DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0 DB 102,15,97,192 ; punpcklwd %xmm0,%xmm0 - DB 102,15,219,130,73,144,0,0 ; pand 0x9049(%edx),%xmm0 + DB 102,15,219,130,41,144,0,0 ; pand 0x9029(%edx),%xmm0 DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3 - DB 15,89,154,121,145,0,0 ; mulps 0x9179(%edx),%xmm3 + DB 15,89,154,89,145,0,0 ; mulps 0x9159(%edx),%xmm3 DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp DB 15,87,192 ; xorps %xmm0,%xmm0 @@ -48463,8 +48463,8 @@ _sk_load_a8_dst_sse2 LABEL PROC DB 131,236,12 ; sub $0xc,%esp DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,49 ; mov (%ecx),%esi DB 139,16 ; mov (%eax),%edx + DB 139,49 ; mov (%ecx),%esi DB 139,122,4 ; mov 0x4(%edx),%edi DB 15,175,121,4 ; imul 0x4(%ecx),%edi DB 3,58 ; add (%edx),%edi @@ -48480,9 +48480,9 @@ _sk_load_a8_dst_sse2 LABEL PROC DB 102,15,110,36,55 ; movd (%edi,%esi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4 - DB 102,15,219,162,117,143,0,0 ; pand 0x8f75(%edx),%xmm4 + DB 102,15,219,162,85,143,0,0 ; pand 0x8f55(%edx),%xmm4 DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 - DB 15,89,162,165,144,0,0 ; mulps 0x90a5(%edx),%xmm4 + DB 15,89,162,133,144,0,0 ; mulps 0x9085(%edx),%xmm4 DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx) DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp @@ -48571,7 +48571,7 @@ _sk_gather_a8_sse2 LABEL PROC DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0 DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0 DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3 - DB 15,89,153,120,143,0,0 ; mulps 0x8f78(%ecx),%xmm3 + DB 15,89,153,88,143,0,0 ; mulps 0x8f58(%ecx),%xmm3 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 131,236,8 ; sub $0x8,%esp DB 15,87,192 ; xorps %xmm0,%xmm0 @@ -48603,7 +48603,7 @@ _sk_store_a8_sse2 LABEL PROC DB 15,175,81,4 ; imul 0x4(%ecx),%edx DB 3,23 ; add (%edi),%edx DB 139,89,8 ; mov 0x8(%ecx),%ebx - DB 15,40,166,20,142,0,0 ; movaps 0x8e14(%esi),%xmm4 + DB 15,40,166,244,141,0,0 ; movaps 0x8df4(%esi),%xmm4 DB 15,89,227 ; mulps %xmm3,%xmm4 DB 102,15,91,228 ; cvtps2dq %xmm4,%xmm4 DB 102,15,114,244,16 ; pslld $0x10,%xmm4 @@ -48638,7 +48638,7 @@ _sk_store_a8_sse2 LABEL PROC DB 102,15,197,220,4 ; pextrw $0x4,%xmm4,%ebx DB 136,92,58,2 ; mov %bl,0x2(%edx,%edi,1) DB 102,15,112,228,212 ; pshufd $0xd4,%xmm4,%xmm4 - DB 102,15,219,166,36,145,0,0 ; pand 0x9124(%esi),%xmm4 + DB 102,15,219,166,4,145,0,0 ; pand 0x9104(%esi),%xmm4 DB 102,15,103,228 ; packuswb %xmm4,%xmm4 DB 102,15,103,228 ; packuswb %xmm4,%xmm4 DB 102,15,103,228 ; packuswb %xmm4,%xmm4 @@ -48672,12 +48672,12 @@ _sk_load_g8_sse2 LABEL PROC DB 102,15,110,4,62 ; movd (%esi,%edi,1),%xmm0 DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0 DB 102,15,97,192 ; punpcklwd %xmm0,%xmm0 - DB 102,15,219,130,82,141,0,0 ; pand 0x8d52(%edx),%xmm0 + DB 102,15,219,130,50,141,0,0 ; pand 0x8d32(%edx),%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,89,130,130,142,0,0 ; mulps 0x8e82(%edx),%xmm0 + DB 15,89,130,98,142,0,0 ; mulps 0x8e62(%edx),%xmm0 DB 141,112,8 ; lea 0x8(%eax),%esi DB 131,236,8 ; sub $0x8,%esp - DB 15,40,154,146,140,0,0 ; movaps 0x8c92(%edx),%xmm3 + DB 15,40,154,114,140,0,0 ; movaps 0x8c72(%edx),%xmm3 DB 15,40,200 ; movaps %xmm0,%xmm1 DB 15,40,208 ; movaps %xmm0,%xmm2 DB 86 ; push %esi @@ -48733,13 +48733,13 @@ _sk_load_g8_dst_sse2 LABEL PROC DB 102,15,110,36,62 ; movd (%esi,%edi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4 - DB 102,15,219,162,166,140,0,0 ; pand 0x8ca6(%edx),%xmm4 + DB 102,15,219,162,134,140,0,0 ; pand 0x8c86(%edx),%xmm4 DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 - DB 15,89,162,214,141,0,0 ; mulps 0x8dd6(%edx),%xmm4 + DB 15,89,162,182,141,0,0 ; mulps 0x8db6(%edx),%xmm4 DB 15,41,97,48 ; movaps %xmm4,0x30(%ecx) DB 15,41,97,32 ; movaps %xmm4,0x20(%ecx) DB 15,41,97,16 ; movaps %xmm4,0x10(%ecx) - DB 15,40,162,230,139,0,0 ; movaps 0x8be6(%edx),%xmm4 + DB 15,40,162,198,139,0,0 ; movaps 0x8bc6(%edx),%xmm4 DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx) DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp @@ -48829,10 +48829,10 @@ _sk_gather_g8_sse2 LABEL PROC DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0 DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,89,129,127,140,0,0 ; mulps 0x8c7f(%ecx),%xmm0 + DB 15,89,129,95,140,0,0 ; mulps 0x8c5f(%ecx),%xmm0 DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp - DB 15,40,153,143,138,0,0 ; movaps 0x8a8f(%ecx),%xmm3 + DB 15,40,153,111,138,0,0 ; movaps 0x8a6f(%ecx),%xmm3 DB 15,40,200 ; movaps %xmm0,%xmm1 DB 15,40,208 ; movaps %xmm0,%xmm2 DB 82 ; push %edx @@ -48867,20 +48867,20 @@ _sk_load_565_sse2 LABEL PROC DB 117,97 ; jne 432a <_sk_load_565_sse2+0x8c> DB 243,15,126,20,126 ; movq (%esi,%edi,2),%xmm2 DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2 - DB 102,15,111,130,68,140,0,0 ; movdqa 0x8c44(%edx),%xmm0 + DB 102,15,111,130,36,140,0,0 ; movdqa 0x8c24(%edx),%xmm0 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,89,130,84,140,0,0 ; mulps 0x8c54(%edx),%xmm0 - DB 102,15,111,138,100,140,0,0 ; movdqa 0x8c64(%edx),%xmm1 + DB 15,89,130,52,140,0,0 ; mulps 0x8c34(%edx),%xmm0 + DB 102,15,111,138,68,140,0,0 ; movdqa 0x8c44(%edx),%xmm1 DB 102,15,219,202 ; pand %xmm2,%xmm1 DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 - DB 15,89,138,116,140,0,0 ; mulps 0x8c74(%edx),%xmm1 - DB 102,15,219,146,132,140,0,0 ; pand 0x8c84(%edx),%xmm2 + DB 15,89,138,84,140,0,0 ; mulps 0x8c54(%edx),%xmm1 + DB 102,15,219,146,100,140,0,0 ; pand 0x8c64(%edx),%xmm2 DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2 - DB 15,89,146,148,140,0,0 ; mulps 0x8c94(%edx),%xmm2 + DB 15,89,146,116,140,0,0 ; mulps 0x8c74(%edx),%xmm2 DB 141,112,8 ; lea 0x8(%eax),%esi DB 131,236,8 ; sub $0x8,%esp - DB 15,40,154,68,138,0,0 ; movaps 0x8a44(%edx),%xmm3 + DB 15,40,154,36,138,0,0 ; movaps 0x8a24(%edx),%xmm3 DB 86 ; push %esi DB 81 ; push %ecx DB 255,80,4 ; call *0x4(%eax) @@ -48932,21 +48932,21 @@ _sk_load_565_dst_sse2 LABEL PROC DB 117,113 ; jne 440a <_sk_load_565_dst_sse2+0x9c> DB 243,15,126,36,126 ; movq (%esi,%edi,2),%xmm4 DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4 - DB 102,15,111,170,116,139,0,0 ; movdqa 0x8b74(%edx),%xmm5 + DB 102,15,111,170,84,139,0,0 ; movdqa 0x8b54(%edx),%xmm5 DB 102,15,219,236 ; pand %xmm4,%xmm5 DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5 - DB 15,89,170,132,139,0,0 ; mulps 0x8b84(%edx),%xmm5 + DB 15,89,170,100,139,0,0 ; mulps 0x8b64(%edx),%xmm5 DB 15,41,105,16 ; movaps %xmm5,0x10(%ecx) - DB 102,15,111,170,148,139,0,0 ; movdqa 0x8b94(%edx),%xmm5 + DB 102,15,111,170,116,139,0,0 ; movdqa 0x8b74(%edx),%xmm5 DB 102,15,219,236 ; pand %xmm4,%xmm5 DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5 - DB 15,89,170,164,139,0,0 ; mulps 0x8ba4(%edx),%xmm5 + DB 15,89,170,132,139,0,0 ; mulps 0x8b84(%edx),%xmm5 DB 15,41,105,32 ; movaps %xmm5,0x20(%ecx) - DB 102,15,219,162,180,139,0,0 ; pand 0x8bb4(%edx),%xmm4 + DB 102,15,219,162,148,139,0,0 ; pand 0x8b94(%edx),%xmm4 DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 - DB 15,89,162,196,139,0,0 ; mulps 0x8bc4(%edx),%xmm4 + DB 15,89,162,164,139,0,0 ; mulps 0x8ba4(%edx),%xmm4 DB 15,41,97,48 ; movaps %xmm4,0x30(%ecx) - DB 15,40,162,116,137,0,0 ; movaps 0x8974(%edx),%xmm4 + DB 15,40,162,84,137,0,0 ; movaps 0x8954(%edx),%xmm4 DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx) DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp @@ -49029,20 +49029,20 @@ _sk_gather_565_sse2 LABEL PROC DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,196,209,3 ; pinsrw $0x3,%ecx,%xmm2 DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2 - DB 102,15,111,130,242,137,0,0 ; movdqa 0x89f2(%edx),%xmm0 + DB 102,15,111,130,210,137,0,0 ; movdqa 0x89d2(%edx),%xmm0 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,89,130,2,138,0,0 ; mulps 0x8a02(%edx),%xmm0 - DB 102,15,111,138,18,138,0,0 ; movdqa 0x8a12(%edx),%xmm1 + DB 15,89,130,226,137,0,0 ; mulps 0x89e2(%edx),%xmm0 + DB 102,15,111,138,242,137,0,0 ; movdqa 0x89f2(%edx),%xmm1 DB 102,15,219,202 ; pand %xmm2,%xmm1 DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 - DB 15,89,138,34,138,0,0 ; mulps 0x8a22(%edx),%xmm1 - DB 102,15,219,146,50,138,0,0 ; pand 0x8a32(%edx),%xmm2 + DB 15,89,138,2,138,0,0 ; mulps 0x8a02(%edx),%xmm1 + DB 102,15,219,146,18,138,0,0 ; pand 0x8a12(%edx),%xmm2 DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2 - DB 15,89,146,66,138,0,0 ; mulps 0x8a42(%edx),%xmm2 + DB 15,89,146,34,138,0,0 ; mulps 0x8a22(%edx),%xmm2 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 131,236,8 ; sub $0x8,%esp - DB 15,40,154,242,135,0,0 ; movaps 0x87f2(%edx),%xmm3 + DB 15,40,154,210,135,0,0 ; movaps 0x87d2(%edx),%xmm3 DB 81 ; push %ecx DB 255,117,8 ; pushl 0x8(%ebp) DB 255,80,4 ; call *0x4(%eax) @@ -49068,8 +49068,8 @@ _sk_store_565_sse2 LABEL PROC DB 1,210 ; add %edx,%edx DB 3,22 ; add (%esi),%edx DB 139,49 ; mov (%ecx),%esi - DB 15,40,167,111,139,0,0 ; movaps 0x8b6f(%edi),%xmm4 - DB 15,40,175,127,139,0,0 ; movaps 0x8b7f(%edi),%xmm5 + DB 15,40,167,79,139,0,0 ; movaps 0x8b4f(%edi),%xmm4 + DB 15,40,175,95,139,0,0 ; movaps 0x8b5f(%edi),%xmm5 DB 139,89,8 ; mov 0x8(%ecx),%ebx DB 15,40,240 ; movaps %xmm0,%xmm6 DB 15,89,244 ; mulps %xmm4,%xmm6 @@ -49147,21 +49147,21 @@ _sk_load_4444_sse2 LABEL PROC DB 117,112 ; jne 46e0 <_sk_load_4444_sse2+0x9b> DB 243,15,126,28,126 ; movq (%esi,%edi,2),%xmm3 DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3 - DB 102,15,111,130,173,138,0,0 ; movdqa 0x8aad(%edx),%xmm0 + DB 102,15,111,130,141,138,0,0 ; movdqa 0x8a8d(%edx),%xmm0 DB 102,15,219,195 ; pand %xmm3,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,89,130,189,138,0,0 ; mulps 0x8abd(%edx),%xmm0 - DB 102,15,111,138,205,138,0,0 ; movdqa 0x8acd(%edx),%xmm1 + DB 15,89,130,157,138,0,0 ; mulps 0x8a9d(%edx),%xmm0 + DB 102,15,111,138,173,138,0,0 ; movdqa 0x8aad(%edx),%xmm1 DB 102,15,219,203 ; pand %xmm3,%xmm1 DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 - DB 15,89,138,221,138,0,0 ; mulps 0x8add(%edx),%xmm1 - DB 102,15,111,146,237,138,0,0 ; movdqa 0x8aed(%edx),%xmm2 + DB 15,89,138,189,138,0,0 ; mulps 0x8abd(%edx),%xmm1 + DB 102,15,111,146,205,138,0,0 ; movdqa 0x8acd(%edx),%xmm2 DB 102,15,219,211 ; pand %xmm3,%xmm2 DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2 - DB 15,89,146,253,138,0,0 ; mulps 0x8afd(%edx),%xmm2 - DB 102,15,219,154,13,139,0,0 ; pand 0x8b0d(%edx),%xmm3 + DB 15,89,146,221,138,0,0 ; mulps 0x8add(%edx),%xmm2 + DB 102,15,219,154,237,138,0,0 ; pand 0x8aed(%edx),%xmm3 DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3 - DB 15,89,154,29,139,0,0 ; mulps 0x8b1d(%edx),%xmm3 + DB 15,89,154,253,138,0,0 ; mulps 0x8afd(%edx),%xmm3 DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp DB 82 ; push %edx @@ -49215,24 +49215,24 @@ _sk_load_4444_dst_sse2 LABEL PROC DB 15,133,128,0,0,0 ; jne 47d3 <_sk_load_4444_dst_sse2+0xaf> DB 243,15,126,36,126 ; movq (%esi,%edi,2),%xmm4 DB 102,15,97,224 ; punpcklwd %xmm0,%xmm4 - DB 102,15,111,170,206,137,0,0 ; movdqa 0x89ce(%edx),%xmm5 + DB 102,15,111,170,174,137,0,0 ; movdqa 0x89ae(%edx),%xmm5 DB 102,15,219,236 ; pand %xmm4,%xmm5 DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5 - DB 15,89,170,222,137,0,0 ; mulps 0x89de(%edx),%xmm5 + DB 15,89,170,190,137,0,0 ; mulps 0x89be(%edx),%xmm5 DB 15,41,105,16 ; movaps %xmm5,0x10(%ecx) - DB 102,15,111,170,238,137,0,0 ; movdqa 0x89ee(%edx),%xmm5 + DB 102,15,111,170,206,137,0,0 ; movdqa 0x89ce(%edx),%xmm5 DB 102,15,219,236 ; pand %xmm4,%xmm5 DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5 - DB 15,89,170,254,137,0,0 ; mulps 0x89fe(%edx),%xmm5 + DB 15,89,170,222,137,0,0 ; mulps 0x89de(%edx),%xmm5 DB 15,41,105,32 ; movaps %xmm5,0x20(%ecx) - DB 102,15,111,170,14,138,0,0 ; movdqa 0x8a0e(%edx),%xmm5 + DB 102,15,111,170,238,137,0,0 ; movdqa 0x89ee(%edx),%xmm5 DB 102,15,219,236 ; pand %xmm4,%xmm5 DB 15,91,237 ; cvtdq2ps %xmm5,%xmm5 - DB 15,89,170,30,138,0,0 ; mulps 0x8a1e(%edx),%xmm5 + DB 15,89,170,254,137,0,0 ; mulps 0x89fe(%edx),%xmm5 DB 15,41,105,48 ; movaps %xmm5,0x30(%ecx) - DB 102,15,219,162,46,138,0,0 ; pand 0x8a2e(%edx),%xmm4 + DB 102,15,219,162,14,138,0,0 ; pand 0x8a0e(%edx),%xmm4 DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 - DB 15,89,162,62,138,0,0 ; mulps 0x8a3e(%edx),%xmm4 + DB 15,89,162,30,138,0,0 ; mulps 0x8a1e(%edx),%xmm4 DB 15,41,97,64 ; movaps %xmm4,0x40(%ecx) DB 141,80,8 ; lea 0x8(%eax),%edx DB 131,236,8 ; sub $0x8,%esp @@ -49315,21 +49315,21 @@ _sk_gather_4444_sse2 LABEL PROC DB 89 ; pop %ecx DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3 - DB 102,15,111,129,48,136,0,0 ; movdqa 0x8830(%ecx),%xmm0 + DB 102,15,111,129,16,136,0,0 ; movdqa 0x8810(%ecx),%xmm0 DB 102,15,219,195 ; pand %xmm3,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,89,129,64,136,0,0 ; mulps 0x8840(%ecx),%xmm0 - DB 102,15,111,137,80,136,0,0 ; movdqa 0x8850(%ecx),%xmm1 + DB 15,89,129,32,136,0,0 ; mulps 0x8820(%ecx),%xmm0 + DB 102,15,111,137,48,136,0,0 ; movdqa 0x8830(%ecx),%xmm1 DB 102,15,219,203 ; pand %xmm3,%xmm1 DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1 - DB 15,89,137,96,136,0,0 ; mulps 0x8860(%ecx),%xmm1 - DB 102,15,111,145,112,136,0,0 ; movdqa 0x8870(%ecx),%xmm2 + DB 15,89,137,64,136,0,0 ; mulps 0x8840(%ecx),%xmm1 + DB 102,15,111,145,80,136,0,0 ; movdqa 0x8850(%ecx),%xmm2 DB 102,15,219,211 ; pand %xmm3,%xmm2 DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2 - DB 15,89,145,128,136,0,0 ; mulps 0x8880(%ecx),%xmm2 - DB 102,15,219,153,144,136,0,0 ; pand 0x8890(%ecx),%xmm3 + DB 15,89,145,96,136,0,0 ; mulps 0x8860(%ecx),%xmm2 + DB 102,15,219,153,112,136,0,0 ; pand 0x8870(%ecx),%xmm3 DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3 - DB 15,89,153,160,136,0,0 ; mulps 0x88a0(%ecx),%xmm3 + DB 15,89,153,128,136,0,0 ; mulps 0x8880(%ecx),%xmm3 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 131,236,8 ; sub $0x8,%esp DB 81 ; push %ecx @@ -49357,7 +49357,7 @@ _sk_store_4444_sse2 LABEL PROC DB 1,210 ; add %edx,%edx DB 3,22 ; add (%esi),%edx DB 139,49 ; mov (%ecx),%esi - DB 15,40,167,51,136,0,0 ; movaps 0x8833(%edi),%xmm4 + DB 15,40,167,19,136,0,0 ; movaps 0x8813(%edi),%xmm4 DB 139,89,8 ; mov 0x8(%ecx),%ebx DB 15,40,232 ; movaps %xmm0,%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 @@ -49440,11 +49440,11 @@ _sk_load_8888_sse2 LABEL PROC DB 139,57 ; mov (%ecx),%edi DB 117,102 ; jne 4ac2 <_sk_load_8888_sse2+0x92> DB 243,15,111,28,190 ; movdqu (%esi,%edi,4),%xmm3 - DB 102,15,111,146,114,131,0,0 ; movdqa 0x8372(%edx),%xmm2 + DB 102,15,111,146,82,131,0,0 ; movdqa 0x8352(%edx),%xmm2 DB 102,15,111,195 ; movdqa %xmm3,%xmm0 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,40,162,162,132,0,0 ; movaps 0x84a2(%edx),%xmm4 + DB 15,40,162,130,132,0,0 ; movaps 0x8482(%edx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,114,209,8 ; psrld $0x8,%xmm1 @@ -49507,11 +49507,11 @@ _sk_load_8888_dst_sse2 LABEL PROC DB 139,57 ; mov (%ecx),%edi DB 117,118 ; jne 4b99 <_sk_load_8888_dst_sse2+0xa2> DB 243,15,111,36,190 ; movdqu (%esi,%edi,4),%xmm4 - DB 102,15,111,170,171,130,0,0 ; movdqa 0x82ab(%edx),%xmm5 + DB 102,15,111,170,139,130,0,0 ; movdqa 0x828b(%edx),%xmm5 DB 102,15,111,244 ; movdqa %xmm4,%xmm6 DB 102,15,219,245 ; pand %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 - DB 15,40,186,219,131,0,0 ; movaps 0x83db(%edx),%xmm7 + DB 15,40,186,187,131,0,0 ; movaps 0x83bb(%edx),%xmm7 DB 15,89,247 ; mulps %xmm7,%xmm6 DB 15,41,113,16 ; movaps %xmm6,0x10(%ecx) DB 102,15,111,244 ; movdqa %xmm4,%xmm6 @@ -49604,11 +49604,11 @@ _sk_gather_8888_sse2 LABEL PROC DB 102,15,98,194 ; punpckldq %xmm2,%xmm0 DB 102,15,98,217 ; punpckldq %xmm1,%xmm3 DB 102,15,108,216 ; punpcklqdq %xmm0,%xmm3 - DB 102,15,111,145,56,129,0,0 ; movdqa 0x8138(%ecx),%xmm2 + DB 102,15,111,145,24,129,0,0 ; movdqa 0x8118(%ecx),%xmm2 DB 102,15,111,195 ; movdqa %xmm3,%xmm0 DB 102,15,219,194 ; pand %xmm2,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,40,161,104,130,0,0 ; movaps 0x8268(%ecx),%xmm4 + DB 15,40,161,72,130,0,0 ; movaps 0x8248(%ecx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,114,209,8 ; psrld $0x8,%xmm1 @@ -49650,7 +49650,7 @@ _sk_store_8888_sse2 LABEL PROC DB 193,226,2 ; shl $0x2,%edx DB 3,22 ; add (%esi),%edx DB 139,49 ; mov (%ecx),%esi - DB 15,40,167,205,128,0,0 ; movaps 0x80cd(%edi),%xmm4 + DB 15,40,167,173,128,0,0 ; movaps 0x80ad(%edi),%xmm4 DB 139,89,8 ; mov 0x8(%ecx),%ebx DB 15,40,232 ; movaps %xmm0,%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 @@ -49719,11 +49719,11 @@ _sk_load_bgra_sse2 LABEL PROC DB 139,57 ; mov (%ecx),%edi DB 117,102 ; jne 4e2d <_sk_load_bgra_sse2+0x92> DB 243,15,111,28,190 ; movdqu (%esi,%edi,4),%xmm3 - DB 102,15,111,130,7,128,0,0 ; movdqa 0x8007(%edx),%xmm0 + DB 102,15,111,130,231,127,0,0 ; movdqa 0x7fe7(%edx),%xmm0 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,219,200 ; pand %xmm0,%xmm1 DB 15,91,209 ; cvtdq2ps %xmm1,%xmm2 - DB 15,40,162,55,129,0,0 ; movaps 0x8137(%edx),%xmm4 + DB 15,40,162,23,129,0,0 ; movaps 0x8117(%edx),%xmm4 DB 15,89,212 ; mulps %xmm4,%xmm2 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,114,209,8 ; psrld $0x8,%xmm1 @@ -49786,11 +49786,11 @@ _sk_load_bgra_dst_sse2 LABEL PROC DB 139,57 ; mov (%ecx),%edi DB 117,118 ; jne 4f04 <_sk_load_bgra_dst_sse2+0xa2> DB 243,15,111,36,190 ; movdqu (%esi,%edi,4),%xmm4 - DB 102,15,111,170,64,127,0,0 ; movdqa 0x7f40(%edx),%xmm5 + DB 102,15,111,170,32,127,0,0 ; movdqa 0x7f20(%edx),%xmm5 DB 102,15,111,244 ; movdqa %xmm4,%xmm6 DB 102,15,219,245 ; pand %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 - DB 15,40,186,112,128,0,0 ; movaps 0x8070(%edx),%xmm7 + DB 15,40,186,80,128,0,0 ; movaps 0x8050(%edx),%xmm7 DB 15,89,247 ; mulps %xmm7,%xmm6 DB 15,41,113,48 ; movaps %xmm6,0x30(%ecx) DB 102,15,111,244 ; movdqa %xmm4,%xmm6 @@ -49883,11 +49883,11 @@ _sk_gather_bgra_sse2 LABEL PROC DB 102,15,98,194 ; punpckldq %xmm2,%xmm0 DB 102,15,98,217 ; punpckldq %xmm1,%xmm3 DB 102,15,108,216 ; punpcklqdq %xmm0,%xmm3 - DB 102,15,111,129,205,125,0,0 ; movdqa 0x7dcd(%ecx),%xmm0 + DB 102,15,111,129,173,125,0,0 ; movdqa 0x7dad(%ecx),%xmm0 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,219,200 ; pand %xmm0,%xmm1 DB 15,91,209 ; cvtdq2ps %xmm1,%xmm2 - DB 15,40,161,253,126,0,0 ; movaps 0x7efd(%ecx),%xmm4 + DB 15,40,161,221,126,0,0 ; movaps 0x7edd(%ecx),%xmm4 DB 15,89,212 ; mulps %xmm4,%xmm2 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,114,209,8 ; psrld $0x8,%xmm1 @@ -49929,7 +49929,7 @@ _sk_store_bgra_sse2 LABEL PROC DB 193,226,2 ; shl $0x2,%edx DB 3,22 ; add (%esi),%edx DB 139,49 ; mov (%ecx),%esi - DB 15,40,167,98,125,0,0 ; movaps 0x7d62(%edi),%xmm4 + DB 15,40,167,66,125,0,0 ; movaps 0x7d42(%edi),%xmm4 DB 139,89,8 ; mov 0x8(%ecx),%ebx DB 15,40,234 ; movaps %xmm2,%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 @@ -50026,11 +50026,11 @@ _sk_load_f16_sse2 LABEL PROC DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,97,200 ; punpcklwd %xmm0,%xmm1 DB 102,15,239,210 ; pxor %xmm2,%xmm2 - DB 102,15,111,170,124,128,0,0 ; movdqa 0x807c(%edx),%xmm5 + DB 102,15,111,170,92,128,0,0 ; movdqa 0x805c(%edx),%xmm5 DB 102,15,111,241 ; movdqa %xmm1,%xmm6 DB 102,15,219,245 ; pand %xmm5,%xmm6 - DB 102,15,219,138,140,128,0,0 ; pand 0x808c(%edx),%xmm1 - DB 102,15,111,130,156,128,0,0 ; movdqa 0x809c(%edx),%xmm0 + DB 102,15,219,138,108,128,0,0 ; pand 0x806c(%edx),%xmm1 + DB 102,15,111,130,124,128,0,0 ; movdqa 0x807c(%edx),%xmm0 DB 102,15,127,69,184 ; movdqa %xmm0,-0x48(%ebp) DB 102,15,114,246,16 ; pslld $0x10,%xmm6 DB 102,15,111,216 ; movdqa %xmm0,%xmm3 @@ -50042,7 +50042,7 @@ _sk_load_f16_sse2 LABEL PROC DB 102,15,239,255 ; pxor %xmm7,%xmm7 DB 102,15,111,212 ; movdqa %xmm4,%xmm2 DB 102,15,219,213 ; pand %xmm5,%xmm2 - DB 102,15,111,154,140,128,0,0 ; movdqa 0x808c(%edx),%xmm3 + DB 102,15,111,154,108,128,0,0 ; movdqa 0x806c(%edx),%xmm3 DB 102,15,219,227 ; pand %xmm3,%xmm4 DB 102,15,114,242,16 ; pslld $0x10,%xmm2 DB 102,15,102,196 ; pcmpgtd %xmm4,%xmm0 @@ -50055,7 +50055,7 @@ _sk_load_f16_sse2 LABEL PROC DB 102,15,219,253 ; pand %xmm5,%xmm7 DB 102,15,219,195 ; pand %xmm3,%xmm0 DB 102,15,114,247,16 ; pslld $0x10,%xmm7 - DB 102,15,111,146,156,128,0,0 ; movdqa 0x809c(%edx),%xmm2 + DB 102,15,111,146,124,128,0,0 ; movdqa 0x807c(%edx),%xmm2 DB 102,15,102,208 ; pcmpgtd %xmm0,%xmm2 DB 102,15,114,240,13 ; pslld $0xd,%xmm0 DB 102,15,235,199 ; por %xmm7,%xmm0 @@ -50070,7 +50070,7 @@ _sk_load_f16_sse2 LABEL PROC DB 102,15,127,93,184 ; movdqa %xmm3,-0x48(%ebp) DB 102,15,114,247,13 ; pslld $0xd,%xmm7 DB 102,15,235,253 ; por %xmm5,%xmm7 - DB 102,15,111,154,172,128,0,0 ; movdqa 0x80ac(%edx),%xmm3 + DB 102,15,111,154,140,128,0,0 ; movdqa 0x808c(%edx),%xmm3 DB 102,15,254,203 ; paddd %xmm3,%xmm1 DB 102,15,254,227 ; paddd %xmm3,%xmm4 DB 102,15,254,195 ; paddd %xmm3,%xmm0 @@ -50157,18 +50157,18 @@ _sk_load_f16_dst_sse2 LABEL PROC DB 102,15,126,85,232 ; movd %xmm2,-0x18(%ebp) DB 102,15,239,210 ; pxor %xmm2,%xmm2 DB 102,15,97,202 ; punpcklwd %xmm2,%xmm1 - DB 102,15,111,186,95,126,0,0 ; movdqa 0x7e5f(%edx),%xmm7 + DB 102,15,111,186,63,126,0,0 ; movdqa 0x7e3f(%edx),%xmm7 DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 102,15,219,215 ; pand %xmm7,%xmm2 - DB 102,15,111,154,111,126,0,0 ; movdqa 0x7e6f(%edx),%xmm3 + DB 102,15,111,154,79,126,0,0 ; movdqa 0x7e4f(%edx),%xmm3 DB 102,15,219,203 ; pand %xmm3,%xmm1 - DB 102,15,111,162,127,126,0,0 ; movdqa 0x7e7f(%edx),%xmm4 + DB 102,15,111,162,95,126,0,0 ; movdqa 0x7e5f(%edx),%xmm4 DB 102,15,114,242,16 ; pslld $0x10,%xmm2 DB 102,15,111,236 ; movdqa %xmm4,%xmm5 DB 102,15,102,233 ; pcmpgtd %xmm1,%xmm5 DB 102,15,114,241,13 ; pslld $0xd,%xmm1 DB 102,15,235,202 ; por %xmm2,%xmm1 - DB 102,15,111,146,143,126,0,0 ; movdqa 0x7e8f(%edx),%xmm2 + DB 102,15,111,146,111,126,0,0 ; movdqa 0x7e6f(%edx),%xmm2 DB 102,15,127,85,184 ; movdqa %xmm2,-0x48(%ebp) DB 102,15,254,202 ; paddd %xmm2,%xmm1 DB 102,15,223,233 ; pandn %xmm1,%xmm5 @@ -50312,11 +50312,11 @@ _sk_gather_f16_sse2 LABEL PROC DB 102,15,126,69,248 ; movd %xmm0,-0x8(%ebp) DB 102,15,97,206 ; punpcklwd %xmm6,%xmm1 DB 102,15,239,210 ; pxor %xmm2,%xmm2 - DB 102,15,111,177,195,123,0,0 ; movdqa 0x7bc3(%ecx),%xmm6 + DB 102,15,111,177,163,123,0,0 ; movdqa 0x7ba3(%ecx),%xmm6 DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,219,230 ; pand %xmm6,%xmm4 - DB 102,15,219,137,211,123,0,0 ; pand 0x7bd3(%ecx),%xmm1 - DB 102,15,111,129,227,123,0,0 ; movdqa 0x7be3(%ecx),%xmm0 + DB 102,15,219,137,179,123,0,0 ; pand 0x7bb3(%ecx),%xmm1 + DB 102,15,111,129,195,123,0,0 ; movdqa 0x7bc3(%ecx),%xmm0 DB 102,15,114,244,16 ; pslld $0x10,%xmm4 DB 102,15,111,216 ; movdqa %xmm0,%xmm3 DB 102,15,102,217 ; pcmpgtd %xmm1,%xmm3 @@ -50327,7 +50327,7 @@ _sk_gather_f16_sse2 LABEL PROC DB 102,15,239,255 ; pxor %xmm7,%xmm7 DB 102,15,111,213 ; movdqa %xmm5,%xmm2 DB 102,15,219,214 ; pand %xmm6,%xmm2 - DB 102,15,111,153,211,123,0,0 ; movdqa 0x7bd3(%ecx),%xmm3 + DB 102,15,111,153,179,123,0,0 ; movdqa 0x7bb3(%ecx),%xmm3 DB 102,15,219,235 ; pand %xmm3,%xmm5 DB 102,15,114,242,16 ; pslld $0x10,%xmm2 DB 102,15,111,224 ; movdqa %xmm0,%xmm4 @@ -50341,7 +50341,7 @@ _sk_gather_f16_sse2 LABEL PROC DB 102,15,219,254 ; pand %xmm6,%xmm7 DB 102,15,219,195 ; pand %xmm3,%xmm0 DB 102,15,114,247,16 ; pslld $0x10,%xmm7 - DB 102,15,111,145,227,123,0,0 ; movdqa 0x7be3(%ecx),%xmm2 + DB 102,15,111,145,195,123,0,0 ; movdqa 0x7bc3(%ecx),%xmm2 DB 102,15,111,218 ; movdqa %xmm2,%xmm3 DB 102,15,102,216 ; pcmpgtd %xmm0,%xmm3 DB 102,15,114,240,13 ; pslld $0xd,%xmm0 @@ -50350,12 +50350,12 @@ _sk_gather_f16_sse2 LABEL PROC DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,97,252 ; punpcklwd %xmm4,%xmm7 DB 102,15,219,247 ; pand %xmm7,%xmm6 - DB 102,15,219,185,211,123,0,0 ; pand 0x7bd3(%ecx),%xmm7 + DB 102,15,219,185,179,123,0,0 ; pand 0x7bb3(%ecx),%xmm7 DB 102,15,114,246,16 ; pslld $0x10,%xmm6 DB 102,15,102,215 ; pcmpgtd %xmm7,%xmm2 DB 102,15,114,247,13 ; pslld $0xd,%xmm7 DB 102,15,235,254 ; por %xmm6,%xmm7 - DB 102,15,111,161,243,123,0,0 ; movdqa 0x7bf3(%ecx),%xmm4 + DB 102,15,111,161,211,123,0,0 ; movdqa 0x7bd3(%ecx),%xmm4 DB 102,15,254,204 ; paddd %xmm4,%xmm1 DB 102,15,254,236 ; paddd %xmm4,%xmm5 DB 102,15,254,196 ; paddd %xmm4,%xmm0 @@ -50392,22 +50392,22 @@ _sk_store_f16_sse2 LABEL PROC DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 232,0,0,0,0 ; call 5791 <_sk_store_f16_sse2+0x19> DB 88 ; pop %eax - DB 102,15,111,152,63,122,0,0 ; movdqa 0x7a3f(%eax),%xmm3 + DB 102,15,111,152,31,122,0,0 ; movdqa 0x7a1f(%eax),%xmm3 DB 102,15,111,224 ; movdqa %xmm0,%xmm4 DB 102,15,219,227 ; pand %xmm3,%xmm4 - DB 102,15,111,136,111,122,0,0 ; movdqa 0x7a6f(%eax),%xmm1 + DB 102,15,111,136,79,122,0,0 ; movdqa 0x7a4f(%eax),%xmm1 DB 102,15,127,77,232 ; movdqa %xmm1,-0x18(%ebp) DB 102,15,111,240 ; movdqa %xmm0,%xmm6 DB 102,15,114,246,3 ; pslld $0x3,%xmm6 DB 102,15,219,241 ; pand %xmm1,%xmm6 DB 102,15,254,244 ; paddd %xmm4,%xmm6 - DB 102,15,111,184,79,122,0,0 ; movdqa 0x7a4f(%eax),%xmm7 + DB 102,15,111,184,47,122,0,0 ; movdqa 0x7a2f(%eax),%xmm7 DB 102,15,127,69,168 ; movdqa %xmm0,-0x58(%ebp) DB 102,15,219,199 ; pand %xmm7,%xmm0 - DB 102,15,111,168,95,122,0,0 ; movdqa 0x7a5f(%eax),%xmm5 + DB 102,15,111,168,63,122,0,0 ; movdqa 0x7a3f(%eax),%xmm5 DB 102,15,111,205 ; movdqa %xmm5,%xmm1 DB 102,15,102,200 ; pcmpgtd %xmm0,%xmm1 - DB 102,15,111,128,239,118,0,0 ; movdqa 0x76ef(%eax),%xmm0 + DB 102,15,111,128,207,118,0,0 ; movdqa 0x76cf(%eax),%xmm0 DB 102,15,127,69,216 ; movdqa %xmm0,-0x28(%ebp) DB 102,15,254,240 ; paddd %xmm0,%xmm6 DB 102,15,114,230,16 ; psrad $0x10,%xmm6 @@ -50459,8 +50459,8 @@ _sk_store_f16_sse2 LABEL PROC DB 102,15,97,245 ; punpcklwd %xmm5,%xmm6 DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,17 ; mov (%ecx),%edx DB 139,56 ; mov (%eax),%edi + DB 139,17 ; mov (%ecx),%edx DB 139,119,4 ; mov 0x4(%edi),%esi DB 15,175,113,4 ; imul 0x4(%ecx),%esi DB 193,230,3 ; shl $0x3,%esi @@ -50507,8 +50507,8 @@ _sk_load_u16_be_sse2 LABEL PROC DB 131,236,44 ; sub $0x2c,%esp DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,49 ; mov (%ecx),%esi DB 139,16 ; mov (%eax),%edx + DB 139,49 ; mov (%ecx),%esi DB 139,122,4 ; mov 0x4(%edx),%edi DB 15,175,121,4 ; imul 0x4(%ecx),%edi DB 1,255 ; add %edi,%edi @@ -50539,7 +50539,7 @@ _sk_load_u16_be_sse2 LABEL PROC DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,97,195 ; punpcklwd %xmm3,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,40,162,2,118,0,0 ; movaps 0x7602(%edx),%xmm4 + DB 15,40,162,226,117,0,0 ; movaps 0x75e2(%edx),%xmm4 DB 15,89,196 ; mulps %xmm4,%xmm0 DB 102,15,111,205 ; movdqa %xmm5,%xmm1 DB 102,15,113,241,8 ; psllw $0x8,%xmm1 @@ -50606,8 +50606,8 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC DB 131,236,28 ; sub $0x1c,%esp DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,121,8 ; mov 0x8(%ecx),%edi DB 139,16 ; mov (%eax),%edx + DB 139,121,8 ; mov 0x8(%ecx),%edi DB 139,114,4 ; mov 0x4(%edx),%esi DB 15,175,113,4 ; imul 0x4(%ecx),%esi DB 1,246 ; add %esi,%esi @@ -50641,7 +50641,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,97,195 ; punpcklwd %xmm3,%xmm0 DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 - DB 15,40,170,155,116,0,0 ; movaps 0x749b(%edx),%xmm5 + DB 15,40,170,123,116,0,0 ; movaps 0x747b(%edx),%xmm5 DB 15,89,197 ; mulps %xmm5,%xmm0 DB 102,15,111,204 ; movdqa %xmm4,%xmm1 DB 102,15,113,241,8 ; psllw $0x8,%xmm1 @@ -50667,7 +50667,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC DB 15,89,213 ; mulps %xmm5,%xmm2 DB 141,112,8 ; lea 0x8(%eax),%esi DB 131,236,8 ; sub $0x8,%esp - DB 15,40,154,43,114,0,0 ; movaps 0x722b(%edx),%xmm3 + DB 15,40,154,11,114,0,0 ; movaps 0x720b(%edx),%xmm3 DB 86 ; push %esi DB 81 ; push %ecx DB 255,80,4 ; call *0x4(%eax) @@ -50712,7 +50712,7 @@ _sk_store_u16_be_sse2 LABEL PROC DB 1,210 ; add %edx,%edx DB 3,22 ; add (%esi),%edx DB 139,49 ; mov (%ecx),%esi - DB 15,40,183,247,117,0,0 ; movaps 0x75f7(%edi),%xmm6 + DB 15,40,183,215,117,0,0 ; movaps 0x75d7(%edi),%xmm6 DB 139,121,8 ; mov 0x8(%ecx),%edi DB 193,230,2 ; shl $0x2,%esi DB 15,40,224 ; movaps %xmm0,%xmm4 @@ -50791,8 +50791,8 @@ _sk_load_f32_sse2 LABEL PROC DB 86 ; push %esi DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,57 ; mov (%ecx),%edi DB 139,48 ; mov (%eax),%esi + DB 139,57 ; mov (%ecx),%edi DB 139,86,4 ; mov 0x4(%esi),%edx DB 15,175,81,4 ; imul 0x4(%ecx),%edx DB 193,226,2 ; shl $0x2,%edx @@ -50853,8 +50853,8 @@ _sk_load_f32_dst_sse2 LABEL PROC DB 15,41,85,232 ; movaps %xmm2,-0x18(%ebp) DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,57 ; mov (%ecx),%edi DB 139,48 ; mov (%eax),%esi + DB 139,57 ; mov (%ecx),%edi DB 139,86,4 ; mov 0x4(%esi),%edx DB 15,175,81,4 ; imul 0x4(%ecx),%edx DB 193,226,2 ; shl $0x2,%edx @@ -50920,8 +50920,8 @@ _sk_store_f32_sse2 LABEL PROC DB 131,236,12 ; sub $0xc,%esp DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 139,25 ; mov (%ecx),%ebx DB 139,48 ; mov (%eax),%esi + DB 139,25 ; mov (%ecx),%ebx DB 139,86,4 ; mov 0x4(%esi),%edx DB 15,175,81,4 ; imul 0x4(%ecx),%edx DB 193,226,2 ; shl $0x2,%edx @@ -50984,7 +50984,7 @@ _sk_repeat_x_sse2 LABEL PROC DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 DB 15,194,238,1 ; cmpltps %xmm6,%xmm5 - DB 15,84,168,179,109,0,0 ; andps 0x6db3(%eax),%xmm5 + DB 15,84,168,147,109,0,0 ; andps 0x6d93(%eax),%xmm5 DB 15,92,245 ; subps %xmm5,%xmm6 DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4 DB 15,89,230 ; mulps %xmm6,%xmm4 @@ -51014,7 +51014,7 @@ _sk_repeat_y_sse2 LABEL PROC DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 DB 15,194,238,1 ; cmpltps %xmm6,%xmm5 - DB 15,84,168,97,109,0,0 ; andps 0x6d61(%eax),%xmm5 + DB 15,84,168,65,109,0,0 ; andps 0x6d41(%eax),%xmm5 DB 15,92,245 ; subps %xmm5,%xmm6 DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4 DB 15,89,230 ; mulps %xmm6,%xmm4 @@ -51042,13 +51042,13 @@ _sk_mirror_x_sse2 LABEL PROC DB 15,40,244 ; movaps %xmm4,%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 DB 15,92,198 ; subps %xmm6,%xmm0 - DB 243,15,89,169,159,116,0,0 ; mulss 0x749f(%ecx),%xmm5 + DB 243,15,89,169,127,116,0,0 ; mulss 0x747f(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,89,232 ; mulps %xmm0,%xmm5 DB 243,15,91,253 ; cvttps2dq %xmm5,%xmm7 DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7 DB 15,194,239,1 ; cmpltps %xmm7,%xmm5 - DB 15,84,169,15,109,0,0 ; andps 0x6d0f(%ecx),%xmm5 + DB 15,84,169,239,108,0,0 ; andps 0x6cef(%ecx),%xmm5 DB 15,92,253 ; subps %xmm5,%xmm7 DB 243,15,88,228 ; addss %xmm4,%xmm4 DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4 @@ -51081,13 +51081,13 @@ _sk_mirror_y_sse2 LABEL PROC DB 15,40,244 ; movaps %xmm4,%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 DB 15,92,206 ; subps %xmm6,%xmm1 - DB 243,15,89,169,43,116,0,0 ; mulss 0x742b(%ecx),%xmm5 + DB 243,15,89,169,11,116,0,0 ; mulss 0x740b(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,89,233 ; mulps %xmm1,%xmm5 DB 243,15,91,253 ; cvttps2dq %xmm5,%xmm7 DB 15,91,255 ; cvtdq2ps %xmm7,%xmm7 DB 15,194,239,1 ; cmpltps %xmm7,%xmm5 - DB 15,84,169,155,108,0,0 ; andps 0x6c9b(%ecx),%xmm5 + DB 15,84,169,123,108,0,0 ; andps 0x6c7b(%ecx),%xmm5 DB 15,92,253 ; subps %xmm5,%xmm7 DB 243,15,88,228 ; addss %xmm4,%xmm4 DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4 @@ -51116,7 +51116,7 @@ _sk_clamp_x_1_sse2 LABEL PROC DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 15,87,228 ; xorps %xmm4,%xmm4 DB 15,95,224 ; maxps %xmm0,%xmm4 - DB 15,93,160,39,108,0,0 ; minps 0x6c27(%eax),%xmm4 + DB 15,93,160,7,108,0,0 ; minps 0x6c07(%eax),%xmm4 DB 141,65,4 ; lea 0x4(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp DB 15,40,196 ; movaps %xmm4,%xmm0 @@ -51139,7 +51139,7 @@ _sk_repeat_x_1_sse2 LABEL PROC DB 15,91,228 ; cvtdq2ps %xmm4,%xmm4 DB 15,40,232 ; movaps %xmm0,%xmm5 DB 15,194,236,1 ; cmpltps %xmm4,%xmm5 - DB 15,84,168,247,107,0,0 ; andps 0x6bf7(%eax),%xmm5 + DB 15,84,168,215,107,0,0 ; andps 0x6bd7(%eax),%xmm5 DB 15,92,229 ; subps %xmm5,%xmm4 DB 15,92,196 ; subps %xmm4,%xmm0 DB 141,65,4 ; lea 0x4(%ecx),%eax @@ -51159,14 +51159,14 @@ _sk_mirror_x_1_sse2 LABEL PROC DB 232,0,0,0,0 ; call 6134 <_sk_mirror_x_1_sse2+0xb> DB 89 ; pop %ecx DB 139,69,12 ; mov 0xc(%ebp),%eax - DB 15,40,161,44,108,0,0 ; movaps 0x6c2c(%ecx),%xmm4 + DB 15,40,161,12,108,0,0 ; movaps 0x6c0c(%ecx),%xmm4 DB 15,88,196 ; addps %xmm4,%xmm0 - DB 15,40,169,172,107,0,0 ; movaps 0x6bac(%ecx),%xmm5 + DB 15,40,169,140,107,0,0 ; movaps 0x6b8c(%ecx),%xmm5 DB 15,89,232 ; mulps %xmm0,%xmm5 DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 DB 15,194,238,1 ; cmpltps %xmm6,%xmm5 - DB 15,84,169,188,107,0,0 ; andps 0x6bbc(%ecx),%xmm5 + DB 15,84,169,156,107,0,0 ; andps 0x6b9c(%ecx),%xmm5 DB 15,87,255 ; xorps %xmm7,%xmm7 DB 15,92,245 ; subps %xmm5,%xmm6 DB 15,88,246 ; addps %xmm6,%xmm6 @@ -51192,10 +51192,10 @@ _sk_luminance_to_alpha_sse2 LABEL PROC DB 232,0,0,0,0 ; call 6192 <_sk_luminance_to_alpha_sse2+0xe> DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 15,89,128,142,112,0,0 ; mulps 0x708e(%eax),%xmm0 - DB 15,89,136,158,112,0,0 ; mulps 0x709e(%eax),%xmm1 + DB 15,89,128,110,112,0,0 ; mulps 0x706e(%eax),%xmm0 + DB 15,89,136,126,112,0,0 ; mulps 0x707e(%eax),%xmm1 DB 15,88,200 ; addps %xmm0,%xmm1 - DB 15,89,152,174,112,0,0 ; mulps 0x70ae(%eax),%xmm3 + DB 15,89,152,142,112,0,0 ; mulps 0x708e(%eax),%xmm3 DB 15,88,217 ; addps %xmm1,%xmm3 DB 141,65,4 ; lea 0x4(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -51363,13 +51363,12 @@ _sk_matrix_4x5_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 131,236,8 ; sub $0x8,%esp DB 15,40,233 ; movaps %xmm1,%xmm5 + DB 15,40,224 ; movaps %xmm0,%xmm4 DB 139,69,12 ; mov 0xc(%ebp),%eax - DB 141,72,4 ; lea 0x4(%eax),%ecx - DB 137,77,252 ; mov %ecx,-0x4(%ebp) DB 139,8 ; mov (%eax),%ecx - DB 243,15,16,33 ; movss (%ecx),%xmm4 + DB 243,15,16,1 ; movss (%ecx),%xmm0 DB 243,15,16,73,4 ; movss 0x4(%ecx),%xmm1 - DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4 + DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0 DB 243,15,16,113,48 ; movss 0x30(%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 DB 243,15,16,121,64 ; movss 0x40(%ecx),%xmm7 @@ -51384,8 +51383,8 @@ _sk_matrix_4x5_sse2 LABEL PROC DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 DB 15,88,247 ; addps %xmm7,%xmm6 - DB 15,89,224 ; mulps %xmm0,%xmm4 - DB 15,88,230 ; addps %xmm6,%xmm4 + DB 15,89,196 ; mulps %xmm4,%xmm0 + DB 15,88,198 ; addps %xmm6,%xmm0 DB 15,198,201,0 ; shufps $0x0,%xmm1,%xmm1 DB 243,15,16,113,52 ; movss 0x34(%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -51401,7 +51400,7 @@ _sk_matrix_4x5_sse2 LABEL PROC DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 DB 15,88,247 ; addps %xmm7,%xmm6 - DB 15,89,200 ; mulps %xmm0,%xmm1 + DB 15,89,204 ; mulps %xmm4,%xmm1 DB 15,88,206 ; addps %xmm6,%xmm1 DB 243,15,16,113,56 ; movss 0x38(%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -51419,7 +51418,7 @@ _sk_matrix_4x5_sse2 LABEL PROC DB 15,88,247 ; addps %xmm7,%xmm6 DB 243,15,16,121,8 ; movss 0x8(%ecx),%xmm7 DB 15,198,255,0 ; shufps $0x0,%xmm7,%xmm7 - DB 15,89,248 ; mulps %xmm0,%xmm7 + DB 15,89,252 ; mulps %xmm4,%xmm7 DB 15,88,254 ; addps %xmm6,%xmm7 DB 243,15,16,113,60 ; movss 0x3c(%ecx),%xmm6 DB 15,198,246,0 ; shufps $0x0,%xmm6,%xmm6 @@ -51437,15 +51436,13 @@ _sk_matrix_4x5_sse2 LABEL PROC DB 15,88,211 ; addps %xmm3,%xmm2 DB 243,15,16,89,12 ; movss 0xc(%ecx),%xmm3 DB 15,198,219,0 ; shufps $0x0,%xmm3,%xmm3 - DB 15,89,216 ; mulps %xmm0,%xmm3 + DB 15,89,220 ; mulps %xmm4,%xmm3 DB 15,88,218 ; addps %xmm2,%xmm3 - DB 139,77,8 ; mov 0x8(%ebp),%ecx - DB 141,80,8 ; lea 0x8(%eax),%edx + DB 141,72,8 ; lea 0x8(%eax),%ecx DB 131,236,8 ; sub $0x8,%esp - DB 15,40,196 ; movaps %xmm4,%xmm0 DB 15,40,215 ; movaps %xmm7,%xmm2 - DB 82 ; push %edx DB 81 ; push %ecx + DB 255,117,8 ; pushl 0x8(%ebp) DB 255,80,4 ; call *0x4(%eax) DB 131,196,24 ; add $0x18,%esp DB 93 ; pop %ebp @@ -51569,23 +51566,21 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC DB 86 ; push %esi DB 131,236,60 ; sub $0x3c,%esp DB 15,41,69,184 ; movaps %xmm0,-0x48(%ebp) - DB 232,0,0,0,0 ; call 662f <_sk_evenly_spaced_gradient_sse2+0x12> + DB 232,0,0,0,0 ; call 6628 <_sk_evenly_spaced_gradient_sse2+0x12> DB 90 ; pop %edx - DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 141,65,4 ; lea 0x4(%ecx),%eax - DB 137,69,240 ; mov %eax,-0x10(%ebp) - DB 139,9 ; mov (%ecx),%ecx + DB 139,69,12 ; mov 0xc(%ebp),%eax + DB 139,8 ; mov (%eax),%ecx DB 139,49 ; mov (%ecx),%esi DB 139,65,4 ; mov 0x4(%ecx),%eax DB 78 ; dec %esi DB 102,15,110,206 ; movd %esi,%xmm1 DB 102,15,112,201,0 ; pshufd $0x0,%xmm1,%xmm1 - DB 102,15,111,146,33,108,0,0 ; movdqa 0x6c21(%edx),%xmm2 + DB 102,15,111,146,8,108,0,0 ; movdqa 0x6c08(%edx),%xmm2 DB 102,15,219,209 ; pand %xmm1,%xmm2 - DB 102,15,235,146,225,105,0,0 ; por 0x69e1(%edx),%xmm2 + DB 102,15,235,146,200,105,0,0 ; por 0x69c8(%edx),%xmm2 DB 102,15,114,209,16 ; psrld $0x10,%xmm1 - DB 102,15,235,138,49,108,0,0 ; por 0x6c31(%edx),%xmm1 - DB 15,88,138,65,108,0,0 ; addps 0x6c41(%edx),%xmm1 + DB 102,15,235,138,24,108,0,0 ; por 0x6c18(%edx),%xmm1 + DB 15,88,138,40,108,0,0 ; addps 0x6c28(%edx),%xmm1 DB 15,88,202 ; addps %xmm2,%xmm1 DB 15,89,200 ; mulps %xmm0,%xmm1 DB 243,15,91,201 ; cvttps2dq %xmm1,%xmm1 @@ -51670,14 +51665,13 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC DB 15,88,215 ; addps %xmm7,%xmm2 DB 15,89,221 ; mulps %xmm5,%xmm3 DB 15,88,216 ; addps %xmm0,%xmm3 - DB 139,69,8 ; mov 0x8(%ebp),%eax - DB 139,85,12 ; mov 0xc(%ebp),%edx - DB 141,74,8 ; lea 0x8(%edx),%ecx + DB 139,77,12 ; mov 0xc(%ebp),%ecx + DB 141,65,8 ; lea 0x8(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp DB 15,40,196 ; movaps %xmm4,%xmm0 - DB 81 ; push %ecx DB 80 ; push %eax - DB 255,82,4 ; call *0x4(%edx) + DB 255,117,8 ; pushl 0x8(%ebp) + DB 255,81,4 ; call *0x4(%ecx) DB 131,196,76 ; add $0x4c,%esp DB 94 ; pop %esi DB 95 ; pop %edi @@ -51690,18 +51684,18 @@ _sk_gauss_a_to_rgba_sse2 LABEL PROC DB 85 ; push %ebp DB 137,229 ; mov %esp,%ebp DB 131,236,8 ; sub $0x8,%esp - DB 232,0,0,0,0 ; call 67ef <_sk_gauss_a_to_rgba_sse2+0xb> + DB 232,0,0,0,0 ; call 67e1 <_sk_gauss_a_to_rgba_sse2+0xb> DB 88 ; pop %eax DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 15,40,128,145,106,0,0 ; movaps 0x6a91(%eax),%xmm0 + DB 15,40,128,127,106,0,0 ; movaps 0x6a7f(%eax),%xmm0 DB 15,89,195 ; mulps %xmm3,%xmm0 - DB 15,88,128,161,106,0,0 ; addps 0x6aa1(%eax),%xmm0 + DB 15,88,128,143,106,0,0 ; addps 0x6a8f(%eax),%xmm0 DB 15,89,195 ; mulps %xmm3,%xmm0 - DB 15,88,128,177,106,0,0 ; addps 0x6ab1(%eax),%xmm0 + DB 15,88,128,159,106,0,0 ; addps 0x6a9f(%eax),%xmm0 DB 15,89,195 ; mulps %xmm3,%xmm0 - DB 15,88,128,193,106,0,0 ; addps 0x6ac1(%eax),%xmm0 + DB 15,88,128,175,106,0,0 ; addps 0x6aaf(%eax),%xmm0 DB 15,89,195 ; mulps %xmm3,%xmm0 - DB 15,88,128,209,106,0,0 ; addps 0x6ad1(%eax),%xmm0 + DB 15,88,128,191,106,0,0 ; addps 0x6abf(%eax),%xmm0 DB 141,65,4 ; lea 0x4(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp DB 15,40,200 ; movaps %xmm0,%xmm1 @@ -51722,16 +51716,14 @@ _sk_gradient_sse2 LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,60 ; sub $0x3c,%esp - DB 139,77,12 ; mov 0xc(%ebp),%ecx - DB 141,81,4 ; lea 0x4(%ecx),%edx - DB 137,85,240 ; mov %edx,-0x10(%ebp) - DB 139,9 ; mov (%ecx),%ecx - DB 139,17 ; mov (%ecx),%edx + DB 139,69,12 ; mov 0xc(%ebp),%eax + DB 139,16 ; mov (%eax),%edx + DB 139,10 ; mov (%edx),%ecx DB 102,15,239,201 ; pxor %xmm1,%xmm1 - DB 131,250,2 ; cmp $0x2,%edx - DB 114,33 ; jb 687c <_sk_gradient_sse2+0x40> - DB 139,113,36 ; mov 0x24(%ecx),%esi - DB 74 ; dec %edx + DB 131,249,2 ; cmp $0x2,%ecx + DB 114,33 ; jb 6868 <_sk_gradient_sse2+0x3a> + DB 139,114,36 ; mov 0x24(%edx),%esi + DB 73 ; dec %ecx DB 131,198,4 ; add $0x4,%esi DB 102,15,239,201 ; pxor %xmm1,%xmm1 DB 243,15,16,22 ; movss (%esi),%xmm2 @@ -51739,80 +51731,80 @@ _sk_gradient_sse2 LABEL PROC DB 15,194,208,2 ; cmpleps %xmm0,%xmm2 DB 102,15,250,202 ; psubd %xmm2,%xmm1 DB 131,198,4 ; add $0x4,%esi - DB 74 ; dec %edx - DB 117,234 ; jne 6866 <_sk_gradient_sse2+0x2a> - DB 102,15,126,202 ; movd %xmm1,%edx + DB 73 ; dec %ecx + DB 117,234 ; jne 6852 <_sk_gradient_sse2+0x24> + DB 102,15,126,206 ; movd %xmm1,%esi DB 102,15,112,209,229 ; pshufd $0xe5,%xmm1,%xmm2 DB 102,15,112,217,78 ; pshufd $0x4e,%xmm1,%xmm3 - DB 102,15,126,222 ; movd %xmm3,%esi + DB 102,15,126,223 ; movd %xmm3,%edi DB 102,15,112,201,231 ; pshufd $0xe7,%xmm1,%xmm1 - DB 102,15,126,207 ; movd %xmm1,%edi - DB 139,65,4 ; mov 0x4(%ecx),%eax - DB 243,15,16,12,184 ; movss (%eax,%edi,4),%xmm1 - DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3 - DB 243,15,16,36,144 ; movss (%eax,%edx,4),%xmm4 - DB 102,15,126,211 ; movd %xmm2,%ebx - DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2 + DB 102,15,126,203 ; movd %xmm1,%ebx + DB 139,66,4 ; mov 0x4(%edx),%eax + DB 243,15,16,12,152 ; movss (%eax,%ebx,4),%xmm1 + DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3 + DB 243,15,16,36,176 ; movss (%eax,%esi,4),%xmm4 + DB 102,15,126,209 ; movd %xmm2,%ecx + DB 243,15,16,20,136 ; movss (%eax,%ecx,4),%xmm2 DB 15,20,217 ; unpcklps %xmm1,%xmm3 - DB 139,65,20 ; mov 0x14(%ecx),%eax - DB 243,15,16,12,184 ; movss (%eax,%edi,4),%xmm1 - DB 243,15,16,52,176 ; movss (%eax,%esi,4),%xmm6 - DB 243,15,16,44,144 ; movss (%eax,%edx,4),%xmm5 - DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7 + DB 139,66,20 ; mov 0x14(%edx),%eax + DB 243,15,16,12,152 ; movss (%eax,%ebx,4),%xmm1 + DB 243,15,16,52,184 ; movss (%eax,%edi,4),%xmm6 + DB 243,15,16,44,176 ; movss (%eax,%esi,4),%xmm5 + DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7 DB 15,20,226 ; unpcklps %xmm2,%xmm4 DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4 DB 102,15,41,101,184 ; movapd %xmm4,-0x48(%ebp) DB 15,20,241 ; unpcklps %xmm1,%xmm6 DB 15,20,239 ; unpcklps %xmm7,%xmm5 - DB 139,65,8 ; mov 0x8(%ecx),%eax - DB 243,15,16,20,184 ; movss (%eax,%edi,4),%xmm2 - DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3 - DB 243,15,16,12,144 ; movss (%eax,%edx,4),%xmm1 - DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7 + DB 139,66,8 ; mov 0x8(%edx),%eax + DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2 + DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3 + DB 243,15,16,12,176 ; movss (%eax,%esi,4),%xmm1 + DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7 DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5 DB 102,15,41,109,200 ; movapd %xmm5,-0x38(%ebp) DB 15,20,218 ; unpcklps %xmm2,%xmm3 DB 15,20,207 ; unpcklps %xmm7,%xmm1 DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1 - DB 139,65,24 ; mov 0x18(%ecx),%eax - DB 243,15,16,20,184 ; movss (%eax,%edi,4),%xmm2 - DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3 - DB 243,15,16,36,144 ; movss (%eax,%edx,4),%xmm4 - DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7 + DB 139,66,24 ; mov 0x18(%edx),%eax + DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2 + DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3 + DB 243,15,16,36,176 ; movss (%eax,%esi,4),%xmm4 + DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7 DB 15,20,218 ; unpcklps %xmm2,%xmm3 DB 15,20,231 ; unpcklps %xmm7,%xmm4 DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4 DB 102,15,41,101,216 ; movapd %xmm4,-0x28(%ebp) - DB 139,65,12 ; mov 0xc(%ecx),%eax - DB 243,15,16,20,184 ; movss (%eax,%edi,4),%xmm2 - DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3 + DB 139,66,12 ; mov 0xc(%edx),%eax + DB 243,15,16,20,152 ; movss (%eax,%ebx,4),%xmm2 + DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3 DB 15,20,218 ; unpcklps %xmm2,%xmm3 - DB 243,15,16,20,144 ; movss (%eax,%edx,4),%xmm2 - DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7 + DB 243,15,16,20,176 ; movss (%eax,%esi,4),%xmm2 + DB 243,15,16,60,136 ; movss (%eax,%ecx,4),%xmm7 DB 15,20,215 ; unpcklps %xmm7,%xmm2 DB 102,15,20,211 ; unpcklpd %xmm3,%xmm2 - DB 139,65,28 ; mov 0x1c(%ecx),%eax - DB 243,15,16,60,184 ; movss (%eax,%edi,4),%xmm7 - DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3 + DB 139,66,28 ; mov 0x1c(%edx),%eax + DB 243,15,16,60,152 ; movss (%eax,%ebx,4),%xmm7 + DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3 DB 15,20,223 ; unpcklps %xmm7,%xmm3 - DB 243,15,16,60,144 ; movss (%eax,%edx,4),%xmm7 - DB 243,15,16,44,152 ; movss (%eax,%ebx,4),%xmm5 + DB 243,15,16,60,176 ; movss (%eax,%esi,4),%xmm7 + DB 243,15,16,44,136 ; movss (%eax,%ecx,4),%xmm5 DB 15,20,253 ; unpcklps %xmm5,%xmm7 DB 102,15,20,251 ; unpcklpd %xmm3,%xmm7 - DB 139,65,16 ; mov 0x10(%ecx),%eax - DB 243,15,16,28,184 ; movss (%eax,%edi,4),%xmm3 - DB 243,15,16,44,176 ; movss (%eax,%esi,4),%xmm5 + DB 139,66,16 ; mov 0x10(%edx),%eax + DB 243,15,16,28,152 ; movss (%eax,%ebx,4),%xmm3 + DB 243,15,16,44,184 ; movss (%eax,%edi,4),%xmm5 DB 15,20,235 ; unpcklps %xmm3,%xmm5 - DB 243,15,16,28,144 ; movss (%eax,%edx,4),%xmm3 - DB 243,15,16,52,152 ; movss (%eax,%ebx,4),%xmm6 + DB 243,15,16,28,176 ; movss (%eax,%esi,4),%xmm3 + DB 243,15,16,52,136 ; movss (%eax,%ecx,4),%xmm6 DB 15,20,222 ; unpcklps %xmm6,%xmm3 DB 102,15,20,221 ; unpcklpd %xmm5,%xmm3 - DB 139,65,32 ; mov 0x20(%ecx),%eax - DB 243,15,16,44,184 ; movss (%eax,%edi,4),%xmm5 - DB 243,15,16,52,176 ; movss (%eax,%esi,4),%xmm6 + DB 139,66,32 ; mov 0x20(%edx),%eax + DB 243,15,16,44,152 ; movss (%eax,%ebx,4),%xmm5 + DB 243,15,16,52,184 ; movss (%eax,%edi,4),%xmm6 DB 15,20,245 ; unpcklps %xmm5,%xmm6 - DB 243,15,16,44,144 ; movss (%eax,%edx,4),%xmm5 - DB 243,15,16,36,152 ; movss (%eax,%ebx,4),%xmm4 + DB 243,15,16,44,176 ; movss (%eax,%esi,4),%xmm5 + DB 243,15,16,36,136 ; movss (%eax,%ecx,4),%xmm4 DB 15,20,236 ; unpcklps %xmm4,%xmm5 DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5 DB 15,40,101,184 ; movaps -0x48(%ebp),%xmm4 @@ -51824,13 +51816,14 @@ _sk_gradient_sse2 LABEL PROC DB 15,88,215 ; addps %xmm7,%xmm2 DB 15,89,216 ; mulps %xmm0,%xmm3 DB 15,88,221 ; addps %xmm5,%xmm3 - DB 139,69,240 ; mov -0x10(%ebp),%eax - DB 141,72,4 ; lea 0x4(%eax),%ecx + DB 139,69,12 ; mov 0xc(%ebp),%eax + DB 137,193 ; mov %eax,%ecx + DB 141,65,8 ; lea 0x8(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp DB 15,40,196 ; movaps %xmm4,%xmm0 - DB 81 ; push %ecx + DB 80 ; push %eax DB 255,117,8 ; pushl 0x8(%ebp) - DB 255,16 ; call *(%eax) + DB 255,81,4 ; call *0x4(%ecx) DB 131,196,76 ; add $0x4c,%esp DB 94 ; pop %esi DB 95 ; pop %edi @@ -51888,7 +51881,7 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC DB 15,40,218 ; movaps %xmm2,%xmm3 DB 15,40,209 ; movaps %xmm1,%xmm2 DB 15,40,200 ; movaps %xmm0,%xmm1 - DB 232,0,0,0,0 ; call 6a81 <_sk_xy_to_unit_angle_sse2+0x18> + DB 232,0,0,0,0 ; call 6a70 <_sk_xy_to_unit_angle_sse2+0x18> DB 88 ; pop %eax DB 15,87,237 ; xorps %xmm5,%xmm5 DB 15,92,233 ; subps %xmm1,%xmm5 @@ -51903,30 +51896,30 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC DB 15,94,247 ; divps %xmm7,%xmm6 DB 15,40,254 ; movaps %xmm6,%xmm7 DB 15,89,255 ; mulps %xmm7,%xmm7 - DB 15,40,128,79,104,0,0 ; movaps 0x684f(%eax),%xmm0 + DB 15,40,128,64,104,0,0 ; movaps 0x6840(%eax),%xmm0 DB 15,89,199 ; mulps %xmm7,%xmm0 - DB 15,88,128,95,104,0,0 ; addps 0x685f(%eax),%xmm0 + DB 15,88,128,80,104,0,0 ; addps 0x6850(%eax),%xmm0 DB 15,89,199 ; mulps %xmm7,%xmm0 - DB 15,88,128,111,104,0,0 ; addps 0x686f(%eax),%xmm0 + DB 15,88,128,96,104,0,0 ; addps 0x6860(%eax),%xmm0 DB 15,89,199 ; mulps %xmm7,%xmm0 - DB 15,88,128,127,104,0,0 ; addps 0x687f(%eax),%xmm0 + DB 15,88,128,112,104,0,0 ; addps 0x6870(%eax),%xmm0 DB 15,89,198 ; mulps %xmm6,%xmm0 DB 15,194,236,1 ; cmpltps %xmm4,%xmm5 - DB 15,40,176,143,104,0,0 ; movaps 0x688f(%eax),%xmm6 + DB 15,40,176,128,104,0,0 ; movaps 0x6880(%eax),%xmm6 DB 15,92,240 ; subps %xmm0,%xmm6 DB 15,84,245 ; andps %xmm5,%xmm6 DB 15,85,232 ; andnps %xmm0,%xmm5 DB 15,87,228 ; xorps %xmm4,%xmm4 DB 15,86,238 ; orps %xmm6,%xmm5 DB 15,194,204,1 ; cmpltps %xmm4,%xmm1 - DB 15,40,128,95,98,0,0 ; movaps 0x625f(%eax),%xmm0 + DB 15,40,128,80,98,0,0 ; movaps 0x6250(%eax),%xmm0 DB 15,92,197 ; subps %xmm5,%xmm0 DB 15,84,193 ; andps %xmm1,%xmm0 DB 15,85,205 ; andnps %xmm5,%xmm1 DB 15,86,200 ; orps %xmm0,%xmm1 DB 15,40,194 ; movaps %xmm2,%xmm0 DB 15,194,196,1 ; cmpltps %xmm4,%xmm0 - DB 15,40,168,111,98,0,0 ; movaps 0x626f(%eax),%xmm5 + DB 15,40,168,96,98,0,0 ; movaps 0x6260(%eax),%xmm5 DB 15,92,233 ; subps %xmm1,%xmm5 DB 15,84,232 ; andps %xmm0,%xmm5 DB 15,85,193 ; andnps %xmm1,%xmm0 @@ -51983,15 +51976,15 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC DB 15,40,241 ; movaps %xmm1,%xmm6 DB 15,89,246 ; mulps %xmm6,%xmm6 DB 15,88,240 ; addps %xmm0,%xmm6 - DB 232,0,0,0,0 ; call 6b9e <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31> + DB 232,0,0,0,0 ; call 6b8d <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31> DB 90 ; pop %edx DB 243,15,89,237 ; mulss %xmm5,%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,92,245 ; subps %xmm5,%xmm6 DB 243,15,16,65,32 ; movss 0x20(%ecx),%xmm0 DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0 - DB 15,89,162,130,103,0,0 ; mulps 0x6782(%edx),%xmm4 - DB 15,89,130,146,103,0,0 ; mulps 0x6792(%edx),%xmm0 + DB 15,89,162,115,103,0,0 ; mulps 0x6773(%edx),%xmm4 + DB 15,89,130,131,103,0,0 ; mulps 0x6783(%edx),%xmm0 DB 15,89,198 ; mulps %xmm6,%xmm0 DB 15,40,236 ; movaps %xmm4,%xmm5 DB 15,89,237 ; mulps %xmm5,%xmm5 @@ -51999,11 +51992,11 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC DB 15,81,237 ; sqrtps %xmm5,%xmm5 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,92,196 ; subps %xmm4,%xmm0 - DB 15,87,162,50,102,0,0 ; xorps 0x6632(%edx),%xmm4 + DB 15,87,162,35,102,0,0 ; xorps 0x6623(%edx),%xmm4 DB 15,92,229 ; subps %xmm5,%xmm4 DB 243,15,16,105,36 ; movss 0x24(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 - DB 15,89,170,66,97,0,0 ; mulps 0x6142(%edx),%xmm5 + DB 15,89,170,51,97,0,0 ; mulps 0x6133(%edx),%xmm5 DB 15,89,197 ; mulps %xmm5,%xmm0 DB 15,89,229 ; mulps %xmm5,%xmm4 DB 15,95,196 ; maxps %xmm4,%xmm0 @@ -52032,15 +52025,15 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC DB 15,40,241 ; movaps %xmm1,%xmm6 DB 15,89,246 ; mulps %xmm6,%xmm6 DB 15,88,240 ; addps %xmm0,%xmm6 - DB 232,0,0,0,0 ; call 6c3c <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31> + DB 232,0,0,0,0 ; call 6c2b <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31> DB 90 ; pop %edx DB 243,15,89,237 ; mulss %xmm5,%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,92,245 ; subps %xmm5,%xmm6 DB 243,15,16,65,32 ; movss 0x20(%ecx),%xmm0 DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0 - DB 15,89,162,228,102,0,0 ; mulps 0x66e4(%edx),%xmm4 - DB 15,89,130,244,102,0,0 ; mulps 0x66f4(%edx),%xmm0 + DB 15,89,162,213,102,0,0 ; mulps 0x66d5(%edx),%xmm4 + DB 15,89,130,229,102,0,0 ; mulps 0x66e5(%edx),%xmm0 DB 15,89,198 ; mulps %xmm6,%xmm0 DB 15,40,236 ; movaps %xmm4,%xmm5 DB 15,89,237 ; mulps %xmm5,%xmm5 @@ -52048,11 +52041,11 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC DB 15,81,237 ; sqrtps %xmm5,%xmm5 DB 15,40,197 ; movaps %xmm5,%xmm0 DB 15,92,196 ; subps %xmm4,%xmm0 - DB 15,87,162,148,101,0,0 ; xorps 0x6594(%edx),%xmm4 + DB 15,87,162,133,101,0,0 ; xorps 0x6585(%edx),%xmm4 DB 15,92,229 ; subps %xmm5,%xmm4 DB 243,15,16,105,36 ; movss 0x24(%ecx),%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 - DB 15,89,170,164,96,0,0 ; mulps 0x60a4(%edx),%xmm5 + DB 15,89,170,149,96,0,0 ; mulps 0x6095(%edx),%xmm5 DB 15,89,197 ; mulps %xmm5,%xmm0 DB 15,89,229 ; mulps %xmm5,%xmm4 DB 15,93,196 ; minps %xmm4,%xmm0 @@ -52070,7 +52063,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC DB 85 ; push %ebp DB 137,229 ; mov %esp,%ebp DB 131,236,8 ; sub $0x8,%esp - DB 232,0,0,0,0 ; call 6cb4 <_sk_xy_to_2pt_conical_linear_sse2+0xb> + DB 232,0,0,0,0 ; call 6ca3 <_sk_xy_to_2pt_conical_linear_sse2+0xb> DB 89 ; pop %ecx DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,16 ; mov (%eax),%edx @@ -52079,7 +52072,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC DB 243,15,89,236 ; mulss %xmm4,%xmm5 DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5 DB 15,88,232 ; addps %xmm0,%xmm5 - DB 15,89,169,108,102,0,0 ; mulps 0x666c(%ecx),%xmm5 + DB 15,89,169,93,102,0,0 ; mulps 0x665d(%ecx),%xmm5 DB 15,89,192 ; mulps %xmm0,%xmm0 DB 15,40,241 ; movaps %xmm1,%xmm6 DB 15,89,246 ; mulps %xmm6,%xmm6 @@ -52087,7 +52080,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC DB 243,15,89,228 ; mulss %xmm4,%xmm4 DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4 DB 15,92,196 ; subps %xmm4,%xmm0 - DB 15,87,129,28,101,0,0 ; xorps 0x651c(%ecx),%xmm0 + DB 15,87,129,13,101,0,0 ; xorps 0x650d(%ecx),%xmm0 DB 15,94,197 ; divps %xmm5,%xmm0 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 131,236,8 ; sub $0x8,%esp @@ -52158,16 +52151,16 @@ _sk_save_xy_sse2 LABEL PROC DB 131,236,24 ; sub $0x18,%esp DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp) DB 15,40,218 ; movaps %xmm2,%xmm3 - DB 232,0,0,0,0 ; call 6d9d <_sk_save_xy_sse2+0x12> + DB 232,0,0,0,0 ; call 6d8c <_sk_save_xy_sse2+0x12> DB 88 ; pop %eax - DB 15,40,160,67,95,0,0 ; movaps 0x5f43(%eax),%xmm4 + DB 15,40,160,52,95,0,0 ; movaps 0x5f34(%eax),%xmm4 DB 15,40,232 ; movaps %xmm0,%xmm5 DB 15,88,236 ; addps %xmm4,%xmm5 DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6 DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6 DB 15,40,253 ; movaps %xmm5,%xmm7 DB 15,194,254,1 ; cmpltps %xmm6,%xmm7 - DB 15,40,144,83,95,0,0 ; movaps 0x5f53(%eax),%xmm2 + DB 15,40,144,68,95,0,0 ; movaps 0x5f44(%eax),%xmm2 DB 15,84,250 ; andps %xmm2,%xmm7 DB 15,92,247 ; subps %xmm7,%xmm6 DB 15,92,238 ; subps %xmm6,%xmm5 @@ -52238,15 +52231,15 @@ _sk_bilinear_nx_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 6e7f <_sk_bilinear_nx_sse2+0xa> + DB 232,0,0,0,0 ; call 6e6e <_sk_bilinear_nx_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,6 ; movups (%esi),%xmm0 DB 15,16,102,64 ; movups 0x40(%esi),%xmm4 - DB 15,88,128,193,100,0,0 ; addps 0x64c1(%eax),%xmm0 - DB 15,40,168,113,94,0,0 ; movaps 0x5e71(%eax),%xmm5 + DB 15,88,128,178,100,0,0 ; addps 0x64b2(%eax),%xmm0 + DB 15,40,168,98,94,0,0 ; movaps 0x5e62(%eax),%xmm5 DB 15,92,236 ; subps %xmm4,%xmm5 DB 15,17,174,128,0,0,0 ; movups %xmm5,0x80(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax @@ -52265,14 +52258,14 @@ _sk_bilinear_px_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 6ec2 <_sk_bilinear_px_sse2+0xa> + DB 232,0,0,0,0 ; call 6eb1 <_sk_bilinear_px_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,6 ; movups (%esi),%xmm0 DB 15,16,102,64 ; movups 0x40(%esi),%xmm4 - DB 15,88,128,30,94,0,0 ; addps 0x5e1e(%eax),%xmm0 + DB 15,88,128,15,94,0,0 ; addps 0x5e0f(%eax),%xmm0 DB 15,17,166,128,0,0,0 ; movups %xmm4,0x80(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -52290,15 +52283,15 @@ _sk_bilinear_ny_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 6efb <_sk_bilinear_ny_sse2+0xa> + DB 232,0,0,0,0 ; call 6eea <_sk_bilinear_ny_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,78,32 ; movups 0x20(%esi),%xmm1 DB 15,16,102,96 ; movups 0x60(%esi),%xmm4 - DB 15,88,136,69,100,0,0 ; addps 0x6445(%eax),%xmm1 - DB 15,40,168,245,93,0,0 ; movaps 0x5df5(%eax),%xmm5 + DB 15,88,136,54,100,0,0 ; addps 0x6436(%eax),%xmm1 + DB 15,40,168,230,93,0,0 ; movaps 0x5de6(%eax),%xmm5 DB 15,92,236 ; subps %xmm4,%xmm5 DB 15,17,174,160,0,0,0 ; movups %xmm5,0xa0(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax @@ -52317,14 +52310,14 @@ _sk_bilinear_py_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 6f3f <_sk_bilinear_py_sse2+0xa> + DB 232,0,0,0,0 ; call 6f2e <_sk_bilinear_py_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,78,32 ; movups 0x20(%esi),%xmm1 DB 15,16,102,96 ; movups 0x60(%esi),%xmm4 - DB 15,88,136,161,93,0,0 ; addps 0x5da1(%eax),%xmm1 + DB 15,88,136,146,93,0,0 ; addps 0x5d92(%eax),%xmm1 DB 15,17,166,160,0,0,0 ; movups %xmm4,0xa0(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -52342,20 +52335,20 @@ _sk_bicubic_n3x_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 6f79 <_sk_bicubic_n3x_sse2+0xa> + DB 232,0,0,0,0 ; call 6f68 <_sk_bicubic_n3x_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,6 ; movups (%esi),%xmm0 DB 15,16,102,64 ; movups 0x40(%esi),%xmm4 - DB 15,88,128,215,99,0,0 ; addps 0x63d7(%eax),%xmm0 - DB 15,40,168,119,93,0,0 ; movaps 0x5d77(%eax),%xmm5 + DB 15,88,128,200,99,0,0 ; addps 0x63c8(%eax),%xmm0 + DB 15,40,168,104,93,0,0 ; movaps 0x5d68(%eax),%xmm5 DB 15,92,236 ; subps %xmm4,%xmm5 DB 15,40,229 ; movaps %xmm5,%xmm4 DB 15,89,228 ; mulps %xmm4,%xmm4 - DB 15,89,168,231,99,0,0 ; mulps 0x63e7(%eax),%xmm5 - DB 15,88,168,87,95,0,0 ; addps 0x5f57(%eax),%xmm5 + DB 15,89,168,216,99,0,0 ; mulps 0x63d8(%eax),%xmm5 + DB 15,88,168,72,95,0,0 ; addps 0x5f48(%eax),%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 DB 15,17,174,128,0,0,0 ; movups %xmm5,0x80(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax @@ -52374,23 +52367,23 @@ _sk_bicubic_n1x_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 6fd3 <_sk_bicubic_n1x_sse2+0xa> + DB 232,0,0,0,0 ; call 6fc2 <_sk_bicubic_n1x_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,6 ; movups (%esi),%xmm0 DB 15,16,102,64 ; movups 0x40(%esi),%xmm4 - DB 15,88,128,109,99,0,0 ; addps 0x636d(%eax),%xmm0 - DB 15,40,168,29,93,0,0 ; movaps 0x5d1d(%eax),%xmm5 + DB 15,88,128,94,99,0,0 ; addps 0x635e(%eax),%xmm0 + DB 15,40,168,14,93,0,0 ; movaps 0x5d0e(%eax),%xmm5 DB 15,92,236 ; subps %xmm4,%xmm5 - DB 15,40,160,157,99,0,0 ; movaps 0x639d(%eax),%xmm4 + DB 15,40,160,142,99,0,0 ; movaps 0x638e(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 - DB 15,88,160,173,99,0,0 ; addps 0x63ad(%eax),%xmm4 + DB 15,88,160,158,99,0,0 ; addps 0x639e(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 - DB 15,88,160,13,93,0,0 ; addps 0x5d0d(%eax),%xmm4 + DB 15,88,160,254,92,0,0 ; addps 0x5cfe(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 - DB 15,88,160,189,99,0,0 ; addps 0x63bd(%eax),%xmm4 + DB 15,88,160,174,99,0,0 ; addps 0x63ae(%eax),%xmm4 DB 15,17,166,128,0,0,0 ; movups %xmm4,0x80(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -52408,22 +52401,22 @@ _sk_bicubic_p1x_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 703b <_sk_bicubic_p1x_sse2+0xa> + DB 232,0,0,0,0 ; call 702a <_sk_bicubic_p1x_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi - DB 15,40,160,165,92,0,0 ; movaps 0x5ca5(%eax),%xmm4 + DB 15,40,160,150,92,0,0 ; movaps 0x5c96(%eax),%xmm4 DB 15,16,6 ; movups (%esi),%xmm0 DB 15,16,110,64 ; movups 0x40(%esi),%xmm5 DB 15,88,196 ; addps %xmm4,%xmm0 - DB 15,40,176,53,99,0,0 ; movaps 0x6335(%eax),%xmm6 + DB 15,40,176,38,99,0,0 ; movaps 0x6326(%eax),%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 - DB 15,88,176,69,99,0,0 ; addps 0x6345(%eax),%xmm6 + DB 15,88,176,54,99,0,0 ; addps 0x6336(%eax),%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 DB 15,88,244 ; addps %xmm4,%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 - DB 15,88,176,85,99,0,0 ; addps 0x6355(%eax),%xmm6 + DB 15,88,176,70,99,0,0 ; addps 0x6346(%eax),%xmm6 DB 15,17,182,128,0,0,0 ; movups %xmm6,0x80(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -52441,18 +52434,18 @@ _sk_bicubic_p3x_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 7098 <_sk_bicubic_p3x_sse2+0xa> + DB 232,0,0,0,0 ; call 7087 <_sk_bicubic_p3x_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,6 ; movups (%esi),%xmm0 DB 15,16,102,64 ; movups 0x40(%esi),%xmm4 - DB 15,88,128,232,98,0,0 ; addps 0x62e8(%eax),%xmm0 + DB 15,88,128,217,98,0,0 ; addps 0x62d9(%eax),%xmm0 DB 15,40,236 ; movaps %xmm4,%xmm5 DB 15,89,237 ; mulps %xmm5,%xmm5 - DB 15,89,160,200,98,0,0 ; mulps 0x62c8(%eax),%xmm4 - DB 15,88,160,56,94,0,0 ; addps 0x5e38(%eax),%xmm4 + DB 15,89,160,185,98,0,0 ; mulps 0x62b9(%eax),%xmm4 + DB 15,88,160,41,94,0,0 ; addps 0x5e29(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 DB 15,17,166,128,0,0,0 ; movups %xmm4,0x80(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax @@ -52471,20 +52464,20 @@ _sk_bicubic_n3y_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 70e8 <_sk_bicubic_n3y_sse2+0xa> + DB 232,0,0,0,0 ; call 70d7 <_sk_bicubic_n3y_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,78,32 ; movups 0x20(%esi),%xmm1 DB 15,16,102,96 ; movups 0x60(%esi),%xmm4 - DB 15,88,136,104,98,0,0 ; addps 0x6268(%eax),%xmm1 - DB 15,40,168,8,92,0,0 ; movaps 0x5c08(%eax),%xmm5 + DB 15,88,136,89,98,0,0 ; addps 0x6259(%eax),%xmm1 + DB 15,40,168,249,91,0,0 ; movaps 0x5bf9(%eax),%xmm5 DB 15,92,236 ; subps %xmm4,%xmm5 DB 15,40,229 ; movaps %xmm5,%xmm4 DB 15,89,228 ; mulps %xmm4,%xmm4 - DB 15,89,168,120,98,0,0 ; mulps 0x6278(%eax),%xmm5 - DB 15,88,168,232,93,0,0 ; addps 0x5de8(%eax),%xmm5 + DB 15,89,168,105,98,0,0 ; mulps 0x6269(%eax),%xmm5 + DB 15,88,168,217,93,0,0 ; addps 0x5dd9(%eax),%xmm5 DB 15,89,236 ; mulps %xmm4,%xmm5 DB 15,17,174,160,0,0,0 ; movups %xmm5,0xa0(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax @@ -52503,23 +52496,23 @@ _sk_bicubic_n1y_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 7143 <_sk_bicubic_n1y_sse2+0xa> + DB 232,0,0,0,0 ; call 7132 <_sk_bicubic_n1y_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,78,32 ; movups 0x20(%esi),%xmm1 DB 15,16,102,96 ; movups 0x60(%esi),%xmm4 - DB 15,88,136,253,97,0,0 ; addps 0x61fd(%eax),%xmm1 - DB 15,40,168,173,91,0,0 ; movaps 0x5bad(%eax),%xmm5 + DB 15,88,136,238,97,0,0 ; addps 0x61ee(%eax),%xmm1 + DB 15,40,168,158,91,0,0 ; movaps 0x5b9e(%eax),%xmm5 DB 15,92,236 ; subps %xmm4,%xmm5 - DB 15,40,160,45,98,0,0 ; movaps 0x622d(%eax),%xmm4 + DB 15,40,160,30,98,0,0 ; movaps 0x621e(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 - DB 15,88,160,61,98,0,0 ; addps 0x623d(%eax),%xmm4 + DB 15,88,160,46,98,0,0 ; addps 0x622e(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 - DB 15,88,160,157,91,0,0 ; addps 0x5b9d(%eax),%xmm4 + DB 15,88,160,142,91,0,0 ; addps 0x5b8e(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 - DB 15,88,160,77,98,0,0 ; addps 0x624d(%eax),%xmm4 + DB 15,88,160,62,98,0,0 ; addps 0x623e(%eax),%xmm4 DB 15,17,166,160,0,0,0 ; movups %xmm4,0xa0(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -52537,22 +52530,22 @@ _sk_bicubic_p1y_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 71ac <_sk_bicubic_p1y_sse2+0xa> + DB 232,0,0,0,0 ; call 719b <_sk_bicubic_p1y_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi - DB 15,40,160,52,91,0,0 ; movaps 0x5b34(%eax),%xmm4 + DB 15,40,160,37,91,0,0 ; movaps 0x5b25(%eax),%xmm4 DB 15,16,78,32 ; movups 0x20(%esi),%xmm1 DB 15,16,110,96 ; movups 0x60(%esi),%xmm5 DB 15,88,204 ; addps %xmm4,%xmm1 - DB 15,40,176,196,97,0,0 ; movaps 0x61c4(%eax),%xmm6 + DB 15,40,176,181,97,0,0 ; movaps 0x61b5(%eax),%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 - DB 15,88,176,212,97,0,0 ; addps 0x61d4(%eax),%xmm6 + DB 15,88,176,197,97,0,0 ; addps 0x61c5(%eax),%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 DB 15,88,244 ; addps %xmm4,%xmm6 DB 15,89,245 ; mulps %xmm5,%xmm6 - DB 15,88,176,228,97,0,0 ; addps 0x61e4(%eax),%xmm6 + DB 15,88,176,213,97,0,0 ; addps 0x61d5(%eax),%xmm6 DB 15,17,182,160,0,0,0 ; movups %xmm6,0xa0(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp @@ -52570,18 +52563,18 @@ _sk_bicubic_p3y_sse2 LABEL PROC DB 137,229 ; mov %esp,%ebp DB 86 ; push %esi DB 80 ; push %eax - DB 232,0,0,0,0 ; call 720a <_sk_bicubic_p3y_sse2+0xa> + DB 232,0,0,0,0 ; call 71f9 <_sk_bicubic_p3y_sse2+0xa> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,12 ; mov 0xc(%ebp),%edx DB 139,50 ; mov (%edx),%esi DB 15,16,78,32 ; movups 0x20(%esi),%xmm1 DB 15,16,102,96 ; movups 0x60(%esi),%xmm4 - DB 15,88,136,118,97,0,0 ; addps 0x6176(%eax),%xmm1 + DB 15,88,136,103,97,0,0 ; addps 0x6167(%eax),%xmm1 DB 15,40,236 ; movaps %xmm4,%xmm5 DB 15,89,237 ; mulps %xmm5,%xmm5 - DB 15,89,160,86,97,0,0 ; mulps 0x6156(%eax),%xmm4 - DB 15,88,160,198,92,0,0 ; addps 0x5cc6(%eax),%xmm4 + DB 15,89,160,71,97,0,0 ; mulps 0x6147(%eax),%xmm4 + DB 15,88,160,183,92,0,0 ; addps 0x5cb7(%eax),%xmm4 DB 15,89,229 ; mulps %xmm5,%xmm4 DB 15,17,166,160,0,0,0 ; movups %xmm4,0xa0(%esi) DB 141,66,8 ; lea 0x8(%edx),%eax @@ -52602,10 +52595,10 @@ _sk_callback_sse2 LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,12 ; sub $0xc,%esp - DB 139,117,12 ; mov 0xc(%ebp),%esi - DB 139,125,8 ; mov 0x8(%ebp),%edi - DB 139,71,8 ; mov 0x8(%edi),%eax - DB 139,30 ; mov (%esi),%ebx + DB 139,117,8 ; mov 0x8(%ebp),%esi + DB 139,125,12 ; mov 0xc(%ebp),%edi + DB 139,31 ; mov (%edi),%ebx + DB 139,70,8 ; mov 0x8(%esi),%eax DB 15,40,224 ; movaps %xmm0,%xmm4 DB 15,20,225 ; unpcklps %xmm1,%xmm4 DB 15,40,234 ; movaps %xmm2,%xmm5 @@ -52647,11 +52640,11 @@ _sk_callback_sse2 LABEL PROC DB 15,40,212 ; movaps %xmm4,%xmm2 DB 102,15,20,211 ; unpcklpd %xmm3,%xmm2 DB 15,18,220 ; movhlps %xmm4,%xmm3 - DB 141,70,8 ; lea 0x8(%esi),%eax + DB 141,71,8 ; lea 0x8(%edi),%eax DB 131,236,8 ; sub $0x8,%esp DB 80 ; push %eax - DB 87 ; push %edi - DB 255,86,4 ; call *0x4(%esi) + DB 86 ; push %esi + DB 255,87,4 ; call *0x4(%edi) DB 131,196,28 ; add $0x1c,%esp DB 94 ; pop %esi DB 95 ; pop %edi @@ -52666,12 +52659,10 @@ _sk_clut_3D_sse2 LABEL PROC DB 83 ; push %ebx DB 87 ; push %edi DB 86 ; push %esi - DB 129,236,44,1,0,0 ; sub $0x12c,%esp - DB 15,41,157,200,254,255,255 ; movaps %xmm3,-0x138(%ebp) + DB 129,236,28,1,0,0 ; sub $0x11c,%esp + DB 15,41,157,216,254,255,255 ; movaps %xmm3,-0x128(%ebp) DB 15,40,216 ; movaps %xmm0,%xmm3 DB 139,69,12 ; mov 0xc(%ebp),%eax - DB 141,72,4 ; lea 0x4(%eax),%ecx - DB 137,141,20,255,255,255 ; mov %ecx,-0xec(%ebp) DB 139,8 ; mov (%eax),%ecx DB 139,81,12 ; mov 0xc(%ecx),%edx DB 141,114,255 ; lea -0x1(%edx),%esi @@ -52680,7 +52671,7 @@ _sk_clut_3D_sse2 LABEL PROC DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0 DB 15,89,194 ; mulps %xmm2,%xmm0 DB 15,40,224 ; movaps %xmm0,%xmm4 - DB 15,41,165,232,254,255,255 ; movaps %xmm4,-0x118(%ebp) + DB 15,41,165,248,254,255,255 ; movaps %xmm4,-0x108(%ebp) DB 102,15,110,194 ; movd %edx,%xmm0 DB 102,15,112,240,0 ; pshufd $0x0,%xmm0,%xmm6 DB 102,15,127,117,152 ; movdqa %xmm6,-0x68(%ebp) @@ -52722,15 +52713,15 @@ _sk_clut_3D_sse2 LABEL PROC DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0 DB 102,15,98,200 ; punpckldq %xmm0,%xmm1 DB 102,15,127,77,136 ; movdqa %xmm1,-0x78(%ebp) - DB 232,0,0,0,0 ; call 73f6 <_sk_clut_3D_sse2+0xf7> + DB 232,0,0,0,0 ; call 73dc <_sk_clut_3D_sse2+0xee> DB 90 ; pop %edx DB 243,15,91,196 ; cvttps2dq %xmm4,%xmm0 - DB 102,15,127,133,248,254,255,255 ; movdqa %xmm0,-0x108(%ebp) + DB 102,15,127,133,8,255,255,255 ; movdqa %xmm0,-0xf8(%ebp) DB 102,15,111,221 ; movdqa %xmm5,%xmm3 DB 102,15,254,216 ; paddd %xmm0,%xmm3 DB 102,15,111,193 ; movdqa %xmm1,%xmm0 DB 102,15,254,195 ; paddd %xmm3,%xmm0 - DB 102,15,111,162,186,95,0,0 ; movdqa 0x5fba(%edx),%xmm4 + DB 102,15,111,162,180,95,0,0 ; movdqa 0x5fb4(%edx),%xmm4 DB 102,15,127,165,120,255,255,255 ; movdqa %xmm4,-0x88(%ebp) DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1 DB 102,15,244,196 ; pmuludq %xmm4,%xmm0 @@ -52770,7 +52761,7 @@ _sk_clut_3D_sse2 LABEL PROC DB 243,15,16,4,129 ; movss (%ecx,%eax,4),%xmm0 DB 15,20,248 ; unpcklps %xmm0,%xmm7 DB 102,15,20,252 ; unpcklpd %xmm4,%xmm7 - DB 102,15,111,130,58,89,0,0 ; movdqa 0x593a(%edx),%xmm0 + DB 102,15,111,130,52,89,0,0 ; movdqa 0x5934(%edx),%xmm0 DB 102,15,127,133,104,255,255,255 ; movdqa %xmm0,-0x98(%ebp) DB 102,15,254,200 ; paddd %xmm0,%xmm1 DB 102,15,112,193,229 ; pshufd $0xe5,%xmm1,%xmm0 @@ -52787,8 +52778,8 @@ _sk_clut_3D_sse2 LABEL PROC DB 243,15,16,4,129 ; movss (%ecx,%eax,4),%xmm0 DB 15,20,240 ; unpcklps %xmm0,%xmm6 DB 102,15,20,241 ; unpcklpd %xmm1,%xmm6 - DB 15,40,130,170,95,0,0 ; movaps 0x5faa(%edx),%xmm0 - DB 15,40,141,232,254,255,255 ; movaps -0x118(%ebp),%xmm1 + DB 15,40,130,164,95,0,0 ; movaps 0x5fa4(%edx),%xmm0 + DB 15,40,141,248,254,255,255 ; movaps -0x108(%ebp),%xmm1 DB 15,88,200 ; addps %xmm0,%xmm1 DB 15,41,77,200 ; movaps %xmm1,-0x38(%ebp) DB 15,40,141,88,255,255,255 ; movaps -0xa8(%ebp),%xmm1 @@ -52872,7 +52863,7 @@ _sk_clut_3D_sse2 LABEL PROC DB 15,92,206 ; subps %xmm6,%xmm1 DB 15,89,204 ; mulps %xmm4,%xmm1 DB 15,88,206 ; addps %xmm6,%xmm1 - DB 15,41,141,216,254,255,255 ; movaps %xmm1,-0x128(%ebp) + DB 15,41,141,232,254,255,255 ; movaps %xmm1,-0x118(%ebp) DB 243,15,91,133,72,255,255,255 ; cvttps2dq -0xb8(%ebp),%xmm0 DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4 DB 102,15,111,77,152 ; movdqa -0x68(%ebp),%xmm1 @@ -52883,7 +52874,7 @@ _sk_clut_3D_sse2 LABEL PROC DB 102,15,112,196,232 ; pshufd $0xe8,%xmm4,%xmm0 DB 102,15,98,248 ; punpckldq %xmm0,%xmm7 DB 102,15,127,125,152 ; movdqa %xmm7,-0x68(%ebp) - DB 102,15,254,189,248,254,255,255 ; paddd -0x108(%ebp),%xmm7 + DB 102,15,254,189,8,255,255,255 ; paddd -0xf8(%ebp),%xmm7 DB 102,15,111,199 ; movdqa %xmm7,%xmm0 DB 102,15,254,69,136 ; paddd -0x78(%ebp),%xmm0 DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4 @@ -53020,7 +53011,7 @@ _sk_clut_3D_sse2 LABEL PROC DB 15,89,212 ; mulps %xmm4,%xmm2 DB 15,88,208 ; addps %xmm0,%xmm2 DB 15,41,149,56,255,255,255 ; movaps %xmm2,-0xc8(%ebp) - DB 15,40,133,216,254,255,255 ; movaps -0x128(%ebp),%xmm0 + DB 15,40,133,232,254,255,255 ; movaps -0x118(%ebp),%xmm0 DB 15,92,216 ; subps %xmm0,%xmm3 DB 15,89,220 ; mulps %xmm4,%xmm3 DB 15,88,216 ; addps %xmm0,%xmm3 @@ -53291,8 +53282,8 @@ _sk_clut_3D_sse2 LABEL PROC DB 15,92,214 ; subps %xmm6,%xmm2 DB 15,89,211 ; mulps %xmm3,%xmm2 DB 15,88,214 ; addps %xmm6,%xmm2 - DB 15,91,157,248,254,255,255 ; cvtdq2ps -0x108(%ebp),%xmm3 - DB 15,40,165,232,254,255,255 ; movaps -0x118(%ebp),%xmm4 + DB 15,91,157,8,255,255,255 ; cvtdq2ps -0xf8(%ebp),%xmm3 + DB 15,40,165,248,254,255,255 ; movaps -0x108(%ebp),%xmm4 DB 15,92,227 ; subps %xmm3,%xmm4 DB 15,40,93,184 ; movaps -0x48(%ebp),%xmm3 DB 15,92,195 ; subps %xmm3,%xmm0 @@ -53306,15 +53297,14 @@ _sk_clut_3D_sse2 LABEL PROC DB 15,92,211 ; subps %xmm3,%xmm2 DB 15,89,212 ; mulps %xmm4,%xmm2 DB 15,88,211 ; addps %xmm3,%xmm2 - DB 139,69,8 ; mov 0x8(%ebp),%eax - DB 139,85,12 ; mov 0xc(%ebp),%edx - DB 141,74,8 ; lea 0x8(%edx),%ecx + DB 139,77,12 ; mov 0xc(%ebp),%ecx + DB 141,65,8 ; lea 0x8(%ecx),%eax DB 131,236,8 ; sub $0x8,%esp - DB 15,40,157,200,254,255,255 ; movaps -0x138(%ebp),%xmm3 - DB 81 ; push %ecx + DB 15,40,157,216,254,255,255 ; movaps -0x128(%ebp),%xmm3 DB 80 ; push %eax - DB 255,82,4 ; call *0x4(%edx) - DB 129,196,60,1,0,0 ; add $0x13c,%esp + DB 255,117,8 ; pushl 0x8(%ebp) + DB 255,81,4 ; call *0x4(%ecx) + DB 129,196,44,1,0,0 ; add $0x12c,%esp DB 94 ; pop %esi DB 95 ; pop %edi DB 91 ; pop %ebx @@ -53328,10 +53318,8 @@ _sk_clut_4D_sse2 LABEL PROC DB 83 ; push %ebx DB 87 ; push %edi DB 86 ; push %esi - DB 129,236,92,1,0,0 ; sub $0x15c,%esp + DB 129,236,76,1,0,0 ; sub $0x14c,%esp DB 139,69,12 ; mov 0xc(%ebp),%eax - DB 141,72,4 ; lea 0x4(%eax),%ecx - DB 137,141,212,254,255,255 ; mov %ecx,-0x12c(%ebp) DB 139,16 ; mov (%eax),%edx DB 139,74,16 ; mov 0x10(%edx),%ecx DB 141,113,255 ; lea -0x1(%ecx),%esi @@ -53408,18 +53396,18 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,112,201,232 ; pshufd $0xe8,%xmm1,%xmm1 DB 102,15,98,217 ; punpckldq %xmm1,%xmm3 DB 102,15,127,93,152 ; movdqa %xmm3,-0x68(%ebp) - DB 232,0,0,0,0 ; call 7f8c <_sk_clut_4D_sse2+0x16e> + DB 232,0,0,0,0 ; call 7f68 <_sk_clut_4D_sse2+0x165> DB 89 ; pop %ecx DB 15,40,197 ; movaps %xmm5,%xmm0 - DB 15,41,133,152,254,255,255 ; movaps %xmm0,-0x168(%ebp) + DB 15,41,133,168,254,255,255 ; movaps %xmm0,-0x158(%ebp) DB 243,15,91,200 ; cvttps2dq %xmm0,%xmm1 - DB 102,15,127,141,184,254,255,255 ; movdqa %xmm1,-0x148(%ebp) + DB 102,15,127,141,200,254,255,255 ; movdqa %xmm1,-0x138(%ebp) DB 102,15,254,241 ; paddd %xmm1,%xmm6 DB 102,15,127,117,200 ; movdqa %xmm6,-0x38(%ebp) DB 102,15,111,212 ; movdqa %xmm4,%xmm2 DB 102,15,254,214 ; paddd %xmm6,%xmm2 DB 102,15,254,218 ; paddd %xmm2,%xmm3 - DB 102,15,111,161,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm4 + DB 102,15,111,161,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm4 DB 102,15,112,203,245 ; pshufd $0xf5,%xmm3,%xmm1 DB 102,15,244,220 ; pmuludq %xmm4,%xmm3 DB 102,15,244,204 ; pmuludq %xmm4,%xmm1 @@ -53461,7 +53449,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 15,20,223 ; unpcklps %xmm7,%xmm3 DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3 DB 102,15,41,157,232,254,255,255 ; movapd %xmm3,-0x118(%ebp) - DB 102,15,254,137,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm1 + DB 102,15,254,137,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm1 DB 102,15,112,241,229 ; pshufd $0xe5,%xmm1,%xmm6 DB 102,15,126,240 ; movd %xmm6,%eax DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6 @@ -53476,7 +53464,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,60,130 ; movss (%edx,%eax,4),%xmm7 DB 15,20,223 ; unpcklps %xmm7,%xmm3 DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3 - DB 15,40,185,20,84,0,0 ; movaps 0x5414(%ecx),%xmm7 + DB 15,40,185,24,84,0,0 ; movaps 0x5418(%ecx),%xmm7 DB 15,88,199 ; addps %xmm7,%xmm0 DB 15,41,133,120,255,255,255 ; movaps %xmm0,-0x88(%ebp) DB 15,40,133,248,254,255,255 ; movaps -0x108(%ebp),%xmm0 @@ -53484,7 +53472,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 15,41,69,136 ; movaps %xmm0,-0x78(%ebp) DB 15,40,133,56,255,255,255 ; movaps -0xc8(%ebp),%xmm0 DB 15,88,199 ; addps %xmm7,%xmm0 - DB 15,41,133,168,254,255,255 ; movaps %xmm0,-0x158(%ebp) + DB 15,41,133,184,254,255,255 ; movaps %xmm0,-0x148(%ebp) DB 15,88,125,216 ; addps -0x28(%ebp),%xmm7 DB 243,15,91,255 ; cvttps2dq %xmm7,%xmm7 DB 102,15,112,199,245 ; pshufd $0xf5,%xmm7,%xmm0 @@ -53497,7 +53485,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,127,101,168 ; movdqa %xmm4,-0x58(%ebp) DB 102,15,254,212 ; paddd %xmm4,%xmm2 DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0 - DB 102,15,111,161,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm4 + DB 102,15,111,161,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm4 DB 102,15,244,212 ; pmuludq %xmm4,%xmm2 DB 102,15,244,196 ; pmuludq %xmm4,%xmm0 DB 102,15,112,240,232 ; pshufd $0xe8,%xmm0,%xmm6 @@ -53533,7 +53521,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5 DB 15,20,213 ; unpcklps %xmm5,%xmm2 DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2 - DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0 + DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0 DB 102,15,112,232,229 ; pshufd $0xe5,%xmm0,%xmm5 DB 102,15,126,232 ; movd %xmm5,%eax DB 102,15,112,232,78 ; pshufd $0x4e,%xmm0,%xmm5 @@ -53565,7 +53553,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 15,92,251 ; subps %xmm3,%xmm7 DB 15,89,248 ; mulps %xmm0,%xmm7 DB 15,88,251 ; addps %xmm3,%xmm7 - DB 243,15,91,141,168,254,255,255 ; cvttps2dq -0x158(%ebp),%xmm1 + DB 243,15,91,141,184,254,255,255 ; cvttps2dq -0x148(%ebp),%xmm1 DB 102,15,112,217,245 ; pshufd $0xf5,%xmm1,%xmm3 DB 102,15,111,133,88,255,255,255 ; movdqa -0xa8(%ebp),%xmm0 DB 102,15,244,216 ; pmuludq %xmm0,%xmm3 @@ -53617,7 +53605,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5 DB 15,20,245 ; unpcklps %xmm5,%xmm6 DB 102,15,20,240 ; unpcklpd %xmm0,%xmm6 - DB 102,15,254,137,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm1 + DB 102,15,254,137,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm1 DB 102,15,112,193,229 ; pshufd $0xe5,%xmm1,%xmm0 DB 102,15,126,192 ; movd %xmm0,%eax DB 102,15,112,193,78 ; pshufd $0x4e,%xmm1,%xmm0 @@ -53635,7 +53623,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,202 ; movdqa %xmm2,%xmm1 DB 102,15,254,77,168 ; paddd -0x58(%ebp),%xmm1 DB 102,15,112,193,245 ; pshufd $0xf5,%xmm1,%xmm0 - DB 102,15,111,145,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm2 + DB 102,15,111,145,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm2 DB 102,15,244,202 ; pmuludq %xmm2,%xmm1 DB 102,15,244,194 ; pmuludq %xmm2,%xmm0 DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0 @@ -53671,7 +53659,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0 DB 15,20,216 ; unpcklps %xmm0,%xmm3 DB 102,15,20,217 ; unpcklpd %xmm1,%xmm3 - DB 102,15,254,169,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm5 + DB 102,15,254,169,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm5 DB 102,15,112,197,229 ; pshufd $0xe5,%xmm5,%xmm0 DB 102,15,126,192 ; movd %xmm0,%eax DB 102,15,112,197,78 ; pshufd $0x4e,%xmm5,%xmm0 @@ -53724,14 +53712,14 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,112,193,232 ; pshufd $0xe8,%xmm1,%xmm0 DB 102,15,98,224 ; punpckldq %xmm0,%xmm4 DB 102,15,127,165,24,255,255,255 ; movdqa %xmm4,-0xe8(%ebp) - DB 102,15,254,165,184,254,255,255 ; paddd -0x148(%ebp),%xmm4 + DB 102,15,254,165,200,254,255,255 ; paddd -0x138(%ebp),%xmm4 DB 102,15,127,101,200 ; movdqa %xmm4,-0x38(%ebp) DB 102,15,111,204 ; movdqa %xmm4,%xmm1 DB 102,15,254,141,72,255,255,255 ; paddd -0xb8(%ebp),%xmm1 DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 102,15,254,85,152 ; paddd -0x68(%ebp),%xmm2 DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0 - DB 102,15,111,153,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm3 + DB 102,15,111,153,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm3 DB 102,15,244,211 ; pmuludq %xmm3,%xmm2 DB 102,15,244,195 ; pmuludq %xmm3,%xmm0 DB 102,15,111,251 ; movdqa %xmm3,%xmm7 @@ -53770,7 +53758,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5 DB 15,20,229 ; unpcklps %xmm5,%xmm4 DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4 - DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0 + DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0 DB 102,15,112,216,229 ; pshufd $0xe5,%xmm0,%xmm3 DB 102,15,126,216 ; movd %xmm3,%eax DB 102,15,112,216,78 ; pshufd $0x4e,%xmm0,%xmm3 @@ -53822,7 +53810,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,52,130 ; movss (%edx,%eax,4),%xmm6 DB 15,20,238 ; unpcklps %xmm6,%xmm5 DB 102,15,20,235 ; unpcklpd %xmm3,%xmm5 - DB 102,15,111,137,164,77,0,0 ; movdqa 0x4da4(%ecx),%xmm1 + DB 102,15,111,137,168,77,0,0 ; movdqa 0x4da8(%ecx),%xmm1 DB 102,15,254,249 ; paddd %xmm1,%xmm7 DB 102,15,112,223,229 ; pshufd $0xe5,%xmm7,%xmm3 DB 102,15,126,216 ; movd %xmm3,%eax @@ -53856,7 +53844,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,226 ; movdqa %xmm2,%xmm4 DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0 DB 102,15,112,208,245 ; pshufd $0xf5,%xmm0,%xmm2 - DB 102,15,111,153,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm3 + DB 102,15,111,153,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm3 DB 102,15,244,195 ; pmuludq %xmm3,%xmm0 DB 102,15,244,211 ; pmuludq %xmm3,%xmm2 DB 102,15,112,218,232 ; pshufd $0xe8,%xmm2,%xmm3 @@ -53913,7 +53901,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,212 ; movdqa %xmm4,%xmm2 DB 102,15,254,85,168 ; paddd -0x58(%ebp),%xmm2 DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0 - DB 102,15,111,137,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm1 + DB 102,15,111,137,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm1 DB 102,15,244,209 ; pmuludq %xmm1,%xmm2 DB 102,15,244,193 ; pmuludq %xmm1,%xmm0 DB 102,15,112,240,232 ; pshufd $0xe8,%xmm0,%xmm6 @@ -53950,7 +53938,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4 DB 15,20,212 ; unpcklps %xmm4,%xmm2 DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2 - DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0 + DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0 DB 102,15,112,224,229 ; pshufd $0xe5,%xmm0,%xmm4 DB 102,15,126,224 ; movd %xmm4,%eax DB 102,15,112,224,78 ; pshufd $0x4e,%xmm0,%xmm4 @@ -54018,7 +54006,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,93,152 ; movdqa -0x68(%ebp),%xmm3 DB 102,15,254,217 ; paddd %xmm1,%xmm3 DB 102,15,112,211,245 ; pshufd $0xf5,%xmm3,%xmm2 - DB 102,15,111,129,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm0 + DB 102,15,111,129,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm0 DB 102,15,244,216 ; pmuludq %xmm0,%xmm3 DB 102,15,244,208 ; pmuludq %xmm0,%xmm2 DB 102,15,111,248 ; movdqa %xmm0,%xmm7 @@ -54057,7 +54045,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,28,130 ; movss (%edx,%eax,4),%xmm3 DB 15,20,235 ; unpcklps %xmm3,%xmm5 DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5 - DB 102,15,254,145,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm2 + DB 102,15,254,145,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm2 DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3 DB 102,15,126,216 ; movd %xmm3,%eax DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3 @@ -54109,7 +54097,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0 DB 15,20,208 ; unpcklps %xmm0,%xmm2 DB 102,15,20,215 ; unpcklpd %xmm7,%xmm2 - DB 102,15,111,137,164,77,0,0 ; movdqa 0x4da4(%ecx),%xmm1 + DB 102,15,111,137,168,77,0,0 ; movdqa 0x4da8(%ecx),%xmm1 DB 102,15,254,217 ; paddd %xmm1,%xmm3 DB 102,15,112,195,229 ; pshufd $0xe5,%xmm3,%xmm0 DB 102,15,126,192 ; movd %xmm0,%eax @@ -54144,7 +54132,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,194 ; movdqa %xmm2,%xmm0 DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0 DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4 - DB 102,15,111,169,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm5 + DB 102,15,111,169,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm5 DB 102,15,111,221 ; movdqa %xmm5,%xmm3 DB 102,15,244,195 ; pmuludq %xmm3,%xmm0 DB 102,15,244,227 ; pmuludq %xmm3,%xmm4 @@ -54200,7 +54188,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,202 ; movdqa %xmm2,%xmm1 DB 102,15,254,77,168 ; paddd -0x58(%ebp),%xmm1 DB 102,15,112,193,245 ; pshufd $0xf5,%xmm1,%xmm0 - DB 102,15,111,145,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm2 + DB 102,15,111,145,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm2 DB 102,15,244,202 ; pmuludq %xmm2,%xmm1 DB 102,15,244,194 ; pmuludq %xmm2,%xmm0 DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0 @@ -54236,7 +54224,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0 DB 15,20,216 ; unpcklps %xmm0,%xmm3 DB 102,15,20,217 ; unpcklpd %xmm1,%xmm3 - DB 102,15,254,185,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm7 + DB 102,15,254,185,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm7 DB 102,15,112,199,229 ; pshufd $0xe5,%xmm7,%xmm0 DB 102,15,126,192 ; movd %xmm0,%eax DB 102,15,112,199,78 ; pshufd $0x4e,%xmm7,%xmm0 @@ -54286,7 +54274,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,111,233 ; movdqa %xmm1,%xmm5 DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0 DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1 - DB 102,15,111,145,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm2 + DB 102,15,111,145,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm2 DB 102,15,244,194 ; pmuludq %xmm2,%xmm0 DB 102,15,244,202 ; pmuludq %xmm2,%xmm1 DB 102,15,111,250 ; movdqa %xmm2,%xmm7 @@ -54325,7 +54313,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4 DB 15,20,204 ; unpcklps %xmm4,%xmm1 DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1 - DB 102,15,254,145,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm2 + DB 102,15,254,145,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm2 DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3 DB 102,15,126,216 ; movd %xmm3,%eax DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3 @@ -54379,7 +54367,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4 DB 15,20,252 ; unpcklps %xmm4,%xmm7 DB 102,15,20,254 ; unpcklpd %xmm6,%xmm7 - DB 102,15,254,153,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm3 + DB 102,15,254,153,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm3 DB 102,15,112,227,229 ; pshufd $0xe5,%xmm3,%xmm4 DB 102,15,126,224 ; movd %xmm4,%eax DB 102,15,112,227,78 ; pshufd $0x4e,%xmm3,%xmm4 @@ -54412,7 +54400,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 102,15,254,208 ; paddd %xmm0,%xmm2 DB 102,15,111,216 ; movdqa %xmm0,%xmm3 DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0 - DB 102,15,111,137,36,84,0,0 ; movdqa 0x5424(%ecx),%xmm1 + DB 102,15,111,137,40,84,0,0 ; movdqa 0x5428(%ecx),%xmm1 DB 102,15,244,209 ; pmuludq %xmm1,%xmm2 DB 102,15,244,193 ; pmuludq %xmm1,%xmm0 DB 102,15,111,241 ; movdqa %xmm1,%xmm6 @@ -54452,7 +54440,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 15,20,225 ; unpcklps %xmm1,%xmm4 DB 102,15,20,226 ; unpcklpd %xmm2,%xmm4 DB 102,15,41,165,88,255,255,255 ; movapd %xmm4,-0xa8(%ebp) - DB 102,15,254,129,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm0 + DB 102,15,254,129,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm0 DB 102,15,112,200,229 ; pshufd $0xe5,%xmm0,%xmm1 DB 102,15,126,200 ; movd %xmm1,%eax DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1 @@ -54506,7 +54494,7 @@ _sk_clut_4D_sse2 LABEL PROC DB 243,15,16,52,130 ; movss (%edx,%eax,4),%xmm6 DB 15,20,206 ; unpcklps %xmm6,%xmm1 DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1 - DB 102,15,254,145,164,77,0,0 ; paddd 0x4da4(%ecx),%xmm2 + DB 102,15,254,145,168,77,0,0 ; paddd 0x4da8(%ecx),%xmm2 DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3 DB 102,15,126,216 ; movd %xmm3,%eax DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3 @@ -54557,8 +54545,8 @@ _sk_clut_4D_sse2 LABEL PROC DB 15,92,212 ; subps %xmm4,%xmm2 DB 15,89,211 ; mulps %xmm3,%xmm2 DB 15,88,212 ; addps %xmm4,%xmm2 - DB 15,91,157,184,254,255,255 ; cvtdq2ps -0x148(%ebp),%xmm3 - DB 15,40,165,152,254,255,255 ; movaps -0x168(%ebp),%xmm4 + DB 15,91,157,200,254,255,255 ; cvtdq2ps -0x138(%ebp),%xmm3 + DB 15,40,165,168,254,255,255 ; movaps -0x158(%ebp),%xmm4 DB 15,92,227 ; subps %xmm3,%xmm4 DB 15,40,157,40,255,255,255 ; movaps -0xd8(%ebp),%xmm3 DB 15,92,195 ; subps %xmm3,%xmm0 @@ -54572,21 +54560,21 @@ _sk_clut_4D_sse2 LABEL PROC DB 15,92,211 ; subps %xmm3,%xmm2 DB 15,89,212 ; mulps %xmm4,%xmm2 DB 15,88,211 ; addps %xmm3,%xmm2 - DB 139,69,8 ; mov 0x8(%ebp),%eax - DB 139,117,12 ; mov 0xc(%ebp),%esi - DB 141,86,8 ; lea 0x8(%esi),%edx + DB 139,85,12 ; mov 0xc(%ebp),%edx + DB 141,66,8 ; lea 0x8(%edx),%eax DB 131,236,8 ; sub $0x8,%esp - DB 15,40,153,100,77,0,0 ; movaps 0x4d64(%ecx),%xmm3 - DB 82 ; push %edx + DB 15,40,153,104,77,0,0 ; movaps 0x4d68(%ecx),%xmm3 DB 80 ; push %eax - DB 255,86,4 ; call *0x4(%esi) - DB 129,196,108,1,0,0 ; add $0x16c,%esp + DB 255,117,8 ; pushl 0x8(%ebp) + DB 255,82,4 ; call *0x4(%edx) + DB 129,196,92,1,0,0 ; add $0x15c,%esp DB 94 ; pop %esi DB 95 ; pop %edi DB 91 ; pop %ebx DB 93 ; pop %ebp DB 195 ; ret DB 144 ; nop + DB 144 ; nop PUBLIC _sk_start_pipeline_sse2_lowp _sk_start_pipeline_sse2_lowp LABEL PROC @@ -54599,7 +54587,7 @@ _sk_start_pipeline_sse2_lowp LABEL PROC DB 131,236,96 ; sub $0x60,%esp DB 139,125,12 ; mov 0xc(%ebp),%edi DB 59,125,20 ; cmp 0x14(%ebp),%edi - DB 15,131,198,0,0,0 ; jae 94b6 <_sk_start_pipeline_sse2_lowp+0xde> + DB 15,131,198,0,0,0 ; jae 9492 <_sk_start_pipeline_sse2_lowp+0xde> DB 139,85,16 ; mov 0x10(%ebp),%edx DB 139,69,8 ; mov 0x8(%ebp),%eax DB 139,117,24 ; mov 0x18(%ebp),%esi @@ -54613,7 +54601,7 @@ _sk_start_pipeline_sse2_lowp LABEL PROC DB 139,69,8 ; mov 0x8(%ebp),%eax DB 137,223 ; mov %ebx,%edi DB 137,243 ; mov %esi,%ebx - DB 119,78 ; ja 9467 <_sk_start_pipeline_sse2_lowp+0x8f> + DB 119,78 ; ja 9443 <_sk_start_pipeline_sse2_lowp+0x8f> DB 139,117,8 ; mov 0x8(%ebp),%esi DB 15,41,68,36,64 ; movaps %xmm0,0x40(%esp) DB 15,41,68,36,48 ; movaps %xmm0,0x30(%esp) @@ -54635,13 +54623,13 @@ _sk_start_pipeline_sse2_lowp LABEL PROC DB 131,198,16 ; add $0x10,%esi DB 57,214 ; cmp %edx,%esi DB 137,198 ; mov %eax,%esi - DB 118,181 ; jbe 941c <_sk_start_pipeline_sse2_lowp+0x44> + DB 118,181 ; jbe 93f8 <_sk_start_pipeline_sse2_lowp+0x44> DB 137,209 ; mov %edx,%ecx DB 41,193 ; sub %eax,%ecx DB 137,222 ; mov %ebx,%esi DB 137,251 ; mov %edi,%ebx DB 139,124,36,84 ; mov 0x54(%esp),%edi - DB 116,55 ; je 94ac <_sk_start_pipeline_sse2_lowp+0xd4> + DB 116,55 ; je 9488 <_sk_start_pipeline_sse2_lowp+0xd4> DB 15,41,68,36,64 ; movaps %xmm0,0x40(%esp) DB 15,41,68,36,48 ; movaps %xmm0,0x30(%esp) DB 15,41,68,36,32 ; movaps %xmm0,0x20(%esp) @@ -54659,7 +54647,7 @@ _sk_start_pipeline_sse2_lowp LABEL PROC DB 139,85,16 ; mov 0x10(%ebp),%edx DB 71 ; inc %edi DB 59,125,20 ; cmp 0x14(%ebp),%edi - DB 15,133,82,255,255,255 ; jne 9408 <_sk_start_pipeline_sse2_lowp+0x30> + DB 15,133,82,255,255,255 ; jne 93e4 <_sk_start_pipeline_sse2_lowp+0x30> DB 141,101,244 ; lea -0xc(%ebp),%esp DB 94 ; pop %esi DB 95 ; pop %edi @@ -54725,7 +54713,7 @@ _sk_black_color_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,92 ; sub $0x5c,%esp - DB 232,0,0,0,0 ; call 9565 <_sk_black_color_sse2_lowp+0xe> + DB 232,0,0,0,0 ; call 9541 <_sk_black_color_sse2_lowp+0xe> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,16 ; mov 0x10(%ebp),%edx @@ -54744,7 +54732,7 @@ _sk_black_color_sse2_lowp LABEL PROC DB 137,84,36,8 ; mov %edx,0x8(%esp) DB 137,92,36,4 ; mov %ebx,0x4(%esp) DB 137,12,36 ; mov %ecx,(%esp) - DB 15,40,152,91,62,0,0 ; movaps 0x3e5b(%eax),%xmm3 + DB 15,40,152,95,62,0,0 ; movaps 0x3e5f(%eax),%xmm3 DB 15,87,192 ; xorps %xmm0,%xmm0 DB 15,87,201 ; xorps %xmm1,%xmm1 DB 15,87,210 ; xorps %xmm2,%xmm2 @@ -54764,7 +54752,7 @@ _sk_white_color_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,92 ; sub $0x5c,%esp - DB 232,0,0,0,0 ; call 95d0 <_sk_white_color_sse2_lowp+0xe> + DB 232,0,0,0,0 ; call 95ac <_sk_white_color_sse2_lowp+0xe> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,16 ; mov 0x10(%ebp),%edx @@ -54783,7 +54771,7 @@ _sk_white_color_sse2_lowp LABEL PROC DB 137,84,36,8 ; mov %edx,0x8(%esp) DB 137,92,36,4 ; mov %ebx,0x4(%esp) DB 137,12,36 ; mov %ecx,(%esp) - DB 15,40,128,240,61,0,0 ; movaps 0x3df0(%eax),%xmm0 + DB 15,40,128,244,61,0,0 ; movaps 0x3df4(%eax),%xmm0 DB 15,40,200 ; movaps %xmm0,%xmm1 DB 15,40,208 ; movaps %xmm0,%xmm2 DB 15,40,216 ; movaps %xmm0,%xmm3 @@ -54802,16 +54790,16 @@ _sk_set_rgb_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 963a <_sk_set_rgb_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9616 <_sk_set_rgb_sse2_lowp+0xd> DB 94 ; pop %esi DB 139,69,8 ; mov 0x8(%ebp),%eax DB 139,85,16 ; mov 0x10(%ebp),%edx DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,57 ; mov (%ecx),%edi - DB 243,15,16,150,74,62,0,0 ; movss 0x3e4a(%esi),%xmm2 + DB 243,15,16,150,78,62,0,0 ; movss 0x3e4e(%esi),%xmm2 DB 243,15,16,7 ; movss (%edi),%xmm0 DB 243,15,89,194 ; mulss %xmm2,%xmm0 - DB 243,15,16,142,70,62,0,0 ; movss 0x3e46(%esi),%xmm1 + DB 243,15,16,142,74,62,0,0 ; movss 0x3e4a(%esi),%xmm1 DB 243,15,88,193 ; addss %xmm1,%xmm0 DB 243,15,44,240 ; cvttss2si %xmm0,%esi DB 102,15,110,198 ; movd %esi,%xmm0 @@ -54858,7 +54846,7 @@ _sk_premul_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 96fe <_sk_premul_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 96da <_sk_premul_sse2_lowp+0xd> DB 90 ; pop %edx DB 139,69,8 ; mov 0x8(%ebp),%eax DB 139,77,16 ; mov 0x10(%ebp),%ecx @@ -54867,7 +54855,7 @@ _sk_premul_sse2_lowp LABEL PROC DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5 DB 15,40,117,56 ; movaps 0x38(%ebp),%xmm6 DB 102,15,213,195 ; pmullw %xmm3,%xmm0 - DB 102,15,111,186,194,60,0,0 ; movdqa 0x3cc2(%edx),%xmm7 + DB 102,15,111,186,198,60,0,0 ; movdqa 0x3cc6(%edx),%xmm7 DB 102,15,253,199 ; paddw %xmm7,%xmm0 DB 102,15,213,203 ; pmullw %xmm3,%xmm1 DB 102,15,253,207 ; paddw %xmm7,%xmm1 @@ -54993,12 +54981,12 @@ _sk_invert_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9878 <_sk_invert_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9854 <_sk_invert_sse2_lowp+0xd> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,16 ; mov 0x10(%ebp),%edx DB 139,117,20 ; mov 0x14(%ebp),%esi - DB 102,15,111,160,72,59,0,0 ; movdqa 0x3b48(%eax),%xmm4 + DB 102,15,111,160,76,59,0,0 ; movdqa 0x3b4c(%eax),%xmm4 DB 102,15,111,236 ; movdqa %xmm4,%xmm5 DB 102,15,249,232 ; psubw %xmm0,%xmm5 DB 102,15,111,244 ; movdqa %xmm4,%xmm6 @@ -55076,11 +55064,11 @@ _sk_srcatop_sse2_lowp LABEL PROC DB 102,15,111,234 ; movdqa %xmm2,%xmm5 DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call 9970 <_sk_srcatop_sse2_lowp+0x19> + DB 232,0,0,0,0 ; call 994c <_sk_srcatop_sse2_lowp+0x19> DB 88 ; pop %eax DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6 DB 102,15,213,206 ; pmullw %xmm6,%xmm1 - DB 102,15,111,128,80,58,0,0 ; movdqa 0x3a50(%eax),%xmm0 + DB 102,15,111,128,84,58,0,0 ; movdqa 0x3a54(%eax),%xmm0 DB 102,15,253,200 ; paddw %xmm0,%xmm1 DB 102,15,213,214 ; pmullw %xmm6,%xmm2 DB 102,15,253,208 ; paddw %xmm0,%xmm2 @@ -55136,12 +55124,12 @@ _sk_dstatop_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9a44 <_sk_dstatop_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9a20 <_sk_dstatop_sse2_lowp+0xd> DB 88 ; pop %eax DB 102,15,111,101,40 ; movdqa 0x28(%ebp),%xmm4 DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6 DB 102,15,213,243 ; pmullw %xmm3,%xmm6 - DB 102,15,111,184,124,57,0,0 ; movdqa 0x397c(%eax),%xmm7 + DB 102,15,111,184,128,57,0,0 ; movdqa 0x3980(%eax),%xmm7 DB 102,15,253,247 ; paddw %xmm7,%xmm6 DB 102,15,213,227 ; pmullw %xmm3,%xmm4 DB 102,15,253,231 ; paddw %xmm7,%xmm4 @@ -55192,7 +55180,7 @@ _sk_srcin_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9b05 <_sk_srcin_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9ae1 <_sk_srcin_sse2_lowp+0xd> DB 94 ; pop %esi DB 139,69,8 ; mov 0x8(%ebp),%eax DB 139,77,16 ; mov 0x10(%ebp),%ecx @@ -55201,7 +55189,7 @@ _sk_srcin_sse2_lowp LABEL PROC DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5 DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6 DB 102,15,213,198 ; pmullw %xmm6,%xmm0 - DB 102,15,111,190,187,56,0,0 ; movdqa 0x38bb(%esi),%xmm7 + DB 102,15,111,190,191,56,0,0 ; movdqa 0x38bf(%esi),%xmm7 DB 102,15,253,199 ; paddw %xmm7,%xmm0 DB 102,15,213,206 ; pmullw %xmm6,%xmm1 DB 102,15,253,207 ; paddw %xmm7,%xmm1 @@ -55238,14 +55226,14 @@ _sk_dstin_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9b9c <_sk_dstin_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9b78 <_sk_dstin_sse2_lowp+0xd> DB 88 ; pop %eax DB 102,15,111,85,56 ; movdqa 0x38(%ebp),%xmm2 DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5 DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6 DB 102,15,111,198 ; movdqa %xmm6,%xmm0 DB 102,15,213,195 ; pmullw %xmm3,%xmm0 - DB 102,15,111,184,36,56,0,0 ; movdqa 0x3824(%eax),%xmm7 + DB 102,15,111,184,40,56,0,0 ; movdqa 0x3828(%eax),%xmm7 DB 102,15,253,199 ; paddw %xmm7,%xmm0 DB 102,15,111,205 ; movdqa %xmm5,%xmm1 DB 102,15,213,203 ; pmullw %xmm3,%xmm1 @@ -55287,14 +55275,14 @@ _sk_srcout_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9c44 <_sk_srcout_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9c20 <_sk_srcout_sse2_lowp+0xd> DB 94 ; pop %esi DB 139,69,8 ; mov 0x8(%ebp),%eax DB 139,77,16 ; mov 0x10(%ebp),%ecx DB 139,85,20 ; mov 0x14(%ebp),%edx DB 15,40,101,24 ; movaps 0x18(%ebp),%xmm4 DB 102,15,111,109,72 ; movdqa 0x48(%ebp),%xmm5 - DB 102,15,111,182,124,55,0,0 ; movdqa 0x377c(%esi),%xmm6 + DB 102,15,111,182,128,55,0,0 ; movdqa 0x3780(%esi),%xmm6 DB 102,15,111,254 ; movdqa %xmm6,%xmm7 DB 102,15,249,253 ; psubw %xmm5,%xmm7 DB 102,15,213,199 ; pmullw %xmm7,%xmm0 @@ -55336,11 +55324,11 @@ _sk_dstout_sse2_lowp LABEL PROC DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp DB 102,15,111,195 ; movdqa %xmm3,%xmm0 - DB 232,0,0,0,0 ; call 9ce7 <_sk_dstout_sse2_lowp+0x11> + DB 232,0,0,0,0 ; call 9cc3 <_sk_dstout_sse2_lowp+0x11> DB 88 ; pop %eax DB 102,15,111,109,56 ; movdqa 0x38(%ebp),%xmm5 DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6 - DB 102,15,111,184,217,54,0,0 ; movdqa 0x36d9(%eax),%xmm7 + DB 102,15,111,184,221,54,0,0 ; movdqa 0x36dd(%eax),%xmm7 DB 102,15,111,223 ; movdqa %xmm7,%xmm3 DB 102,15,249,216 ; psubw %xmm0,%xmm3 DB 102,15,111,195 ; movdqa %xmm3,%xmm0 @@ -55390,9 +55378,9 @@ _sk_srcover_sse2_lowp LABEL PROC DB 15,41,85,232 ; movaps %xmm2,-0x18(%ebp) DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 102,15,111,224 ; movdqa %xmm0,%xmm4 - DB 232,0,0,0,0 ; call 9da3 <_sk_srcover_sse2_lowp+0x19> + DB 232,0,0,0,0 ; call 9d7f <_sk_srcover_sse2_lowp+0x19> DB 88 ; pop %eax - DB 102,15,111,136,29,54,0,0 ; movdqa 0x361d(%eax),%xmm1 + DB 102,15,111,136,33,54,0,0 ; movdqa 0x3621(%eax),%xmm1 DB 102,15,111,193 ; movdqa %xmm1,%xmm0 DB 102,15,249,195 ; psubw %xmm3,%xmm0 DB 102,15,111,248 ; movdqa %xmm0,%xmm7 @@ -55449,7 +55437,7 @@ _sk_dstover_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9e73 <_sk_dstover_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9e4f <_sk_dstover_sse2_lowp+0xd> DB 95 ; pop %edi DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,16 ; mov 0x10(%ebp),%edx @@ -55457,7 +55445,7 @@ _sk_dstover_sse2_lowp LABEL PROC DB 139,69,12 ; mov 0xc(%ebp),%eax DB 102,15,111,101,56 ; movdqa 0x38(%ebp),%xmm4 DB 102,15,111,109,72 ; movdqa 0x48(%ebp),%xmm5 - DB 102,15,111,183,77,53,0,0 ; movdqa 0x354d(%edi),%xmm6 + DB 102,15,111,183,81,53,0,0 ; movdqa 0x3551(%edi),%xmm6 DB 102,15,111,254 ; movdqa %xmm6,%xmm7 DB 102,15,249,253 ; psubw %xmm5,%xmm7 DB 102,15,213,199 ; pmullw %xmm7,%xmm0 @@ -55501,12 +55489,12 @@ _sk_modulate_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9f28 <_sk_modulate_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9f04 <_sk_modulate_sse2_lowp+0xd> DB 88 ; pop %eax DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5 DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6 DB 102,15,213,198 ; pmullw %xmm6,%xmm0 - DB 102,15,111,184,152,52,0,0 ; movdqa 0x3498(%eax),%xmm7 + DB 102,15,111,184,156,52,0,0 ; movdqa 0x349c(%eax),%xmm7 DB 102,15,253,199 ; paddw %xmm7,%xmm0 DB 102,15,213,205 ; pmullw %xmm5,%xmm1 DB 102,15,253,207 ; paddw %xmm7,%xmm1 @@ -55547,10 +55535,10 @@ _sk_multiply_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call 9fc4 <_sk_multiply_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call 9fa0 <_sk_multiply_sse2_lowp+0xd> DB 88 ; pop %eax DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5 - DB 102,15,111,160,252,51,0,0 ; movdqa 0x33fc(%eax),%xmm4 + DB 102,15,111,160,0,52,0,0 ; movdqa 0x3400(%eax),%xmm4 DB 102,15,111,245 ; movdqa %xmm5,%xmm6 DB 102,15,253,244 ; paddw %xmm4,%xmm6 DB 102,15,249,117,72 ; psubw 0x48(%ebp),%xmm6 @@ -55618,17 +55606,17 @@ _sk_plus__sse2_lowp LABEL PROC DB 131,236,96 ; sub $0x60,%esp DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call a0c5 <_sk_plus__sse2_lowp+0x15> + DB 232,0,0,0,0 ; call a0a1 <_sk_plus__sse2_lowp+0x15> DB 88 ; pop %eax DB 102,15,253,77,24 ; paddw 0x18(%ebp),%xmm1 - DB 102,15,111,168,11,51,0,0 ; movdqa 0x330b(%eax),%xmm5 + DB 102,15,111,168,15,51,0,0 ; movdqa 0x330f(%eax),%xmm5 DB 102,15,111,193 ; movdqa %xmm1,%xmm0 DB 102,15,217,197 ; psubusw %xmm5,%xmm0 DB 102,15,127,109,232 ; movdqa %xmm5,-0x18(%ebp) DB 102,15,239,255 ; pxor %xmm7,%xmm7 DB 102,15,117,199 ; pcmpeqw %xmm7,%xmm0 DB 102,15,219,200 ; pand %xmm0,%xmm1 - DB 102,15,111,176,251,50,0,0 ; movdqa 0x32fb(%eax),%xmm6 + DB 102,15,111,176,255,50,0,0 ; movdqa 0x32ff(%eax),%xmm6 DB 102,15,223,198 ; pandn %xmm6,%xmm0 DB 102,15,235,193 ; por %xmm1,%xmm0 DB 102,15,253,101,40 ; paddw 0x28(%ebp),%xmm4 @@ -55687,14 +55675,14 @@ _sk_screen_sse2_lowp LABEL PROC DB 131,236,80 ; sub $0x50,%esp DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call a1bd <_sk_screen_sse2_lowp+0x15> + DB 232,0,0,0,0 ; call a199 <_sk_screen_sse2_lowp+0x15> DB 88 ; pop %eax DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5 DB 102,15,111,117,24 ; movdqa 0x18(%ebp),%xmm6 DB 102,15,111,198 ; movdqa %xmm6,%xmm0 DB 102,15,253,193 ; paddw %xmm1,%xmm0 DB 102,15,213,206 ; pmullw %xmm6,%xmm1 - DB 102,15,111,176,3,50,0,0 ; movdqa 0x3203(%eax),%xmm6 + DB 102,15,111,176,7,50,0,0 ; movdqa 0x3207(%eax),%xmm6 DB 102,15,253,206 ; paddw %xmm6,%xmm1 DB 102,15,113,209,8 ; psrlw $0x8,%xmm1 DB 102,15,249,193 ; psubw %xmm1,%xmm0 @@ -55750,9 +55738,9 @@ _sk_xor__sse2_lowp LABEL PROC DB 86 ; push %esi DB 131,236,96 ; sub $0x60,%esp DB 102,15,127,93,232 ; movdqa %xmm3,-0x18(%ebp) - DB 232,0,0,0,0 ; call a29d <_sk_xor__sse2_lowp+0x12> + DB 232,0,0,0,0 ; call a279 <_sk_xor__sse2_lowp+0x12> DB 88 ; pop %eax - DB 102,15,111,176,35,49,0,0 ; movdqa 0x3123(%eax),%xmm6 + DB 102,15,111,176,39,49,0,0 ; movdqa 0x3127(%eax),%xmm6 DB 102,15,111,254 ; movdqa %xmm6,%xmm7 DB 102,15,249,125,72 ; psubw 0x48(%ebp),%xmm7 DB 102,15,213,199 ; pmullw %xmm7,%xmm0 @@ -55817,7 +55805,7 @@ _sk_darken_sse2_lowp LABEL PROC DB 15,41,85,200 ; movaps %xmm2,-0x38(%ebp) DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call a392 <_sk_darken_sse2_lowp+0x25> + DB 232,0,0,0,0 ; call a36e <_sk_darken_sse2_lowp+0x25> DB 88 ; pop %eax DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6 DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5 @@ -55828,7 +55816,7 @@ _sk_darken_sse2_lowp LABEL PROC DB 102,15,111,222 ; movdqa %xmm6,%xmm3 DB 102,15,111,197 ; movdqa %xmm5,%xmm0 DB 102,15,213,199 ; pmullw %xmm7,%xmm0 - DB 102,15,111,184,78,48,0,0 ; movdqa 0x304e(%eax),%xmm7 + DB 102,15,111,184,82,48,0,0 ; movdqa 0x3052(%eax),%xmm7 DB 102,15,111,241 ; movdqa %xmm1,%xmm6 DB 102,15,239,247 ; pxor %xmm7,%xmm6 DB 102,15,111,232 ; movdqa %xmm0,%xmm5 @@ -55837,7 +55825,7 @@ _sk_darken_sse2_lowp LABEL PROC DB 102,15,219,197 ; pand %xmm5,%xmm0 DB 102,15,223,233 ; pandn %xmm1,%xmm5 DB 102,15,235,232 ; por %xmm0,%xmm5 - DB 102,15,111,128,46,48,0,0 ; movdqa 0x302e(%eax),%xmm0 + DB 102,15,111,128,50,48,0,0 ; movdqa 0x3032(%eax),%xmm0 DB 102,15,127,69,232 ; movdqa %xmm0,-0x18(%ebp) DB 102,15,253,232 ; paddw %xmm0,%xmm5 DB 102,15,113,213,8 ; psrlw $0x8,%xmm5 @@ -55926,7 +55914,7 @@ _sk_lighten_sse2_lowp LABEL PROC DB 15,41,85,200 ; movaps %xmm2,-0x38(%ebp) DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call a53b <_sk_lighten_sse2_lowp+0x25> + DB 232,0,0,0,0 ; call a517 <_sk_lighten_sse2_lowp+0x25> DB 88 ; pop %eax DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5 DB 102,15,111,197 ; movdqa %xmm5,%xmm0 @@ -55935,7 +55923,7 @@ _sk_lighten_sse2_lowp LABEL PROC DB 102,15,213,77,72 ; pmullw 0x48(%ebp),%xmm1 DB 102,15,111,197 ; movdqa %xmm5,%xmm0 DB 102,15,213,198 ; pmullw %xmm6,%xmm0 - DB 102,15,111,184,165,46,0,0 ; movdqa 0x2ea5(%eax),%xmm7 + DB 102,15,111,184,169,46,0,0 ; movdqa 0x2ea9(%eax),%xmm7 DB 102,15,111,241 ; movdqa %xmm1,%xmm6 DB 102,15,239,247 ; pxor %xmm7,%xmm6 DB 102,15,111,232 ; movdqa %xmm0,%xmm5 @@ -55944,7 +55932,7 @@ _sk_lighten_sse2_lowp LABEL PROC DB 102,15,219,205 ; pand %xmm5,%xmm1 DB 102,15,223,232 ; pandn %xmm0,%xmm5 DB 102,15,235,233 ; por %xmm1,%xmm5 - DB 102,15,111,128,133,46,0,0 ; movdqa 0x2e85(%eax),%xmm0 + DB 102,15,111,128,137,46,0,0 ; movdqa 0x2e89(%eax),%xmm0 DB 102,15,253,232 ; paddw %xmm0,%xmm5 DB 102,15,111,208 ; movdqa %xmm0,%xmm2 DB 102,15,127,85,232 ; movdqa %xmm2,-0x18(%ebp) @@ -56032,7 +56020,7 @@ _sk_difference_sse2_lowp LABEL PROC DB 15,41,85,184 ; movaps %xmm2,-0x48(%ebp) DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call a6d9 <_sk_difference_sse2_lowp+0x25> + DB 232,0,0,0,0 ; call a6b5 <_sk_difference_sse2_lowp+0x25> DB 88 ; pop %eax DB 102,15,111,117,72 ; movdqa 0x48(%ebp),%xmm6 DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5 @@ -56043,7 +56031,7 @@ _sk_difference_sse2_lowp LABEL PROC DB 102,15,111,222 ; movdqa %xmm6,%xmm3 DB 102,15,111,197 ; movdqa %xmm5,%xmm0 DB 102,15,213,199 ; pmullw %xmm7,%xmm0 - DB 102,15,111,184,7,45,0,0 ; movdqa 0x2d07(%eax),%xmm7 + DB 102,15,111,184,11,45,0,0 ; movdqa 0x2d0b(%eax),%xmm7 DB 102,15,111,241 ; movdqa %xmm1,%xmm6 DB 102,15,239,247 ; pxor %xmm7,%xmm6 DB 102,15,111,232 ; movdqa %xmm0,%xmm5 @@ -56052,11 +56040,11 @@ _sk_difference_sse2_lowp LABEL PROC DB 102,15,219,205 ; pand %xmm5,%xmm1 DB 102,15,223,232 ; pandn %xmm0,%xmm5 DB 102,15,235,233 ; por %xmm1,%xmm5 - DB 102,15,111,128,231,44,0,0 ; movdqa 0x2ce7(%eax),%xmm0 + DB 102,15,111,128,235,44,0,0 ; movdqa 0x2ceb(%eax),%xmm0 DB 102,15,127,69,216 ; movdqa %xmm0,-0x28(%ebp) DB 102,15,253,232 ; paddw %xmm0,%xmm5 DB 102,15,113,213,7 ; psrlw $0x7,%xmm5 - DB 102,15,111,128,23,45,0,0 ; movdqa 0x2d17(%eax),%xmm0 + DB 102,15,111,128,27,45,0,0 ; movdqa 0x2d1b(%eax),%xmm0 DB 102,15,127,69,232 ; movdqa %xmm0,-0x18(%ebp) DB 102,15,219,232 ; pand %xmm0,%xmm5 DB 102,15,249,213 ; psubw %xmm5,%xmm2 @@ -56143,16 +56131,16 @@ _sk_exclusion_sse2_lowp LABEL PROC DB 131,236,80 ; sub $0x50,%esp DB 102,15,111,225 ; movdqa %xmm1,%xmm4 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call a88d <_sk_exclusion_sse2_lowp+0x15> + DB 232,0,0,0,0 ; call a869 <_sk_exclusion_sse2_lowp+0x15> DB 88 ; pop %eax DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5 DB 102,15,111,197 ; movdqa %xmm5,%xmm0 DB 102,15,253,193 ; paddw %xmm1,%xmm0 DB 102,15,213,205 ; pmullw %xmm5,%xmm1 - DB 102,15,111,184,51,43,0,0 ; movdqa 0x2b33(%eax),%xmm7 + DB 102,15,111,184,55,43,0,0 ; movdqa 0x2b37(%eax),%xmm7 DB 102,15,253,207 ; paddw %xmm7,%xmm1 DB 102,15,113,209,7 ; psrlw $0x7,%xmm1 - DB 102,15,111,176,99,43,0,0 ; movdqa 0x2b63(%eax),%xmm6 + DB 102,15,111,176,103,43,0,0 ; movdqa 0x2b67(%eax),%xmm6 DB 102,15,219,206 ; pand %xmm6,%xmm1 DB 102,15,249,193 ; psubw %xmm1,%xmm0 DB 102,15,111,109,40 ; movdqa 0x28(%ebp),%xmm5 @@ -56211,9 +56199,9 @@ _sk_hardlight_sse2_lowp LABEL PROC DB 15,41,85,152 ; movaps %xmm2,-0x68(%ebp) DB 102,15,111,233 ; movdqa %xmm1,%xmm5 DB 102,15,111,224 ; movdqa %xmm0,%xmm4 - DB 232,0,0,0,0 ; call a987 <_sk_hardlight_sse2_lowp+0x1c> + DB 232,0,0,0,0 ; call a963 <_sk_hardlight_sse2_lowp+0x1c> DB 88 ; pop %eax - DB 102,15,111,184,57,42,0,0 ; movdqa 0x2a39(%eax),%xmm7 + DB 102,15,111,184,61,42,0,0 ; movdqa 0x2a3d(%eax),%xmm7 DB 102,15,127,125,200 ; movdqa %xmm7,-0x38(%ebp) DB 102,15,111,215 ; movdqa %xmm7,%xmm2 DB 102,15,249,85,72 ; psubw 0x48(%ebp),%xmm2 @@ -56240,7 +56228,7 @@ _sk_hardlight_sse2_lowp LABEL PROC DB 102,15,111,214 ; movdqa %xmm6,%xmm2 DB 102,15,249,209 ; psubw %xmm1,%xmm2 DB 102,15,253,228 ; paddw %xmm4,%xmm4 - DB 102,15,111,128,89,42,0,0 ; movdqa 0x2a59(%eax),%xmm0 + DB 102,15,111,128,93,42,0,0 ; movdqa 0x2a5d(%eax),%xmm0 DB 102,15,239,216 ; pxor %xmm0,%xmm3 DB 102,15,127,93,184 ; movdqa %xmm3,-0x48(%ebp) DB 102,15,111,204 ; movdqa %xmm4,%xmm1 @@ -56345,10 +56333,10 @@ _sk_overlay_sse2_lowp LABEL PROC DB 15,41,85,152 ; movaps %xmm2,-0x68(%ebp) DB 15,41,141,120,255,255,255 ; movaps %xmm1,-0x88(%ebp) DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call aba9 <_sk_overlay_sse2_lowp+0x1f> + DB 232,0,0,0,0 ; call ab85 <_sk_overlay_sse2_lowp+0x1f> DB 88 ; pop %eax DB 102,15,111,69,72 ; movdqa 0x48(%ebp),%xmm0 - DB 102,15,111,184,23,40,0,0 ; movdqa 0x2817(%eax),%xmm7 + DB 102,15,111,184,27,40,0,0 ; movdqa 0x281b(%eax),%xmm7 DB 102,15,127,125,232 ; movdqa %xmm7,-0x18(%ebp) DB 102,15,111,215 ; movdqa %xmm7,%xmm2 DB 102,15,249,208 ; psubw %xmm0,%xmm2 @@ -56375,7 +56363,7 @@ _sk_overlay_sse2_lowp LABEL PROC DB 102,15,249,234 ; psubw %xmm2,%xmm5 DB 102,15,111,195 ; movdqa %xmm3,%xmm0 DB 102,15,253,192 ; paddw %xmm0,%xmm0 - DB 102,15,111,144,55,40,0,0 ; movdqa 0x2837(%eax),%xmm2 + DB 102,15,111,144,59,40,0,0 ; movdqa 0x283b(%eax),%xmm2 DB 102,15,127,85,184 ; movdqa %xmm2,-0x48(%ebp) DB 102,15,239,226 ; pxor %xmm2,%xmm4 DB 102,15,239,194 ; pxor %xmm2,%xmm0 @@ -56503,10 +56491,10 @@ _sk_load_8888_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call ae18 <_sk_load_8888_sse2_lowp+0x30> + DB 232,0,0,0,0 ; call adf4 <_sk_load_8888_sse2_lowp+0x30> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,32 ; ja ae3e <_sk_load_8888_sse2_lowp+0x56> + DB 119,32 ; ja ae1a <_sk_load_8888_sse2_lowp+0x56> DB 102,15,239,246 ; pxor %xmm6,%xmm6 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,52,1,0,0 ; mov 0x134(%edi,%ecx,4),%ecx @@ -56515,14 +56503,14 @@ _sk_load_8888_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 243,15,16,28,179 ; movss (%ebx,%esi,4),%xmm3 DB 15,87,246 ; xorps %xmm6,%xmm6 - DB 235,73 ; jmp ae87 <_sk_load_8888_sse2_lowp+0x9f> + DB 235,73 ; jmp ae63 <_sk_load_8888_sse2_lowp+0x9f> DB 102,15,16,28,179 ; movupd (%ebx,%esi,4),%xmm3 DB 15,16,116,179,16 ; movups 0x10(%ebx,%esi,4),%xmm6 - DB 235,61 ; jmp ae87 <_sk_load_8888_sse2_lowp+0x9f> + DB 235,61 ; jmp ae63 <_sk_load_8888_sse2_lowp+0x9f> DB 102,15,110,68,179,8 ; movd 0x8(%ebx,%esi,4),%xmm0 DB 102,15,112,216,69 ; pshufd $0x45,%xmm0,%xmm3 DB 102,15,18,28,179 ; movlpd (%ebx,%esi,4),%xmm3 - DB 235,43 ; jmp ae87 <_sk_load_8888_sse2_lowp+0x9f> + DB 235,43 ; jmp ae63 <_sk_load_8888_sse2_lowp+0x9f> DB 102,15,110,68,179,24 ; movd 0x18(%ebx,%esi,4),%xmm0 DB 102,15,112,240,69 ; pshufd $0x45,%xmm0,%xmm6 DB 243,15,16,68,179,20 ; movss 0x14(%ebx,%esi,4),%xmm0 @@ -56539,7 +56527,7 @@ _sk_load_8888_sse2_lowp LABEL PROC DB 102,15,114,240,16 ; pslld $0x10,%xmm0 DB 102,15,114,224,16 ; psrad $0x10,%xmm0 DB 102,15,107,200 ; packssdw %xmm0,%xmm1 - DB 102,15,111,175,168,37,0,0 ; movdqa 0x25a8(%edi),%xmm5 + DB 102,15,111,175,172,37,0,0 ; movdqa 0x25ac(%edi),%xmm5 DB 102,15,111,193 ; movdqa %xmm1,%xmm0 DB 102,15,219,197 ; pand %xmm5,%xmm0 DB 102,15,113,209,8 ; psrlw $0x8,%xmm1 @@ -56617,10 +56605,10 @@ _sk_load_8888_dst_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call afa5 <_sk_load_8888_dst_sse2_lowp+0x3d> + DB 232,0,0,0,0 ; call af81 <_sk_load_8888_dst_sse2_lowp+0x3d> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,32 ; ja afcb <_sk_load_8888_dst_sse2_lowp+0x63> + DB 119,32 ; ja afa7 <_sk_load_8888_dst_sse2_lowp+0x63> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,59,1,0,0 ; mov 0x13b(%edi,%ecx,4),%ecx @@ -56629,14 +56617,14 @@ _sk_load_8888_dst_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 243,15,16,60,179 ; movss (%ebx,%esi,4),%xmm7 DB 15,87,219 ; xorps %xmm3,%xmm3 - DB 235,73 ; jmp b014 <_sk_load_8888_dst_sse2_lowp+0xac> + DB 235,73 ; jmp aff0 <_sk_load_8888_dst_sse2_lowp+0xac> DB 102,15,16,60,179 ; movupd (%ebx,%esi,4),%xmm7 DB 15,16,92,179,16 ; movups 0x10(%ebx,%esi,4),%xmm3 - DB 235,61 ; jmp b014 <_sk_load_8888_dst_sse2_lowp+0xac> + DB 235,61 ; jmp aff0 <_sk_load_8888_dst_sse2_lowp+0xac> DB 102,15,110,84,179,8 ; movd 0x8(%ebx,%esi,4),%xmm2 DB 102,15,112,250,69 ; pshufd $0x45,%xmm2,%xmm7 DB 102,15,18,60,179 ; movlpd (%ebx,%esi,4),%xmm7 - DB 235,43 ; jmp b014 <_sk_load_8888_dst_sse2_lowp+0xac> + DB 235,43 ; jmp aff0 <_sk_load_8888_dst_sse2_lowp+0xac> DB 102,15,110,84,179,24 ; movd 0x18(%ebx,%esi,4),%xmm2 DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3 DB 243,15,16,84,179,20 ; movss 0x14(%ebx,%esi,4),%xmm2 @@ -56653,7 +56641,7 @@ _sk_load_8888_dst_sse2_lowp LABEL PROC DB 102,15,114,242,16 ; pslld $0x10,%xmm2 DB 102,15,114,226,16 ; psrad $0x10,%xmm2 DB 102,15,107,242 ; packssdw %xmm2,%xmm6 - DB 102,15,111,151,27,36,0,0 ; movdqa 0x241b(%edi),%xmm2 + DB 102,15,111,151,31,36,0,0 ; movdqa 0x241f(%edi),%xmm2 DB 102,15,111,206 ; movdqa %xmm6,%xmm1 DB 102,15,219,202 ; pand %xmm2,%xmm1 DB 102,15,113,214,8 ; psrlw $0x8,%xmm6 @@ -56745,19 +56733,19 @@ _sk_store_8888_sse2_lowp LABEL PROC DB 128,227,7 ; and $0x7,%bl DB 254,203 ; dec %bl DB 128,251,6 ; cmp $0x6,%bl - DB 232,0,0,0,0 ; call b170 <_sk_store_8888_sse2_lowp+0x74> + DB 232,0,0,0,0 ; call b14c <_sk_store_8888_sse2_lowp+0x74> DB 89 ; pop %ecx DB 139,117,16 ; mov 0x10(%ebp),%esi DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5 - DB 119,19 ; ja b18d <_sk_store_8888_sse2_lowp+0x91> + DB 119,19 ; ja b169 <_sk_store_8888_sse2_lowp+0x91> DB 15,182,219 ; movzbl %bl,%ebx DB 3,140,153,184,0,0,0 ; add 0xb8(%ecx,%ebx,4),%ecx DB 255,225 ; jmp *%ecx DB 102,15,126,60,183 ; movd %xmm7,(%edi,%esi,4) - DB 235,93 ; jmp b1ea <_sk_store_8888_sse2_lowp+0xee> + DB 235,93 ; jmp b1c6 <_sk_store_8888_sse2_lowp+0xee> DB 243,15,127,60,183 ; movdqu %xmm7,(%edi,%esi,4) DB 243,15,127,116,183,16 ; movdqu %xmm6,0x10(%edi,%esi,4) - DB 235,80 ; jmp b1ea <_sk_store_8888_sse2_lowp+0xee> + DB 235,80 ; jmp b1c6 <_sk_store_8888_sse2_lowp+0xee> DB 102,15,111,244 ; movdqa %xmm4,%xmm6 DB 15,40,227 ; movaps %xmm3,%xmm4 DB 102,15,112,223,78 ; pshufd $0x4e,%xmm7,%xmm3 @@ -56765,7 +56753,7 @@ _sk_store_8888_sse2_lowp LABEL PROC DB 15,40,220 ; movaps %xmm4,%xmm3 DB 102,15,111,230 ; movdqa %xmm6,%xmm4 DB 102,15,214,60,183 ; movq %xmm7,(%edi,%esi,4) - DB 235,48 ; jmp b1ea <_sk_store_8888_sse2_lowp+0xee> + DB 235,48 ; jmp b1c6 <_sk_store_8888_sse2_lowp+0xee> DB 102,15,112,222,78 ; pshufd $0x4e,%xmm6,%xmm3 DB 102,15,126,92,183,24 ; movd %xmm3,0x18(%edi,%esi,4) DB 15,40,93,72 ; movaps 0x48(%ebp),%xmm3 @@ -56802,7 +56790,7 @@ _sk_store_8888_sse2_lowp LABEL PROC DB 0,0 ; add %al,(%eax) DB 42,0 ; sub (%eax),%al DB 0,0 ; add %al,(%eax) - DB 117,0 ; jne b236 <_sk_store_8888_sse2_lowp+0x13a> + DB 117,0 ; jne b212 <_sk_store_8888_sse2_lowp+0x13a> DB 0,0 ; add %al,(%eax) DB 111 ; outsl %ds:(%esi),(%dx) DB 0,0 ; add %al,(%eax) @@ -56832,10 +56820,10 @@ _sk_load_bgra_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call b274 <_sk_load_bgra_sse2_lowp+0x30> + DB 232,0,0,0,0 ; call b250 <_sk_load_bgra_sse2_lowp+0x30> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,32 ; ja b29a <_sk_load_bgra_sse2_lowp+0x56> + DB 119,32 ; ja b276 <_sk_load_bgra_sse2_lowp+0x56> DB 102,15,239,246 ; pxor %xmm6,%xmm6 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,52,1,0,0 ; mov 0x134(%edi,%ecx,4),%ecx @@ -56844,14 +56832,14 @@ _sk_load_bgra_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 243,15,16,28,179 ; movss (%ebx,%esi,4),%xmm3 DB 15,87,246 ; xorps %xmm6,%xmm6 - DB 235,73 ; jmp b2e3 <_sk_load_bgra_sse2_lowp+0x9f> + DB 235,73 ; jmp b2bf <_sk_load_bgra_sse2_lowp+0x9f> DB 102,15,16,28,179 ; movupd (%ebx,%esi,4),%xmm3 DB 15,16,116,179,16 ; movups 0x10(%ebx,%esi,4),%xmm6 - DB 235,61 ; jmp b2e3 <_sk_load_bgra_sse2_lowp+0x9f> + DB 235,61 ; jmp b2bf <_sk_load_bgra_sse2_lowp+0x9f> DB 102,15,110,68,179,8 ; movd 0x8(%ebx,%esi,4),%xmm0 DB 102,15,112,216,69 ; pshufd $0x45,%xmm0,%xmm3 DB 102,15,18,28,179 ; movlpd (%ebx,%esi,4),%xmm3 - DB 235,43 ; jmp b2e3 <_sk_load_bgra_sse2_lowp+0x9f> + DB 235,43 ; jmp b2bf <_sk_load_bgra_sse2_lowp+0x9f> DB 102,15,110,68,179,24 ; movd 0x18(%ebx,%esi,4),%xmm0 DB 102,15,112,240,69 ; pshufd $0x45,%xmm0,%xmm6 DB 243,15,16,68,179,20 ; movss 0x14(%ebx,%esi,4),%xmm0 @@ -56868,7 +56856,7 @@ _sk_load_bgra_sse2_lowp LABEL PROC DB 102,15,114,240,16 ; pslld $0x10,%xmm0 DB 102,15,114,224,16 ; psrad $0x10,%xmm0 DB 102,15,107,200 ; packssdw %xmm0,%xmm1 - DB 102,15,111,175,76,33,0,0 ; movdqa 0x214c(%edi),%xmm5 + DB 102,15,111,175,80,33,0,0 ; movdqa 0x2150(%edi),%xmm5 DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 102,15,219,213 ; pand %xmm5,%xmm2 DB 102,15,113,209,8 ; psrlw $0x8,%xmm1 @@ -56946,10 +56934,10 @@ _sk_load_bgra_dst_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call b401 <_sk_load_bgra_dst_sse2_lowp+0x3d> + DB 232,0,0,0,0 ; call b3dd <_sk_load_bgra_dst_sse2_lowp+0x3d> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,32 ; ja b427 <_sk_load_bgra_dst_sse2_lowp+0x63> + DB 119,32 ; ja b403 <_sk_load_bgra_dst_sse2_lowp+0x63> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,59,1,0,0 ; mov 0x13b(%edi,%ecx,4),%ecx @@ -56958,14 +56946,14 @@ _sk_load_bgra_dst_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 243,15,16,60,179 ; movss (%ebx,%esi,4),%xmm7 DB 15,87,219 ; xorps %xmm3,%xmm3 - DB 235,73 ; jmp b470 <_sk_load_bgra_dst_sse2_lowp+0xac> + DB 235,73 ; jmp b44c <_sk_load_bgra_dst_sse2_lowp+0xac> DB 102,15,16,60,179 ; movupd (%ebx,%esi,4),%xmm7 DB 15,16,92,179,16 ; movups 0x10(%ebx,%esi,4),%xmm3 - DB 235,61 ; jmp b470 <_sk_load_bgra_dst_sse2_lowp+0xac> + DB 235,61 ; jmp b44c <_sk_load_bgra_dst_sse2_lowp+0xac> DB 102,15,110,84,179,8 ; movd 0x8(%ebx,%esi,4),%xmm2 DB 102,15,112,250,69 ; pshufd $0x45,%xmm2,%xmm7 DB 102,15,18,60,179 ; movlpd (%ebx,%esi,4),%xmm7 - DB 235,43 ; jmp b470 <_sk_load_bgra_dst_sse2_lowp+0xac> + DB 235,43 ; jmp b44c <_sk_load_bgra_dst_sse2_lowp+0xac> DB 102,15,110,84,179,24 ; movd 0x18(%ebx,%esi,4),%xmm2 DB 102,15,112,218,69 ; pshufd $0x45,%xmm2,%xmm3 DB 243,15,16,84,179,20 ; movss 0x14(%ebx,%esi,4),%xmm2 @@ -56982,7 +56970,7 @@ _sk_load_bgra_dst_sse2_lowp LABEL PROC DB 102,15,114,242,16 ; pslld $0x10,%xmm2 DB 102,15,114,226,16 ; psrad $0x10,%xmm2 DB 102,15,107,242 ; packssdw %xmm2,%xmm6 - DB 102,15,111,151,191,31,0,0 ; movdqa 0x1fbf(%edi),%xmm2 + DB 102,15,111,151,195,31,0,0 ; movdqa 0x1fc3(%edi),%xmm2 DB 102,15,111,206 ; movdqa %xmm6,%xmm1 DB 102,15,219,202 ; pand %xmm2,%xmm1 DB 102,15,113,214,8 ; psrlw $0x8,%xmm6 @@ -57074,19 +57062,19 @@ _sk_store_bgra_sse2_lowp LABEL PROC DB 128,227,7 ; and $0x7,%bl DB 254,203 ; dec %bl DB 128,251,6 ; cmp $0x6,%bl - DB 232,0,0,0,0 ; call b5cc <_sk_store_bgra_sse2_lowp+0x74> + DB 232,0,0,0,0 ; call b5a8 <_sk_store_bgra_sse2_lowp+0x74> DB 89 ; pop %ecx DB 139,117,16 ; mov 0x10(%ebp),%esi DB 15,40,109,40 ; movaps 0x28(%ebp),%xmm5 - DB 119,19 ; ja b5e9 <_sk_store_bgra_sse2_lowp+0x91> + DB 119,19 ; ja b5c5 <_sk_store_bgra_sse2_lowp+0x91> DB 15,182,219 ; movzbl %bl,%ebx DB 3,140,153,184,0,0,0 ; add 0xb8(%ecx,%ebx,4),%ecx DB 255,225 ; jmp *%ecx DB 102,15,126,60,183 ; movd %xmm7,(%edi,%esi,4) - DB 235,93 ; jmp b646 <_sk_store_bgra_sse2_lowp+0xee> + DB 235,93 ; jmp b622 <_sk_store_bgra_sse2_lowp+0xee> DB 243,15,127,60,183 ; movdqu %xmm7,(%edi,%esi,4) DB 243,15,127,116,183,16 ; movdqu %xmm6,0x10(%edi,%esi,4) - DB 235,80 ; jmp b646 <_sk_store_bgra_sse2_lowp+0xee> + DB 235,80 ; jmp b622 <_sk_store_bgra_sse2_lowp+0xee> DB 102,15,111,244 ; movdqa %xmm4,%xmm6 DB 15,40,227 ; movaps %xmm3,%xmm4 DB 102,15,112,223,78 ; pshufd $0x4e,%xmm7,%xmm3 @@ -57094,7 +57082,7 @@ _sk_store_bgra_sse2_lowp LABEL PROC DB 15,40,220 ; movaps %xmm4,%xmm3 DB 102,15,111,230 ; movdqa %xmm6,%xmm4 DB 102,15,214,60,183 ; movq %xmm7,(%edi,%esi,4) - DB 235,48 ; jmp b646 <_sk_store_bgra_sse2_lowp+0xee> + DB 235,48 ; jmp b622 <_sk_store_bgra_sse2_lowp+0xee> DB 102,15,112,222,78 ; pshufd $0x4e,%xmm6,%xmm3 DB 102,15,126,92,183,24 ; movd %xmm3,0x18(%edi,%esi,4) DB 15,40,93,72 ; movaps 0x48(%ebp),%xmm3 @@ -57131,7 +57119,7 @@ _sk_store_bgra_sse2_lowp LABEL PROC DB 0,0 ; add %al,(%eax) DB 42,0 ; sub (%eax),%al DB 0,0 ; add %al,(%eax) - DB 117,0 ; jne b692 <_sk_store_bgra_sse2_lowp+0x13a> + DB 117,0 ; jne b66e <_sk_store_bgra_sse2_lowp+0x13a> DB 0,0 ; add %al,(%eax) DB 111 ; outsl %ds:(%esi),(%dx) DB 0,0 ; add %al,(%eax) @@ -57164,10 +57152,10 @@ _sk_load_565_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call b6db <_sk_load_565_sse2_lowp+0x3b> + DB 232,0,0,0,0 ; call b6b7 <_sk_load_565_sse2_lowp+0x3b> DB 94 ; pop %esi DB 139,125,16 ; mov 0x10(%ebp),%edi - DB 119,28 ; ja b6fd <_sk_load_565_sse2_lowp+0x5d> + DB 119,28 ; ja b6d9 <_sk_load_565_sse2_lowp+0x5d> DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,142,245,0,0,0 ; mov 0xf5(%esi,%ecx,4),%ecx @@ -57175,14 +57163,14 @@ _sk_load_565_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,183,12,123 ; movzwl (%ebx,%edi,2),%ecx DB 102,15,110,193 ; movd %ecx,%xmm0 - DB 235,59 ; jmp b738 <_sk_load_565_sse2_lowp+0x98> + DB 235,59 ; jmp b714 <_sk_load_565_sse2_lowp+0x98> DB 243,15,111,4,123 ; movdqu (%ebx,%edi,2),%xmm0 - DB 235,52 ; jmp b738 <_sk_load_565_sse2_lowp+0x98> + DB 235,52 ; jmp b714 <_sk_load_565_sse2_lowp+0x98> DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,196,68,123,4,2 ; pinsrw $0x2,0x4(%ebx,%edi,2),%xmm0 DB 243,15,16,12,123 ; movss (%ebx,%edi,2),%xmm1 DB 243,15,16,193 ; movss %xmm1,%xmm0 - DB 235,30 ; jmp b738 <_sk_load_565_sse2_lowp+0x98> + DB 235,30 ; jmp b714 <_sk_load_565_sse2_lowp+0x98> DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,196,68,123,12,6 ; pinsrw $0x6,0xc(%ebx,%edi,2),%xmm0 DB 102,15,196,68,123,10,5 ; pinsrw $0x5,0xa(%ebx,%edi,2),%xmm0 @@ -57190,11 +57178,11 @@ _sk_load_565_sse2_lowp LABEL PROC DB 102,15,18,4,123 ; movlpd (%ebx,%edi,2),%xmm0 DB 102,15,111,248 ; movdqa %xmm0,%xmm7 DB 102,15,113,215,8 ; psrlw $0x8,%xmm7 - DB 102,15,219,190,37,29,0,0 ; pand 0x1d25(%esi),%xmm7 + DB 102,15,219,190,41,29,0,0 ; pand 0x1d29(%esi),%xmm7 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 DB 102,15,113,209,5 ; psrlw $0x5,%xmm1 - DB 102,15,219,142,53,29,0,0 ; pand 0x1d35(%esi),%xmm1 - DB 102,15,111,150,69,29,0,0 ; movdqa 0x1d45(%esi),%xmm2 + DB 102,15,219,142,57,29,0,0 ; pand 0x1d39(%esi),%xmm1 + DB 102,15,111,150,73,29,0,0 ; movdqa 0x1d49(%esi),%xmm2 DB 102,15,219,208 ; pand %xmm0,%xmm2 DB 102,15,113,208,13 ; psrlw $0xd,%xmm0 DB 102,15,235,199 ; por %xmm7,%xmm0 @@ -57216,7 +57204,7 @@ _sk_load_565_sse2_lowp LABEL PROC DB 137,124,36,8 ; mov %edi,0x8(%esp) DB 137,76,36,4 ; mov %ecx,0x4(%esp) DB 137,20,36 ; mov %edx,(%esp) - DB 15,40,158,229,28,0,0 ; movaps 0x1ce5(%esi),%xmm3 + DB 15,40,158,233,28,0,0 ; movaps 0x1ce9(%esi),%xmm3 DB 255,80,4 ; call *0x4(%eax) DB 131,196,92 ; add $0x5c,%esp DB 94 ; pop %esi @@ -57260,10 +57248,10 @@ _sk_load_565_dst_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call b817 <_sk_load_565_dst_sse2_lowp+0x2b> + DB 232,0,0,0,0 ; call b7f3 <_sk_load_565_dst_sse2_lowp+0x2b> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja b839 <_sk_load_565_dst_sse2_lowp+0x4d> + DB 119,28 ; ja b815 <_sk_load_565_dst_sse2_lowp+0x4d> DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,249,0,0,0 ; mov 0xf9(%edi,%ecx,4),%ecx @@ -57271,14 +57259,14 @@ _sk_load_565_dst_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,183,12,115 ; movzwl (%ebx,%esi,2),%ecx DB 102,15,110,225 ; movd %ecx,%xmm4 - DB 235,59 ; jmp b874 <_sk_load_565_dst_sse2_lowp+0x88> + DB 235,59 ; jmp b850 <_sk_load_565_dst_sse2_lowp+0x88> DB 243,15,111,36,115 ; movdqu (%ebx,%esi,2),%xmm4 - DB 235,52 ; jmp b874 <_sk_load_565_dst_sse2_lowp+0x88> + DB 235,52 ; jmp b850 <_sk_load_565_dst_sse2_lowp+0x88> DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,100,115,4,2 ; pinsrw $0x2,0x4(%ebx,%esi,2),%xmm4 DB 243,15,16,44,115 ; movss (%ebx,%esi,2),%xmm5 DB 243,15,16,229 ; movss %xmm5,%xmm4 - DB 235,30 ; jmp b874 <_sk_load_565_dst_sse2_lowp+0x88> + DB 235,30 ; jmp b850 <_sk_load_565_dst_sse2_lowp+0x88> DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,100,115,12,6 ; pinsrw $0x6,0xc(%ebx,%esi,2),%xmm4 DB 102,15,196,100,115,10,5 ; pinsrw $0x5,0xa(%ebx,%esi,2),%xmm4 @@ -57286,11 +57274,11 @@ _sk_load_565_dst_sse2_lowp LABEL PROC DB 102,15,18,36,115 ; movlpd (%ebx,%esi,2),%xmm4 DB 102,15,111,244 ; movdqa %xmm4,%xmm6 DB 102,15,113,214,8 ; psrlw $0x8,%xmm6 - DB 102,15,219,183,233,27,0,0 ; pand 0x1be9(%edi),%xmm6 + DB 102,15,219,183,237,27,0,0 ; pand 0x1bed(%edi),%xmm6 DB 102,15,111,236 ; movdqa %xmm4,%xmm5 DB 102,15,113,213,5 ; psrlw $0x5,%xmm5 - DB 102,15,219,175,249,27,0,0 ; pand 0x1bf9(%edi),%xmm5 - DB 102,15,111,191,9,28,0,0 ; movdqa 0x1c09(%edi),%xmm7 + DB 102,15,219,175,253,27,0,0 ; pand 0x1bfd(%edi),%xmm5 + DB 102,15,111,191,13,28,0,0 ; movdqa 0x1c0d(%edi),%xmm7 DB 102,15,219,252 ; pand %xmm4,%xmm7 DB 102,15,113,212,13 ; psrlw $0xd,%xmm4 DB 102,15,235,230 ; por %xmm6,%xmm4 @@ -57303,7 +57291,7 @@ _sk_load_565_dst_sse2_lowp LABEL PROC DB 102,15,113,215,2 ; psrlw $0x2,%xmm7 DB 102,15,235,254 ; por %xmm6,%xmm7 DB 141,72,8 ; lea 0x8(%eax),%ecx - DB 15,40,183,169,27,0,0 ; movaps 0x1ba9(%edi),%xmm6 + DB 15,40,183,173,27,0,0 ; movaps 0x1bad(%edi),%xmm6 DB 15,41,116,36,64 ; movaps %xmm6,0x40(%esp) DB 139,125,20 ; mov 0x14(%ebp),%edi DB 137,124,36,12 ; mov %edi,0xc(%esp) @@ -57346,15 +57334,15 @@ _sk_store_565_sse2_lowp LABEL PROC DB 86 ; push %esi DB 131,236,92 ; sub $0x5c,%esp DB 102,15,111,226 ; movdqa %xmm2,%xmm4 - DB 232,0,0,0,0 ; call b93e <_sk_store_565_sse2_lowp+0x12> + DB 232,0,0,0,0 ; call b91a <_sk_store_565_sse2_lowp+0x12> DB 95 ; pop %edi DB 15,40,109,72 ; movaps 0x48(%ebp),%xmm5 DB 102,15,111,208 ; movdqa %xmm0,%xmm2 DB 102,15,113,242,8 ; psllw $0x8,%xmm2 - DB 102,15,219,151,242,26,0,0 ; pand 0x1af2(%edi),%xmm2 + DB 102,15,219,151,246,26,0,0 ; pand 0x1af6(%edi),%xmm2 DB 102,15,111,241 ; movdqa %xmm1,%xmm6 DB 102,15,113,246,3 ; psllw $0x3,%xmm6 - DB 102,15,219,183,2,27,0,0 ; pand 0x1b02(%edi),%xmm6 + DB 102,15,219,183,6,27,0,0 ; pand 0x1b06(%edi),%xmm6 DB 102,15,235,242 ; por %xmm2,%xmm6 DB 102,15,111,212 ; movdqa %xmm4,%xmm2 DB 102,15,113,210,3 ; psrlw $0x3,%xmm2 @@ -57373,19 +57361,19 @@ _sk_store_565_sse2_lowp LABEL PROC DB 128,249,6 ; cmp $0x6,%cl DB 139,117,16 ; mov 0x10(%ebp),%esi DB 15,40,125,24 ; movaps 0x18(%ebp),%xmm7 - DB 119,22 ; ja b9b6 <_sk_store_565_sse2_lowp+0x8a> + DB 119,22 ; ja b992 <_sk_store_565_sse2_lowp+0x8a> DB 15,182,201 ; movzbl %cl,%ecx DB 3,188,143,242,0,0,0 ; add 0xf2(%edi,%ecx,4),%edi DB 255,231 ; jmp *%edi DB 102,15,126,209 ; movd %xmm2,%ecx DB 102,137,12,115 ; mov %cx,(%ebx,%esi,2) - DB 235,59 ; jmp b9f1 <_sk_store_565_sse2_lowp+0xc5> + DB 235,59 ; jmp b9cd <_sk_store_565_sse2_lowp+0xc5> DB 243,15,127,20,115 ; movdqu %xmm2,(%ebx,%esi,2) - DB 235,52 ; jmp b9f1 <_sk_store_565_sse2_lowp+0xc5> + DB 235,52 ; jmp b9cd <_sk_store_565_sse2_lowp+0xc5> DB 102,15,197,202,2 ; pextrw $0x2,%xmm2,%ecx DB 102,137,76,115,4 ; mov %cx,0x4(%ebx,%esi,2) DB 102,15,126,20,115 ; movd %xmm2,(%ebx,%esi,2) - DB 235,35 ; jmp b9f1 <_sk_store_565_sse2_lowp+0xc5> + DB 235,35 ; jmp b9cd <_sk_store_565_sse2_lowp+0xc5> DB 102,15,197,202,6 ; pextrw $0x6,%xmm2,%ecx DB 102,137,76,115,12 ; mov %cx,0xc(%ebx,%esi,2) DB 102,15,197,202,5 ; pextrw $0x5,%xmm2,%ecx @@ -57445,10 +57433,10 @@ _sk_load_a8_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call ba86 <_sk_load_a8_sse2_lowp+0x3a> + DB 232,0,0,0,0 ; call ba62 <_sk_load_a8_sse2_lowp+0x3a> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja baa8 <_sk_load_a8_sse2_lowp+0x5c> + DB 119,28 ; ja ba84 <_sk_load_a8_sse2_lowp+0x5c> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,198,0,0,0 ; mov 0xc6(%edi,%ecx,4),%ecx @@ -57456,10 +57444,10 @@ _sk_load_a8_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx DB 102,15,110,217 ; movd %ecx,%xmm3 - DB 235,90 ; jmp bb02 <_sk_load_a8_sse2_lowp+0xb6> + DB 235,90 ; jmp bade <_sk_load_a8_sse2_lowp+0xb6> DB 243,15,126,28,51 ; movq (%ebx,%esi,1),%xmm3 DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3 - DB 235,79 ; jmp bb02 <_sk_load_a8_sse2_lowp+0xb6> + DB 235,79 ; jmp bade <_sk_load_a8_sse2_lowp+0xb6> DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,217,2 ; pinsrw $0x2,%ecx,%xmm3 @@ -57467,7 +57455,7 @@ _sk_load_a8_sse2_lowp LABEL PROC DB 102,15,110,233 ; movd %ecx,%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 243,15,16,221 ; movss %xmm5,%xmm3 - DB 235,47 ; jmp bb02 <_sk_load_a8_sse2_lowp+0xb6> + DB 235,47 ; jmp bade <_sk_load_a8_sse2_lowp+0xb6> DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,217,6 ; pinsrw $0x6,%ecx,%xmm3 @@ -57478,7 +57466,7 @@ _sk_load_a8_sse2_lowp LABEL PROC DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 242,15,16,221 ; movsd %xmm5,%xmm3 - DB 102,15,219,159,58,25,0,0 ; pand 0x193a(%edi),%xmm3 + DB 102,15,219,159,62,25,0,0 ; pand 0x193e(%edi),%xmm3 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 15,41,100,36,64 ; movaps %xmm4,0x40(%esp) DB 15,41,84,36,48 ; movaps %xmm2,0x30(%esp) @@ -57531,10 +57519,10 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call bb91 <_sk_load_a8_dst_sse2_lowp+0x29> + DB 232,0,0,0,0 ; call bb6d <_sk_load_a8_dst_sse2_lowp+0x29> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja bbb3 <_sk_load_a8_dst_sse2_lowp+0x4b> + DB 119,28 ; ja bb8f <_sk_load_a8_dst_sse2_lowp+0x4b> DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,195,0,0,0 ; mov 0xc3(%edi,%ecx,4),%ecx @@ -57542,10 +57530,10 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx DB 102,15,110,225 ; movd %ecx,%xmm4 - DB 235,90 ; jmp bc0d <_sk_load_a8_dst_sse2_lowp+0xa5> + DB 235,90 ; jmp bbe9 <_sk_load_a8_dst_sse2_lowp+0xa5> DB 243,15,126,36,51 ; movq (%ebx,%esi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 - DB 235,79 ; jmp bc0d <_sk_load_a8_dst_sse2_lowp+0xa5> + DB 235,79 ; jmp bbe9 <_sk_load_a8_dst_sse2_lowp+0xa5> DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,225,2 ; pinsrw $0x2,%ecx,%xmm4 @@ -57553,7 +57541,7 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC DB 102,15,110,233 ; movd %ecx,%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 243,15,16,229 ; movss %xmm5,%xmm4 - DB 235,47 ; jmp bc0d <_sk_load_a8_dst_sse2_lowp+0xa5> + DB 235,47 ; jmp bbe9 <_sk_load_a8_dst_sse2_lowp+0xa5> DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,225,6 ; pinsrw $0x6,%ecx,%xmm4 @@ -57564,7 +57552,7 @@ _sk_load_a8_dst_sse2_lowp LABEL PROC DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 242,15,16,229 ; movsd %xmm5,%xmm4 - DB 102,15,219,167,47,24,0,0 ; pand 0x182f(%edi),%xmm4 + DB 102,15,219,167,51,24,0,0 ; pand 0x1833(%edi),%xmm4 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 102,15,127,100,36,64 ; movdqa %xmm4,0x40(%esp) DB 102,15,239,228 ; pxor %xmm4,%xmm4 @@ -57619,32 +57607,32 @@ _sk_store_a8_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call bca9 <_sk_store_a8_sse2_lowp+0x39> + DB 232,0,0,0,0 ; call bc85 <_sk_store_a8_sse2_lowp+0x39> DB 91 ; pop %ebx DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,26 ; ja bcc9 <_sk_store_a8_sse2_lowp+0x59> + DB 119,26 ; ja bca5 <_sk_store_a8_sse2_lowp+0x59> DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,139,223,0,0,0 ; mov 0xdf(%ebx,%ecx,4),%ecx DB 1,217 ; add %ebx,%ecx DB 255,225 ; jmp *%ecx DB 102,15,126,217 ; movd %xmm3,%ecx DB 136,12,55 ; mov %cl,(%edi,%esi,1) - DB 233,136,0,0,0 ; jmp bd51 <_sk_store_a8_sse2_lowp+0xe1> - DB 102,15,111,163,23,23,0,0 ; movdqa 0x1717(%ebx),%xmm4 + DB 233,136,0,0,0 ; jmp bd2d <_sk_store_a8_sse2_lowp+0xe1> + DB 102,15,111,163,27,23,0,0 ; movdqa 0x171b(%ebx),%xmm4 DB 102,15,219,227 ; pand %xmm3,%xmm4 DB 102,15,103,228 ; packuswb %xmm4,%xmm4 DB 102,15,214,36,55 ; movq %xmm4,(%edi,%esi,1) DB 15,40,101,24 ; movaps 0x18(%ebp),%xmm4 - DB 235,109 ; jmp bd51 <_sk_store_a8_sse2_lowp+0xe1> + DB 235,109 ; jmp bd2d <_sk_store_a8_sse2_lowp+0xe1> DB 102,15,197,203,2 ; pextrw $0x2,%xmm3,%ecx DB 136,76,55,2 ; mov %cl,0x2(%edi,%esi,1) - DB 102,15,111,163,23,23,0,0 ; movdqa 0x1717(%ebx),%xmm4 + DB 102,15,111,163,27,23,0,0 ; movdqa 0x171b(%ebx),%xmm4 DB 102,15,219,227 ; pand %xmm3,%xmm4 DB 102,15,103,228 ; packuswb %xmm4,%xmm4 DB 102,15,126,225 ; movd %xmm4,%ecx DB 15,40,101,24 ; movaps 0x18(%ebp),%xmm4 DB 102,137,12,55 ; mov %cx,(%edi,%esi,1) - DB 235,70 ; jmp bd51 <_sk_store_a8_sse2_lowp+0xe1> + DB 235,70 ; jmp bd2d <_sk_store_a8_sse2_lowp+0xe1> DB 102,15,197,203,6 ; pextrw $0x6,%xmm3,%ecx DB 136,76,55,6 ; mov %cl,0x6(%edi,%esi,1) DB 102,15,197,203,5 ; pextrw $0x5,%xmm3,%ecx @@ -57654,7 +57642,7 @@ _sk_store_a8_sse2_lowp LABEL PROC DB 15,40,254 ; movaps %xmm6,%xmm7 DB 15,40,245 ; movaps %xmm5,%xmm6 DB 15,40,236 ; movaps %xmm4,%xmm5 - DB 102,15,111,163,23,23,0,0 ; movdqa 0x1717(%ebx),%xmm4 + DB 102,15,111,163,27,23,0,0 ; movdqa 0x171b(%ebx),%xmm4 DB 102,15,219,227 ; pand %xmm3,%xmm4 DB 102,15,103,228 ; packuswb %xmm4,%xmm4 DB 102,15,126,36,55 ; movd %xmm4,(%edi,%esi,1) @@ -57688,7 +57676,7 @@ _sk_store_a8_sse2_lowp LABEL PROC DB 0,0 ; add %al,(%eax) DB 0,125,0 ; add %bh,0x0(%ebp) DB 0,0 ; add %al,(%eax) - DB 116,0 ; je bd9a <_sk_store_a8_sse2_lowp+0x12a> + DB 116,0 ; je bd76 <_sk_store_a8_sse2_lowp+0x12a> DB 0,0 ; add %al,(%eax) DB 107,0,0 ; imul $0x0,(%eax),%eax DB 0,98,0 ; add %ah,0x0(%edx) @@ -57716,10 +57704,10 @@ _sk_load_g8_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call bddd <_sk_load_g8_sse2_lowp+0x39> + DB 232,0,0,0,0 ; call bdb9 <_sk_load_g8_sse2_lowp+0x39> DB 94 ; pop %esi DB 139,125,16 ; mov 0x10(%ebp),%edi - DB 119,28 ; ja bdff <_sk_load_g8_sse2_lowp+0x5b> + DB 119,28 ; ja bddb <_sk_load_g8_sse2_lowp+0x5b> DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,142,199,0,0,0 ; mov 0xc7(%esi,%ecx,4),%ecx @@ -57727,10 +57715,10 @@ _sk_load_g8_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,182,12,59 ; movzbl (%ebx,%edi,1),%ecx DB 102,15,110,193 ; movd %ecx,%xmm0 - DB 235,90 ; jmp be59 <_sk_load_g8_sse2_lowp+0xb5> + DB 235,90 ; jmp be35 <_sk_load_g8_sse2_lowp+0xb5> DB 243,15,126,4,59 ; movq (%ebx,%edi,1),%xmm0 DB 102,15,96,192 ; punpcklbw %xmm0,%xmm0 - DB 235,79 ; jmp be59 <_sk_load_g8_sse2_lowp+0xb5> + DB 235,79 ; jmp be35 <_sk_load_g8_sse2_lowp+0xb5> DB 15,182,76,59,2 ; movzbl 0x2(%ebx,%edi,1),%ecx DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,196,193,2 ; pinsrw $0x2,%ecx,%xmm0 @@ -57738,7 +57726,7 @@ _sk_load_g8_sse2_lowp LABEL PROC DB 102,15,110,233 ; movd %ecx,%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 243,15,16,197 ; movss %xmm5,%xmm0 - DB 235,47 ; jmp be59 <_sk_load_g8_sse2_lowp+0xb5> + DB 235,47 ; jmp be35 <_sk_load_g8_sse2_lowp+0xb5> DB 15,182,76,59,6 ; movzbl 0x6(%ebx,%edi,1),%ecx DB 102,15,239,192 ; pxor %xmm0,%xmm0 DB 102,15,196,193,6 ; pinsrw $0x6,%ecx,%xmm0 @@ -57749,7 +57737,7 @@ _sk_load_g8_sse2_lowp LABEL PROC DB 102,15,110,44,59 ; movd (%ebx,%edi,1),%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 242,15,16,197 ; movsd %xmm5,%xmm0 - DB 102,15,219,134,227,21,0,0 ; pand 0x15e3(%esi),%xmm0 + DB 102,15,219,134,231,21,0,0 ; pand 0x15e7(%esi),%xmm0 DB 141,72,8 ; lea 0x8(%eax),%ecx DB 15,41,100,36,64 ; movaps %xmm4,0x40(%esp) DB 15,41,92,36,48 ; movaps %xmm3,0x30(%esp) @@ -57760,7 +57748,7 @@ _sk_load_g8_sse2_lowp LABEL PROC DB 137,124,36,8 ; mov %edi,0x8(%esp) DB 137,76,36,4 ; mov %ecx,0x4(%esp) DB 137,20,36 ; mov %edx,(%esp) - DB 15,40,158,227,21,0,0 ; movaps 0x15e3(%esi),%xmm3 + DB 15,40,158,231,21,0,0 ; movaps 0x15e7(%esi),%xmm3 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 DB 102,15,111,208 ; movdqa %xmm0,%xmm2 DB 255,80,4 ; call *0x4(%eax) @@ -57801,10 +57789,10 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call bee9 <_sk_load_g8_dst_sse2_lowp+0x29> + DB 232,0,0,0,0 ; call bec5 <_sk_load_g8_dst_sse2_lowp+0x29> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja bf0b <_sk_load_g8_dst_sse2_lowp+0x4b> + DB 119,28 ; ja bee7 <_sk_load_g8_dst_sse2_lowp+0x4b> DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,195,0,0,0 ; mov 0xc3(%edi,%ecx,4),%ecx @@ -57812,10 +57800,10 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx DB 102,15,110,225 ; movd %ecx,%xmm4 - DB 235,90 ; jmp bf65 <_sk_load_g8_dst_sse2_lowp+0xa5> + DB 235,90 ; jmp bf41 <_sk_load_g8_dst_sse2_lowp+0xa5> DB 243,15,126,36,51 ; movq (%ebx,%esi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 - DB 235,79 ; jmp bf65 <_sk_load_g8_dst_sse2_lowp+0xa5> + DB 235,79 ; jmp bf41 <_sk_load_g8_dst_sse2_lowp+0xa5> DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,225,2 ; pinsrw $0x2,%ecx,%xmm4 @@ -57823,7 +57811,7 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC DB 102,15,110,233 ; movd %ecx,%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 243,15,16,229 ; movss %xmm5,%xmm4 - DB 235,47 ; jmp bf65 <_sk_load_g8_dst_sse2_lowp+0xa5> + DB 235,47 ; jmp bf41 <_sk_load_g8_dst_sse2_lowp+0xa5> DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,225,6 ; pinsrw $0x6,%ecx,%xmm4 @@ -57834,9 +57822,9 @@ _sk_load_g8_dst_sse2_lowp LABEL PROC DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 242,15,16,229 ; movsd %xmm5,%xmm4 - DB 102,15,219,167,215,20,0,0 ; pand 0x14d7(%edi),%xmm4 + DB 102,15,219,167,219,20,0,0 ; pand 0x14db(%edi),%xmm4 DB 141,72,8 ; lea 0x8(%eax),%ecx - DB 15,40,175,215,20,0,0 ; movaps 0x14d7(%edi),%xmm5 + DB 15,40,175,219,20,0,0 ; movaps 0x14db(%edi),%xmm5 DB 15,41,108,36,64 ; movaps %xmm5,0x40(%esp) DB 102,15,127,100,36,48 ; movdqa %xmm4,0x30(%esp) DB 102,15,127,100,36,32 ; movdqa %xmm4,0x20(%esp) @@ -57875,7 +57863,7 @@ _sk_luminance_to_alpha_sse2_lowp LABEL PROC DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp DB 102,15,111,218 ; movdqa %xmm2,%xmm3 - DB 232,0,0,0,0 ; call bfd9 <_sk_luminance_to_alpha_sse2_lowp+0x11> + DB 232,0,0,0,0 ; call bfb5 <_sk_luminance_to_alpha_sse2_lowp+0x11> DB 88 ; pop %eax DB 139,77,8 ; mov 0x8(%ebp),%ecx DB 139,85,16 ; mov 0x10(%ebp),%edx @@ -57885,10 +57873,10 @@ _sk_luminance_to_alpha_sse2_lowp LABEL PROC DB 15,40,109,56 ; movaps 0x38(%ebp),%xmm5 DB 15,40,117,72 ; movaps 0x48(%ebp),%xmm6 DB 139,125,12 ; mov 0xc(%ebp),%edi - DB 102,15,213,128,119,20,0,0 ; pmullw 0x1477(%eax),%xmm0 - DB 102,15,213,136,135,20,0,0 ; pmullw 0x1487(%eax),%xmm1 + DB 102,15,213,128,123,20,0,0 ; pmullw 0x147b(%eax),%xmm0 + DB 102,15,213,136,139,20,0,0 ; pmullw 0x148b(%eax),%xmm1 DB 102,15,253,200 ; paddw %xmm0,%xmm1 - DB 102,15,213,152,151,20,0,0 ; pmullw 0x1497(%eax),%xmm3 + DB 102,15,213,152,155,20,0,0 ; pmullw 0x149b(%eax),%xmm3 DB 102,15,253,217 ; paddw %xmm1,%xmm3 DB 102,15,113,211,8 ; psrlw $0x8,%xmm3 DB 141,71,4 ; lea 0x4(%edi),%eax @@ -57917,15 +57905,15 @@ _sk_scale_1_float_sse2_lowp LABEL PROC DB 87 ; push %edi DB 86 ; push %esi DB 131,236,80 ; sub $0x50,%esp - DB 232,0,0,0,0 ; call c062 <_sk_scale_1_float_sse2_lowp+0xd> + DB 232,0,0,0,0 ; call c03e <_sk_scale_1_float_sse2_lowp+0xd> DB 94 ; pop %esi DB 139,69,8 ; mov 0x8(%ebp),%eax DB 139,85,16 ; mov 0x10(%ebp),%edx DB 139,77,12 ; mov 0xc(%ebp),%ecx DB 139,57 ; mov (%ecx),%edi DB 243,15,16,39 ; movss (%edi),%xmm4 - DB 243,15,89,166,34,20,0,0 ; mulss 0x1422(%esi),%xmm4 - DB 243,15,88,166,30,20,0,0 ; addss 0x141e(%esi),%xmm4 + DB 243,15,89,166,38,20,0,0 ; mulss 0x1426(%esi),%xmm4 + DB 243,15,88,166,34,20,0,0 ; addss 0x1422(%esi),%xmm4 DB 243,15,44,252 ; cvttss2si %xmm4,%edi DB 102,15,110,239 ; movd %edi,%xmm5 DB 139,125,20 ; mov 0x14(%ebp),%edi @@ -57938,7 +57926,7 @@ _sk_scale_1_float_sse2_lowp LABEL PROC DB 102,15,213,205 ; pmullw %xmm5,%xmm1 DB 102,15,213,213 ; pmullw %xmm5,%xmm2 DB 102,15,213,221 ; pmullw %xmm5,%xmm3 - DB 102,15,111,174,94,19,0,0 ; movdqa 0x135e(%esi),%xmm5 + DB 102,15,111,174,98,19,0,0 ; movdqa 0x1362(%esi),%xmm5 DB 102,15,253,197 ; paddw %xmm5,%xmm0 DB 102,15,253,205 ; paddw %xmm5,%xmm1 DB 102,15,253,213 ; paddw %xmm5,%xmm2 @@ -57975,19 +57963,19 @@ _sk_lerp_1_float_sse2_lowp LABEL PROC DB 102,15,111,218 ; movdqa %xmm2,%xmm3 DB 102,15,111,209 ; movdqa %xmm1,%xmm2 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 - DB 232,0,0,0,0 ; call c130 <_sk_lerp_1_float_sse2_lowp+0x1d> + DB 232,0,0,0,0 ; call c10c <_sk_lerp_1_float_sse2_lowp+0x1d> DB 89 ; pop %ecx DB 102,15,111,109,24 ; movdqa 0x18(%ebp),%xmm5 DB 139,69,12 ; mov 0xc(%ebp),%eax DB 139,16 ; mov (%eax),%edx DB 243,15,16,50 ; movss (%edx),%xmm6 - DB 243,15,89,177,84,19,0,0 ; mulss 0x1354(%ecx),%xmm6 - DB 243,15,88,177,80,19,0,0 ; addss 0x1350(%ecx),%xmm6 + DB 243,15,89,177,88,19,0,0 ; mulss 0x1358(%ecx),%xmm6 + DB 243,15,88,177,84,19,0,0 ; addss 0x1354(%ecx),%xmm6 DB 243,15,44,214 ; cvttss2si %xmm6,%edx DB 102,15,110,242 ; movd %edx,%xmm6 DB 242,15,112,246,0 ; pshuflw $0x0,%xmm6,%xmm6 DB 102,15,112,246,80 ; pshufd $0x50,%xmm6,%xmm6 - DB 102,15,111,129,144,18,0,0 ; movdqa 0x1290(%ecx),%xmm0 + DB 102,15,111,129,148,18,0,0 ; movdqa 0x1294(%ecx),%xmm0 DB 102,15,213,206 ; pmullw %xmm6,%xmm1 DB 102,15,253,200 ; paddw %xmm0,%xmm1 DB 102,15,213,214 ; pmullw %xmm6,%xmm2 @@ -58058,10 +58046,10 @@ _sk_scale_u8_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call c259 <_sk_scale_u8_sse2_lowp+0x31> + DB 232,0,0,0,0 ; call c235 <_sk_scale_u8_sse2_lowp+0x31> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja c27b <_sk_scale_u8_sse2_lowp+0x53> + DB 119,28 ; ja c257 <_sk_scale_u8_sse2_lowp+0x53> DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,3,1,0,0 ; mov 0x103(%edi,%ecx,4),%ecx @@ -58069,10 +58057,10 @@ _sk_scale_u8_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx DB 102,15,110,225 ; movd %ecx,%xmm4 - DB 235,90 ; jmp c2d5 <_sk_scale_u8_sse2_lowp+0xad> + DB 235,90 ; jmp c2b1 <_sk_scale_u8_sse2_lowp+0xad> DB 243,15,126,36,51 ; movq (%ebx,%esi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 - DB 235,79 ; jmp c2d5 <_sk_scale_u8_sse2_lowp+0xad> + DB 235,79 ; jmp c2b1 <_sk_scale_u8_sse2_lowp+0xad> DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,225,2 ; pinsrw $0x2,%ecx,%xmm4 @@ -58080,7 +58068,7 @@ _sk_scale_u8_sse2_lowp LABEL PROC DB 102,15,110,233 ; movd %ecx,%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 243,15,16,229 ; movss %xmm5,%xmm4 - DB 235,47 ; jmp c2d5 <_sk_scale_u8_sse2_lowp+0xad> + DB 235,47 ; jmp c2b1 <_sk_scale_u8_sse2_lowp+0xad> DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx DB 102,15,239,228 ; pxor %xmm4,%xmm4 DB 102,15,196,225,6 ; pinsrw $0x6,%ecx,%xmm4 @@ -58091,9 +58079,9 @@ _sk_scale_u8_sse2_lowp LABEL PROC DB 102,15,110,44,51 ; movd (%ebx,%esi,1),%xmm5 DB 102,15,96,232 ; punpcklbw %xmm0,%xmm5 DB 242,15,16,229 ; movsd %xmm5,%xmm4 - DB 102,15,219,167,103,17,0,0 ; pand 0x1167(%edi),%xmm4 + DB 102,15,219,167,107,17,0,0 ; pand 0x116b(%edi),%xmm4 DB 102,15,213,196 ; pmullw %xmm4,%xmm0 - DB 102,15,111,175,103,17,0,0 ; movdqa 0x1167(%edi),%xmm5 + DB 102,15,111,175,107,17,0,0 ; movdqa 0x116b(%edi),%xmm5 DB 102,15,253,197 ; paddw %xmm5,%xmm0 DB 102,15,113,208,8 ; psrlw $0x8,%xmm0 DB 102,15,213,204 ; pmullw %xmm4,%xmm1 @@ -58158,10 +58146,10 @@ _sk_lerp_u8_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call c3a6 <_sk_lerp_u8_sse2_lowp+0x2e> + DB 232,0,0,0,0 ; call c382 <_sk_lerp_u8_sse2_lowp+0x2e> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja c3c8 <_sk_lerp_u8_sse2_lowp+0x50> + DB 119,28 ; ja c3a4 <_sk_lerp_u8_sse2_lowp+0x50> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,74,1,0,0 ; mov 0x14a(%edi,%ecx,4),%ecx @@ -58169,10 +58157,10 @@ _sk_lerp_u8_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,182,12,51 ; movzbl (%ebx,%esi,1),%ecx DB 102,15,110,217 ; movd %ecx,%xmm3 - DB 235,90 ; jmp c422 <_sk_lerp_u8_sse2_lowp+0xaa> + DB 235,90 ; jmp c3fe <_sk_lerp_u8_sse2_lowp+0xaa> DB 243,15,126,28,51 ; movq (%ebx,%esi,1),%xmm3 DB 102,15,96,216 ; punpcklbw %xmm0,%xmm3 - DB 235,79 ; jmp c422 <_sk_lerp_u8_sse2_lowp+0xaa> + DB 235,79 ; jmp c3fe <_sk_lerp_u8_sse2_lowp+0xaa> DB 15,182,76,51,2 ; movzbl 0x2(%ebx,%esi,1),%ecx DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,217,2 ; pinsrw $0x2,%ecx,%xmm3 @@ -58180,7 +58168,7 @@ _sk_lerp_u8_sse2_lowp LABEL PROC DB 102,15,110,225 ; movd %ecx,%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 DB 243,15,16,220 ; movss %xmm4,%xmm3 - DB 235,47 ; jmp c422 <_sk_lerp_u8_sse2_lowp+0xaa> + DB 235,47 ; jmp c3fe <_sk_lerp_u8_sse2_lowp+0xaa> DB 15,182,76,51,6 ; movzbl 0x6(%ebx,%esi,1),%ecx DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,217,6 ; pinsrw $0x6,%ecx,%xmm3 @@ -58191,8 +58179,8 @@ _sk_lerp_u8_sse2_lowp LABEL PROC DB 102,15,110,36,51 ; movd (%ebx,%esi,1),%xmm4 DB 102,15,96,224 ; punpcklbw %xmm0,%xmm4 DB 242,15,16,220 ; movsd %xmm4,%xmm3 - DB 102,15,219,159,26,16,0,0 ; pand 0x101a(%edi),%xmm3 - DB 102,15,111,183,26,16,0,0 ; movdqa 0x101a(%edi),%xmm6 + DB 102,15,219,159,30,16,0,0 ; pand 0x101e(%edi),%xmm3 + DB 102,15,111,183,30,16,0,0 ; movdqa 0x101e(%edi),%xmm6 DB 102,15,111,227 ; movdqa %xmm3,%xmm4 DB 102,15,239,230 ; pxor %xmm6,%xmm4 DB 102,15,111,252 ; movdqa %xmm4,%xmm7 @@ -58279,10 +58267,10 @@ _sk_scale_565_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call c54f <_sk_scale_565_sse2_lowp+0x43> + DB 232,0,0,0,0 ; call c52b <_sk_scale_565_sse2_lowp+0x43> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja c571 <_sk_scale_565_sse2_lowp+0x65> + DB 119,28 ; ja c54d <_sk_scale_565_sse2_lowp+0x65> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,249,1,0,0 ; mov 0x1f9(%edi,%ecx,4),%ecx @@ -58290,14 +58278,14 @@ _sk_scale_565_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,183,12,115 ; movzwl (%ebx,%esi,2),%ecx DB 102,15,110,217 ; movd %ecx,%xmm3 - DB 235,59 ; jmp c5ac <_sk_scale_565_sse2_lowp+0xa0> + DB 235,59 ; jmp c588 <_sk_scale_565_sse2_lowp+0xa0> DB 243,15,111,28,115 ; movdqu (%ebx,%esi,2),%xmm3 - DB 235,52 ; jmp c5ac <_sk_scale_565_sse2_lowp+0xa0> + DB 235,52 ; jmp c588 <_sk_scale_565_sse2_lowp+0xa0> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,92,115,4,2 ; pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3 DB 243,15,16,12,115 ; movss (%ebx,%esi,2),%xmm1 DB 243,15,16,217 ; movss %xmm1,%xmm3 - DB 235,30 ; jmp c5ac <_sk_scale_565_sse2_lowp+0xa0> + DB 235,30 ; jmp c588 <_sk_scale_565_sse2_lowp+0xa0> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,92,115,12,6 ; pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3 DB 102,15,196,92,115,10,5 ; pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3 @@ -58305,11 +58293,11 @@ _sk_scale_565_sse2_lowp LABEL PROC DB 102,15,18,28,115 ; movlpd (%ebx,%esi,2),%xmm3 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,113,209,8 ; psrlw $0x8,%xmm1 - DB 102,15,219,143,177,14,0,0 ; pand 0xeb1(%edi),%xmm1 + DB 102,15,219,143,181,14,0,0 ; pand 0xeb5(%edi),%xmm1 DB 102,15,111,211 ; movdqa %xmm3,%xmm2 DB 102,15,113,210,5 ; psrlw $0x5,%xmm2 - DB 102,15,219,151,193,14,0,0 ; pand 0xec1(%edi),%xmm2 - DB 102,15,111,135,209,14,0,0 ; movdqa 0xed1(%edi),%xmm0 + DB 102,15,219,151,197,14,0,0 ; pand 0xec5(%edi),%xmm2 + DB 102,15,111,135,213,14,0,0 ; movdqa 0xed5(%edi),%xmm0 DB 102,15,219,195 ; pand %xmm3,%xmm0 DB 102,15,113,211,13 ; psrlw $0xd,%xmm3 DB 102,15,235,217 ; por %xmm1,%xmm3 @@ -58322,7 +58310,7 @@ _sk_scale_565_sse2_lowp LABEL PROC DB 102,15,113,208,2 ; psrlw $0x2,%xmm0 DB 102,15,235,193 ; por %xmm1,%xmm0 DB 102,15,127,69,200 ; movdqa %xmm0,-0x38(%ebp) - DB 102,15,111,167,145,14,0,0 ; movdqa 0xe91(%edi),%xmm4 + DB 102,15,111,167,149,14,0,0 ; movdqa 0xe95(%edi),%xmm4 DB 15,41,117,184 ; movaps %xmm6,-0x48(%ebp) DB 102,15,239,244 ; pxor %xmm4,%xmm6 DB 102,15,239,252 ; pxor %xmm4,%xmm7 @@ -58365,7 +58353,7 @@ _sk_scale_565_sse2_lowp LABEL PROC DB 102,15,111,229 ; movdqa %xmm5,%xmm4 DB 102,15,213,101,136 ; pmullw -0x78(%ebp),%xmm4 DB 102,15,213,125,184 ; pmullw -0x48(%ebp),%xmm7 - DB 102,15,111,135,113,14,0,0 ; movdqa 0xe71(%edi),%xmm0 + DB 102,15,111,135,117,14,0,0 ; movdqa 0xe75(%edi),%xmm0 DB 102,15,253,216 ; paddw %xmm0,%xmm3 DB 102,15,253,208 ; paddw %xmm0,%xmm2 DB 102,15,253,224 ; paddw %xmm0,%xmm4 @@ -58440,10 +58428,10 @@ _sk_lerp_565_sse2_lowp LABEL PROC DB 128,225,7 ; and $0x7,%cl DB 254,201 ; dec %cl DB 128,249,6 ; cmp $0x6,%cl - DB 232,0,0,0,0 ; call c7a7 <_sk_lerp_565_sse2_lowp+0x43> + DB 232,0,0,0,0 ; call c783 <_sk_lerp_565_sse2_lowp+0x43> DB 95 ; pop %edi DB 139,117,16 ; mov 0x10(%ebp),%esi - DB 119,28 ; ja c7c9 <_sk_lerp_565_sse2_lowp+0x65> + DB 119,28 ; ja c7a5 <_sk_lerp_565_sse2_lowp+0x65> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 15,182,201 ; movzbl %cl,%ecx DB 139,140,143,73,2,0,0 ; mov 0x249(%edi,%ecx,4),%ecx @@ -58451,14 +58439,14 @@ _sk_lerp_565_sse2_lowp LABEL PROC DB 255,225 ; jmp *%ecx DB 15,183,12,115 ; movzwl (%ebx,%esi,2),%ecx DB 102,15,110,217 ; movd %ecx,%xmm3 - DB 235,59 ; jmp c804 <_sk_lerp_565_sse2_lowp+0xa0> + DB 235,59 ; jmp c7e0 <_sk_lerp_565_sse2_lowp+0xa0> DB 243,15,111,28,115 ; movdqu (%ebx,%esi,2),%xmm3 - DB 235,52 ; jmp c804 <_sk_lerp_565_sse2_lowp+0xa0> + DB 235,52 ; jmp c7e0 <_sk_lerp_565_sse2_lowp+0xa0> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,92,115,4,2 ; pinsrw $0x2,0x4(%ebx,%esi,2),%xmm3 DB 243,15,16,12,115 ; movss (%ebx,%esi,2),%xmm1 DB 243,15,16,217 ; movss %xmm1,%xmm3 - DB 235,30 ; jmp c804 <_sk_lerp_565_sse2_lowp+0xa0> + DB 235,30 ; jmp c7e0 <_sk_lerp_565_sse2_lowp+0xa0> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 102,15,196,92,115,12,6 ; pinsrw $0x6,0xc(%ebx,%esi,2),%xmm3 DB 102,15,196,92,115,10,5 ; pinsrw $0x5,0xa(%ebx,%esi,2),%xmm3 @@ -58466,11 +58454,11 @@ _sk_lerp_565_sse2_lowp LABEL PROC DB 102,15,18,28,115 ; movlpd (%ebx,%esi,2),%xmm3 DB 102,15,111,203 ; movdqa %xmm3,%xmm1 DB 102,15,113,209,8 ; psrlw $0x8,%xmm1 - DB 102,15,219,143,89,12,0,0 ; pand 0xc59(%edi),%xmm1 + DB 102,15,219,143,93,12,0,0 ; pand 0xc5d(%edi),%xmm1 DB 102,15,111,211 ; movdqa %xmm3,%xmm2 DB 102,15,113,210,5 ; psrlw $0x5,%xmm2 - DB 102,15,219,151,105,12,0,0 ; pand 0xc69(%edi),%xmm2 - DB 102,15,111,175,121,12,0,0 ; movdqa 0xc79(%edi),%xmm5 + DB 102,15,219,151,109,12,0,0 ; pand 0xc6d(%edi),%xmm2 + DB 102,15,111,175,125,12,0,0 ; movdqa 0xc7d(%edi),%xmm5 DB 102,15,219,235 ; pand %xmm3,%xmm5 DB 102,15,113,211,13 ; psrlw $0xd,%xmm3 DB 102,15,235,217 ; por %xmm1,%xmm3 @@ -58483,7 +58471,7 @@ _sk_lerp_565_sse2_lowp LABEL PROC DB 102,15,113,213,2 ; psrlw $0x2,%xmm5 DB 102,15,235,233 ; por %xmm1,%xmm5 DB 102,15,127,109,216 ; movdqa %xmm5,-0x28(%ebp) - DB 102,15,111,167,57,12,0,0 ; movdqa 0xc39(%edi),%xmm4 + DB 102,15,111,167,61,12,0,0 ; movdqa 0xc3d(%edi),%xmm4 DB 102,15,111,198 ; movdqa %xmm6,%xmm0 DB 102,15,111,200 ; movdqa %xmm0,%xmm1 DB 102,15,239,204 ; pxor %xmm4,%xmm1 @@ -58524,7 +58512,7 @@ _sk_lerp_565_sse2_lowp LABEL PROC DB 102,15,235,249 ; por %xmm1,%xmm7 DB 102,15,111,195 ; movdqa %xmm3,%xmm0 DB 102,15,213,93,168 ; pmullw -0x58(%ebp),%xmm3 - DB 102,15,111,143,25,12,0,0 ; movdqa 0xc19(%edi),%xmm1 + DB 102,15,111,143,29,12,0,0 ; movdqa 0xc1d(%edi),%xmm1 DB 102,15,239,193 ; pxor %xmm1,%xmm0 DB 102,15,111,101,24 ; movdqa 0x18(%ebp),%xmm4 DB 102,15,213,196 ; pmullw %xmm4,%xmm0 @@ -58618,11 +58606,11 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC DB 128,227,7 ; and $0x7,%bl DB 254,203 ; dec %bl DB 128,251,6 ; cmp $0x6,%bl - DB 232,0,0,0,0 ; call ca4b <_sk_srcover_rgba_8888_sse2_lowp+0x3f> + DB 232,0,0,0,0 ; call ca27 <_sk_srcover_rgba_8888_sse2_lowp+0x3f> DB 89 ; pop %ecx DB 139,117,16 ; mov 0x10(%ebp),%esi DB 15,182,211 ; movzbl %bl,%edx - DB 119,29 ; ja ca71 <_sk_srcover_rgba_8888_sse2_lowp+0x65> + DB 119,29 ; ja ca4d <_sk_srcover_rgba_8888_sse2_lowp+0x65> DB 102,15,239,219 ; pxor %xmm3,%xmm3 DB 139,132,145,77,2,0,0 ; mov 0x24d(%ecx,%edx,4),%eax DB 1,200 ; add %ecx,%eax @@ -58630,14 +58618,14 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC DB 255,224 ; jmp *%eax DB 243,15,16,52,183 ; movss (%edi,%esi,4),%xmm6 DB 15,87,219 ; xorps %xmm3,%xmm3 - DB 235,73 ; jmp caba <_sk_srcover_rgba_8888_sse2_lowp+0xae> + DB 235,73 ; jmp ca96 <_sk_srcover_rgba_8888_sse2_lowp+0xae> DB 102,15,16,52,183 ; movupd (%edi,%esi,4),%xmm6 DB 15,16,92,183,16 ; movups 0x10(%edi,%esi,4),%xmm3 - DB 235,61 ; jmp caba <_sk_srcover_rgba_8888_sse2_lowp+0xae> + DB 235,61 ; jmp ca96 <_sk_srcover_rgba_8888_sse2_lowp+0xae> DB 102,15,110,68,183,8 ; movd 0x8(%edi,%esi,4),%xmm0 DB 102,15,112,240,69 ; pshufd $0x45,%xmm0,%xmm6 DB 102,15,18,52,183 ; movlpd (%edi,%esi,4),%xmm6 - DB 235,43 ; jmp caba <_sk_srcover_rgba_8888_sse2_lowp+0xae> + DB 235,43 ; jmp ca96 <_sk_srcover_rgba_8888_sse2_lowp+0xae> DB 102,15,110,68,183,24 ; movd 0x18(%edi,%esi,4),%xmm0 DB 102,15,112,216,69 ; pshufd $0x45,%xmm0,%xmm3 DB 243,15,16,68,183,20 ; movss 0x14(%edi,%esi,4),%xmm0 @@ -58663,7 +58651,7 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC DB 102,15,114,243,16 ; pslld $0x10,%xmm3 DB 102,15,114,227,16 ; psrad $0x10,%xmm3 DB 102,15,107,243 ; packssdw %xmm3,%xmm6 - DB 102,15,111,153,117,9,0,0 ; movdqa 0x975(%ecx),%xmm3 + DB 102,15,111,153,121,9,0,0 ; movdqa 0x979(%ecx),%xmm3 DB 102,15,114,208,16 ; psrld $0x10,%xmm0 DB 102,15,114,210,16 ; psrld $0x10,%xmm2 DB 102,15,114,242,16 ; pslld $0x10,%xmm2 @@ -58715,18 +58703,18 @@ _sk_srcover_rgba_8888_sse2_lowp LABEL PROC DB 102,15,105,220 ; punpckhwd %xmm4,%xmm3 DB 102,15,235,222 ; por %xmm6,%xmm3 DB 128,251,6 ; cmp $0x6,%bl - DB 119,16 ; ja cbfb <_sk_srcover_rgba_8888_sse2_lowp+0x1ef> + DB 119,16 ; ja cbd7 <_sk_srcover_rgba_8888_sse2_lowp+0x1ef> DB 3,140,145,105,2,0,0 ; add 0x269(%ecx,%edx,4),%ecx DB 255,225 ; jmp *%ecx DB 102,15,126,4,183 ; movd %xmm0,(%edi,%esi,4) - DB 235,64 ; jmp cc3b <_sk_srcover_rgba_8888_sse2_lowp+0x22f> + DB 235,64 ; jmp cc17 <_sk_srcover_rgba_8888_sse2_lowp+0x22f> DB 243,15,127,4,183 ; movdqu %xmm0,(%edi,%esi,4) DB 243,15,127,92,183,16 ; movdqu %xmm3,0x10(%edi,%esi,4) - DB 235,51 ; jmp cc3b <_sk_srcover_rgba_8888_sse2_lowp+0x22f> + DB 235,51 ; jmp cc17 <_sk_srcover_rgba_8888_sse2_lowp+0x22f> DB 102,15,112,208,78 ; pshufd $0x4e,%xmm0,%xmm2 DB 102,15,126,84,183,8 ; movd %xmm2,0x8(%edi,%esi,4) DB 102,15,214,4,183 ; movq %xmm0,(%edi,%esi,4) - DB 235,33 ; jmp cc3b <_sk_srcover_rgba_8888_sse2_lowp+0x22f> + DB 235,33 ; jmp cc17 <_sk_srcover_rgba_8888_sse2_lowp+0x22f> DB 102,15,112,211,78 ; pshufd $0x4e,%xmm3,%xmm2 DB 102,15,126,84,183,24 ; movd %xmm2,0x18(%edi,%esi,4) DB 102,15,112,211,229 ; pshufd $0xe5,%xmm3,%xmm2 @@ -58855,11 +58843,11 @@ ALIGN 16 DB 0,128,191,0,0,128 ; add %al,-0x7fffff41(%eax) DB 191,0,0,224,64 ; mov $0x40e00000,%edi DB 0,0 ; add %al,(%eax) - DB 224,64 ; loopne cdb8 <.literal16+0xe8> + DB 224,64 ; loopne cd98 <.literal16+0xe8> DB 0,0 ; add %al,(%eax) - DB 224,64 ; loopne cdbc <.literal16+0xec> + DB 224,64 ; loopne cd9c <.literal16+0xec> DB 0,0 ; add %al,(%eax) - DB 224,64 ; loopne cdc0 <.literal16+0xf0> + DB 224,64 ; loopne cda0 <.literal16+0xf0> DB 154,153,153,62,154,153,153 ; lcall $0x9999,$0x9a3e9999 DB 62,154,153,153,62,154,153,153 ; ds lcall $0x9999,$0x9a3e9999 DB 62,61,10,23,63,61 ; ds cmp $0x3d3f170a,%eax @@ -58870,16 +58858,16 @@ ALIGN 16 DB 63 ; aas DB 174 ; scas %es:(%edi),%al DB 71 ; inc %edi - DB 225,61 ; loope cde1 <.literal16+0x111> + DB 225,61 ; loope cdc1 <.literal16+0x111> DB 174 ; scas %es:(%edi),%al DB 71 ; inc %edi - DB 225,61 ; loope cde5 <.literal16+0x115> + DB 225,61 ; loope cdc5 <.literal16+0x115> DB 174 ; scas %es:(%edi),%al DB 71 ; inc %edi - DB 225,61 ; loope cde9 <.literal16+0x119> + DB 225,61 ; loope cdc9 <.literal16+0x119> DB 174 ; scas %es:(%edi),%al DB 71 ; inc %edi - DB 225,61 ; loope cded <.literal16+0x11d> + DB 225,61 ; loope cdcd <.literal16+0x11d> DB 255,0 ; incl (%eax) DB 0,0 ; add %al,(%eax) DB 255,0 ; incl (%eax) @@ -58889,13 +58877,13 @@ ALIGN 16 DB 255,0 ; incl (%eax) DB 0,0 ; add %al,(%eax) DB 0,0 ; add %al,(%eax) - DB 127,67 ; jg ce07 <.literal16+0x137> + DB 127,67 ; jg cde7 <.literal16+0x137> DB 0,0 ; add %al,(%eax) - DB 127,67 ; jg ce0b <.literal16+0x13b> + DB 127,67 ; jg cdeb <.literal16+0x13b> DB 0,0 ; add %al,(%eax) - DB 127,67 ; jg ce0f <.literal16+0x13f> + DB 127,67 ; jg cdef <.literal16+0x13f> DB 0,0 ; add %al,(%eax) - DB 127,67 ; jg ce13 <.literal16+0x143> + DB 127,67 ; jg cdf3 <.literal16+0x143> DB 145 ; xchg %eax,%ecx DB 131,158,61,145,131,158,61 ; sbbl $0x3d,-0x617c6ec3(%esi) DB 145 ; xchg %eax,%ecx @@ -59046,13 +59034,13 @@ ALIGN 16 DB 132,55 ; test %dh,(%edi) DB 8,33 ; or %ah,(%ecx) DB 132,55 ; test %dh,(%edi) - DB 224,7 ; loopne cf19 <.literal16+0x249> + DB 224,7 ; loopne cef9 <.literal16+0x249> DB 0,0 ; add %al,(%eax) - DB 224,7 ; loopne cf1d <.literal16+0x24d> + DB 224,7 ; loopne cefd <.literal16+0x24d> DB 0,0 ; add %al,(%eax) - DB 224,7 ; loopne cf21 <.literal16+0x251> + DB 224,7 ; loopne cf01 <.literal16+0x251> DB 0,0 ; add %al,(%eax) - DB 224,7 ; loopne cf25 <.literal16+0x255> + DB 224,7 ; loopne cf05 <.literal16+0x255> DB 0,0 ; add %al,(%eax) DB 33,8 ; and %ecx,(%eax) DB 2,58 ; add (%edx),%bh @@ -59101,17 +59089,17 @@ ALIGN 16 DB 0,0 ; add %al,(%eax) DB 52,255 ; xor $0xff,%al DB 255 ; (bad) - DB 127,0 ; jg cf84 <.literal16+0x2b4> + DB 127,0 ; jg cf64 <.literal16+0x2b4> DB 255 ; (bad) DB 255 ; (bad) - DB 127,0 ; jg cf88 <.literal16+0x2b8> + DB 127,0 ; jg cf68 <.literal16+0x2b8> DB 255 ; (bad) DB 255 ; (bad) - DB 127,0 ; jg cf8c <.literal16+0x2bc> + DB 127,0 ; jg cf6c <.literal16+0x2bc> DB 255 ; (bad) DB 255 ; (bad) - DB 127,0 ; jg cf90 <.literal16+0x2c0> - DB 119,115 ; ja d005 <.literal16+0x335> + DB 127,0 ; jg cf70 <.literal16+0x2c0> + DB 119,115 ; ja cfe5 <.literal16+0x335> DB 248 ; clc DB 194,119,115 ; ret $0x7377 DB 248 ; clc @@ -59122,7 +59110,7 @@ ALIGN 16 DB 194,117,191 ; ret $0xbf75 DB 191,63,117,191,191 ; mov $0xbfbf753f,%edi DB 63 ; aas - DB 117,191 ; jne cf69 <.literal16+0x299> + DB 117,191 ; jne cf49 <.literal16+0x299> DB 191,63,117,191,191 ; mov $0xbfbf753f,%edi DB 63 ; aas DB 249 ; stc @@ -59138,7 +59126,7 @@ ALIGN 16 DB 68 ; inc %esp DB 180,62 ; mov $0x3e,%ah DB 163,233,220,63,163 ; mov %eax,0xa33fdce9 - DB 233,220,63,163,233 ; jmp e9a40fa6 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a3459a> + DB 233,220,63,163,233 ; jmp e9a40f86 <_sk_srcover_rgba_8888_sse2_lowp+0xe9a3459e> DB 220,63 ; fdivrl (%edi) DB 163,233,220,63,81 ; mov %eax,0x513fdce9 DB 140,242 ; mov %?,%edx @@ -59234,16 +59222,16 @@ ALIGN 16 DB 128,3,62 ; addb $0x3e,(%ebx) DB 31 ; pop %ds DB 215 ; xlat %ds:(%ebx) - DB 118,63 ; jbe d0f3 <.literal16+0x423> + DB 118,63 ; jbe d0d3 <.literal16+0x423> DB 31 ; pop %ds DB 215 ; xlat %ds:(%ebx) - DB 118,63 ; jbe d0f7 <.literal16+0x427> + DB 118,63 ; jbe d0d7 <.literal16+0x427> DB 31 ; pop %ds DB 215 ; xlat %ds:(%ebx) - DB 118,63 ; jbe d0fb <.literal16+0x42b> + DB 118,63 ; jbe d0db <.literal16+0x42b> DB 31 ; pop %ds DB 215 ; xlat %ds:(%ebx) - DB 118,63 ; jbe d0ff <.literal16+0x42f> + DB 118,63 ; jbe d0df <.literal16+0x42f> DB 246,64,83,63 ; testb $0x3f,0x53(%eax) DB 246,64,83,63 ; testb $0x3f,0x53(%eax) DB 246,64,83,63 ; testb $0x3f,0x53(%eax) @@ -59269,13 +59257,13 @@ ALIGN 16 DB 248 ; clc DB 65 ; inc %ecx DB 0,0 ; add %al,(%eax) - DB 124,66 ; jl d136 <.literal16+0x466> + DB 124,66 ; jl d116 <.literal16+0x466> DB 0,0 ; add %al,(%eax) - DB 124,66 ; jl d13a <.literal16+0x46a> + DB 124,66 ; jl d11a <.literal16+0x46a> DB 0,0 ; add %al,(%eax) - DB 124,66 ; jl d13e <.literal16+0x46e> + DB 124,66 ; jl d11e <.literal16+0x46e> DB 0,0 ; add %al,(%eax) - DB 124,66 ; jl d142 <.literal16+0x472> + DB 124,66 ; jl d122 <.literal16+0x472> DB 0,240 ; add %dh,%al DB 0,0 ; add %al,(%eax) DB 0,240 ; add %dh,%al @@ -59321,25 +59309,25 @@ ALIGN 16 DB 136,136,61,137,136,136 ; mov %cl,-0x777776c3(%eax) DB 61,137,136,136,61 ; cmp $0x3d888889,%eax DB 0,0 ; add %al,(%eax) - DB 112,65 ; jo d1c5 <.literal16+0x4f5> + DB 112,65 ; jo d1a5 <.literal16+0x4f5> DB 0,0 ; add %al,(%eax) - DB 112,65 ; jo d1c9 <.literal16+0x4f9> + DB 112,65 ; jo d1a9 <.literal16+0x4f9> DB 0,0 ; add %al,(%eax) - DB 112,65 ; jo d1cd <.literal16+0x4fd> + DB 112,65 ; jo d1ad <.literal16+0x4fd> DB 0,0 ; add %al,(%eax) - DB 112,65 ; jo d1d1 <.literal16+0x501> + DB 112,65 ; jo d1b1 <.literal16+0x501> DB 0,128,0,0,0,128 ; add %al,-0x80000000(%eax) DB 0,0 ; add %al,(%eax) DB 0,128,0,0,0,128 ; add %al,-0x80000000(%eax) DB 0,0 ; add %al,(%eax) DB 255 ; (bad) - DB 127,0 ; jg d1a3 <.literal16+0x4d3> + DB 127,0 ; jg d183 <.literal16+0x4d3> DB 0,255 ; add %bh,%bh - DB 127,0 ; jg d1a7 <.literal16+0x4d7> + DB 127,0 ; jg d187 <.literal16+0x4d7> DB 0,255 ; add %bh,%bh - DB 127,0 ; jg d1ab <.literal16+0x4db> + DB 127,0 ; jg d18b <.literal16+0x4db> DB 0,255 ; add %bh,%bh - DB 127,0 ; jg d1af <.literal16+0x4df> + DB 127,0 ; jg d18f <.literal16+0x4df> DB 0,0 ; add %al,(%eax) DB 4,0 ; add $0x0,%al DB 0,0 ; add %al,(%eax) @@ -59365,13 +59353,13 @@ ALIGN 16 DB 255 ; (bad) DB 255 ; (bad) DB 255 ; (bad) - DB 127,255 ; jg d1e8 <.literal16+0x518> + DB 127,255 ; jg d1c8 <.literal16+0x518> DB 255 ; (bad) DB 255 ; (bad) - DB 127,255 ; jg d1ec <.literal16+0x51c> + DB 127,255 ; jg d1cc <.literal16+0x51c> DB 255 ; (bad) DB 255 ; (bad) - DB 127,0 ; jg d1f1 <.literal16+0x521> + DB 127,0 ; jg d1d1 <.literal16+0x521> DB 0,128,56,0,0,128 ; add %al,-0x7fffffc8(%eax) DB 56,0 ; cmp %al,(%eax) DB 0,128,56,0,0,128 ; add %al,-0x7fffffc8(%eax) @@ -59385,13 +59373,13 @@ ALIGN 16 DB 0,255 ; add %bh,%bh DB 255,0 ; incl (%eax) DB 255 ; (bad) - DB 127,71 ; jg d25b <.literal16+0x58b> + DB 127,71 ; jg d23b <.literal16+0x58b> DB 0,255 ; add %bh,%bh - DB 127,71 ; jg d25f <.literal16+0x58f> + DB 127,71 ; jg d23f <.literal16+0x58f> DB 0,255 ; add %bh,%bh - DB 127,71 ; jg d263 <.literal16+0x593> + DB 127,71 ; jg d243 <.literal16+0x593> DB 0,255 ; add %bh,%bh - DB 127,71 ; jg d267 <.literal16+0x597> + DB 127,71 ; jg d247 <.literal16+0x597> DB 208 ; (bad) DB 179,89 ; mov $0x59,%bl DB 62,208 ; ds (bad) @@ -59444,7 +59432,7 @@ ALIGN 16 DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110 DB 17,192 ; adc %eax,%eax DB 45,16,17,192,18 ; sub $0x12c01110,%eax - DB 120,57 ; js d2cc <.literal16+0x5fc> + DB 120,57 ; js d2ac <.literal16+0x5fc> DB 64 ; inc %eax DB 18,120,57 ; adc 0x39(%eax),%bh DB 64 ; inc %eax @@ -59515,13 +59503,13 @@ ALIGN 16 DB 192,191,0,0,192,191,0 ; sarb $0x0,-0x40400000(%edi) DB 0,192 ; add %al,%al DB 191,0,0,192,191 ; mov $0xbfc00000,%edi - DB 114,28 ; jb d37e <.literal16+0x6ae> + DB 114,28 ; jb d35e <.literal16+0x6ae> DB 199 ; (bad) - DB 62,114,28 ; jb,pt d382 <.literal16+0x6b2> + DB 62,114,28 ; jb,pt d362 <.literal16+0x6b2> DB 199 ; (bad) - DB 62,114,28 ; jb,pt d386 <.literal16+0x6b6> + DB 62,114,28 ; jb,pt d366 <.literal16+0x6b6> DB 199 ; (bad) - DB 62,114,28 ; jb,pt d38a <.literal16+0x6ba> + DB 62,114,28 ; jb,pt d36a <.literal16+0x6ba> DB 199 ; (bad) DB 62,85 ; ds push %ebp DB 85 ; push %ebp @@ -59542,13 +59530,13 @@ ALIGN 16 DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%esi) DB 99,61,57,142,99,61 ; arpl %di,0x3d638e39 DB 57,142,99,61,114,249 ; cmp %ecx,-0x68dc29d(%esi) - DB 127,63 ; jg d3e3 <.literal16+0x713> - DB 114,249 ; jb d39f <.literal16+0x6cf> - DB 127,63 ; jg d3e7 <.literal16+0x717> - DB 114,249 ; jb d3a3 <.literal16+0x6d3> - DB 127,63 ; jg d3eb <.literal16+0x71b> - DB 114,249 ; jb d3a7 <.literal16+0x6d7> - DB 127,63 ; jg d3ef <.literal16+0x71f> + DB 127,63 ; jg d3c3 <.literal16+0x713> + DB 114,249 ; jb d37f <.literal16+0x6cf> + DB 127,63 ; jg d3c7 <.literal16+0x717> + DB 114,249 ; jb d383 <.literal16+0x6d3> + DB 127,63 ; jg d3cb <.literal16+0x71b> + DB 114,249 ; jb d387 <.literal16+0x6d7> + DB 127,63 ; jg d3cf <.literal16+0x71f> DB 3,0 ; add (%eax),%eax DB 0,0 ; add %al,(%eax) DB 3,0 ; add (%eax),%eax @@ -59616,14 +59604,14 @@ ALIGN 16 DB 0,248 ; add %bh,%al DB 0,248 ; add %bh,%al DB 0,248 ; add %bh,%al - DB 224,255 ; loopne d441 <.literal16+0x771> - DB 224,255 ; loopne d443 <.literal16+0x773> - DB 224,255 ; loopne d445 <.literal16+0x775> - DB 224,255 ; loopne d447 <.literal16+0x777> - DB 224,255 ; loopne d449 <.literal16+0x779> - DB 224,255 ; loopne d44b <.literal16+0x77b> - DB 224,255 ; loopne d44d <.literal16+0x77d> - DB 224,255 ; loopne d44f <.literal16+0x77f> + DB 224,255 ; loopne d421 <.literal16+0x771> + DB 224,255 ; loopne d423 <.literal16+0x773> + DB 224,255 ; loopne d425 <.literal16+0x775> + DB 224,255 ; loopne d427 <.literal16+0x777> + DB 224,255 ; loopne d429 <.literal16+0x779> + DB 224,255 ; loopne d42b <.literal16+0x77b> + DB 224,255 ; loopne d42d <.literal16+0x77d> + DB 224,255 ; loopne d42f <.literal16+0x77f> DB 54,0,54 ; add %dh,%ss:(%esi) DB 0,54 ; add %dh,(%esi) DB 0,54 ; add %dh,(%esi) @@ -59647,6 +59635,6 @@ ALIGN 4 DB 0,0 ; add %al,(%eax) DB 0,63 ; add %bh,(%edi) DB 0,0 ; add %al,(%eax) - DB 127,67 ; jg d4cb <_sk_srcover_rgba_8888_sse2_lowp+0xabf> + DB 127,67 ; jg d4ab <_sk_srcover_rgba_8888_sse2_lowp+0xac3> ENDIF END diff --git a/src/jumper/SkJumper_misc.h b/src/jumper/SkJumper_misc.h index 8f7ebb56ac..5db2709f05 100644 --- a/src/jumper/SkJumper_misc.h +++ b/src/jumper/SkJumper_misc.h @@ -65,7 +65,7 @@ SI void* load_and_inc(void**& program) { // Lazily resolved on first cast. Does nothing if cast to Ctx::None. struct Ctx { - using None = decltype(nullptr); + struct None {}; void* ptr; void**& program; @@ -77,7 +77,7 @@ struct Ctx { if (!ptr) { ptr = load_and_inc(program); } return (T*)ptr; } - operator None() { return nullptr; } + operator None() { return None{}; } }; #endif//SkJumper_misc_DEFINED diff --git a/src/jumper/SkJumper_stages.cpp b/src/jumper/SkJumper_stages.cpp index 4ba4a76a6b..262b9262de 100644 --- a/src/jumper/SkJumper_stages.cpp +++ b/src/jumper/SkJumper_stages.cpp @@ -85,31 +85,29 @@ extern "C" void WRAP(start_pipeline)(size_t x, size_t y, size_t xlimit, size_t y } #if defined(__i386__) || defined(_M_IX86) || defined(__arm__) - #define STAGE(name) \ - SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \ + #define STAGE(name, ...) \ + SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \ F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da); \ extern "C" void WRAP(name)(Params* params, void** program, \ F r, F g, F b, F a) { \ - Ctx ctx(program); \ - name##_k(ctx,params->x,params->y,params->tail, r,g,b,a, \ + name##_k(Ctx{program},params->x,params->y,params->tail, r,g,b,a, \ params->dr, params->dg, params->db, params->da); \ auto next = (Stage*)load_and_inc(program); \ next(params,program, r,g,b,a); \ } \ - SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \ + SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \ F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da) #else - #define STAGE(name) \ - SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \ + #define STAGE(name, ...) \ + SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \ F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da); \ extern "C" void WRAP(name)(size_t tail, void** program, size_t x, size_t y, \ F r, F g, F b, F a, F dr, F dg, F db, F da) { \ - Ctx ctx(program); \ - name##_k(ctx,x,y,tail, r,g,b,a, dr,dg,db,da); \ + name##_k(Ctx{program},x,y,tail, r,g,b,a, dr,dg,db,da); \ auto next = (Stage*)load_and_inc(program); \ next(tail,program,x,y, r,g,b,a, dr,dg,db,da); \ } \ - SI void name##_k(Ctx ctx, size_t x, size_t y, size_t tail, \ + SI void name##_k(__VA_ARGS__, size_t x, size_t y, size_t tail, \ F& r, F& g, F& b, F& a, F& dr, F& dg, F& db, F& da) #endif @@ -214,7 +212,7 @@ SI U32 ix_and_ptr(T** ptr, const SkJumper_GatherCtx* ctx, F x, F y) { // Now finally, normal Stages! -STAGE(seed_shader) { +STAGE(seed_shader, Ctx::None) { // It's important for speed to explicitly cast(x) and cast(y), // which has the effect of splatting them to vectors before converting to floats. // On Intel this breaks a data dependency on previous loop iterations' registers. @@ -226,9 +224,7 @@ STAGE(seed_shader) { dr = dg = db = da = 0; } -STAGE(dither) { - auto rate = *(const float*)ctx; - +STAGE(dither, const float* rate) { // Get [(x,y), (x+1,y), (x+2,y), ...] loaded up in integer vectors. uint32_t iota[] = {0,1,2,3,4,5,6,7}; U32 X = x + unaligned_load<U32>(iota), @@ -251,9 +247,9 @@ STAGE(dither) { // like 0 and 1 unchanged after rounding. F dither = cast(M) * (2/128.0f) - (63/128.0f); - r += rate*dither; - g += rate*dither; - b += rate*dither; + r += *rate*dither; + g += *rate*dither; + b += *rate*dither; r = max(0, min(r, a)); g = max(0, min(g, a)); @@ -261,8 +257,7 @@ STAGE(dither) { } // load 4 floats from memory, and splat them into r,g,b,a -STAGE(uniform_color) { - auto c = (const SkJumper_UniformColorCtx*)ctx; +STAGE(uniform_color, const SkJumper_UniformColorCtx* c) { r = c->r; g = c->g; b = c->b; @@ -270,18 +265,17 @@ STAGE(uniform_color) { } // splats opaque-black into r,g,b,a -STAGE(black_color) { +STAGE(black_color, Ctx::None) { r = g = b = 0.0f; a = 1.0f; } -STAGE(white_color) { +STAGE(white_color, Ctx::None) { r = g = b = a = 1.0f; } // load registers r,g,b,a from context (mirrors store_rgba) -STAGE(load_rgba) { - auto ptr = (const float*)ctx; +STAGE(load_rgba, const float* ptr) { r = unaligned_load<F>(ptr + 0*N); g = unaligned_load<F>(ptr + 1*N); b = unaligned_load<F>(ptr + 2*N); @@ -289,8 +283,7 @@ STAGE(load_rgba) { } // store registers r,g,b,a into context (mirrors load_rgba) -STAGE(store_rgba) { - auto ptr = (float*)ctx; +STAGE(store_rgba, float* ptr) { unaligned_store(ptr + 0*N, r); unaligned_store(ptr + 1*N, g); unaligned_store(ptr + 2*N, b); @@ -300,7 +293,7 @@ STAGE(store_rgba) { // Most blend modes apply the same logic to each channel. #define BLEND_MODE(name) \ SI F name##_channel(F s, F d, F sa, F da); \ - STAGE(name) { \ + STAGE(name, Ctx::None) { \ r = name##_channel(r,dr,a,da); \ g = name##_channel(g,dg,a,da); \ b = name##_channel(b,db,a,da); \ @@ -331,7 +324,7 @@ BLEND_MODE(xor_) { return s*inv(da) + d*inv(sa); } // Most other blend modes apply the same logic to colors, and srcover to alpha. #define BLEND_MODE(name) \ SI F name##_channel(F s, F d, F sa, F da); \ - STAGE(name) { \ + STAGE(name, Ctx::None) { \ r = name##_channel(r,dr,a,da); \ g = name##_channel(g,dg,a,da); \ b = name##_channel(b,db,a,da); \ @@ -429,7 +422,7 @@ SI void clip_color(F* r, F* g, F* b, F a) { *b = clip(*b); } -STAGE(hue) { +STAGE(hue, Ctx::None) { F R = r*a, G = g*a, B = b*a; @@ -443,7 +436,7 @@ STAGE(hue) { b = b*inv(da) + db*inv(a) + B; a = a + da - a*da; } -STAGE(saturation) { +STAGE(saturation, Ctx::None) { F R = dr*a, G = dg*a, B = db*a; @@ -457,7 +450,7 @@ STAGE(saturation) { b = b*inv(da) + db*inv(a) + B; a = a + da - a*da; } -STAGE(color) { +STAGE(color, Ctx::None) { F R = r*da, G = g*da, B = b*da; @@ -470,7 +463,7 @@ STAGE(color) { b = b*inv(da) + db*inv(a) + B; a = a + da - a*da; } -STAGE(luminosity) { +STAGE(luminosity, Ctx::None) { F R = dr*a, G = dg*a, B = db*a; @@ -484,7 +477,7 @@ STAGE(luminosity) { a = a + da - a*da; } -STAGE(srcover_rgba_8888) { +STAGE(srcover_rgba_8888, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint32_t>(ctx, x,y); U32 dst = load<U32>(ptr, tail); @@ -508,76 +501,75 @@ STAGE(srcover_rgba_8888) { store(ptr, dst, tail); } -STAGE(clamp_0) { +STAGE(clamp_0, Ctx::None) { r = max(r, 0); g = max(g, 0); b = max(b, 0); a = max(a, 0); } -STAGE(clamp_1) { +STAGE(clamp_1, Ctx::None) { r = min(r, 1.0f); g = min(g, 1.0f); b = min(b, 1.0f); a = min(a, 1.0f); } -STAGE(clamp_a) { +STAGE(clamp_a, Ctx::None) { a = min(a, 1.0f); r = min(r, a); g = min(g, a); b = min(b, a); } -STAGE(clamp_a_dst) { +STAGE(clamp_a_dst, Ctx::None) { da = min(da, 1.0f); dr = min(dr, da); dg = min(dg, da); db = min(db, da); } -STAGE(set_rgb) { - auto rgb = (const float*)ctx; +STAGE(set_rgb, const float* rgb) { r = rgb[0]; g = rgb[1]; b = rgb[2]; } -STAGE(swap_rb) { +STAGE(swap_rb, Ctx::None) { auto tmp = r; r = b; b = tmp; } -STAGE(invert) { +STAGE(invert, Ctx::None) { r = inv(r); g = inv(g); b = inv(b); a = inv(a); } -STAGE(move_src_dst) { +STAGE(move_src_dst, Ctx::None) { dr = r; dg = g; db = b; da = a; } -STAGE(move_dst_src) { +STAGE(move_dst_src, Ctx::None) { r = dr; g = dg; b = db; a = da; } -STAGE(premul) { +STAGE(premul, Ctx::None) { r = r * a; g = g * a; b = b * a; } -STAGE(premul_dst) { +STAGE(premul_dst, Ctx::None) { dr = dr * da; dg = dg * da; db = db * da; } -STAGE(unpremul) { +STAGE(unpremul, Ctx::None) { auto scale = if_then_else(a == 0, 0, 1.0f / a); r *= scale; g *= scale; @@ -590,17 +582,17 @@ SI F from_srgb(F s) { return if_then_else(s < 0.055f, lo, hi); } -STAGE(from_srgb) { +STAGE(from_srgb, Ctx::None) { r = from_srgb(r); g = from_srgb(g); b = from_srgb(b); } -STAGE(from_srgb_dst) { +STAGE(from_srgb_dst, Ctx::None) { dr = from_srgb(dr); dg = from_srgb(dg); db = from_srgb(db); } -STAGE(to_srgb) { +STAGE(to_srgb, Ctx::None) { auto fn = [&](F l) { // We tweak c and d for each instruction set to make sure fn(1) is exactly 1. #if defined(JUMPER_IS_SSE2) || defined(JUMPER_IS_SSE41) || \ @@ -625,7 +617,7 @@ STAGE(to_srgb) { b = fn(b); } -STAGE(rgb_to_hsl) { +STAGE(rgb_to_hsl, Ctx::None) { F mx = max(r,g,b), mn = min(r,g,b), d = mx - mn, @@ -645,7 +637,7 @@ STAGE(rgb_to_hsl) { g = s; b = l; } -STAGE(hsl_to_rgb) { +STAGE(hsl_to_rgb, Ctx::None) { F h = r, s = g, l = b; @@ -674,15 +666,13 @@ SI F alpha_coverage_from_rgb_coverage(F a, F da, F cr, F cg, F cb) { , max(cr,cg,cb)); } -STAGE(scale_1_float) { - auto c = *(const float*)ctx; - - r = r * c; - g = g * c; - b = b * c; - a = a * c; +STAGE(scale_1_float, const float* c) { + r = r * *c; + g = g * *c; + b = b * *c; + a = a * *c; } -STAGE(scale_u8) { +STAGE(scale_u8, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y); auto scales = load<U8>(ptr, tail); @@ -693,7 +683,7 @@ STAGE(scale_u8) { b = b * c; a = a * c; } -STAGE(scale_565) { +STAGE(scale_565, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y); F cr,cg,cb; @@ -711,15 +701,13 @@ SI F lerp(F from, F to, F t) { return mad(to-from, t, from); } -STAGE(lerp_1_float) { - auto c = *(const float*)ctx; - - r = lerp(dr, r, c); - g = lerp(dg, g, c); - b = lerp(db, b, c); - a = lerp(da, a, c); +STAGE(lerp_1_float, const float* c) { + r = lerp(dr, r, *c); + g = lerp(dg, g, *c); + b = lerp(db, b, *c); + a = lerp(da, a, *c); } -STAGE(lerp_u8) { +STAGE(lerp_u8, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y); auto scales = load<U8>(ptr, tail); @@ -730,7 +718,7 @@ STAGE(lerp_u8) { b = lerp(db, b, c); a = lerp(da, a, c); } -STAGE(lerp_565) { +STAGE(lerp_565, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y); F cr,cg,cb; @@ -744,17 +732,14 @@ STAGE(lerp_565) { a = lerp(da, a, ca); } -STAGE(load_tables) { - auto c = (const SkJumper_LoadTablesCtx*)ctx; - +STAGE(load_tables, const SkJumper_LoadTablesCtx* c) { auto px = load<U32>((const uint32_t*)c->src + x, tail); r = gather(c->r, (px ) & 0xff); g = gather(c->g, (px >> 8) & 0xff); b = gather(c->b, (px >> 16) & 0xff); a = cast( (px >> 24)) * (1/255.0f); } -STAGE(load_tables_u16_be) { - auto c = (const SkJumper_LoadTablesCtx*)ctx; +STAGE(load_tables_u16_be, const SkJumper_LoadTablesCtx* c) { auto ptr = (const uint16_t*)c->src + 4*x; U16 R,G,B,A; @@ -766,8 +751,7 @@ STAGE(load_tables_u16_be) { b = gather(c->b, expand(B) & 0xff); a = (1/65535.0f) * cast(expand(bswap(A))); } -STAGE(load_tables_rgb_u16_be) { - auto c = (const SkJumper_LoadTablesCtx*)ctx; +STAGE(load_tables_rgb_u16_be, const SkJumper_LoadTablesCtx* c) { auto ptr = (const uint16_t*)c->src + 3*x; U16 R,G,B; @@ -780,7 +764,7 @@ STAGE(load_tables_rgb_u16_be) { a = 1.0f; } -STAGE(byte_tables) { +STAGE(byte_tables, const void* ctx) { // TODO: rename Tables SkJumper_ByteTablesCtx struct Tables { const uint8_t *r, *g, *b, *a; }; auto tables = (const Tables*)ctx; @@ -790,7 +774,7 @@ STAGE(byte_tables) { a = from_byte(gather(tables->a, round(a, 255.0f))); } -STAGE(byte_tables_rgb) { +STAGE(byte_tables_rgb, const void* ctx) { // TODO: rename Tables SkJumper_ByteTablesRGBCtx struct Tables { const uint8_t *r, *g, *b; int n; }; auto tables = (const Tables*)ctx; @@ -803,29 +787,28 @@ STAGE(byte_tables_rgb) { SI F table(F v, const SkJumper_TableCtx* ctx) { return gather(ctx->table, round(v, ctx->size - 1)); } -STAGE(table_r) { r = table(r, ctx); } -STAGE(table_g) { g = table(g, ctx); } -STAGE(table_b) { b = table(b, ctx); } -STAGE(table_a) { a = table(a, ctx); } +STAGE(table_r, const SkJumper_TableCtx* ctx) { r = table(r, ctx); } +STAGE(table_g, const SkJumper_TableCtx* ctx) { g = table(g, ctx); } +STAGE(table_b, const SkJumper_TableCtx* ctx) { b = table(b, ctx); } +STAGE(table_a, const SkJumper_TableCtx* ctx) { a = table(a, ctx); } SI F parametric(F v, const SkJumper_ParametricTransferFunction* ctx) { F r = if_then_else(v <= ctx->D, mad(ctx->C, v, ctx->F) , approx_powf(mad(ctx->A, v, ctx->B), ctx->G) + ctx->E); return min(max(r, 0), 1.0f); // Clamp to [0,1], with argument order mattering to handle NaN. } -STAGE(parametric_r) { r = parametric(r, ctx); } -STAGE(parametric_g) { g = parametric(g, ctx); } -STAGE(parametric_b) { b = parametric(b, ctx); } -STAGE(parametric_a) { a = parametric(a, ctx); } +STAGE(parametric_r, const SkJumper_ParametricTransferFunction* ctx) { r = parametric(r, ctx); } +STAGE(parametric_g, const SkJumper_ParametricTransferFunction* ctx) { g = parametric(g, ctx); } +STAGE(parametric_b, const SkJumper_ParametricTransferFunction* ctx) { b = parametric(b, ctx); } +STAGE(parametric_a, const SkJumper_ParametricTransferFunction* ctx) { a = parametric(a, ctx); } -STAGE(gamma) { - float G = *(const float*)ctx; - r = approx_powf(r,G); - g = approx_powf(g,G); - b = approx_powf(b,G); +STAGE(gamma, const float* G) { + r = approx_powf(r, *G); + g = approx_powf(g, *G); + b = approx_powf(b, *G); } -STAGE(lab_to_xyz) { +STAGE(lab_to_xyz, Ctx::None) { F L = r * 100.0f, A = g * 255.0f - 128.0f, B = b * 255.0f - 128.0f; @@ -844,69 +827,69 @@ STAGE(lab_to_xyz) { b = Z * 0.82521f; } -STAGE(load_a8) { +STAGE(load_a8, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y); r = g = b = 0.0f; a = from_byte(load<U8>(ptr, tail)); } -STAGE(load_a8_dst) { +STAGE(load_a8_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y); dr = dg = db = 0.0f; da = from_byte(load<U8>(ptr, tail)); } -STAGE(gather_a8) { +STAGE(gather_a8, const SkJumper_GatherCtx* ctx) { const uint8_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); r = g = b = 0.0f; a = from_byte(gather(ptr, ix)); } -STAGE(store_a8) { +STAGE(store_a8, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint8_t>(ctx, x,y); U8 packed = pack(pack(round(a, 255.0f))); store(ptr, packed, tail); } -STAGE(load_g8) { +STAGE(load_g8, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y); r = g = b = from_byte(load<U8>(ptr, tail)); a = 1.0f; } -STAGE(load_g8_dst) { +STAGE(load_g8_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint8_t>(ctx, x,y); dr = dg = db = from_byte(load<U8>(ptr, tail)); da = 1.0f; } -STAGE(gather_g8) { +STAGE(gather_g8, const SkJumper_GatherCtx* ctx) { const uint8_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); r = g = b = from_byte(gather(ptr, ix)); a = 1.0f; } -STAGE(load_565) { +STAGE(load_565, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y); from_565(load<U16>(ptr, tail), &r,&g,&b); a = 1.0f; } -STAGE(load_565_dst) { +STAGE(load_565_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y); from_565(load<U16>(ptr, tail), &dr,&dg,&db); da = 1.0f; } -STAGE(gather_565) { +STAGE(gather_565, const SkJumper_GatherCtx* ctx) { const uint16_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); from_565(gather(ptr, ix), &r,&g,&b); a = 1.0f; } -STAGE(store_565) { +STAGE(store_565, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint16_t>(ctx, x,y); U16 px = pack( round(r, 31.0f) << 11 @@ -915,20 +898,20 @@ STAGE(store_565) { store(ptr, px, tail); } -STAGE(load_4444) { +STAGE(load_4444, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y); from_4444(load<U16>(ptr, tail), &r,&g,&b,&a); } -STAGE(load_4444_dst) { +STAGE(load_4444_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, x,y); from_4444(load<U16>(ptr, tail), &dr,&dg,&db,&da); } -STAGE(gather_4444) { +STAGE(gather_4444, const SkJumper_GatherCtx* ctx) { const uint16_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); from_4444(gather(ptr, ix), &r,&g,&b,&a); } -STAGE(store_4444) { +STAGE(store_4444, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint16_t>(ctx, x,y); U16 px = pack( round(r, 15.0f) << 12 | round(g, 15.0f) << 8 @@ -937,20 +920,20 @@ STAGE(store_4444) { store(ptr, px, tail); } -STAGE(load_8888) { +STAGE(load_8888, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y); from_8888(load<U32>(ptr, tail), &r,&g,&b,&a); } -STAGE(load_8888_dst) { +STAGE(load_8888_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y); from_8888(load<U32>(ptr, tail), &dr,&dg,&db,&da); } -STAGE(gather_8888) { +STAGE(gather_8888, const SkJumper_GatherCtx* ctx) { const uint32_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); from_8888(gather(ptr, ix), &r,&g,&b,&a); } -STAGE(store_8888) { +STAGE(store_8888, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint32_t>(ctx, x,y); U32 px = round(r, 255.0f) @@ -960,20 +943,20 @@ STAGE(store_8888) { store(ptr, px, tail); } -STAGE(load_bgra) { +STAGE(load_bgra, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y); from_8888(load<U32>(ptr, tail), &b,&g,&r,&a); } -STAGE(load_bgra_dst) { +STAGE(load_bgra_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint32_t>(ctx, x,y); from_8888(load<U32>(ptr, tail), &db,&dg,&dr,&da); } -STAGE(gather_bgra) { +STAGE(gather_bgra, const SkJumper_GatherCtx* ctx) { const uint32_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); from_8888(gather(ptr, ix), &b,&g,&r,&a); } -STAGE(store_bgra) { +STAGE(store_bgra, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint32_t>(ctx, x,y); U32 px = round(b, 255.0f) @@ -983,7 +966,7 @@ STAGE(store_bgra) { store(ptr, px, tail); } -STAGE(load_f16) { +STAGE(load_f16, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint64_t>(ctx, x,y); U16 R,G,B,A; @@ -993,7 +976,7 @@ STAGE(load_f16) { b = from_half(B); a = from_half(A); } -STAGE(load_f16_dst) { +STAGE(load_f16_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint64_t>(ctx, x,y); U16 R,G,B,A; @@ -1003,7 +986,7 @@ STAGE(load_f16_dst) { db = from_half(B); da = from_half(A); } -STAGE(gather_f16) { +STAGE(gather_f16, const SkJumper_GatherCtx* ctx) { const uint64_t* ptr; U32 ix = ix_and_ptr(&ptr, ctx, r,g); auto px = gather(ptr, ix); @@ -1015,7 +998,7 @@ STAGE(gather_f16) { b = from_half(B); a = from_half(A); } -STAGE(store_f16) { +STAGE(store_f16, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint64_t>(ctx, x,y); store4((uint16_t*)ptr,tail, to_half(r) , to_half(g) @@ -1023,7 +1006,7 @@ STAGE(store_f16) { , to_half(a)); } -STAGE(load_u16_be) { +STAGE(load_u16_be, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, 4*x,y); U16 R,G,B,A; @@ -1034,7 +1017,7 @@ STAGE(load_u16_be) { b = (1/65535.0f) * cast(expand(bswap(B))); a = (1/65535.0f) * cast(expand(bswap(A))); } -STAGE(load_rgb_u16_be) { +STAGE(load_rgb_u16_be, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const uint16_t>(ctx, 3*x,y); U16 R,G,B; @@ -1045,7 +1028,7 @@ STAGE(load_rgb_u16_be) { b = (1/65535.0f) * cast(expand(bswap(B))); a = 1.0f; } -STAGE(store_u16_be) { +STAGE(store_u16_be, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<uint16_t>(ctx, 4*x,y); U16 R = bswap(pack(round(r, 65535.0f))), @@ -1056,15 +1039,15 @@ STAGE(store_u16_be) { store4(ptr,tail, R,G,B,A); } -STAGE(load_f32) { +STAGE(load_f32, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const float>(ctx, 4*x,y); load4(ptr,tail, &r,&g,&b,&a); } -STAGE(load_f32_dst) { +STAGE(load_f32_dst, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<const float>(ctx, 4*x,y); load4(ptr,tail, &dr,&dg,&db,&da); } -STAGE(store_f32) { +STAGE(store_f32, const SkJumper_MemoryCtx* ctx) { auto ptr = ptr_at_xy<float>(ctx, 4*x,y); store4(ptr,tail, r,g,b,a); } @@ -1080,44 +1063,36 @@ SI F exclusive_mirror(F v, const SkJumper_TileCtx* ctx) { // Tile x or y to [0,limit) == [0,limit - 1 ulp] (think, sampling from images). // The gather stages will hard clamp the output of these stages to [0,limit)... // we just need to do the basic repeat or mirroring. -STAGE(repeat_x) { r = exclusive_repeat(r, (const SkJumper_TileCtx*)ctx); } -STAGE(repeat_y) { g = exclusive_repeat(g, (const SkJumper_TileCtx*)ctx); } -STAGE(mirror_x) { r = exclusive_mirror(r, (const SkJumper_TileCtx*)ctx); } -STAGE(mirror_y) { g = exclusive_mirror(g, (const SkJumper_TileCtx*)ctx); } +STAGE(repeat_x, const SkJumper_TileCtx* ctx) { r = exclusive_repeat(r, ctx); } +STAGE(repeat_y, const SkJumper_TileCtx* ctx) { g = exclusive_repeat(g, ctx); } +STAGE(mirror_x, const SkJumper_TileCtx* ctx) { r = exclusive_mirror(r, ctx); } +STAGE(mirror_y, const SkJumper_TileCtx* ctx) { g = exclusive_mirror(g, ctx); } // Clamp x to [0,1], both sides exclusive (think, gradients). -STAGE( clamp_x_1) { r = min(max(0, r), 1.0f); } -STAGE(repeat_x_1) { r = r - floor_(r); } -STAGE(mirror_x_1) { r = abs_( (r-1.0f) - two(floor_((r-1.0f)*0.5f)) - 1.0f ); } +STAGE( clamp_x_1, Ctx::None) { r = min(max(0, r), 1.0f); } +STAGE(repeat_x_1, Ctx::None) { r = r - floor_(r); } +STAGE(mirror_x_1, Ctx::None) { r = abs_( (r-1.0f) - two(floor_((r-1.0f)*0.5f)) - 1.0f ); } -STAGE(luminance_to_alpha) { +STAGE(luminance_to_alpha, Ctx::None) { a = r*0.2126f + g*0.7152f + b*0.0722f; r = g = b = 0; } -STAGE(matrix_translate) { - auto m = (const float*)ctx; - +STAGE(matrix_translate, const float* m) { r += m[0]; g += m[1]; } -STAGE(matrix_scale_translate) { - auto m = (const float*)ctx; - +STAGE(matrix_scale_translate, const float* m) { r = mad(r,m[2], m[0]); g = mad(g,m[3], m[1]); } -STAGE(matrix_2x3) { - auto m = (const float*)ctx; - +STAGE(matrix_2x3, const float* m) { auto R = mad(r,m[0], mad(g,m[2], m[4])), G = mad(r,m[1], mad(g,m[3], m[5])); r = R; g = G; } -STAGE(matrix_3x4) { - auto m = (const float*)ctx; - +STAGE(matrix_3x4, const float* m) { auto R = mad(r,m[0], mad(g,m[3], mad(b,m[6], m[ 9]))), G = mad(r,m[1], mad(g,m[4], mad(b,m[7], m[10]))), B = mad(r,m[2], mad(g,m[5], mad(b,m[8], m[11]))); @@ -1125,9 +1100,7 @@ STAGE(matrix_3x4) { g = G; b = B; } -STAGE(matrix_4x5) { - auto m = (const float*)ctx; - +STAGE(matrix_4x5, const float* m) { auto R = mad(r,m[0], mad(g,m[4], mad(b,m[ 8], mad(a,m[12], m[16])))), G = mad(r,m[1], mad(g,m[5], mad(b,m[ 9], mad(a,m[13], m[17])))), B = mad(r,m[2], mad(g,m[6], mad(b,m[10], mad(a,m[14], m[18])))), @@ -1137,8 +1110,7 @@ STAGE(matrix_4x5) { b = B; a = A; } -STAGE(matrix_4x3) { - auto m = (const float*)ctx; +STAGE(matrix_4x3, const float* m) { auto X = r, Y = g; @@ -1147,10 +1119,8 @@ STAGE(matrix_4x3) { b = mad(X, m[2], mad(Y, m[6], m[10])); a = mad(X, m[3], mad(Y, m[7], m[11])); } -STAGE(matrix_perspective) { +STAGE(matrix_perspective, const float* m) { // N.B. Unlike the other matrix_ stages, this matrix is row-major. - auto m = (const float*)ctx; - auto R = mad(r,m[0], mad(g,m[1], m[2])), G = mad(r,m[3], mad(g,m[4], m[5])), Z = mad(r,m[6], mad(g,m[7], m[8])); @@ -1190,14 +1160,14 @@ SI void gradient_lookup(const SkJumper_GradientCtx* c, U32 idx, F t, *a = mad(t, fa, ba); } -STAGE(evenly_spaced_gradient) { - auto c = (const SkJumper_GradientCtx*)ctx; +STAGE(evenly_spaced_gradient, const SkJumper_GradientCtx* c) { auto t = r; auto idx = trunc_(t * (c->stopCount-1)); gradient_lookup(c, idx, t, &r, &g, &b, &a); } -STAGE(gauss_a_to_rgba) { +// TODO: move this somewhere not in the middle of the gradients... +STAGE(gauss_a_to_rgba, Ctx::None) { // x = 1 - x; // exp(-x * x * 4) - 0.018f; // ... now approximate with quartic @@ -1213,8 +1183,7 @@ STAGE(gauss_a_to_rgba) { b = a; } -STAGE(gradient) { - auto c = (const SkJumper_GradientCtx*)ctx; +STAGE(gradient, const SkJumper_GradientCtx* c) { auto t = r; U32 idx = 0; @@ -1226,7 +1195,8 @@ STAGE(gradient) { gradient_lookup(c, idx, t, &r, &g, &b, &a); } -STAGE(evenly_spaced_2_stop_gradient) { +STAGE(evenly_spaced_2_stop_gradient, const void* ctx) { + // TODO: Rename Ctx SkJumper_EvenlySpacedGradientCtx. struct Ctx { float f[4], b[4]; }; auto c = (const Ctx*)ctx; @@ -1237,7 +1207,7 @@ STAGE(evenly_spaced_2_stop_gradient) { a = mad(t, c->f[3], c->b[3]); } -STAGE(xy_to_unit_angle) { +STAGE(xy_to_unit_angle, Ctx::None) { F X = r, Y = g; F xabs = abs_(X), @@ -1263,7 +1233,7 @@ STAGE(xy_to_unit_angle) { r = phi; } -STAGE(xy_to_radius) { +STAGE(xy_to_radius, Ctx::None) { F X2 = r * r, Y2 = g * g; r = sqrt_(X2 + Y2); @@ -1302,26 +1272,22 @@ SI F solve_2pt_conical_quadratic(const SkJumper_2PtConicalCtx* c, F x, F y, F (* (-coeffB - sqrt_disc) * (invCoeffA * 0.5f)); } -STAGE(xy_to_2pt_conical_quadratic_max) { +STAGE(xy_to_2pt_conical_quadratic_max, const SkJumper_2PtConicalCtx* ctx) { r = solve_2pt_conical_quadratic(ctx, r, g, max); } -STAGE(xy_to_2pt_conical_quadratic_min) { +STAGE(xy_to_2pt_conical_quadratic_min, const SkJumper_2PtConicalCtx* ctx) { r = solve_2pt_conical_quadratic(ctx, r, g, min); } -STAGE(xy_to_2pt_conical_linear) { - auto* c = (const SkJumper_2PtConicalCtx*)ctx; - +STAGE(xy_to_2pt_conical_linear, const SkJumper_2PtConicalCtx* c) { const F coeffB = -2 * (r + c->fDR*c->fR0), coeffC = r*r + g*g - c->fR0*c->fR0; r = -coeffC / coeffB; } -STAGE(mask_2pt_conical_degenerates) { - auto* c = (SkJumper_2PtConicalCtx*)ctx; - +STAGE(mask_2pt_conical_degenerates, SkJumper_2PtConicalCtx* c) { // The gradient t coordinate is in the r register right now. F& t = r; @@ -1329,22 +1295,19 @@ STAGE(mask_2pt_conical_degenerates) { // and save a mask to ignore those colors in apply_vector_mask. auto is_degenerate = (mad(t, c->fDR, c->fR0) < 0) // Radius(t) < 0 | (t != t); // t == NaN - t = if_then_else(is_degenerate, F(0), t); unaligned_store(&c->fMask, if_then_else(is_degenerate, U32(0), U32(0xffffffff))); } -STAGE(apply_vector_mask) { - const U32 mask = unaligned_load<U32>((const uint32_t*)ctx); +STAGE(apply_vector_mask, const uint32_t* ctx) { + const U32 mask = unaligned_load<U32>(ctx); r = bit_cast<F>(bit_cast<U32>(r) & mask); g = bit_cast<F>(bit_cast<U32>(g) & mask); b = bit_cast<F>(bit_cast<U32>(b) & mask); a = bit_cast<F>(bit_cast<U32>(a) & mask); } -STAGE(save_xy) { - auto c = (SkJumper_SamplerCtx*)ctx; - +STAGE(save_xy, SkJumper_SamplerCtx* c) { // Whether bilinear or bicubic, all sample points are at the same fractional offset (fx,fy). // They're either the 4 corners of a logical 1x1 pixel or the 16 corners of a 3x3 grid // surrounding (x,y) at (0.5,0.5) off-center. @@ -1358,9 +1321,7 @@ STAGE(save_xy) { unaligned_store(c->fy, fy); } -STAGE(accumulate) { - auto c = (const SkJumper_SamplerCtx*)ctx; - +STAGE(accumulate, const SkJumper_SamplerCtx* c) { // Bilinear and bicubic filters are both separable, so we produce independent contributions // from x and y, multiplying them together here to get each pixel's total scale factor. auto scale = unaligned_load<F>(c->scalex) @@ -1397,10 +1358,10 @@ SI void bilinear_y(SkJumper_SamplerCtx* ctx, F* y) { unaligned_store(ctx->scaley, scaley); } -STAGE(bilinear_nx) { bilinear_x<-1>(ctx, &r); } -STAGE(bilinear_px) { bilinear_x<+1>(ctx, &r); } -STAGE(bilinear_ny) { bilinear_y<-1>(ctx, &g); } -STAGE(bilinear_py) { bilinear_y<+1>(ctx, &g); } +STAGE(bilinear_nx, SkJumper_SamplerCtx* ctx) { bilinear_x<-1>(ctx, &r); } +STAGE(bilinear_px, SkJumper_SamplerCtx* ctx) { bilinear_x<+1>(ctx, &r); } +STAGE(bilinear_ny, SkJumper_SamplerCtx* ctx) { bilinear_y<-1>(ctx, &g); } +STAGE(bilinear_py, SkJumper_SamplerCtx* ctx) { bilinear_y<+1>(ctx, &g); } // In bicubic interpolation, the 16 pixels and +/- 0.5 and +/- 1.5 offsets from the sample @@ -1443,18 +1404,17 @@ SI void bicubic_y(SkJumper_SamplerCtx* ctx, F* y) { unaligned_store(ctx->scaley, scaley); } -STAGE(bicubic_n3x) { bicubic_x<-3>(ctx, &r); } -STAGE(bicubic_n1x) { bicubic_x<-1>(ctx, &r); } -STAGE(bicubic_p1x) { bicubic_x<+1>(ctx, &r); } -STAGE(bicubic_p3x) { bicubic_x<+3>(ctx, &r); } +STAGE(bicubic_n3x, SkJumper_SamplerCtx* ctx) { bicubic_x<-3>(ctx, &r); } +STAGE(bicubic_n1x, SkJumper_SamplerCtx* ctx) { bicubic_x<-1>(ctx, &r); } +STAGE(bicubic_p1x, SkJumper_SamplerCtx* ctx) { bicubic_x<+1>(ctx, &r); } +STAGE(bicubic_p3x, SkJumper_SamplerCtx* ctx) { bicubic_x<+3>(ctx, &r); } -STAGE(bicubic_n3y) { bicubic_y<-3>(ctx, &g); } -STAGE(bicubic_n1y) { bicubic_y<-1>(ctx, &g); } -STAGE(bicubic_p1y) { bicubic_y<+1>(ctx, &g); } -STAGE(bicubic_p3y) { bicubic_y<+3>(ctx, &g); } +STAGE(bicubic_n3y, SkJumper_SamplerCtx* ctx) { bicubic_y<-3>(ctx, &g); } +STAGE(bicubic_n1y, SkJumper_SamplerCtx* ctx) { bicubic_y<-1>(ctx, &g); } +STAGE(bicubic_p1y, SkJumper_SamplerCtx* ctx) { bicubic_y<+1>(ctx, &g); } +STAGE(bicubic_p3y, SkJumper_SamplerCtx* ctx) { bicubic_y<+3>(ctx, &g); } -STAGE(callback) { - auto c = (SkJumper_CallbackCtx*)ctx; +STAGE(callback, SkJumper_CallbackCtx* c) { store4(c->rgba,0, r,g,b,a); c->fn(c, tail ? tail : N); load4(c->read_from,0, &r,&g,&b,&a); @@ -1502,11 +1462,11 @@ inline void color_lookup_table<0>(const SkJumper_ColorLookupTableCtx* ctx, b = gather(ctx->table, 3*index+2); } -STAGE(clut_3D) { +STAGE(clut_3D, const SkJumper_ColorLookupTableCtx* ctx) { color_lookup_table<3>(ctx, r,g,b,a, 0,1); // This 3D color lookup table leaves alpha alone. } -STAGE(clut_4D) { +STAGE(clut_4D, const SkJumper_ColorLookupTableCtx* ctx) { color_lookup_table<4>(ctx, r,g,b,a, 0,1); // "a" was really CMYK's K, so we just set alpha opaque. a = 1.0f; |