aboutsummaryrefslogtreecommitdiffhomepage
path: root/src
diff options
context:
space:
mode:
Diffstat (limited to 'src')
-rw-r--r--src/core/SkRasterPipelineBlitter.cpp59
-rw-r--r--src/jumper/SkJumper_generated.S2823
-rw-r--r--src/jumper/SkJumper_generated_win.S2784
-rw-r--r--src/jumper/SkJumper_stages.cpp17
4 files changed, 2834 insertions, 2849 deletions
diff --git a/src/core/SkRasterPipelineBlitter.cpp b/src/core/SkRasterPipelineBlitter.cpp
index 576ba4ba19..d18decd1cd 100644
--- a/src/core/SkRasterPipelineBlitter.cpp
+++ b/src/core/SkRasterPipelineBlitter.cpp
@@ -60,10 +60,11 @@ private:
// These values are pointed to by the blit pipelines above,
// which allows us to adjust them from call to call.
- void* fDstPtr = nullptr;
- const void* fMaskPtr = nullptr;
- float fCurrentCoverage = 0.0f;
- int fCurrentY = 0;
+ void* fDstPtr = nullptr;
+ const void* fMaskPtr = nullptr;
+ float fCurrentCoverage = 0.0f;
+ int fCurrentY = 0;
+ SkJumper_DitherCtx fDitherCtx = { &fCurrentY, 0.0f };
typedef SkBlitter INHERITED;
};
@@ -107,8 +108,21 @@ SkBlitter* SkRasterPipelineBlitter::Create(const SkPixmap& dst,
return nullptr;
}
+ // TODO: Think more about under what conditions we dither:
+ // - if we're drawing anything into 565 and the user has asked us to dither, or
+ // - if we're drawing a gradient into 565 or 8888.
+ if ((paint.isDither() && dst.info().colorType() == kRGB_565_SkColorType) ||
+ (shader && shader->asAGradient(nullptr) >= SkShader::kLinear_GradientType)) {
+ switch (dst.info().colorType()) {
+ default: blitter->fDitherCtx.rate = 0.0f; break;
+ case kRGB_565_SkColorType: blitter->fDitherCtx.rate = 1/63.0f; break;
+ case kRGBA_8888_SkColorType:
+ case kBGRA_8888_SkColorType: blitter->fDitherCtx.rate = 1/255.0f; break;
+ }
+ }
+
bool is_opaque = paintColor->a() == 1.0f,
- is_constant = true;
+ is_constant = blitter->fDitherCtx.rate == 0.0f;
if (shader) {
pipeline->append(SkRasterPipeline::seed_shader, &blitter->fCurrentY);
if (!shader->appendStages(pipeline, dst.colorSpace(), alloc, ctm, paint)) {
@@ -119,8 +133,8 @@ SkBlitter* SkRasterPipelineBlitter::Create(const SkPixmap& dst,
&paintColor->fVec[SkPM4f::A]);
}
- is_opaque = is_opaque && shader->isOpaque();
- is_constant = shader->isConstant();
+ is_opaque = is_opaque && shader->isOpaque();
+ is_constant = is_constant && shader->isConstant();
} else {
pipeline->append(SkRasterPipeline::constant_color, paintColor);
}
@@ -132,30 +146,6 @@ SkBlitter* SkRasterPipelineBlitter::Create(const SkPixmap& dst,
is_opaque = is_opaque && (colorFilter->getFlags() & SkColorFilter::kAlphaUnchanged_Flag);
}
- // TODO: Think more about under what conditions we dither:
- // - if we're drawing anything into 565 and the user has asked us to dither, or
- // - if we're drawing a gradient into 565 or 8888.
- // TODO: move this later in the pipeline, perhaps the first thing we do in append_store()?
- if ((paint.isDither() && dst.info().colorType() == kRGB_565_SkColorType) ||
- (shader && shader->asAGradient(nullptr) >= SkShader::kLinear_GradientType)) {
- float rate;
- switch (dst.info().colorType()) {
- case kRGB_565_SkColorType: rate = 1/63.0f; break;
- case kBGRA_8888_SkColorType:
- case kRGBA_8888_SkColorType: rate = 1/255.0f; break;
- default: rate = 0.0f; break;
- }
- if (rate) {
- auto ctx = alloc->make<SkJumper_DitherCtx>();
- ctx->y = &blitter->fCurrentY;
- ctx->rate = rate;
- pipeline->append(SkRasterPipeline::dither, ctx);
- pipeline->append(SkRasterPipeline::clamp_0);
- pipeline->append(SkRasterPipeline::clamp_a);
- is_constant = false;
- }
- }
-
if (is_constant) {
pipeline->append(SkRasterPipeline::store_f32, &paintColor);
pipeline->run(0,1);
@@ -208,10 +198,15 @@ void SkRasterPipelineBlitter::append_store(SkRasterPipeline* p) const {
if (fDst.info().gammaCloseToSRGB()) {
p->append(SkRasterPipeline::to_srgb);
}
+ if (fDitherCtx.rate > 0.0f) {
+ // We dither after any sRGB transfer function to make sure our 1/255.0f is sensible
+ // over the whole range. If we did it before, 1/255.0f is too big a rate near zero.
+ p->append(SkRasterPipeline::dither, &fDitherCtx);
+ }
+
if (fDst.info().colorType() == kBGRA_8888_SkColorType) {
p->append(SkRasterPipeline::swap_rb);
}
-
SkASSERT(supported(fDst.info()));
switch (fDst.info().colorType()) {
case kAlpha_8_SkColorType: p->append(SkRasterPipeline::store_a8, &fDstPtr); break;
diff --git a/src/jumper/SkJumper_generated.S b/src/jumper/SkJumper_generated.S
index 71afcd85a9..72860b734b 100644
--- a/src/jumper/SkJumper_generated.S
+++ b/src/jumper/SkJumper_generated.S
@@ -121,18 +121,17 @@ _sk_dither_aarch64:
.long 0x4e331e10 // and v16.16b, v16.16b, v19.16b
.long 0x4f225694 // shl v20.4s, v20.4s, #2
.long 0x4eb21e31 // orr v17.16b, v17.16b, v18.16b
- .long 0x52a79049 // mov w9, #0x3c820000
+ .long 0x52a79009 // mov w9, #0x3c800000
.long 0xbd400913 // ldr s19, [x8, #8]
.long 0x6f3f0610 // ushr v16.4s, v16.4s, #1
.long 0x4eb41e31 // orr v17.16b, v17.16b, v20.16b
- .long 0x72810429 // movk w9, #0x821
- .long 0x4eb01e30 // orr v16.16b, v17.16b, v16.16b
.long 0x4e040d36 // dup v22.4s, w9
- .long 0x4f0567f5 // movi v21.4s, #0xbf, lsl #24
+ .long 0x52b7df89 // mov w9, #0xbefc0000
+ .long 0x4eb01e30 // orr v16.16b, v17.16b, v16.16b
+ .long 0x4e040d35 // dup v21.4s, w9
.long 0x4e21da10 // scvtf v16.4s, v16.4s
.long 0x4e30ced5 // fmla v21.4s, v22.4s, v16.4s
.long 0x4f9392b0 // fmul v16.4s, v21.4s, v19.s[0]
- .long 0x6e23de10 // fmul v16.4s, v16.4s, v3.4s
.long 0x4e20d600 // fadd v0.4s, v16.4s, v0.4s
.long 0x4e21d601 // fadd v1.4s, v16.4s, v1.4s
.long 0x4e22d602 // fadd v2.4s, v16.4s, v2.4s
@@ -2251,9 +2250,9 @@ FUNCTION(_sk_gather_i8_aarch64)
_sk_gather_i8_aarch64:
.long 0xaa0103e8 // mov x8, x1
.long 0xf8408429 // ldr x9, [x1], #8
- .long 0xb4000069 // cbz x9, 1da0 <sk_gather_i8_aarch64+0x14>
+ .long 0xb4000069 // cbz x9, 1d9c <sk_gather_i8_aarch64+0x14>
.long 0xaa0903ea // mov x10, x9
- .long 0x14000003 // b 1da8 <sk_gather_i8_aarch64+0x1c>
+ .long 0x14000003 // b 1da4 <sk_gather_i8_aarch64+0x1c>
.long 0xf940050a // ldr x10, [x8, #8]
.long 0x91004101 // add x1, x8, #0x10
.long 0xf8410548 // ldr x8, [x10], #16
@@ -3102,7 +3101,7 @@ _sk_linear_gradient_aarch64:
.long 0x4d40c902 // ld1r {v2.4s}, [x8]
.long 0xf9400128 // ldr x8, [x9]
.long 0x4d40c943 // ld1r {v3.4s}, [x10]
- .long 0xb40006c8 // cbz x8, 2974 <sk_linear_gradient_aarch64+0x100>
+ .long 0xb40006c8 // cbz x8, 2970 <sk_linear_gradient_aarch64+0x100>
.long 0x6dbf23e9 // stp d9, d8, [sp, #-16]!
.long 0xf9400529 // ldr x9, [x9, #8]
.long 0x6f00e413 // movi v19.2d, #0x0
@@ -3153,9 +3152,9 @@ _sk_linear_gradient_aarch64:
.long 0xd1000508 // sub x8, x8, #0x1
.long 0x6e771fd0 // bsl v16.16b, v30.16b, v23.16b
.long 0x91009129 // add x9, x9, #0x24
- .long 0xb5fffaa8 // cbnz x8, 28bc <sk_linear_gradient_aarch64+0x48>
+ .long 0xb5fffaa8 // cbnz x8, 28b8 <sk_linear_gradient_aarch64+0x48>
.long 0x6cc123e9 // ldp d9, d8, [sp], #16
- .long 0x14000005 // b 2984 <sk_linear_gradient_aarch64+0x110>
+ .long 0x14000005 // b 2980 <sk_linear_gradient_aarch64+0x110>
.long 0x6f00e414 // movi v20.2d, #0x0
.long 0x6f00e412 // movi v18.2d, #0x0
.long 0x6f00e411 // movi v17.2d, #0x0
@@ -3631,16 +3630,17 @@ HIDDEN _sk_dither_vfp4
.globl _sk_dither_vfp4
FUNCTION(_sk_dither_vfp4)
_sk_dither_vfp4:
- .long 0xe92d4800 // push {fp, lr}
+ .long 0xe92d4010 // push {r4, lr}
.long 0xee800b90 // vdup.32 d16, r0
.long 0xf2c02012 // vmov.i32 d18, #2
.long 0xf3fb0620 // vcvt.f32.s32 d16, d16
.long 0xedd21b00 // vldr d17, [r2]
- .long 0xe8911008 // ldm r1, {r3, ip}
+ .long 0xe8911010 // ldm r1, {r4, ip}
.long 0xf2c03014 // vmov.i32 d19, #4
+ .long 0xe3a035f2 // mov r3, #1015021568
.long 0xe2811008 // add r1, r1, #8
.long 0xf2400da1 // vadd.f32 d16, d16, d17
- .long 0xe493e004 // ldr lr, [r3], #4
+ .long 0xe494e004 // ldr lr, [r4], #4
.long 0xf2c01011 // vmov.i32 d17, #1
.long 0xf4ee5c9f // vld1.32 {d21[]}, [lr :32]
.long 0xf3fb0720 // vcvt.s32.f32 d16, d16
@@ -3662,21 +3662,20 @@ _sk_dither_vfp4:
.long 0xf3ff1033 // vshr.u32 d17, d19, #1
.long 0xf26001b2 // vorr d16, d16, d18
.long 0xf26001b1 // vorr d16, d16, d17
- .long 0xeddf1b0b // vldr d17, [pc, #44]
+ .long 0xee813b90 // vdup.32 d17, r3
.long 0xf3fb0620 // vcvt.f32.s32 d16, d16
.long 0xf3400db1 // vmul.f32 d16, d16, d17
- .long 0xf3c3161f // vmov.i32 d17, #-1090519040
+ .long 0xeddf1b07 // vldr d17, [pc, #28]
.long 0xf2400da1 // vadd.f32 d16, d16, d17
- .long 0xf4e31c9f // vld1.32 {d17[]}, [r3 :32]
+ .long 0xf4e41c9f // vld1.32 {d17[]}, [r4 :32]
.long 0xf3410db0 // vmul.f32 d16, d17, d16
- .long 0xf3400d93 // vmul.f32 d16, d16, d3
.long 0xf2000d80 // vadd.f32 d0, d16, d0
.long 0xf2001d81 // vadd.f32 d1, d16, d1
.long 0xf2002d82 // vadd.f32 d2, d16, d2
- .long 0xe8bd4800 // pop {fp, lr}
+ .long 0xe8bd4010 // pop {r4, lr}
.long 0xe12fff1c // bx ip
- .long 0x3c820821 // .word 0x3c820821
- .long 0x3c820821 // .word 0x3c820821
+ .long 0xbefc0000 // .word 0xbefc0000
+ .long 0xbefc0000 // .word 0xbefc0000
HIDDEN _sk_constant_color_vfp4
.globl _sk_constant_color_vfp4
@@ -7535,14 +7534,14 @@ _sk_seed_shader_hsw:
.byte 197,249,110,199 // vmovd %edi,%xmm0
.byte 196,226,125,88,192 // vpbroadcastd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,173,61,0,0 // vbroadcastss 0x3dad(%rip),%ymm1 # 3e70 <_sk_callback_hsw+0x127>
+ .byte 196,226,125,24,13,169,61,0,0 // vbroadcastss 0x3da9(%rip),%ymm1 # 3e6c <_sk_callback_hsw+0x127>
.byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
.byte 197,252,88,2 // vaddps (%rdx),%ymm0,%ymm0
.byte 196,226,125,24,16 // vbroadcastss (%rax),%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 197,236,88,201 // vaddps %ymm1,%ymm2,%ymm1
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,21,145,61,0,0 // vbroadcastss 0x3d91(%rip),%ymm2 # 3e74 <_sk_callback_hsw+0x12b>
+ .byte 196,226,125,24,21,141,61,0,0 // vbroadcastss 0x3d8d(%rip),%ymm2 # 3e70 <_sk_callback_hsw+0x12b>
.byte 197,228,87,219 // vxorps %ymm3,%ymm3,%ymm3
.byte 197,220,87,228 // vxorps %ymm4,%ymm4,%ymm4
.byte 197,212,87,237 // vxorps %ymm5,%ymm5,%ymm5
@@ -7563,13 +7562,13 @@ _sk_dither_hsw:
.byte 76,139,0 // mov (%rax),%r8
.byte 196,66,125,88,8 // vpbroadcastd (%r8),%ymm9
.byte 196,65,61,239,201 // vpxor %ymm9,%ymm8,%ymm9
- .byte 196,98,125,88,21,80,61,0,0 // vpbroadcastd 0x3d50(%rip),%ymm10 # 3e78 <_sk_callback_hsw+0x12f>
+ .byte 196,98,125,88,21,76,61,0,0 // vpbroadcastd 0x3d4c(%rip),%ymm10 # 3e74 <_sk_callback_hsw+0x12f>
.byte 196,65,53,219,218 // vpand %ymm10,%ymm9,%ymm11
.byte 196,193,37,114,243,5 // vpslld $0x5,%ymm11,%ymm11
.byte 196,65,61,219,210 // vpand %ymm10,%ymm8,%ymm10
.byte 196,193,45,114,242,4 // vpslld $0x4,%ymm10,%ymm10
- .byte 196,98,125,88,37,53,61,0,0 // vpbroadcastd 0x3d35(%rip),%ymm12 # 3e7c <_sk_callback_hsw+0x133>
- .byte 196,98,125,88,45,48,61,0,0 // vpbroadcastd 0x3d30(%rip),%ymm13 # 3e80 <_sk_callback_hsw+0x137>
+ .byte 196,98,125,88,37,49,61,0,0 // vpbroadcastd 0x3d31(%rip),%ymm12 # 3e78 <_sk_callback_hsw+0x133>
+ .byte 196,98,125,88,45,44,61,0,0 // vpbroadcastd 0x3d2c(%rip),%ymm13 # 3e7c <_sk_callback_hsw+0x137>
.byte 196,65,53,219,245 // vpand %ymm13,%ymm9,%ymm14
.byte 196,193,13,114,246,2 // vpslld $0x2,%ymm14,%ymm14
.byte 196,65,61,219,237 // vpand %ymm13,%ymm8,%ymm13
@@ -7584,12 +7583,11 @@ _sk_dither_hsw:
.byte 196,65,61,235,194 // vpor %ymm10,%ymm8,%ymm8
.byte 196,65,61,235,193 // vpor %ymm9,%ymm8,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,226,60,0,0 // vbroadcastss 0x3ce2(%rip),%ymm9 # 3e84 <_sk_callback_hsw+0x13b>
- .byte 196,98,125,24,21,221,60,0,0 // vbroadcastss 0x3cdd(%rip),%ymm10 # 3e88 <_sk_callback_hsw+0x13f>
+ .byte 196,98,125,24,13,222,60,0,0 // vbroadcastss 0x3cde(%rip),%ymm9 # 3e80 <_sk_callback_hsw+0x13b>
+ .byte 196,98,125,24,21,217,60,0,0 // vbroadcastss 0x3cd9(%rip),%ymm10 # 3e84 <_sk_callback_hsw+0x13f>
.byte 196,66,61,184,209 // vfmadd231ps %ymm9,%ymm8,%ymm10
.byte 196,98,125,24,64,8 // vbroadcastss 0x8(%rax),%ymm8
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 197,60,89,195 // vmulps %ymm3,%ymm8,%ymm8
.byte 197,188,88,192 // vaddps %ymm0,%ymm8,%ymm0
.byte 197,188,88,201 // vaddps %ymm1,%ymm8,%ymm1
.byte 197,188,88,210 // vaddps %ymm2,%ymm8,%ymm2
@@ -7624,7 +7622,7 @@ HIDDEN _sk_srcatop_hsw
FUNCTION(_sk_srcatop_hsw)
_sk_srcatop_hsw:
.byte 197,252,89,199 // vmulps %ymm7,%ymm0,%ymm0
- .byte 196,98,125,24,5,127,60,0,0 // vbroadcastss 0x3c7f(%rip),%ymm8 # 3e8c <_sk_callback_hsw+0x143>
+ .byte 196,98,125,24,5,127,60,0,0 // vbroadcastss 0x3c7f(%rip),%ymm8 # 3e88 <_sk_callback_hsw+0x143>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 196,226,61,184,196 // vfmadd231ps %ymm4,%ymm8,%ymm0
.byte 197,244,89,207 // vmulps %ymm7,%ymm1,%ymm1
@@ -7640,7 +7638,7 @@ HIDDEN _sk_dstatop_hsw
.globl _sk_dstatop_hsw
FUNCTION(_sk_dstatop_hsw)
_sk_dstatop_hsw:
- .byte 196,98,125,24,5,82,60,0,0 // vbroadcastss 0x3c52(%rip),%ymm8 # 3e90 <_sk_callback_hsw+0x147>
+ .byte 196,98,125,24,5,82,60,0,0 // vbroadcastss 0x3c52(%rip),%ymm8 # 3e8c <_sk_callback_hsw+0x147>
.byte 197,60,92,199 // vsubps %ymm7,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,226,101,184,196 // vfmadd231ps %ymm4,%ymm3,%ymm0
@@ -7679,7 +7677,7 @@ HIDDEN _sk_srcout_hsw
.globl _sk_srcout_hsw
FUNCTION(_sk_srcout_hsw)
_sk_srcout_hsw:
- .byte 196,98,125,24,5,249,59,0,0 // vbroadcastss 0x3bf9(%rip),%ymm8 # 3e94 <_sk_callback_hsw+0x14b>
+ .byte 196,98,125,24,5,249,59,0,0 // vbroadcastss 0x3bf9(%rip),%ymm8 # 3e90 <_sk_callback_hsw+0x14b>
.byte 197,60,92,199 // vsubps %ymm7,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
@@ -7692,7 +7690,7 @@ HIDDEN _sk_dstout_hsw
.globl _sk_dstout_hsw
FUNCTION(_sk_dstout_hsw)
_sk_dstout_hsw:
- .byte 196,226,125,24,5,220,59,0,0 // vbroadcastss 0x3bdc(%rip),%ymm0 # 3e98 <_sk_callback_hsw+0x14f>
+ .byte 196,226,125,24,5,220,59,0,0 // vbroadcastss 0x3bdc(%rip),%ymm0 # 3e94 <_sk_callback_hsw+0x14f>
.byte 197,252,92,219 // vsubps %ymm3,%ymm0,%ymm3
.byte 197,228,89,196 // vmulps %ymm4,%ymm3,%ymm0
.byte 197,228,89,205 // vmulps %ymm5,%ymm3,%ymm1
@@ -7705,7 +7703,7 @@ HIDDEN _sk_srcover_hsw
.globl _sk_srcover_hsw
FUNCTION(_sk_srcover_hsw)
_sk_srcover_hsw:
- .byte 196,98,125,24,5,191,59,0,0 // vbroadcastss 0x3bbf(%rip),%ymm8 # 3e9c <_sk_callback_hsw+0x153>
+ .byte 196,98,125,24,5,191,59,0,0 // vbroadcastss 0x3bbf(%rip),%ymm8 # 3e98 <_sk_callback_hsw+0x153>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 196,194,93,184,192 // vfmadd231ps %ymm8,%ymm4,%ymm0
.byte 196,194,85,184,200 // vfmadd231ps %ymm8,%ymm5,%ymm1
@@ -7718,7 +7716,7 @@ HIDDEN _sk_dstover_hsw
.globl _sk_dstover_hsw
FUNCTION(_sk_dstover_hsw)
_sk_dstover_hsw:
- .byte 196,98,125,24,5,158,59,0,0 // vbroadcastss 0x3b9e(%rip),%ymm8 # 3ea0 <_sk_callback_hsw+0x157>
+ .byte 196,98,125,24,5,158,59,0,0 // vbroadcastss 0x3b9e(%rip),%ymm8 # 3e9c <_sk_callback_hsw+0x157>
.byte 197,60,92,199 // vsubps %ymm7,%ymm8,%ymm8
.byte 196,226,61,168,196 // vfmadd213ps %ymm4,%ymm8,%ymm0
.byte 196,226,61,168,205 // vfmadd213ps %ymm5,%ymm8,%ymm1
@@ -7742,7 +7740,7 @@ HIDDEN _sk_multiply_hsw
.globl _sk_multiply_hsw
FUNCTION(_sk_multiply_hsw)
_sk_multiply_hsw:
- .byte 196,98,125,24,5,105,59,0,0 // vbroadcastss 0x3b69(%rip),%ymm8 # 3ea4 <_sk_callback_hsw+0x15b>
+ .byte 196,98,125,24,5,105,59,0,0 // vbroadcastss 0x3b69(%rip),%ymm8 # 3ea0 <_sk_callback_hsw+0x15b>
.byte 197,60,92,207 // vsubps %ymm7,%ymm8,%ymm9
.byte 197,52,89,208 // vmulps %ymm0,%ymm9,%ymm10
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -7790,7 +7788,7 @@ HIDDEN _sk_xor__hsw
.globl _sk_xor__hsw
FUNCTION(_sk_xor__hsw)
_sk_xor__hsw:
- .byte 196,98,125,24,5,228,58,0,0 // vbroadcastss 0x3ae4(%rip),%ymm8 # 3ea8 <_sk_callback_hsw+0x15f>
+ .byte 196,98,125,24,5,228,58,0,0 // vbroadcastss 0x3ae4(%rip),%ymm8 # 3ea4 <_sk_callback_hsw+0x15f>
.byte 197,60,92,207 // vsubps %ymm7,%ymm8,%ymm9
.byte 197,180,89,192 // vmulps %ymm0,%ymm9,%ymm0
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -7824,7 +7822,7 @@ _sk_darken_hsw:
.byte 197,100,89,206 // vmulps %ymm6,%ymm3,%ymm9
.byte 196,193,108,95,209 // vmaxps %ymm9,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,108,58,0,0 // vbroadcastss 0x3a6c(%rip),%ymm8 # 3eac <_sk_callback_hsw+0x163>
+ .byte 196,98,125,24,5,108,58,0,0 // vbroadcastss 0x3a6c(%rip),%ymm8 # 3ea8 <_sk_callback_hsw+0x163>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 196,194,69,184,216 // vfmadd231ps %ymm8,%ymm7,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -7849,7 +7847,7 @@ _sk_lighten_hsw:
.byte 197,100,89,206 // vmulps %ymm6,%ymm3,%ymm9
.byte 196,193,108,93,209 // vminps %ymm9,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,27,58,0,0 // vbroadcastss 0x3a1b(%rip),%ymm8 # 3eb0 <_sk_callback_hsw+0x167>
+ .byte 196,98,125,24,5,27,58,0,0 // vbroadcastss 0x3a1b(%rip),%ymm8 # 3eac <_sk_callback_hsw+0x167>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 196,194,69,184,216 // vfmadd231ps %ymm8,%ymm7,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -7877,7 +7875,7 @@ _sk_difference_hsw:
.byte 196,193,108,93,209 // vminps %ymm9,%ymm2,%ymm2
.byte 197,236,88,210 // vaddps %ymm2,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,190,57,0,0 // vbroadcastss 0x39be(%rip),%ymm8 # 3eb4 <_sk_callback_hsw+0x16b>
+ .byte 196,98,125,24,5,190,57,0,0 // vbroadcastss 0x39be(%rip),%ymm8 # 3eb0 <_sk_callback_hsw+0x16b>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 196,194,69,184,216 // vfmadd231ps %ymm8,%ymm7,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -7899,7 +7897,7 @@ _sk_exclusion_hsw:
.byte 197,236,89,214 // vmulps %ymm6,%ymm2,%ymm2
.byte 197,236,88,210 // vaddps %ymm2,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,124,57,0,0 // vbroadcastss 0x397c(%rip),%ymm8 # 3eb8 <_sk_callback_hsw+0x16f>
+ .byte 196,98,125,24,5,124,57,0,0 // vbroadcastss 0x397c(%rip),%ymm8 # 3eb4 <_sk_callback_hsw+0x16f>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 196,194,69,184,216 // vfmadd231ps %ymm8,%ymm7,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -7909,7 +7907,7 @@ HIDDEN _sk_colorburn_hsw
.globl _sk_colorburn_hsw
FUNCTION(_sk_colorburn_hsw)
_sk_colorburn_hsw:
- .byte 196,98,125,24,5,106,57,0,0 // vbroadcastss 0x396a(%rip),%ymm8 # 3ebc <_sk_callback_hsw+0x173>
+ .byte 196,98,125,24,5,106,57,0,0 // vbroadcastss 0x396a(%rip),%ymm8 # 3eb8 <_sk_callback_hsw+0x173>
.byte 197,60,92,207 // vsubps %ymm7,%ymm8,%ymm9
.byte 197,52,89,216 // vmulps %ymm0,%ymm9,%ymm11
.byte 196,65,44,87,210 // vxorps %ymm10,%ymm10,%ymm10
@@ -7967,7 +7965,7 @@ HIDDEN _sk_colordodge_hsw
FUNCTION(_sk_colordodge_hsw)
_sk_colordodge_hsw:
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
- .byte 196,98,125,24,13,117,56,0,0 // vbroadcastss 0x3875(%rip),%ymm9 # 3ec0 <_sk_callback_hsw+0x177>
+ .byte 196,98,125,24,13,117,56,0,0 // vbroadcastss 0x3875(%rip),%ymm9 # 3ebc <_sk_callback_hsw+0x177>
.byte 197,52,92,215 // vsubps %ymm7,%ymm9,%ymm10
.byte 197,44,89,216 // vmulps %ymm0,%ymm10,%ymm11
.byte 197,52,92,203 // vsubps %ymm3,%ymm9,%ymm9
@@ -8020,7 +8018,7 @@ HIDDEN _sk_hardlight_hsw
.globl _sk_hardlight_hsw
FUNCTION(_sk_hardlight_hsw)
_sk_hardlight_hsw:
- .byte 196,98,125,24,5,150,55,0,0 // vbroadcastss 0x3796(%rip),%ymm8 # 3ec4 <_sk_callback_hsw+0x17b>
+ .byte 196,98,125,24,5,150,55,0,0 // vbroadcastss 0x3796(%rip),%ymm8 # 3ec0 <_sk_callback_hsw+0x17b>
.byte 197,60,92,215 // vsubps %ymm7,%ymm8,%ymm10
.byte 197,44,89,216 // vmulps %ymm0,%ymm10,%ymm11
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -8071,7 +8069,7 @@ HIDDEN _sk_overlay_hsw
.globl _sk_overlay_hsw
FUNCTION(_sk_overlay_hsw)
_sk_overlay_hsw:
- .byte 196,98,125,24,5,206,54,0,0 // vbroadcastss 0x36ce(%rip),%ymm8 # 3ec8 <_sk_callback_hsw+0x17f>
+ .byte 196,98,125,24,5,206,54,0,0 // vbroadcastss 0x36ce(%rip),%ymm8 # 3ec4 <_sk_callback_hsw+0x17f>
.byte 197,60,92,215 // vsubps %ymm7,%ymm8,%ymm10
.byte 197,44,89,216 // vmulps %ymm0,%ymm10,%ymm11
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -8132,10 +8130,10 @@ _sk_softlight_hsw:
.byte 196,65,20,88,197 // vaddps %ymm13,%ymm13,%ymm8
.byte 196,65,60,88,192 // vaddps %ymm8,%ymm8,%ymm8
.byte 196,66,61,168,192 // vfmadd213ps %ymm8,%ymm8,%ymm8
- .byte 196,98,125,24,29,217,53,0,0 // vbroadcastss 0x35d9(%rip),%ymm11 # 3ed0 <_sk_callback_hsw+0x187>
+ .byte 196,98,125,24,29,217,53,0,0 // vbroadcastss 0x35d9(%rip),%ymm11 # 3ecc <_sk_callback_hsw+0x187>
.byte 196,65,20,88,227 // vaddps %ymm11,%ymm13,%ymm12
.byte 196,65,28,89,192 // vmulps %ymm8,%ymm12,%ymm8
- .byte 196,98,125,24,37,202,53,0,0 // vbroadcastss 0x35ca(%rip),%ymm12 # 3ed4 <_sk_callback_hsw+0x18b>
+ .byte 196,98,125,24,37,202,53,0,0 // vbroadcastss 0x35ca(%rip),%ymm12 # 3ed0 <_sk_callback_hsw+0x18b>
.byte 196,66,21,184,196 // vfmadd231ps %ymm12,%ymm13,%ymm8
.byte 196,65,124,82,245 // vrsqrtps %ymm13,%ymm14
.byte 196,65,124,83,246 // vrcpps %ymm14,%ymm14
@@ -8145,7 +8143,7 @@ _sk_softlight_hsw:
.byte 197,4,194,255,2 // vcmpleps %ymm7,%ymm15,%ymm15
.byte 196,67,13,74,240,240 // vblendvps %ymm15,%ymm8,%ymm14,%ymm14
.byte 197,116,88,249 // vaddps %ymm1,%ymm1,%ymm15
- .byte 196,98,125,24,5,141,53,0,0 // vbroadcastss 0x358d(%rip),%ymm8 # 3ecc <_sk_callback_hsw+0x183>
+ .byte 196,98,125,24,5,141,53,0,0 // vbroadcastss 0x358d(%rip),%ymm8 # 3ec8 <_sk_callback_hsw+0x183>
.byte 196,65,60,92,237 // vsubps %ymm13,%ymm8,%ymm13
.byte 197,132,92,195 // vsubps %ymm3,%ymm15,%ymm0
.byte 196,98,125,168,235 // vfmadd213ps %ymm3,%ymm0,%ymm13
@@ -8238,7 +8236,7 @@ HIDDEN _sk_clamp_1_hsw
.globl _sk_clamp_1_hsw
FUNCTION(_sk_clamp_1_hsw)
_sk_clamp_1_hsw:
- .byte 196,98,125,24,5,18,52,0,0 // vbroadcastss 0x3412(%rip),%ymm8 # 3ed8 <_sk_callback_hsw+0x18f>
+ .byte 196,98,125,24,5,18,52,0,0 // vbroadcastss 0x3412(%rip),%ymm8 # 3ed4 <_sk_callback_hsw+0x18f>
.byte 196,193,124,93,192 // vminps %ymm8,%ymm0,%ymm0
.byte 196,193,116,93,200 // vminps %ymm8,%ymm1,%ymm1
.byte 196,193,108,93,208 // vminps %ymm8,%ymm2,%ymm2
@@ -8250,7 +8248,7 @@ HIDDEN _sk_clamp_a_hsw
.globl _sk_clamp_a_hsw
FUNCTION(_sk_clamp_a_hsw)
_sk_clamp_a_hsw:
- .byte 196,98,125,24,5,245,51,0,0 // vbroadcastss 0x33f5(%rip),%ymm8 # 3edc <_sk_callback_hsw+0x193>
+ .byte 196,98,125,24,5,245,51,0,0 // vbroadcastss 0x33f5(%rip),%ymm8 # 3ed8 <_sk_callback_hsw+0x193>
.byte 196,193,100,93,216 // vminps %ymm8,%ymm3,%ymm3
.byte 197,252,93,195 // vminps %ymm3,%ymm0,%ymm0
.byte 197,244,93,203 // vminps %ymm3,%ymm1,%ymm1
@@ -8336,7 +8334,7 @@ FUNCTION(_sk_unpremul_hsw)
_sk_unpremul_hsw:
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,65,100,194,200,0 // vcmpeqps %ymm8,%ymm3,%ymm9
- .byte 196,98,125,24,21,61,51,0,0 // vbroadcastss 0x333d(%rip),%ymm10 # 3ee0 <_sk_callback_hsw+0x197>
+ .byte 196,98,125,24,21,61,51,0,0 // vbroadcastss 0x333d(%rip),%ymm10 # 3edc <_sk_callback_hsw+0x197>
.byte 197,44,94,211 // vdivps %ymm3,%ymm10,%ymm10
.byte 196,67,45,74,192,144 // vblendvps %ymm9,%ymm8,%ymm10,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
@@ -8349,16 +8347,16 @@ HIDDEN _sk_from_srgb_hsw
.globl _sk_from_srgb_hsw
FUNCTION(_sk_from_srgb_hsw)
_sk_from_srgb_hsw:
- .byte 196,98,125,24,5,30,51,0,0 // vbroadcastss 0x331e(%rip),%ymm8 # 3ee4 <_sk_callback_hsw+0x19b>
+ .byte 196,98,125,24,5,30,51,0,0 // vbroadcastss 0x331e(%rip),%ymm8 # 3ee0 <_sk_callback_hsw+0x19b>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 197,124,89,208 // vmulps %ymm0,%ymm0,%ymm10
- .byte 196,98,125,24,29,16,51,0,0 // vbroadcastss 0x3310(%rip),%ymm11 # 3ee8 <_sk_callback_hsw+0x19f>
- .byte 196,98,125,24,37,11,51,0,0 // vbroadcastss 0x330b(%rip),%ymm12 # 3eec <_sk_callback_hsw+0x1a3>
+ .byte 196,98,125,24,29,16,51,0,0 // vbroadcastss 0x3310(%rip),%ymm11 # 3ee4 <_sk_callback_hsw+0x19f>
+ .byte 196,98,125,24,37,11,51,0,0 // vbroadcastss 0x330b(%rip),%ymm12 # 3ee8 <_sk_callback_hsw+0x1a3>
.byte 196,65,124,40,236 // vmovaps %ymm12,%ymm13
.byte 196,66,125,168,235 // vfmadd213ps %ymm11,%ymm0,%ymm13
- .byte 196,98,125,24,53,252,50,0,0 // vbroadcastss 0x32fc(%rip),%ymm14 # 3ef0 <_sk_callback_hsw+0x1a7>
+ .byte 196,98,125,24,53,252,50,0,0 // vbroadcastss 0x32fc(%rip),%ymm14 # 3eec <_sk_callback_hsw+0x1a7>
.byte 196,66,45,168,238 // vfmadd213ps %ymm14,%ymm10,%ymm13
- .byte 196,98,125,24,21,242,50,0,0 // vbroadcastss 0x32f2(%rip),%ymm10 # 3ef4 <_sk_callback_hsw+0x1ab>
+ .byte 196,98,125,24,21,242,50,0,0 // vbroadcastss 0x32f2(%rip),%ymm10 # 3ef0 <_sk_callback_hsw+0x1ab>
.byte 196,193,124,194,194,1 // vcmpltps %ymm10,%ymm0,%ymm0
.byte 196,195,21,74,193,0 // vblendvps %ymm0,%ymm9,%ymm13,%ymm0
.byte 196,65,116,89,200 // vmulps %ymm8,%ymm1,%ymm9
@@ -8384,16 +8382,16 @@ _sk_to_srgb_hsw:
.byte 197,124,82,192 // vrsqrtps %ymm0,%ymm8
.byte 196,65,124,83,200 // vrcpps %ymm8,%ymm9
.byte 196,65,124,82,208 // vrsqrtps %ymm8,%ymm10
- .byte 196,98,125,24,5,140,50,0,0 // vbroadcastss 0x328c(%rip),%ymm8 # 3ef8 <_sk_callback_hsw+0x1af>
+ .byte 196,98,125,24,5,140,50,0,0 // vbroadcastss 0x328c(%rip),%ymm8 # 3ef4 <_sk_callback_hsw+0x1af>
.byte 196,65,124,89,216 // vmulps %ymm8,%ymm0,%ymm11
- .byte 196,98,125,24,37,130,50,0,0 // vbroadcastss 0x3282(%rip),%ymm12 # 3efc <_sk_callback_hsw+0x1b3>
- .byte 196,98,125,24,45,125,50,0,0 // vbroadcastss 0x327d(%rip),%ymm13 # 3f00 <_sk_callback_hsw+0x1b7>
+ .byte 196,98,125,24,37,130,50,0,0 // vbroadcastss 0x3282(%rip),%ymm12 # 3ef8 <_sk_callback_hsw+0x1b3>
+ .byte 196,98,125,24,45,125,50,0,0 // vbroadcastss 0x327d(%rip),%ymm13 # 3efc <_sk_callback_hsw+0x1b7>
.byte 196,66,21,168,204 // vfmadd213ps %ymm12,%ymm13,%ymm9
- .byte 196,98,125,24,53,115,50,0,0 // vbroadcastss 0x3273(%rip),%ymm14 # 3f04 <_sk_callback_hsw+0x1bb>
+ .byte 196,98,125,24,53,115,50,0,0 // vbroadcastss 0x3273(%rip),%ymm14 # 3f00 <_sk_callback_hsw+0x1bb>
.byte 196,66,13,184,202 // vfmadd231ps %ymm10,%ymm14,%ymm9
- .byte 196,98,125,24,21,105,50,0,0 // vbroadcastss 0x3269(%rip),%ymm10 # 3f08 <_sk_callback_hsw+0x1bf>
+ .byte 196,98,125,24,21,105,50,0,0 // vbroadcastss 0x3269(%rip),%ymm10 # 3f04 <_sk_callback_hsw+0x1bf>
.byte 196,65,44,93,201 // vminps %ymm9,%ymm10,%ymm9
- .byte 196,98,125,24,61,95,50,0,0 // vbroadcastss 0x325f(%rip),%ymm15 # 3f0c <_sk_callback_hsw+0x1c3>
+ .byte 196,98,125,24,61,95,50,0,0 // vbroadcastss 0x325f(%rip),%ymm15 # 3f08 <_sk_callback_hsw+0x1c3>
.byte 196,193,124,194,199,1 // vcmpltps %ymm15,%ymm0,%ymm0
.byte 196,195,53,74,195,0 // vblendvps %ymm0,%ymm11,%ymm9,%ymm0
.byte 197,124,82,201 // vrsqrtps %ymm1,%ymm9
@@ -8426,26 +8424,26 @@ _sk_rgb_to_hsl_hsw:
.byte 197,124,93,201 // vminps %ymm1,%ymm0,%ymm9
.byte 197,52,93,202 // vminps %ymm2,%ymm9,%ymm9
.byte 196,65,60,92,209 // vsubps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,29,217,49,0,0 // vbroadcastss 0x31d9(%rip),%ymm11 # 3f10 <_sk_callback_hsw+0x1c7>
+ .byte 196,98,125,24,29,217,49,0,0 // vbroadcastss 0x31d9(%rip),%ymm11 # 3f0c <_sk_callback_hsw+0x1c7>
.byte 196,65,36,94,218 // vdivps %ymm10,%ymm11,%ymm11
.byte 197,116,92,226 // vsubps %ymm2,%ymm1,%ymm12
.byte 197,116,194,234,1 // vcmpltps %ymm2,%ymm1,%ymm13
- .byte 196,98,125,24,53,198,49,0,0 // vbroadcastss 0x31c6(%rip),%ymm14 # 3f14 <_sk_callback_hsw+0x1cb>
+ .byte 196,98,125,24,53,198,49,0,0 // vbroadcastss 0x31c6(%rip),%ymm14 # 3f10 <_sk_callback_hsw+0x1cb>
.byte 196,65,4,87,255 // vxorps %ymm15,%ymm15,%ymm15
.byte 196,67,5,74,238,208 // vblendvps %ymm13,%ymm14,%ymm15,%ymm13
.byte 196,66,37,168,229 // vfmadd213ps %ymm13,%ymm11,%ymm12
.byte 197,236,92,208 // vsubps %ymm0,%ymm2,%ymm2
.byte 197,124,92,233 // vsubps %ymm1,%ymm0,%ymm13
- .byte 196,98,125,24,53,173,49,0,0 // vbroadcastss 0x31ad(%rip),%ymm14 # 3f1c <_sk_callback_hsw+0x1d3>
+ .byte 196,98,125,24,53,173,49,0,0 // vbroadcastss 0x31ad(%rip),%ymm14 # 3f18 <_sk_callback_hsw+0x1d3>
.byte 196,66,37,168,238 // vfmadd213ps %ymm14,%ymm11,%ymm13
- .byte 196,98,125,24,53,155,49,0,0 // vbroadcastss 0x319b(%rip),%ymm14 # 3f18 <_sk_callback_hsw+0x1cf>
+ .byte 196,98,125,24,53,155,49,0,0 // vbroadcastss 0x319b(%rip),%ymm14 # 3f14 <_sk_callback_hsw+0x1cf>
.byte 196,194,37,168,214 // vfmadd213ps %ymm14,%ymm11,%ymm2
.byte 197,188,194,201,0 // vcmpeqps %ymm1,%ymm8,%ymm1
.byte 196,227,21,74,202,16 // vblendvps %ymm1,%ymm2,%ymm13,%ymm1
.byte 197,188,194,192,0 // vcmpeqps %ymm0,%ymm8,%ymm0
.byte 196,195,117,74,196,0 // vblendvps %ymm0,%ymm12,%ymm1,%ymm0
.byte 196,193,60,88,201 // vaddps %ymm9,%ymm8,%ymm1
- .byte 196,98,125,24,29,126,49,0,0 // vbroadcastss 0x317e(%rip),%ymm11 # 3f24 <_sk_callback_hsw+0x1db>
+ .byte 196,98,125,24,29,126,49,0,0 // vbroadcastss 0x317e(%rip),%ymm11 # 3f20 <_sk_callback_hsw+0x1db>
.byte 196,193,116,89,211 // vmulps %ymm11,%ymm1,%ymm2
.byte 197,36,194,218,1 // vcmpltps %ymm2,%ymm11,%ymm11
.byte 196,65,12,92,224 // vsubps %ymm8,%ymm14,%ymm12
@@ -8455,7 +8453,7 @@ _sk_rgb_to_hsl_hsw:
.byte 197,172,94,201 // vdivps %ymm1,%ymm10,%ymm1
.byte 196,195,125,74,199,128 // vblendvps %ymm8,%ymm15,%ymm0,%ymm0
.byte 196,195,117,74,207,128 // vblendvps %ymm8,%ymm15,%ymm1,%ymm1
- .byte 196,98,125,24,5,65,49,0,0 // vbroadcastss 0x3141(%rip),%ymm8 # 3f20 <_sk_callback_hsw+0x1d7>
+ .byte 196,98,125,24,5,65,49,0,0 // vbroadcastss 0x3141(%rip),%ymm8 # 3f1c <_sk_callback_hsw+0x1d7>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -8472,30 +8470,30 @@ _sk_hsl_to_rgb_hsw:
.byte 197,252,17,92,36,128 // vmovups %ymm3,-0x80(%rsp)
.byte 197,252,40,233 // vmovaps %ymm1,%ymm5
.byte 197,252,40,224 // vmovaps %ymm0,%ymm4
- .byte 196,98,125,24,5,14,49,0,0 // vbroadcastss 0x310e(%rip),%ymm8 # 3f28 <_sk_callback_hsw+0x1df>
+ .byte 196,98,125,24,5,14,49,0,0 // vbroadcastss 0x310e(%rip),%ymm8 # 3f24 <_sk_callback_hsw+0x1df>
.byte 197,60,194,202,2 // vcmpleps %ymm2,%ymm8,%ymm9
.byte 197,84,89,210 // vmulps %ymm2,%ymm5,%ymm10
.byte 196,65,84,92,218 // vsubps %ymm10,%ymm5,%ymm11
.byte 196,67,45,74,203,144 // vblendvps %ymm9,%ymm11,%ymm10,%ymm9
.byte 197,52,88,210 // vaddps %ymm2,%ymm9,%ymm10
- .byte 196,98,125,24,13,241,48,0,0 // vbroadcastss 0x30f1(%rip),%ymm9 # 3f2c <_sk_callback_hsw+0x1e3>
+ .byte 196,98,125,24,13,241,48,0,0 // vbroadcastss 0x30f1(%rip),%ymm9 # 3f28 <_sk_callback_hsw+0x1e3>
.byte 196,66,109,170,202 // vfmsub213ps %ymm10,%ymm2,%ymm9
- .byte 196,98,125,24,29,231,48,0,0 // vbroadcastss 0x30e7(%rip),%ymm11 # 3f30 <_sk_callback_hsw+0x1e7>
+ .byte 196,98,125,24,29,231,48,0,0 // vbroadcastss 0x30e7(%rip),%ymm11 # 3f2c <_sk_callback_hsw+0x1e7>
.byte 196,65,92,88,219 // vaddps %ymm11,%ymm4,%ymm11
.byte 196,67,125,8,227,1 // vroundps $0x1,%ymm11,%ymm12
.byte 196,65,36,92,252 // vsubps %ymm12,%ymm11,%ymm15
.byte 196,65,44,92,217 // vsubps %ymm9,%ymm10,%ymm11
- .byte 196,98,125,24,45,209,48,0,0 // vbroadcastss 0x30d1(%rip),%ymm13 # 3f38 <_sk_callback_hsw+0x1ef>
+ .byte 196,98,125,24,45,209,48,0,0 // vbroadcastss 0x30d1(%rip),%ymm13 # 3f34 <_sk_callback_hsw+0x1ef>
.byte 196,193,4,89,197 // vmulps %ymm13,%ymm15,%ymm0
- .byte 196,98,125,24,53,199,48,0,0 // vbroadcastss 0x30c7(%rip),%ymm14 # 3f3c <_sk_callback_hsw+0x1f3>
+ .byte 196,98,125,24,53,199,48,0,0 // vbroadcastss 0x30c7(%rip),%ymm14 # 3f38 <_sk_callback_hsw+0x1f3>
.byte 197,12,92,224 // vsubps %ymm0,%ymm14,%ymm12
.byte 196,66,37,168,225 // vfmadd213ps %ymm9,%ymm11,%ymm12
- .byte 196,226,125,24,29,173,48,0,0 // vbroadcastss 0x30ad(%rip),%ymm3 # 3f34 <_sk_callback_hsw+0x1eb>
+ .byte 196,226,125,24,29,173,48,0,0 // vbroadcastss 0x30ad(%rip),%ymm3 # 3f30 <_sk_callback_hsw+0x1eb>
.byte 196,193,100,194,255,2 // vcmpleps %ymm15,%ymm3,%ymm7
.byte 196,195,29,74,249,112 // vblendvps %ymm7,%ymm9,%ymm12,%ymm7
.byte 196,65,60,194,231,2 // vcmpleps %ymm15,%ymm8,%ymm12
.byte 196,227,45,74,255,192 // vblendvps %ymm12,%ymm7,%ymm10,%ymm7
- .byte 196,98,125,24,37,152,48,0,0 // vbroadcastss 0x3098(%rip),%ymm12 # 3f40 <_sk_callback_hsw+0x1f7>
+ .byte 196,98,125,24,37,152,48,0,0 // vbroadcastss 0x3098(%rip),%ymm12 # 3f3c <_sk_callback_hsw+0x1f7>
.byte 196,65,28,194,255,2 // vcmpleps %ymm15,%ymm12,%ymm15
.byte 196,194,37,168,193 // vfmadd213ps %ymm9,%ymm11,%ymm0
.byte 196,99,125,74,255,240 // vblendvps %ymm15,%ymm7,%ymm0,%ymm15
@@ -8511,7 +8509,7 @@ _sk_hsl_to_rgb_hsw:
.byte 197,156,194,192,2 // vcmpleps %ymm0,%ymm12,%ymm0
.byte 196,194,37,168,249 // vfmadd213ps %ymm9,%ymm11,%ymm7
.byte 196,227,69,74,201,0 // vblendvps %ymm0,%ymm1,%ymm7,%ymm1
- .byte 196,226,125,24,5,68,48,0,0 // vbroadcastss 0x3044(%rip),%ymm0 # 3f44 <_sk_callback_hsw+0x1fb>
+ .byte 196,226,125,24,5,68,48,0,0 // vbroadcastss 0x3044(%rip),%ymm0 # 3f40 <_sk_callback_hsw+0x1fb>
.byte 197,220,88,192 // vaddps %ymm0,%ymm4,%ymm0
.byte 196,227,125,8,224,1 // vroundps $0x1,%ymm0,%ymm4
.byte 197,252,92,196 // vsubps %ymm4,%ymm0,%ymm0
@@ -8561,11 +8559,11 @@ _sk_scale_u8_hsw:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,51 // jne fe0 <_sk_scale_u8_hsw+0x43>
+ .byte 117,51 // jne fdc <_sk_scale_u8_hsw+0x43>
.byte 197,122,126,0 // vmovq (%rax),%xmm8
.byte 196,66,125,49,192 // vpmovzxbd %xmm8,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,132,47,0,0 // vbroadcastss 0x2f84(%rip),%ymm9 # 3f48 <_sk_callback_hsw+0x1ff>
+ .byte 196,98,125,24,13,132,47,0,0 // vbroadcastss 0x2f84(%rip),%ymm9 # 3f44 <_sk_callback_hsw+0x1ff>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
@@ -8583,9 +8581,9 @@ _sk_scale_u8_hsw:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne fe8 <_sk_scale_u8_hsw+0x4b>
+ .byte 117,234 // jne fe4 <_sk_scale_u8_hsw+0x4b>
.byte 196,65,249,110,193 // vmovq %r9,%xmm8
- .byte 235,172 // jmp fb1 <_sk_scale_u8_hsw+0x14>
+ .byte 235,172 // jmp fad <_sk_scale_u8_hsw+0x14>
HIDDEN _sk_lerp_1_float_hsw
.globl _sk_lerp_1_float_hsw
@@ -8613,11 +8611,11 @@ _sk_lerp_u8_hsw:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,71 // jne 108b <_sk_lerp_u8_hsw+0x57>
+ .byte 117,71 // jne 1087 <_sk_lerp_u8_hsw+0x57>
.byte 197,122,126,0 // vmovq (%rax),%xmm8
.byte 196,66,125,49,192 // vpmovzxbd %xmm8,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,241,46,0,0 // vbroadcastss 0x2ef1(%rip),%ymm9 # 3f4c <_sk_callback_hsw+0x203>
+ .byte 196,98,125,24,13,241,46,0,0 // vbroadcastss 0x2ef1(%rip),%ymm9 # 3f48 <_sk_callback_hsw+0x203>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,252,92,196 // vsubps %ymm4,%ymm0,%ymm0
.byte 196,226,61,168,196 // vfmadd213ps %ymm4,%ymm8,%ymm0
@@ -8639,9 +8637,9 @@ _sk_lerp_u8_hsw:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 1093 <_sk_lerp_u8_hsw+0x5f>
+ .byte 117,234 // jne 108f <_sk_lerp_u8_hsw+0x5f>
.byte 196,65,249,110,193 // vmovq %r9,%xmm8
- .byte 235,152 // jmp 1048 <_sk_lerp_u8_hsw+0x14>
+ .byte 235,152 // jmp 1044 <_sk_lerp_u8_hsw+0x14>
HIDDEN _sk_lerp_565_hsw
.globl _sk_lerp_565_hsw
@@ -8650,23 +8648,23 @@ _sk_lerp_565_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,149,0,0,0 // jne 1153 <_sk_lerp_565_hsw+0xa3>
+ .byte 15,133,149,0,0,0 // jne 114f <_sk_lerp_565_hsw+0xa3>
.byte 196,193,122,111,28,122 // vmovdqu (%r10,%rdi,2),%xmm3
.byte 196,226,125,51,219 // vpmovzxwd %xmm3,%ymm3
- .byte 196,98,125,88,5,126,46,0,0 // vpbroadcastd 0x2e7e(%rip),%ymm8 # 3f50 <_sk_callback_hsw+0x207>
+ .byte 196,98,125,88,5,126,46,0,0 // vpbroadcastd 0x2e7e(%rip),%ymm8 # 3f4c <_sk_callback_hsw+0x207>
.byte 196,65,101,219,192 // vpand %ymm8,%ymm3,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,111,46,0,0 // vbroadcastss 0x2e6f(%rip),%ymm9 # 3f54 <_sk_callback_hsw+0x20b>
+ .byte 196,98,125,24,13,111,46,0,0 // vbroadcastss 0x2e6f(%rip),%ymm9 # 3f50 <_sk_callback_hsw+0x20b>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,88,13,101,46,0,0 // vpbroadcastd 0x2e65(%rip),%ymm9 # 3f58 <_sk_callback_hsw+0x20f>
+ .byte 196,98,125,88,13,101,46,0,0 // vpbroadcastd 0x2e65(%rip),%ymm9 # 3f54 <_sk_callback_hsw+0x20f>
.byte 196,65,101,219,201 // vpand %ymm9,%ymm3,%ymm9
.byte 196,65,124,91,201 // vcvtdq2ps %ymm9,%ymm9
- .byte 196,98,125,24,21,86,46,0,0 // vbroadcastss 0x2e56(%rip),%ymm10 # 3f5c <_sk_callback_hsw+0x213>
+ .byte 196,98,125,24,21,86,46,0,0 // vbroadcastss 0x2e56(%rip),%ymm10 # 3f58 <_sk_callback_hsw+0x213>
.byte 196,65,52,89,202 // vmulps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,88,21,76,46,0,0 // vpbroadcastd 0x2e4c(%rip),%ymm10 # 3f60 <_sk_callback_hsw+0x217>
+ .byte 196,98,125,88,21,76,46,0,0 // vpbroadcastd 0x2e4c(%rip),%ymm10 # 3f5c <_sk_callback_hsw+0x217>
.byte 196,193,101,219,218 // vpand %ymm10,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,21,62,46,0,0 // vbroadcastss 0x2e3e(%rip),%ymm10 # 3f64 <_sk_callback_hsw+0x21b>
+ .byte 196,98,125,24,21,62,46,0,0 // vbroadcastss 0x2e3e(%rip),%ymm10 # 3f60 <_sk_callback_hsw+0x21b>
.byte 196,193,100,89,218 // vmulps %ymm10,%ymm3,%ymm3
.byte 197,252,92,196 // vsubps %ymm4,%ymm0,%ymm0
.byte 196,226,61,168,196 // vfmadd213ps %ymm4,%ymm8,%ymm0
@@ -8675,16 +8673,16 @@ _sk_lerp_565_hsw:
.byte 197,236,92,214 // vsubps %ymm6,%ymm2,%ymm2
.byte 196,226,101,168,214 // vfmadd213ps %ymm6,%ymm3,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,23,46,0,0 // vbroadcastss 0x2e17(%rip),%ymm3 # 3f68 <_sk_callback_hsw+0x21f>
+ .byte 196,226,125,24,29,23,46,0,0 // vbroadcastss 0x2e17(%rip),%ymm3 # 3f64 <_sk_callback_hsw+0x21f>
.byte 255,224 // jmpq *%rax
.byte 65,137,200 // mov %ecx,%r8d
.byte 65,128,224,7 // and $0x7,%r8b
.byte 197,225,239,219 // vpxor %xmm3,%xmm3,%xmm3
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 15,135,89,255,255,255 // ja 10c4 <_sk_lerp_565_hsw+0x14>
+ .byte 15,135,89,255,255,255 // ja 10c0 <_sk_lerp_565_hsw+0x14>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,74,0,0,0 // lea 0x4a(%rip),%r9 # 11c0 <_sk_lerp_565_hsw+0x110>
+ .byte 76,141,13,74,0,0,0 // lea 0x4a(%rip),%r9 # 11bc <_sk_lerp_565_hsw+0x110>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -8696,12 +8694,12 @@ _sk_lerp_565_hsw:
.byte 196,193,97,196,92,122,4,2 // vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm3,%xmm3
.byte 196,193,97,196,92,122,2,1 // vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm3,%xmm3
.byte 196,193,97,196,28,122,0 // vpinsrw $0x0,(%r10,%rdi,2),%xmm3,%xmm3
- .byte 233,5,255,255,255 // jmpq 10c4 <_sk_lerp_565_hsw+0x14>
+ .byte 233,5,255,255,255 // jmpq 10c0 <_sk_lerp_565_hsw+0x14>
.byte 144 // nop
.byte 243,255 // repz (bad)
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 235,255 // jmp 11c5 <_sk_lerp_565_hsw+0x115>
+ .byte 235,255 // jmp 11c1 <_sk_lerp_565_hsw+0x115>
.byte 255 // (bad)
.byte 255,227 // jmpq *%rbx
.byte 255 // (bad)
@@ -8730,23 +8728,23 @@ _sk_load_tables_hsw:
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
.byte 76,3,8 // add (%rax),%r9
.byte 77,133,192 // test %r8,%r8
- .byte 117,105 // jne 125a <_sk_load_tables_hsw+0x7e>
+ .byte 117,105 // jne 1256 <_sk_load_tables_hsw+0x7e>
.byte 196,193,126,111,25 // vmovdqu (%r9),%ymm3
- .byte 197,229,219,13,34,48,0,0 // vpand 0x3022(%rip),%ymm3,%ymm1 # 4220 <_sk_callback_hsw+0x4d7>
+ .byte 197,229,219,13,38,48,0,0 // vpand 0x3026(%rip),%ymm3,%ymm1 # 4220 <_sk_callback_hsw+0x4db>
.byte 196,65,61,118,192 // vpcmpeqd %ymm8,%ymm8,%ymm8
.byte 72,139,72,8 // mov 0x8(%rax),%rcx
.byte 76,139,72,16 // mov 0x10(%rax),%r9
.byte 197,237,118,210 // vpcmpeqd %ymm2,%ymm2,%ymm2
.byte 196,226,109,146,4,137 // vgatherdps %ymm2,(%rcx,%ymm1,4),%ymm0
- .byte 196,226,101,0,21,34,48,0,0 // vpshufb 0x3022(%rip),%ymm3,%ymm2 # 4240 <_sk_callback_hsw+0x4f7>
+ .byte 196,226,101,0,21,38,48,0,0 // vpshufb 0x3026(%rip),%ymm3,%ymm2 # 4240 <_sk_callback_hsw+0x4fb>
.byte 196,65,53,118,201 // vpcmpeqd %ymm9,%ymm9,%ymm9
.byte 196,194,53,146,12,145 // vgatherdps %ymm9,(%r9,%ymm2,4),%ymm1
.byte 72,139,64,24 // mov 0x18(%rax),%rax
- .byte 196,98,101,0,13,42,48,0,0 // vpshufb 0x302a(%rip),%ymm3,%ymm9 # 4260 <_sk_callback_hsw+0x517>
+ .byte 196,98,101,0,13,46,48,0,0 // vpshufb 0x302e(%rip),%ymm3,%ymm9 # 4260 <_sk_callback_hsw+0x51b>
.byte 196,162,61,146,20,136 // vgatherdps %ymm8,(%rax,%ymm9,4),%ymm2
.byte 197,229,114,211,24 // vpsrld $0x18,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,30,45,0,0 // vbroadcastss 0x2d1e(%rip),%ymm8 # 3f6c <_sk_callback_hsw+0x223>
+ .byte 196,98,125,24,5,30,45,0,0 // vbroadcastss 0x2d1e(%rip),%ymm8 # 3f68 <_sk_callback_hsw+0x223>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,137,193 // mov %r8,%rcx
@@ -8759,7 +8757,7 @@ _sk_load_tables_hsw:
.byte 196,193,249,110,194 // vmovq %r10,%xmm0
.byte 196,226,125,33,192 // vpmovsxbd %xmm0,%ymm0
.byte 196,194,125,140,25 // vpmaskmovd (%r9),%ymm0,%ymm3
- .byte 233,115,255,255,255 // jmpq 11f6 <_sk_load_tables_hsw+0x1a>
+ .byte 233,115,255,255,255 // jmpq 11f2 <_sk_load_tables_hsw+0x1a>
HIDDEN _sk_load_tables_u16_be_hsw
.globl _sk_load_tables_u16_be_hsw
@@ -8769,7 +8767,7 @@ _sk_load_tables_u16_be_hsw:
.byte 76,139,0 // mov (%rax),%r8
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,201,0,0,0 // jne 1362 <_sk_load_tables_u16_be_hsw+0xdf>
+ .byte 15,133,201,0,0,0 // jne 135e <_sk_load_tables_u16_be_hsw+0xdf>
.byte 196,1,121,16,4,72 // vmovupd (%r8,%r9,2),%xmm8
.byte 196,129,121,16,84,72,16 // vmovupd 0x10(%r8,%r9,2),%xmm2
.byte 196,129,121,16,92,72,32 // vmovupd 0x20(%r8,%r9,2),%xmm3
@@ -8785,7 +8783,7 @@ _sk_load_tables_u16_be_hsw:
.byte 197,185,108,200 // vpunpcklqdq %xmm0,%xmm8,%xmm1
.byte 197,185,109,208 // vpunpckhqdq %xmm0,%xmm8,%xmm2
.byte 197,49,108,195 // vpunpcklqdq %xmm3,%xmm9,%xmm8
- .byte 197,121,111,21,182,48,0,0 // vmovdqa 0x30b6(%rip),%xmm10 # 43a0 <_sk_callback_hsw+0x657>
+ .byte 197,121,111,21,186,48,0,0 // vmovdqa 0x30ba(%rip),%xmm10 # 43a0 <_sk_callback_hsw+0x65b>
.byte 196,193,113,219,194 // vpand %xmm10,%xmm1,%xmm0
.byte 196,226,125,51,200 // vpmovzxwd %xmm0,%ymm1
.byte 196,65,37,118,219 // vpcmpeqd %ymm11,%ymm11,%ymm11
@@ -8807,36 +8805,36 @@ _sk_load_tables_u16_be_hsw:
.byte 197,185,235,219 // vpor %xmm3,%xmm8,%xmm3
.byte 196,226,125,51,219 // vpmovzxwd %xmm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,23,44,0,0 // vbroadcastss 0x2c17(%rip),%ymm8 # 3f70 <_sk_callback_hsw+0x227>
+ .byte 196,98,125,24,5,23,44,0,0 // vbroadcastss 0x2c17(%rip),%ymm8 # 3f6c <_sk_callback_hsw+0x227>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
.byte 196,1,123,16,4,72 // vmovsd (%r8,%r9,2),%xmm8
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,85 // je 13c8 <_sk_load_tables_u16_be_hsw+0x145>
+ .byte 116,85 // je 13c4 <_sk_load_tables_u16_be_hsw+0x145>
.byte 196,1,57,22,68,72,8 // vmovhpd 0x8(%r8,%r9,2),%xmm8,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,72 // jb 13c8 <_sk_load_tables_u16_be_hsw+0x145>
+ .byte 114,72 // jb 13c4 <_sk_load_tables_u16_be_hsw+0x145>
.byte 196,129,123,16,84,72,16 // vmovsd 0x10(%r8,%r9,2),%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 116,72 // je 13d5 <_sk_load_tables_u16_be_hsw+0x152>
+ .byte 116,72 // je 13d1 <_sk_load_tables_u16_be_hsw+0x152>
.byte 196,129,105,22,84,72,24 // vmovhpd 0x18(%r8,%r9,2),%xmm2,%xmm2
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,59 // jb 13d5 <_sk_load_tables_u16_be_hsw+0x152>
+ .byte 114,59 // jb 13d1 <_sk_load_tables_u16_be_hsw+0x152>
.byte 196,129,123,16,92,72,32 // vmovsd 0x20(%r8,%r9,2),%xmm3
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 15,132,9,255,255,255 // je 12b4 <_sk_load_tables_u16_be_hsw+0x31>
+ .byte 15,132,9,255,255,255 // je 12b0 <_sk_load_tables_u16_be_hsw+0x31>
.byte 196,129,97,22,92,72,40 // vmovhpd 0x28(%r8,%r9,2),%xmm3,%xmm3
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 15,130,248,254,255,255 // jb 12b4 <_sk_load_tables_u16_be_hsw+0x31>
+ .byte 15,130,248,254,255,255 // jb 12b0 <_sk_load_tables_u16_be_hsw+0x31>
.byte 196,1,122,126,76,72,48 // vmovq 0x30(%r8,%r9,2),%xmm9
- .byte 233,236,254,255,255 // jmpq 12b4 <_sk_load_tables_u16_be_hsw+0x31>
+ .byte 233,236,254,255,255 // jmpq 12b0 <_sk_load_tables_u16_be_hsw+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
.byte 197,233,87,210 // vxorpd %xmm2,%xmm2,%xmm2
- .byte 233,223,254,255,255 // jmpq 12b4 <_sk_load_tables_u16_be_hsw+0x31>
+ .byte 233,223,254,255,255 // jmpq 12b0 <_sk_load_tables_u16_be_hsw+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
- .byte 233,214,254,255,255 // jmpq 12b4 <_sk_load_tables_u16_be_hsw+0x31>
+ .byte 233,214,254,255,255 // jmpq 12b0 <_sk_load_tables_u16_be_hsw+0x31>
HIDDEN _sk_load_tables_rgb_u16_be_hsw
.globl _sk_load_tables_rgb_u16_be_hsw
@@ -8846,7 +8844,7 @@ _sk_load_tables_rgb_u16_be_hsw:
.byte 76,139,0 // mov (%rax),%r8
.byte 76,141,12,127 // lea (%rdi,%rdi,2),%r9
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,193,0,0,0 // jne 14b1 <_sk_load_tables_rgb_u16_be_hsw+0xd3>
+ .byte 15,133,193,0,0,0 // jne 14ad <_sk_load_tables_rgb_u16_be_hsw+0xd3>
.byte 196,129,122,111,4,72 // vmovdqu (%r8,%r9,2),%xmm0
.byte 196,129,122,111,84,72,12 // vmovdqu 0xc(%r8,%r9,2),%xmm2
.byte 196,129,122,111,76,72,24 // vmovdqu 0x18(%r8,%r9,2),%xmm1
@@ -8867,7 +8865,7 @@ _sk_load_tables_rgb_u16_be_hsw:
.byte 197,185,108,218 // vpunpcklqdq %xmm2,%xmm8,%xmm3
.byte 197,185,109,210 // vpunpckhqdq %xmm2,%xmm8,%xmm2
.byte 197,121,108,193 // vpunpcklqdq %xmm1,%xmm0,%xmm8
- .byte 197,121,111,13,86,47,0,0 // vmovdqa 0x2f56(%rip),%xmm9 # 43b0 <_sk_callback_hsw+0x667>
+ .byte 197,121,111,13,90,47,0,0 // vmovdqa 0x2f5a(%rip),%xmm9 # 43b0 <_sk_callback_hsw+0x66b>
.byte 196,193,97,219,193 // vpand %xmm9,%xmm3,%xmm0
.byte 196,226,125,51,200 // vpmovzxwd %xmm0,%ymm1
.byte 197,229,118,219 // vpcmpeqd %ymm3,%ymm3,%ymm3
@@ -8884,41 +8882,41 @@ _sk_load_tables_rgb_u16_be_hsw:
.byte 196,98,125,51,194 // vpmovzxwd %xmm2,%ymm8
.byte 196,162,101,146,20,128 // vgatherdps %ymm3,(%rax,%ymm8,4),%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,197,42,0,0 // vbroadcastss 0x2ac5(%rip),%ymm3 # 3f74 <_sk_callback_hsw+0x22b>
+ .byte 196,226,125,24,29,197,42,0,0 // vbroadcastss 0x2ac5(%rip),%ymm3 # 3f70 <_sk_callback_hsw+0x22b>
.byte 255,224 // jmpq *%rax
.byte 196,129,121,110,4,72 // vmovd (%r8,%r9,2),%xmm0
.byte 196,129,121,196,68,72,4,2 // vpinsrw $0x2,0x4(%r8,%r9,2),%xmm0,%xmm0
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 117,5 // jne 14ca <_sk_load_tables_rgb_u16_be_hsw+0xec>
- .byte 233,90,255,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 117,5 // jne 14c6 <_sk_load_tables_rgb_u16_be_hsw+0xec>
+ .byte 233,90,255,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
.byte 196,129,121,110,76,72,6 // vmovd 0x6(%r8,%r9,2),%xmm1
.byte 196,1,113,196,68,72,10,2 // vpinsrw $0x2,0xa(%r8,%r9,2),%xmm1,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,26 // jb 14f9 <_sk_load_tables_rgb_u16_be_hsw+0x11b>
+ .byte 114,26 // jb 14f5 <_sk_load_tables_rgb_u16_be_hsw+0x11b>
.byte 196,129,121,110,76,72,12 // vmovd 0xc(%r8,%r9,2),%xmm1
.byte 196,129,113,196,84,72,16,2 // vpinsrw $0x2,0x10(%r8,%r9,2),%xmm1,%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 117,10 // jne 14fe <_sk_load_tables_rgb_u16_be_hsw+0x120>
- .byte 233,43,255,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
- .byte 233,38,255,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 117,10 // jne 14fa <_sk_load_tables_rgb_u16_be_hsw+0x120>
+ .byte 233,43,255,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 233,38,255,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
.byte 196,129,121,110,76,72,18 // vmovd 0x12(%r8,%r9,2),%xmm1
.byte 196,1,113,196,76,72,22,2 // vpinsrw $0x2,0x16(%r8,%r9,2),%xmm1,%xmm9
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,26 // jb 152d <_sk_load_tables_rgb_u16_be_hsw+0x14f>
+ .byte 114,26 // jb 1529 <_sk_load_tables_rgb_u16_be_hsw+0x14f>
.byte 196,129,121,110,76,72,24 // vmovd 0x18(%r8,%r9,2),%xmm1
.byte 196,129,113,196,76,72,28,2 // vpinsrw $0x2,0x1c(%r8,%r9,2),%xmm1,%xmm1
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 117,10 // jne 1532 <_sk_load_tables_rgb_u16_be_hsw+0x154>
- .byte 233,247,254,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
- .byte 233,242,254,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 117,10 // jne 152e <_sk_load_tables_rgb_u16_be_hsw+0x154>
+ .byte 233,247,254,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 233,242,254,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
.byte 196,129,121,110,92,72,30 // vmovd 0x1e(%r8,%r9,2),%xmm3
.byte 196,1,97,196,92,72,34,2 // vpinsrw $0x2,0x22(%r8,%r9,2),%xmm3,%xmm11
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,20 // jb 155b <_sk_load_tables_rgb_u16_be_hsw+0x17d>
+ .byte 114,20 // jb 1557 <_sk_load_tables_rgb_u16_be_hsw+0x17d>
.byte 196,129,121,110,92,72,36 // vmovd 0x24(%r8,%r9,2),%xmm3
.byte 196,129,97,196,92,72,40,2 // vpinsrw $0x2,0x28(%r8,%r9,2),%xmm3,%xmm3
- .byte 233,201,254,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
- .byte 233,196,254,255,255 // jmpq 1424 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 233,201,254,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ .byte 233,196,254,255,255 // jmpq 1420 <_sk_load_tables_rgb_u16_be_hsw+0x46>
HIDDEN _sk_byte_tables_hsw
.globl _sk_byte_tables_hsw
@@ -8931,7 +8929,7 @@ _sk_byte_tables_hsw:
.byte 65,84 // push %r12
.byte 83 // push %rbx
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,3,42,0,0 // vbroadcastss 0x2a03(%rip),%ymm8 # 3f78 <_sk_callback_hsw+0x22f>
+ .byte 196,98,125,24,5,3,42,0,0 // vbroadcastss 0x2a03(%rip),%ymm8 # 3f74 <_sk_callback_hsw+0x22f>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
.byte 197,253,91,192 // vcvtps2dq %ymm0,%ymm0
.byte 196,195,249,22,192,1 // vpextrq $0x1,%xmm0,%r8
@@ -8968,7 +8966,7 @@ _sk_byte_tables_hsw:
.byte 196,227,121,32,197,7 // vpinsrb $0x7,%ebp,%xmm0,%xmm0
.byte 196,226,125,49,192 // vpmovzxbd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,13,84,41,0,0 // vbroadcastss 0x2954(%rip),%ymm9 # 3f7c <_sk_callback_hsw+0x233>
+ .byte 196,98,125,24,13,84,41,0,0 // vbroadcastss 0x2954(%rip),%ymm9 # 3f78 <_sk_callback_hsw+0x233>
.byte 196,193,124,89,193 // vmulps %ymm9,%ymm0,%ymm0
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
.byte 197,253,91,201 // vcvtps2dq %ymm1,%ymm1
@@ -9129,7 +9127,7 @@ _sk_byte_tables_rgb_hsw:
.byte 196,227,121,32,197,7 // vpinsrb $0x7,%ebp,%xmm0,%xmm0
.byte 196,226,125,49,192 // vpmovzxbd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,13,141,38,0,0 // vbroadcastss 0x268d(%rip),%ymm9 # 3f80 <_sk_callback_hsw+0x237>
+ .byte 196,98,125,24,13,141,38,0,0 // vbroadcastss 0x268d(%rip),%ymm9 # 3f7c <_sk_callback_hsw+0x237>
.byte 196,193,124,89,193 // vmulps %ymm9,%ymm0,%ymm0
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
.byte 197,253,91,201 // vcvtps2dq %ymm1,%ymm1
@@ -9292,33 +9290,33 @@ _sk_parametric_r_hsw:
.byte 196,66,125,168,211 // vfmadd213ps %ymm11,%ymm0,%ymm10
.byte 196,226,125,24,0 // vbroadcastss (%rax),%ymm0
.byte 196,65,124,91,218 // vcvtdq2ps %ymm10,%ymm11
- .byte 196,98,125,24,37,64,36,0,0 // vbroadcastss 0x2440(%rip),%ymm12 # 3f84 <_sk_callback_hsw+0x23b>
- .byte 196,98,125,24,45,59,36,0,0 // vbroadcastss 0x243b(%rip),%ymm13 # 3f88 <_sk_callback_hsw+0x23f>
+ .byte 196,98,125,24,37,64,36,0,0 // vbroadcastss 0x2440(%rip),%ymm12 # 3f80 <_sk_callback_hsw+0x23b>
+ .byte 196,98,125,24,45,59,36,0,0 // vbroadcastss 0x243b(%rip),%ymm13 # 3f84 <_sk_callback_hsw+0x23f>
.byte 196,65,44,84,213 // vandps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,49,36,0,0 // vbroadcastss 0x2431(%rip),%ymm13 # 3f8c <_sk_callback_hsw+0x243>
+ .byte 196,98,125,24,45,49,36,0,0 // vbroadcastss 0x2431(%rip),%ymm13 # 3f88 <_sk_callback_hsw+0x243>
.byte 196,65,44,86,213 // vorps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,39,36,0,0 // vbroadcastss 0x2427(%rip),%ymm13 # 3f90 <_sk_callback_hsw+0x247>
+ .byte 196,98,125,24,45,39,36,0,0 // vbroadcastss 0x2427(%rip),%ymm13 # 3f8c <_sk_callback_hsw+0x247>
.byte 196,66,37,184,236 // vfmadd231ps %ymm12,%ymm11,%ymm13
- .byte 196,98,125,24,29,29,36,0,0 // vbroadcastss 0x241d(%rip),%ymm11 # 3f94 <_sk_callback_hsw+0x24b>
+ .byte 196,98,125,24,29,29,36,0,0 // vbroadcastss 0x241d(%rip),%ymm11 # 3f90 <_sk_callback_hsw+0x24b>
.byte 196,66,45,172,221 // vfnmadd213ps %ymm13,%ymm10,%ymm11
- .byte 196,98,125,24,37,19,36,0,0 // vbroadcastss 0x2413(%rip),%ymm12 # 3f98 <_sk_callback_hsw+0x24f>
+ .byte 196,98,125,24,37,19,36,0,0 // vbroadcastss 0x2413(%rip),%ymm12 # 3f94 <_sk_callback_hsw+0x24f>
.byte 196,65,44,88,212 // vaddps %ymm12,%ymm10,%ymm10
- .byte 196,98,125,24,37,9,36,0,0 // vbroadcastss 0x2409(%rip),%ymm12 # 3f9c <_sk_callback_hsw+0x253>
+ .byte 196,98,125,24,37,9,36,0,0 // vbroadcastss 0x2409(%rip),%ymm12 # 3f98 <_sk_callback_hsw+0x253>
.byte 196,65,28,94,210 // vdivps %ymm10,%ymm12,%ymm10
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
.byte 196,193,124,89,194 // vmulps %ymm10,%ymm0,%ymm0
.byte 196,99,125,8,208,1 // vroundps $0x1,%ymm0,%ymm10
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 196,98,125,24,29,234,35,0,0 // vbroadcastss 0x23ea(%rip),%ymm11 # 3fa0 <_sk_callback_hsw+0x257>
+ .byte 196,98,125,24,29,234,35,0,0 // vbroadcastss 0x23ea(%rip),%ymm11 # 3f9c <_sk_callback_hsw+0x257>
.byte 196,193,124,88,195 // vaddps %ymm11,%ymm0,%ymm0
- .byte 196,98,125,24,29,224,35,0,0 // vbroadcastss 0x23e0(%rip),%ymm11 # 3fa4 <_sk_callback_hsw+0x25b>
+ .byte 196,98,125,24,29,224,35,0,0 // vbroadcastss 0x23e0(%rip),%ymm11 # 3fa0 <_sk_callback_hsw+0x25b>
.byte 196,98,45,172,216 // vfnmadd213ps %ymm0,%ymm10,%ymm11
- .byte 196,226,125,24,5,214,35,0,0 // vbroadcastss 0x23d6(%rip),%ymm0 # 3fa8 <_sk_callback_hsw+0x25f>
+ .byte 196,226,125,24,5,214,35,0,0 // vbroadcastss 0x23d6(%rip),%ymm0 # 3fa4 <_sk_callback_hsw+0x25f>
.byte 196,193,124,92,194 // vsubps %ymm10,%ymm0,%ymm0
- .byte 196,98,125,24,21,204,35,0,0 // vbroadcastss 0x23cc(%rip),%ymm10 # 3fac <_sk_callback_hsw+0x263>
+ .byte 196,98,125,24,21,204,35,0,0 // vbroadcastss 0x23cc(%rip),%ymm10 # 3fa8 <_sk_callback_hsw+0x263>
.byte 197,172,94,192 // vdivps %ymm0,%ymm10,%ymm0
.byte 197,164,88,192 // vaddps %ymm0,%ymm11,%ymm0
- .byte 196,98,125,24,21,191,35,0,0 // vbroadcastss 0x23bf(%rip),%ymm10 # 3fb0 <_sk_callback_hsw+0x267>
+ .byte 196,98,125,24,21,191,35,0,0 // vbroadcastss 0x23bf(%rip),%ymm10 # 3fac <_sk_callback_hsw+0x267>
.byte 196,193,124,89,194 // vmulps %ymm10,%ymm0,%ymm0
.byte 197,253,91,192 // vcvtps2dq %ymm0,%ymm0
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -9326,7 +9324,7 @@ _sk_parametric_r_hsw:
.byte 196,195,125,74,193,128 // vblendvps %ymm8,%ymm9,%ymm0,%ymm0
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,124,95,192 // vmaxps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,5,150,35,0,0 // vbroadcastss 0x2396(%rip),%ymm8 # 3fb4 <_sk_callback_hsw+0x26b>
+ .byte 196,98,125,24,5,150,35,0,0 // vbroadcastss 0x2396(%rip),%ymm8 # 3fb0 <_sk_callback_hsw+0x26b>
.byte 196,193,124,93,192 // vminps %ymm8,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -9346,33 +9344,33 @@ _sk_parametric_g_hsw:
.byte 196,66,117,168,211 // vfmadd213ps %ymm11,%ymm1,%ymm10
.byte 196,226,125,24,8 // vbroadcastss (%rax),%ymm1
.byte 196,65,124,91,218 // vcvtdq2ps %ymm10,%ymm11
- .byte 196,98,125,24,37,78,35,0,0 // vbroadcastss 0x234e(%rip),%ymm12 # 3fb8 <_sk_callback_hsw+0x26f>
- .byte 196,98,125,24,45,73,35,0,0 // vbroadcastss 0x2349(%rip),%ymm13 # 3fbc <_sk_callback_hsw+0x273>
+ .byte 196,98,125,24,37,78,35,0,0 // vbroadcastss 0x234e(%rip),%ymm12 # 3fb4 <_sk_callback_hsw+0x26f>
+ .byte 196,98,125,24,45,73,35,0,0 // vbroadcastss 0x2349(%rip),%ymm13 # 3fb8 <_sk_callback_hsw+0x273>
.byte 196,65,44,84,213 // vandps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,63,35,0,0 // vbroadcastss 0x233f(%rip),%ymm13 # 3fc0 <_sk_callback_hsw+0x277>
+ .byte 196,98,125,24,45,63,35,0,0 // vbroadcastss 0x233f(%rip),%ymm13 # 3fbc <_sk_callback_hsw+0x277>
.byte 196,65,44,86,213 // vorps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,53,35,0,0 // vbroadcastss 0x2335(%rip),%ymm13 # 3fc4 <_sk_callback_hsw+0x27b>
+ .byte 196,98,125,24,45,53,35,0,0 // vbroadcastss 0x2335(%rip),%ymm13 # 3fc0 <_sk_callback_hsw+0x27b>
.byte 196,66,37,184,236 // vfmadd231ps %ymm12,%ymm11,%ymm13
- .byte 196,98,125,24,29,43,35,0,0 // vbroadcastss 0x232b(%rip),%ymm11 # 3fc8 <_sk_callback_hsw+0x27f>
+ .byte 196,98,125,24,29,43,35,0,0 // vbroadcastss 0x232b(%rip),%ymm11 # 3fc4 <_sk_callback_hsw+0x27f>
.byte 196,66,45,172,221 // vfnmadd213ps %ymm13,%ymm10,%ymm11
- .byte 196,98,125,24,37,33,35,0,0 // vbroadcastss 0x2321(%rip),%ymm12 # 3fcc <_sk_callback_hsw+0x283>
+ .byte 196,98,125,24,37,33,35,0,0 // vbroadcastss 0x2321(%rip),%ymm12 # 3fc8 <_sk_callback_hsw+0x283>
.byte 196,65,44,88,212 // vaddps %ymm12,%ymm10,%ymm10
- .byte 196,98,125,24,37,23,35,0,0 // vbroadcastss 0x2317(%rip),%ymm12 # 3fd0 <_sk_callback_hsw+0x287>
+ .byte 196,98,125,24,37,23,35,0,0 // vbroadcastss 0x2317(%rip),%ymm12 # 3fcc <_sk_callback_hsw+0x287>
.byte 196,65,28,94,210 // vdivps %ymm10,%ymm12,%ymm10
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
.byte 196,193,116,89,202 // vmulps %ymm10,%ymm1,%ymm1
.byte 196,99,125,8,209,1 // vroundps $0x1,%ymm1,%ymm10
.byte 196,65,116,92,210 // vsubps %ymm10,%ymm1,%ymm10
- .byte 196,98,125,24,29,248,34,0,0 // vbroadcastss 0x22f8(%rip),%ymm11 # 3fd4 <_sk_callback_hsw+0x28b>
+ .byte 196,98,125,24,29,248,34,0,0 // vbroadcastss 0x22f8(%rip),%ymm11 # 3fd0 <_sk_callback_hsw+0x28b>
.byte 196,193,116,88,203 // vaddps %ymm11,%ymm1,%ymm1
- .byte 196,98,125,24,29,238,34,0,0 // vbroadcastss 0x22ee(%rip),%ymm11 # 3fd8 <_sk_callback_hsw+0x28f>
+ .byte 196,98,125,24,29,238,34,0,0 // vbroadcastss 0x22ee(%rip),%ymm11 # 3fd4 <_sk_callback_hsw+0x28f>
.byte 196,98,45,172,217 // vfnmadd213ps %ymm1,%ymm10,%ymm11
- .byte 196,226,125,24,13,228,34,0,0 // vbroadcastss 0x22e4(%rip),%ymm1 # 3fdc <_sk_callback_hsw+0x293>
+ .byte 196,226,125,24,13,228,34,0,0 // vbroadcastss 0x22e4(%rip),%ymm1 # 3fd8 <_sk_callback_hsw+0x293>
.byte 196,193,116,92,202 // vsubps %ymm10,%ymm1,%ymm1
- .byte 196,98,125,24,21,218,34,0,0 // vbroadcastss 0x22da(%rip),%ymm10 # 3fe0 <_sk_callback_hsw+0x297>
+ .byte 196,98,125,24,21,218,34,0,0 // vbroadcastss 0x22da(%rip),%ymm10 # 3fdc <_sk_callback_hsw+0x297>
.byte 197,172,94,201 // vdivps %ymm1,%ymm10,%ymm1
.byte 197,164,88,201 // vaddps %ymm1,%ymm11,%ymm1
- .byte 196,98,125,24,21,205,34,0,0 // vbroadcastss 0x22cd(%rip),%ymm10 # 3fe4 <_sk_callback_hsw+0x29b>
+ .byte 196,98,125,24,21,205,34,0,0 // vbroadcastss 0x22cd(%rip),%ymm10 # 3fe0 <_sk_callback_hsw+0x29b>
.byte 196,193,116,89,202 // vmulps %ymm10,%ymm1,%ymm1
.byte 197,253,91,201 // vcvtps2dq %ymm1,%ymm1
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -9380,7 +9378,7 @@ _sk_parametric_g_hsw:
.byte 196,195,117,74,201,128 // vblendvps %ymm8,%ymm9,%ymm1,%ymm1
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,116,95,200 // vmaxps %ymm8,%ymm1,%ymm1
- .byte 196,98,125,24,5,164,34,0,0 // vbroadcastss 0x22a4(%rip),%ymm8 # 3fe8 <_sk_callback_hsw+0x29f>
+ .byte 196,98,125,24,5,164,34,0,0 // vbroadcastss 0x22a4(%rip),%ymm8 # 3fe4 <_sk_callback_hsw+0x29f>
.byte 196,193,116,93,200 // vminps %ymm8,%ymm1,%ymm1
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -9400,33 +9398,33 @@ _sk_parametric_b_hsw:
.byte 196,66,109,168,211 // vfmadd213ps %ymm11,%ymm2,%ymm10
.byte 196,226,125,24,16 // vbroadcastss (%rax),%ymm2
.byte 196,65,124,91,218 // vcvtdq2ps %ymm10,%ymm11
- .byte 196,98,125,24,37,92,34,0,0 // vbroadcastss 0x225c(%rip),%ymm12 # 3fec <_sk_callback_hsw+0x2a3>
- .byte 196,98,125,24,45,87,34,0,0 // vbroadcastss 0x2257(%rip),%ymm13 # 3ff0 <_sk_callback_hsw+0x2a7>
+ .byte 196,98,125,24,37,92,34,0,0 // vbroadcastss 0x225c(%rip),%ymm12 # 3fe8 <_sk_callback_hsw+0x2a3>
+ .byte 196,98,125,24,45,87,34,0,0 // vbroadcastss 0x2257(%rip),%ymm13 # 3fec <_sk_callback_hsw+0x2a7>
.byte 196,65,44,84,213 // vandps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,77,34,0,0 // vbroadcastss 0x224d(%rip),%ymm13 # 3ff4 <_sk_callback_hsw+0x2ab>
+ .byte 196,98,125,24,45,77,34,0,0 // vbroadcastss 0x224d(%rip),%ymm13 # 3ff0 <_sk_callback_hsw+0x2ab>
.byte 196,65,44,86,213 // vorps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,67,34,0,0 // vbroadcastss 0x2243(%rip),%ymm13 # 3ff8 <_sk_callback_hsw+0x2af>
+ .byte 196,98,125,24,45,67,34,0,0 // vbroadcastss 0x2243(%rip),%ymm13 # 3ff4 <_sk_callback_hsw+0x2af>
.byte 196,66,37,184,236 // vfmadd231ps %ymm12,%ymm11,%ymm13
- .byte 196,98,125,24,29,57,34,0,0 // vbroadcastss 0x2239(%rip),%ymm11 # 3ffc <_sk_callback_hsw+0x2b3>
+ .byte 196,98,125,24,29,57,34,0,0 // vbroadcastss 0x2239(%rip),%ymm11 # 3ff8 <_sk_callback_hsw+0x2b3>
.byte 196,66,45,172,221 // vfnmadd213ps %ymm13,%ymm10,%ymm11
- .byte 196,98,125,24,37,47,34,0,0 // vbroadcastss 0x222f(%rip),%ymm12 # 4000 <_sk_callback_hsw+0x2b7>
+ .byte 196,98,125,24,37,47,34,0,0 // vbroadcastss 0x222f(%rip),%ymm12 # 3ffc <_sk_callback_hsw+0x2b7>
.byte 196,65,44,88,212 // vaddps %ymm12,%ymm10,%ymm10
- .byte 196,98,125,24,37,37,34,0,0 // vbroadcastss 0x2225(%rip),%ymm12 # 4004 <_sk_callback_hsw+0x2bb>
+ .byte 196,98,125,24,37,37,34,0,0 // vbroadcastss 0x2225(%rip),%ymm12 # 4000 <_sk_callback_hsw+0x2bb>
.byte 196,65,28,94,210 // vdivps %ymm10,%ymm12,%ymm10
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
.byte 196,193,108,89,210 // vmulps %ymm10,%ymm2,%ymm2
.byte 196,99,125,8,210,1 // vroundps $0x1,%ymm2,%ymm10
.byte 196,65,108,92,210 // vsubps %ymm10,%ymm2,%ymm10
- .byte 196,98,125,24,29,6,34,0,0 // vbroadcastss 0x2206(%rip),%ymm11 # 4008 <_sk_callback_hsw+0x2bf>
+ .byte 196,98,125,24,29,6,34,0,0 // vbroadcastss 0x2206(%rip),%ymm11 # 4004 <_sk_callback_hsw+0x2bf>
.byte 196,193,108,88,211 // vaddps %ymm11,%ymm2,%ymm2
- .byte 196,98,125,24,29,252,33,0,0 // vbroadcastss 0x21fc(%rip),%ymm11 # 400c <_sk_callback_hsw+0x2c3>
+ .byte 196,98,125,24,29,252,33,0,0 // vbroadcastss 0x21fc(%rip),%ymm11 # 4008 <_sk_callback_hsw+0x2c3>
.byte 196,98,45,172,218 // vfnmadd213ps %ymm2,%ymm10,%ymm11
- .byte 196,226,125,24,21,242,33,0,0 // vbroadcastss 0x21f2(%rip),%ymm2 # 4010 <_sk_callback_hsw+0x2c7>
+ .byte 196,226,125,24,21,242,33,0,0 // vbroadcastss 0x21f2(%rip),%ymm2 # 400c <_sk_callback_hsw+0x2c7>
.byte 196,193,108,92,210 // vsubps %ymm10,%ymm2,%ymm2
- .byte 196,98,125,24,21,232,33,0,0 // vbroadcastss 0x21e8(%rip),%ymm10 # 4014 <_sk_callback_hsw+0x2cb>
+ .byte 196,98,125,24,21,232,33,0,0 // vbroadcastss 0x21e8(%rip),%ymm10 # 4010 <_sk_callback_hsw+0x2cb>
.byte 197,172,94,210 // vdivps %ymm2,%ymm10,%ymm2
.byte 197,164,88,210 // vaddps %ymm2,%ymm11,%ymm2
- .byte 196,98,125,24,21,219,33,0,0 // vbroadcastss 0x21db(%rip),%ymm10 # 4018 <_sk_callback_hsw+0x2cf>
+ .byte 196,98,125,24,21,219,33,0,0 // vbroadcastss 0x21db(%rip),%ymm10 # 4014 <_sk_callback_hsw+0x2cf>
.byte 196,193,108,89,210 // vmulps %ymm10,%ymm2,%ymm2
.byte 197,253,91,210 // vcvtps2dq %ymm2,%ymm2
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -9434,7 +9432,7 @@ _sk_parametric_b_hsw:
.byte 196,195,109,74,209,128 // vblendvps %ymm8,%ymm9,%ymm2,%ymm2
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,108,95,208 // vmaxps %ymm8,%ymm2,%ymm2
- .byte 196,98,125,24,5,178,33,0,0 // vbroadcastss 0x21b2(%rip),%ymm8 # 401c <_sk_callback_hsw+0x2d3>
+ .byte 196,98,125,24,5,178,33,0,0 // vbroadcastss 0x21b2(%rip),%ymm8 # 4018 <_sk_callback_hsw+0x2d3>
.byte 196,193,108,93,208 // vminps %ymm8,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -9454,33 +9452,33 @@ _sk_parametric_a_hsw:
.byte 196,66,101,168,211 // vfmadd213ps %ymm11,%ymm3,%ymm10
.byte 196,226,125,24,24 // vbroadcastss (%rax),%ymm3
.byte 196,65,124,91,218 // vcvtdq2ps %ymm10,%ymm11
- .byte 196,98,125,24,37,106,33,0,0 // vbroadcastss 0x216a(%rip),%ymm12 # 4020 <_sk_callback_hsw+0x2d7>
- .byte 196,98,125,24,45,101,33,0,0 // vbroadcastss 0x2165(%rip),%ymm13 # 4024 <_sk_callback_hsw+0x2db>
+ .byte 196,98,125,24,37,106,33,0,0 // vbroadcastss 0x216a(%rip),%ymm12 # 401c <_sk_callback_hsw+0x2d7>
+ .byte 196,98,125,24,45,101,33,0,0 // vbroadcastss 0x2165(%rip),%ymm13 # 4020 <_sk_callback_hsw+0x2db>
.byte 196,65,44,84,213 // vandps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,91,33,0,0 // vbroadcastss 0x215b(%rip),%ymm13 # 4028 <_sk_callback_hsw+0x2df>
+ .byte 196,98,125,24,45,91,33,0,0 // vbroadcastss 0x215b(%rip),%ymm13 # 4024 <_sk_callback_hsw+0x2df>
.byte 196,65,44,86,213 // vorps %ymm13,%ymm10,%ymm10
- .byte 196,98,125,24,45,81,33,0,0 // vbroadcastss 0x2151(%rip),%ymm13 # 402c <_sk_callback_hsw+0x2e3>
+ .byte 196,98,125,24,45,81,33,0,0 // vbroadcastss 0x2151(%rip),%ymm13 # 4028 <_sk_callback_hsw+0x2e3>
.byte 196,66,37,184,236 // vfmadd231ps %ymm12,%ymm11,%ymm13
- .byte 196,98,125,24,29,71,33,0,0 // vbroadcastss 0x2147(%rip),%ymm11 # 4030 <_sk_callback_hsw+0x2e7>
+ .byte 196,98,125,24,29,71,33,0,0 // vbroadcastss 0x2147(%rip),%ymm11 # 402c <_sk_callback_hsw+0x2e7>
.byte 196,66,45,172,221 // vfnmadd213ps %ymm13,%ymm10,%ymm11
- .byte 196,98,125,24,37,61,33,0,0 // vbroadcastss 0x213d(%rip),%ymm12 # 4034 <_sk_callback_hsw+0x2eb>
+ .byte 196,98,125,24,37,61,33,0,0 // vbroadcastss 0x213d(%rip),%ymm12 # 4030 <_sk_callback_hsw+0x2eb>
.byte 196,65,44,88,212 // vaddps %ymm12,%ymm10,%ymm10
- .byte 196,98,125,24,37,51,33,0,0 // vbroadcastss 0x2133(%rip),%ymm12 # 4038 <_sk_callback_hsw+0x2ef>
+ .byte 196,98,125,24,37,51,33,0,0 // vbroadcastss 0x2133(%rip),%ymm12 # 4034 <_sk_callback_hsw+0x2ef>
.byte 196,65,28,94,210 // vdivps %ymm10,%ymm12,%ymm10
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
.byte 196,193,100,89,218 // vmulps %ymm10,%ymm3,%ymm3
.byte 196,99,125,8,211,1 // vroundps $0x1,%ymm3,%ymm10
.byte 196,65,100,92,210 // vsubps %ymm10,%ymm3,%ymm10
- .byte 196,98,125,24,29,20,33,0,0 // vbroadcastss 0x2114(%rip),%ymm11 # 403c <_sk_callback_hsw+0x2f3>
+ .byte 196,98,125,24,29,20,33,0,0 // vbroadcastss 0x2114(%rip),%ymm11 # 4038 <_sk_callback_hsw+0x2f3>
.byte 196,193,100,88,219 // vaddps %ymm11,%ymm3,%ymm3
- .byte 196,98,125,24,29,10,33,0,0 // vbroadcastss 0x210a(%rip),%ymm11 # 4040 <_sk_callback_hsw+0x2f7>
+ .byte 196,98,125,24,29,10,33,0,0 // vbroadcastss 0x210a(%rip),%ymm11 # 403c <_sk_callback_hsw+0x2f7>
.byte 196,98,45,172,219 // vfnmadd213ps %ymm3,%ymm10,%ymm11
- .byte 196,226,125,24,29,0,33,0,0 // vbroadcastss 0x2100(%rip),%ymm3 # 4044 <_sk_callback_hsw+0x2fb>
+ .byte 196,226,125,24,29,0,33,0,0 // vbroadcastss 0x2100(%rip),%ymm3 # 4040 <_sk_callback_hsw+0x2fb>
.byte 196,193,100,92,218 // vsubps %ymm10,%ymm3,%ymm3
- .byte 196,98,125,24,21,246,32,0,0 // vbroadcastss 0x20f6(%rip),%ymm10 # 4048 <_sk_callback_hsw+0x2ff>
+ .byte 196,98,125,24,21,246,32,0,0 // vbroadcastss 0x20f6(%rip),%ymm10 # 4044 <_sk_callback_hsw+0x2ff>
.byte 197,172,94,219 // vdivps %ymm3,%ymm10,%ymm3
.byte 197,164,88,219 // vaddps %ymm3,%ymm11,%ymm3
- .byte 196,98,125,24,21,233,32,0,0 // vbroadcastss 0x20e9(%rip),%ymm10 # 404c <_sk_callback_hsw+0x303>
+ .byte 196,98,125,24,21,233,32,0,0 // vbroadcastss 0x20e9(%rip),%ymm10 # 4048 <_sk_callback_hsw+0x303>
.byte 196,193,100,89,218 // vmulps %ymm10,%ymm3,%ymm3
.byte 197,253,91,219 // vcvtps2dq %ymm3,%ymm3
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -9488,7 +9486,7 @@ _sk_parametric_a_hsw:
.byte 196,195,101,74,217,128 // vblendvps %ymm8,%ymm9,%ymm3,%ymm3
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,100,95,216 // vmaxps %ymm8,%ymm3,%ymm3
- .byte 196,98,125,24,5,192,32,0,0 // vbroadcastss 0x20c0(%rip),%ymm8 # 4050 <_sk_callback_hsw+0x307>
+ .byte 196,98,125,24,5,192,32,0,0 // vbroadcastss 0x20c0(%rip),%ymm8 # 404c <_sk_callback_hsw+0x307>
.byte 196,193,100,93,216 // vminps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -9497,26 +9495,26 @@ HIDDEN _sk_lab_to_xyz_hsw
.globl _sk_lab_to_xyz_hsw
FUNCTION(_sk_lab_to_xyz_hsw)
_sk_lab_to_xyz_hsw:
- .byte 196,98,125,24,5,178,32,0,0 // vbroadcastss 0x20b2(%rip),%ymm8 # 4054 <_sk_callback_hsw+0x30b>
- .byte 196,98,125,24,13,173,32,0,0 // vbroadcastss 0x20ad(%rip),%ymm9 # 4058 <_sk_callback_hsw+0x30f>
- .byte 196,98,125,24,21,168,32,0,0 // vbroadcastss 0x20a8(%rip),%ymm10 # 405c <_sk_callback_hsw+0x313>
+ .byte 196,98,125,24,5,178,32,0,0 // vbroadcastss 0x20b2(%rip),%ymm8 # 4050 <_sk_callback_hsw+0x30b>
+ .byte 196,98,125,24,13,173,32,0,0 // vbroadcastss 0x20ad(%rip),%ymm9 # 4054 <_sk_callback_hsw+0x30f>
+ .byte 196,98,125,24,21,168,32,0,0 // vbroadcastss 0x20a8(%rip),%ymm10 # 4058 <_sk_callback_hsw+0x313>
.byte 196,194,53,168,202 // vfmadd213ps %ymm10,%ymm9,%ymm1
.byte 196,194,53,168,210 // vfmadd213ps %ymm10,%ymm9,%ymm2
- .byte 196,98,125,24,13,153,32,0,0 // vbroadcastss 0x2099(%rip),%ymm9 # 4060 <_sk_callback_hsw+0x317>
+ .byte 196,98,125,24,13,153,32,0,0 // vbroadcastss 0x2099(%rip),%ymm9 # 405c <_sk_callback_hsw+0x317>
.byte 196,66,125,184,200 // vfmadd231ps %ymm8,%ymm0,%ymm9
- .byte 196,226,125,24,5,143,32,0,0 // vbroadcastss 0x208f(%rip),%ymm0 # 4064 <_sk_callback_hsw+0x31b>
+ .byte 196,226,125,24,5,143,32,0,0 // vbroadcastss 0x208f(%rip),%ymm0 # 4060 <_sk_callback_hsw+0x31b>
.byte 197,180,89,192 // vmulps %ymm0,%ymm9,%ymm0
- .byte 196,98,125,24,5,134,32,0,0 // vbroadcastss 0x2086(%rip),%ymm8 # 4068 <_sk_callback_hsw+0x31f>
+ .byte 196,98,125,24,5,134,32,0,0 // vbroadcastss 0x2086(%rip),%ymm8 # 4064 <_sk_callback_hsw+0x31f>
.byte 196,98,117,168,192 // vfmadd213ps %ymm0,%ymm1,%ymm8
- .byte 196,98,125,24,13,124,32,0,0 // vbroadcastss 0x207c(%rip),%ymm9 # 406c <_sk_callback_hsw+0x323>
+ .byte 196,98,125,24,13,124,32,0,0 // vbroadcastss 0x207c(%rip),%ymm9 # 4068 <_sk_callback_hsw+0x323>
.byte 196,98,109,172,200 // vfnmadd213ps %ymm0,%ymm2,%ymm9
.byte 196,193,60,89,200 // vmulps %ymm8,%ymm8,%ymm1
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
- .byte 196,226,125,24,21,105,32,0,0 // vbroadcastss 0x2069(%rip),%ymm2 # 4070 <_sk_callback_hsw+0x327>
+ .byte 196,226,125,24,21,105,32,0,0 // vbroadcastss 0x2069(%rip),%ymm2 # 406c <_sk_callback_hsw+0x327>
.byte 197,108,194,209,1 // vcmpltps %ymm1,%ymm2,%ymm10
- .byte 196,98,125,24,29,95,32,0,0 // vbroadcastss 0x205f(%rip),%ymm11 # 4074 <_sk_callback_hsw+0x32b>
+ .byte 196,98,125,24,29,95,32,0,0 // vbroadcastss 0x205f(%rip),%ymm11 # 4070 <_sk_callback_hsw+0x32b>
.byte 196,65,60,88,195 // vaddps %ymm11,%ymm8,%ymm8
- .byte 196,98,125,24,37,85,32,0,0 // vbroadcastss 0x2055(%rip),%ymm12 # 4078 <_sk_callback_hsw+0x32f>
+ .byte 196,98,125,24,37,85,32,0,0 // vbroadcastss 0x2055(%rip),%ymm12 # 4074 <_sk_callback_hsw+0x32f>
.byte 196,65,60,89,196 // vmulps %ymm12,%ymm8,%ymm8
.byte 196,99,61,74,193,160 // vblendvps %ymm10,%ymm1,%ymm8,%ymm8
.byte 197,252,89,200 // vmulps %ymm0,%ymm0,%ymm1
@@ -9531,9 +9529,9 @@ _sk_lab_to_xyz_hsw:
.byte 196,65,52,88,203 // vaddps %ymm11,%ymm9,%ymm9
.byte 196,65,52,89,204 // vmulps %ymm12,%ymm9,%ymm9
.byte 196,227,53,74,208,32 // vblendvps %ymm2,%ymm0,%ymm9,%ymm2
- .byte 196,226,125,24,5,10,32,0,0 // vbroadcastss 0x200a(%rip),%ymm0 # 407c <_sk_callback_hsw+0x333>
+ .byte 196,226,125,24,5,10,32,0,0 // vbroadcastss 0x200a(%rip),%ymm0 # 4078 <_sk_callback_hsw+0x333>
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
- .byte 196,98,125,24,5,1,32,0,0 // vbroadcastss 0x2001(%rip),%ymm8 # 4080 <_sk_callback_hsw+0x337>
+ .byte 196,98,125,24,5,1,32,0,0 // vbroadcastss 0x2001(%rip),%ymm8 # 407c <_sk_callback_hsw+0x337>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -9547,11 +9545,11 @@ _sk_load_a8_hsw:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,45 // jne 20c5 <_sk_load_a8_hsw+0x3d>
+ .byte 117,45 // jne 20c1 <_sk_load_a8_hsw+0x3d>
.byte 197,250,126,0 // vmovq (%rax),%xmm0
.byte 196,226,125,49,192 // vpmovzxbd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,214,31,0,0 // vbroadcastss 0x1fd6(%rip),%ymm1 # 4084 <_sk_callback_hsw+0x33b>
+ .byte 196,226,125,24,13,214,31,0,0 // vbroadcastss 0x1fd6(%rip),%ymm1 # 4080 <_sk_callback_hsw+0x33b>
.byte 197,252,89,217 // vmulps %ymm1,%ymm0,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,87,192 // vxorps %ymm0,%ymm0,%ymm0
@@ -9568,9 +9566,9 @@ _sk_load_a8_hsw:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 20cd <_sk_load_a8_hsw+0x45>
+ .byte 117,234 // jne 20c9 <_sk_load_a8_hsw+0x45>
.byte 196,193,249,110,193 // vmovq %r9,%xmm0
- .byte 235,178 // jmp 209c <_sk_load_a8_hsw+0x14>
+ .byte 235,178 // jmp 2098 <_sk_load_a8_hsw+0x14>
HIDDEN _sk_gather_a8_hsw
.globl _sk_gather_a8_hsw
@@ -9616,7 +9614,7 @@ _sk_gather_a8_hsw:
.byte 196,227,121,32,192,7 // vpinsrb $0x7,%eax,%xmm0,%xmm0
.byte 196,226,125,49,192 // vpmovzxbd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,225,30,0,0 // vbroadcastss 0x1ee1(%rip),%ymm1 # 4088 <_sk_callback_hsw+0x33f>
+ .byte 196,226,125,24,13,225,30,0,0 // vbroadcastss 0x1ee1(%rip),%ymm1 # 4084 <_sk_callback_hsw+0x33f>
.byte 197,252,89,217 // vmulps %ymm1,%ymm0,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,87,192 // vxorps %ymm0,%ymm0,%ymm0
@@ -9634,14 +9632,14 @@ FUNCTION(_sk_store_a8_hsw)
_sk_store_a8_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,188,30,0,0 // vbroadcastss 0x1ebc(%rip),%ymm8 # 408c <_sk_callback_hsw+0x343>
+ .byte 196,98,125,24,5,188,30,0,0 // vbroadcastss 0x1ebc(%rip),%ymm8 # 4088 <_sk_callback_hsw+0x343>
.byte 196,65,100,89,192 // vmulps %ymm8,%ymm3,%ymm8
.byte 196,65,125,91,192 // vcvtps2dq %ymm8,%ymm8
.byte 196,67,125,25,193,1 // vextractf128 $0x1,%ymm8,%xmm9
.byte 196,66,57,43,193 // vpackusdw %xmm9,%xmm8,%xmm8
.byte 196,65,57,103,192 // vpackuswb %xmm8,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 21f9 <_sk_store_a8_hsw+0x37>
+ .byte 117,10 // jne 21f5 <_sk_store_a8_hsw+0x37>
.byte 196,65,123,17,4,58 // vmovsd %xmm8,(%r10,%rdi,1)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -9649,10 +9647,10 @@ _sk_store_a8_hsw:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 21f5 <_sk_store_a8_hsw+0x33>
+ .byte 119,236 // ja 21f1 <_sk_store_a8_hsw+0x33>
.byte 196,66,121,48,192 // vpmovzxbw %xmm8,%xmm8
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,67,0,0,0 // lea 0x43(%rip),%r9 # 225c <_sk_store_a8_hsw+0x9a>
+ .byte 76,141,13,67,0,0,0 // lea 0x43(%rip),%r9 # 2258 <_sk_store_a8_hsw+0x9a>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -9663,7 +9661,7 @@ _sk_store_a8_hsw:
.byte 196,67,121,20,68,58,2,4 // vpextrb $0x4,%xmm8,0x2(%r10,%rdi,1)
.byte 196,67,121,20,68,58,1,2 // vpextrb $0x2,%xmm8,0x1(%r10,%rdi,1)
.byte 196,67,121,20,4,58,0 // vpextrb $0x0,%xmm8,(%r10,%rdi,1)
- .byte 235,154 // jmp 21f5 <_sk_store_a8_hsw+0x33>
+ .byte 235,154 // jmp 21f1 <_sk_store_a8_hsw+0x33>
.byte 144 // nop
.byte 246,255 // idiv %bh
.byte 255 // (bad)
@@ -9697,14 +9695,14 @@ _sk_load_g8_hsw:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,50 // jne 22ba <_sk_load_g8_hsw+0x42>
+ .byte 117,50 // jne 22b6 <_sk_load_g8_hsw+0x42>
.byte 197,250,126,0 // vmovq (%rax),%xmm0
.byte 196,226,125,49,192 // vpmovzxbd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,242,29,0,0 // vbroadcastss 0x1df2(%rip),%ymm1 # 4090 <_sk_callback_hsw+0x347>
+ .byte 196,226,125,24,13,242,29,0,0 // vbroadcastss 0x1df2(%rip),%ymm1 # 408c <_sk_callback_hsw+0x347>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,231,29,0,0 // vbroadcastss 0x1de7(%rip),%ymm3 # 4094 <_sk_callback_hsw+0x34b>
+ .byte 196,226,125,24,29,231,29,0,0 // vbroadcastss 0x1de7(%rip),%ymm3 # 4090 <_sk_callback_hsw+0x34b>
.byte 76,137,193 // mov %r8,%rcx
.byte 197,252,40,200 // vmovaps %ymm0,%ymm1
.byte 197,252,40,208 // vmovaps %ymm0,%ymm2
@@ -9718,9 +9716,9 @@ _sk_load_g8_hsw:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 22c2 <_sk_load_g8_hsw+0x4a>
+ .byte 117,234 // jne 22be <_sk_load_g8_hsw+0x4a>
.byte 196,193,249,110,193 // vmovq %r9,%xmm0
- .byte 235,173 // jmp 228c <_sk_load_g8_hsw+0x14>
+ .byte 235,173 // jmp 2288 <_sk_load_g8_hsw+0x14>
HIDDEN _sk_gather_g8_hsw
.globl _sk_gather_g8_hsw
@@ -9766,10 +9764,10 @@ _sk_gather_g8_hsw:
.byte 196,227,121,32,192,7 // vpinsrb $0x7,%eax,%xmm0,%xmm0
.byte 196,226,125,49,192 // vpmovzxbd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,252,28,0,0 // vbroadcastss 0x1cfc(%rip),%ymm1 # 4098 <_sk_callback_hsw+0x34f>
+ .byte 196,226,125,24,13,252,28,0,0 // vbroadcastss 0x1cfc(%rip),%ymm1 # 4094 <_sk_callback_hsw+0x34f>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,241,28,0,0 // vbroadcastss 0x1cf1(%rip),%ymm3 # 409c <_sk_callback_hsw+0x353>
+ .byte 196,226,125,24,29,241,28,0,0 // vbroadcastss 0x1cf1(%rip),%ymm3 # 4098 <_sk_callback_hsw+0x353>
.byte 197,252,40,200 // vmovaps %ymm0,%ymm1
.byte 197,252,40,208 // vmovaps %ymm0,%ymm2
.byte 91 // pop %rbx
@@ -9785,9 +9783,9 @@ _sk_gather_i8_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 73,137,192 // mov %rax,%r8
.byte 77,133,192 // test %r8,%r8
- .byte 116,5 // je 23cb <_sk_gather_i8_hsw+0xf>
+ .byte 116,5 // je 23c7 <_sk_gather_i8_hsw+0xf>
.byte 76,137,192 // mov %r8,%rax
- .byte 235,2 // jmp 23cd <_sk_gather_i8_hsw+0x11>
+ .byte 235,2 // jmp 23c9 <_sk_gather_i8_hsw+0x11>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,87 // push %r15
.byte 65,86 // push %r14
@@ -9825,14 +9823,14 @@ _sk_gather_i8_hsw:
.byte 73,139,64,8 // mov 0x8(%r8),%rax
.byte 197,245,118,201 // vpcmpeqd %ymm1,%ymm1,%ymm1
.byte 196,226,117,144,28,128 // vpgatherdd %ymm1,(%rax,%ymm0,4),%ymm3
- .byte 197,229,219,5,5,30,0,0 // vpand 0x1e05(%rip),%ymm3,%ymm0 # 4280 <_sk_callback_hsw+0x537>
+ .byte 197,229,219,5,9,30,0,0 // vpand 0x1e09(%rip),%ymm3,%ymm0 # 4280 <_sk_callback_hsw+0x53b>
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,5,24,28,0,0 // vbroadcastss 0x1c18(%rip),%ymm8 # 40a0 <_sk_callback_hsw+0x357>
+ .byte 196,98,125,24,5,24,28,0,0 // vbroadcastss 0x1c18(%rip),%ymm8 # 409c <_sk_callback_hsw+0x357>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
- .byte 196,226,101,0,13,10,30,0,0 // vpshufb 0x1e0a(%rip),%ymm3,%ymm1 # 42a0 <_sk_callback_hsw+0x557>
+ .byte 196,226,101,0,13,14,30,0,0 // vpshufb 0x1e0e(%rip),%ymm3,%ymm1 # 42a0 <_sk_callback_hsw+0x55b>
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
- .byte 196,226,101,0,21,24,30,0,0 // vpshufb 0x1e18(%rip),%ymm3,%ymm2 # 42c0 <_sk_callback_hsw+0x577>
+ .byte 196,226,101,0,21,28,30,0,0 // vpshufb 0x1e1c(%rip),%ymm3,%ymm2 # 42c0 <_sk_callback_hsw+0x57b>
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 197,229,114,211,24 // vpsrld $0x18,%ymm3,%ymm3
@@ -9853,35 +9851,35 @@ _sk_load_565_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,114 // jne 2548 <_sk_load_565_hsw+0x7c>
+ .byte 117,114 // jne 2544 <_sk_load_565_hsw+0x7c>
.byte 196,193,122,111,4,122 // vmovdqu (%r10,%rdi,2),%xmm0
.byte 196,226,125,51,208 // vpmovzxwd %xmm0,%ymm2
- .byte 196,226,125,88,5,186,27,0,0 // vpbroadcastd 0x1bba(%rip),%ymm0 # 40a4 <_sk_callback_hsw+0x35b>
+ .byte 196,226,125,88,5,186,27,0,0 // vpbroadcastd 0x1bba(%rip),%ymm0 # 40a0 <_sk_callback_hsw+0x35b>
.byte 197,237,219,192 // vpand %ymm0,%ymm2,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,173,27,0,0 // vbroadcastss 0x1bad(%rip),%ymm1 # 40a8 <_sk_callback_hsw+0x35f>
+ .byte 196,226,125,24,13,173,27,0,0 // vbroadcastss 0x1bad(%rip),%ymm1 # 40a4 <_sk_callback_hsw+0x35f>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,88,13,164,27,0,0 // vpbroadcastd 0x1ba4(%rip),%ymm1 # 40ac <_sk_callback_hsw+0x363>
+ .byte 196,226,125,88,13,164,27,0,0 // vpbroadcastd 0x1ba4(%rip),%ymm1 # 40a8 <_sk_callback_hsw+0x363>
.byte 197,237,219,201 // vpand %ymm1,%ymm2,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,29,151,27,0,0 // vbroadcastss 0x1b97(%rip),%ymm3 # 40b0 <_sk_callback_hsw+0x367>
+ .byte 196,226,125,24,29,151,27,0,0 // vbroadcastss 0x1b97(%rip),%ymm3 # 40ac <_sk_callback_hsw+0x367>
.byte 197,244,89,203 // vmulps %ymm3,%ymm1,%ymm1
- .byte 196,226,125,88,29,142,27,0,0 // vpbroadcastd 0x1b8e(%rip),%ymm3 # 40b4 <_sk_callback_hsw+0x36b>
+ .byte 196,226,125,88,29,142,27,0,0 // vpbroadcastd 0x1b8e(%rip),%ymm3 # 40b0 <_sk_callback_hsw+0x36b>
.byte 197,237,219,211 // vpand %ymm3,%ymm2,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,226,125,24,29,129,27,0,0 // vbroadcastss 0x1b81(%rip),%ymm3 # 40b8 <_sk_callback_hsw+0x36f>
+ .byte 196,226,125,24,29,129,27,0,0 // vbroadcastss 0x1b81(%rip),%ymm3 # 40b4 <_sk_callback_hsw+0x36f>
.byte 197,236,89,211 // vmulps %ymm3,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,118,27,0,0 // vbroadcastss 0x1b76(%rip),%ymm3 # 40bc <_sk_callback_hsw+0x373>
+ .byte 196,226,125,24,29,118,27,0,0 // vbroadcastss 0x1b76(%rip),%ymm3 # 40b8 <_sk_callback_hsw+0x373>
.byte 255,224 // jmpq *%rax
.byte 65,137,200 // mov %ecx,%r8d
.byte 65,128,224,7 // and $0x7,%r8b
.byte 197,249,239,192 // vpxor %xmm0,%xmm0,%xmm0
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,128 // ja 24dc <_sk_load_565_hsw+0x10>
+ .byte 119,128 // ja 24d8 <_sk_load_565_hsw+0x10>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 25b0 <_sk_load_565_hsw+0xe4>
+ .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 25ac <_sk_load_565_hsw+0xe4>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -9893,7 +9891,7 @@ _sk_load_565_hsw:
.byte 196,193,121,196,68,122,4,2 // vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,68,122,2,1 // vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,4,122,0 // vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- .byte 233,44,255,255,255 // jmpq 24dc <_sk_load_565_hsw+0x10>
+ .byte 233,44,255,255,255 // jmpq 24d8 <_sk_load_565_hsw+0x10>
.byte 244 // hlt
.byte 255 // (bad)
.byte 255 // (bad)
@@ -9963,23 +9961,23 @@ _sk_gather_565_hsw:
.byte 65,15,183,4,88 // movzwl (%r8,%rbx,2),%eax
.byte 197,249,196,192,7 // vpinsrw $0x7,%eax,%xmm0,%xmm0
.byte 196,226,125,51,208 // vpmovzxwd %xmm0,%ymm2
- .byte 196,226,125,88,5,57,26,0,0 // vpbroadcastd 0x1a39(%rip),%ymm0 # 40c0 <_sk_callback_hsw+0x377>
+ .byte 196,226,125,88,5,57,26,0,0 // vpbroadcastd 0x1a39(%rip),%ymm0 # 40bc <_sk_callback_hsw+0x377>
.byte 197,237,219,192 // vpand %ymm0,%ymm2,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,44,26,0,0 // vbroadcastss 0x1a2c(%rip),%ymm1 # 40c4 <_sk_callback_hsw+0x37b>
+ .byte 196,226,125,24,13,44,26,0,0 // vbroadcastss 0x1a2c(%rip),%ymm1 # 40c0 <_sk_callback_hsw+0x37b>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,88,13,35,26,0,0 // vpbroadcastd 0x1a23(%rip),%ymm1 # 40c8 <_sk_callback_hsw+0x37f>
+ .byte 196,226,125,88,13,35,26,0,0 // vpbroadcastd 0x1a23(%rip),%ymm1 # 40c4 <_sk_callback_hsw+0x37f>
.byte 197,237,219,201 // vpand %ymm1,%ymm2,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,29,22,26,0,0 // vbroadcastss 0x1a16(%rip),%ymm3 # 40cc <_sk_callback_hsw+0x383>
+ .byte 196,226,125,24,29,22,26,0,0 // vbroadcastss 0x1a16(%rip),%ymm3 # 40c8 <_sk_callback_hsw+0x383>
.byte 197,244,89,203 // vmulps %ymm3,%ymm1,%ymm1
- .byte 196,226,125,88,29,13,26,0,0 // vpbroadcastd 0x1a0d(%rip),%ymm3 # 40d0 <_sk_callback_hsw+0x387>
+ .byte 196,226,125,88,29,13,26,0,0 // vpbroadcastd 0x1a0d(%rip),%ymm3 # 40cc <_sk_callback_hsw+0x387>
.byte 197,237,219,211 // vpand %ymm3,%ymm2,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,226,125,24,29,0,26,0,0 // vbroadcastss 0x1a00(%rip),%ymm3 # 40d4 <_sk_callback_hsw+0x38b>
+ .byte 196,226,125,24,29,0,26,0,0 // vbroadcastss 0x1a00(%rip),%ymm3 # 40d0 <_sk_callback_hsw+0x38b>
.byte 197,236,89,211 // vmulps %ymm3,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,245,25,0,0 // vbroadcastss 0x19f5(%rip),%ymm3 # 40d8 <_sk_callback_hsw+0x38f>
+ .byte 196,226,125,24,29,245,25,0,0 // vbroadcastss 0x19f5(%rip),%ymm3 # 40d4 <_sk_callback_hsw+0x38f>
.byte 91 // pop %rbx
.byte 65,92 // pop %r12
.byte 65,94 // pop %r14
@@ -9992,11 +9990,11 @@ FUNCTION(_sk_store_565_hsw)
_sk_store_565_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,226,25,0,0 // vbroadcastss 0x19e2(%rip),%ymm8 # 40dc <_sk_callback_hsw+0x393>
+ .byte 196,98,125,24,5,226,25,0,0 // vbroadcastss 0x19e2(%rip),%ymm8 # 40d8 <_sk_callback_hsw+0x393>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,193,53,114,241,11 // vpslld $0xb,%ymm9,%ymm9
- .byte 196,98,125,24,21,205,25,0,0 // vbroadcastss 0x19cd(%rip),%ymm10 # 40e0 <_sk_callback_hsw+0x397>
+ .byte 196,98,125,24,21,205,25,0,0 // vbroadcastss 0x19cd(%rip),%ymm10 # 40dc <_sk_callback_hsw+0x397>
.byte 196,65,116,89,210 // vmulps %ymm10,%ymm1,%ymm10
.byte 196,65,125,91,210 // vcvtps2dq %ymm10,%ymm10
.byte 196,193,45,114,242,5 // vpslld $0x5,%ymm10,%ymm10
@@ -10007,7 +10005,7 @@ _sk_store_565_hsw:
.byte 196,67,125,57,193,1 // vextracti128 $0x1,%ymm8,%xmm9
.byte 196,66,57,43,193 // vpackusdw %xmm9,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 2751 <_sk_store_565_hsw+0x65>
+ .byte 117,10 // jne 274d <_sk_store_565_hsw+0x65>
.byte 196,65,122,127,4,122 // vmovdqu %xmm8,(%r10,%rdi,2)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -10015,9 +10013,9 @@ _sk_store_565_hsw:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 274d <_sk_store_565_hsw+0x61>
+ .byte 119,236 // ja 2749 <_sk_store_565_hsw+0x61>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,68,0,0,0 // lea 0x44(%rip),%r9 # 27b0 <_sk_store_565_hsw+0xc4>
+ .byte 76,141,13,68,0,0,0 // lea 0x44(%rip),%r9 # 27ac <_sk_store_565_hsw+0xc4>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -10028,7 +10026,7 @@ _sk_store_565_hsw:
.byte 196,67,121,21,68,122,4,2 // vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
.byte 196,67,121,21,68,122,2,1 // vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
.byte 196,67,121,21,4,122,0 // vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- .byte 235,159 // jmp 274d <_sk_store_565_hsw+0x61>
+ .byte 235,159 // jmp 2749 <_sk_store_565_hsw+0x61>
.byte 102,144 // xchg %ax,%ax
.byte 245 // cmc
.byte 255 // (bad)
@@ -10061,28 +10059,28 @@ _sk_load_4444_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,138,0,0,0 // jne 2864 <_sk_load_4444_hsw+0x98>
+ .byte 15,133,138,0,0,0 // jne 2860 <_sk_load_4444_hsw+0x98>
.byte 196,193,122,111,4,122 // vmovdqu (%r10,%rdi,2),%xmm0
.byte 196,226,125,51,216 // vpmovzxwd %xmm0,%ymm3
- .byte 196,226,125,88,5,246,24,0,0 // vpbroadcastd 0x18f6(%rip),%ymm0 # 40e4 <_sk_callback_hsw+0x39b>
+ .byte 196,226,125,88,5,246,24,0,0 // vpbroadcastd 0x18f6(%rip),%ymm0 # 40e0 <_sk_callback_hsw+0x39b>
.byte 197,229,219,192 // vpand %ymm0,%ymm3,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,233,24,0,0 // vbroadcastss 0x18e9(%rip),%ymm1 # 40e8 <_sk_callback_hsw+0x39f>
+ .byte 196,226,125,24,13,233,24,0,0 // vbroadcastss 0x18e9(%rip),%ymm1 # 40e4 <_sk_callback_hsw+0x39f>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,88,13,224,24,0,0 // vpbroadcastd 0x18e0(%rip),%ymm1 # 40ec <_sk_callback_hsw+0x3a3>
+ .byte 196,226,125,88,13,224,24,0,0 // vpbroadcastd 0x18e0(%rip),%ymm1 # 40e8 <_sk_callback_hsw+0x3a3>
.byte 197,229,219,201 // vpand %ymm1,%ymm3,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,21,211,24,0,0 // vbroadcastss 0x18d3(%rip),%ymm2 # 40f0 <_sk_callback_hsw+0x3a7>
+ .byte 196,226,125,24,21,211,24,0,0 // vbroadcastss 0x18d3(%rip),%ymm2 # 40ec <_sk_callback_hsw+0x3a7>
.byte 197,244,89,202 // vmulps %ymm2,%ymm1,%ymm1
- .byte 196,226,125,88,21,202,24,0,0 // vpbroadcastd 0x18ca(%rip),%ymm2 # 40f4 <_sk_callback_hsw+0x3ab>
+ .byte 196,226,125,88,21,202,24,0,0 // vpbroadcastd 0x18ca(%rip),%ymm2 # 40f0 <_sk_callback_hsw+0x3ab>
.byte 197,229,219,210 // vpand %ymm2,%ymm3,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,98,125,24,5,189,24,0,0 // vbroadcastss 0x18bd(%rip),%ymm8 # 40f8 <_sk_callback_hsw+0x3af>
+ .byte 196,98,125,24,5,189,24,0,0 // vbroadcastss 0x18bd(%rip),%ymm8 # 40f4 <_sk_callback_hsw+0x3af>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
- .byte 196,98,125,88,5,179,24,0,0 // vpbroadcastd 0x18b3(%rip),%ymm8 # 40fc <_sk_callback_hsw+0x3b3>
+ .byte 196,98,125,88,5,179,24,0,0 // vpbroadcastd 0x18b3(%rip),%ymm8 # 40f8 <_sk_callback_hsw+0x3b3>
.byte 196,193,101,219,216 // vpand %ymm8,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,165,24,0,0 // vbroadcastss 0x18a5(%rip),%ymm8 # 4100 <_sk_callback_hsw+0x3b7>
+ .byte 196,98,125,24,5,165,24,0,0 // vbroadcastss 0x18a5(%rip),%ymm8 # 40fc <_sk_callback_hsw+0x3b7>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -10091,9 +10089,9 @@ _sk_load_4444_hsw:
.byte 197,249,239,192 // vpxor %xmm0,%xmm0,%xmm0
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 15,135,100,255,255,255 // ja 27e0 <_sk_load_4444_hsw+0x14>
+ .byte 15,135,100,255,255,255 // ja 27dc <_sk_load_4444_hsw+0x14>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 28d0 <_sk_load_4444_hsw+0x104>
+ .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 28cc <_sk_load_4444_hsw+0x104>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -10105,7 +10103,7 @@ _sk_load_4444_hsw:
.byte 196,193,121,196,68,122,4,2 // vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,68,122,2,1 // vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,4,122,0 // vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- .byte 233,16,255,255,255 // jmpq 27e0 <_sk_load_4444_hsw+0x14>
+ .byte 233,16,255,255,255 // jmpq 27dc <_sk_load_4444_hsw+0x14>
.byte 244 // hlt
.byte 255 // (bad)
.byte 255 // (bad)
@@ -10175,25 +10173,25 @@ _sk_gather_4444_hsw:
.byte 65,15,183,4,88 // movzwl (%r8,%rbx,2),%eax
.byte 197,249,196,192,7 // vpinsrw $0x7,%eax,%xmm0,%xmm0
.byte 196,226,125,51,216 // vpmovzxwd %xmm0,%ymm3
- .byte 196,226,125,88,5,93,23,0,0 // vpbroadcastd 0x175d(%rip),%ymm0 # 4104 <_sk_callback_hsw+0x3bb>
+ .byte 196,226,125,88,5,93,23,0,0 // vpbroadcastd 0x175d(%rip),%ymm0 # 4100 <_sk_callback_hsw+0x3bb>
.byte 197,229,219,192 // vpand %ymm0,%ymm3,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,80,23,0,0 // vbroadcastss 0x1750(%rip),%ymm1 # 4108 <_sk_callback_hsw+0x3bf>
+ .byte 196,226,125,24,13,80,23,0,0 // vbroadcastss 0x1750(%rip),%ymm1 # 4104 <_sk_callback_hsw+0x3bf>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,88,13,71,23,0,0 // vpbroadcastd 0x1747(%rip),%ymm1 # 410c <_sk_callback_hsw+0x3c3>
+ .byte 196,226,125,88,13,71,23,0,0 // vpbroadcastd 0x1747(%rip),%ymm1 # 4108 <_sk_callback_hsw+0x3c3>
.byte 197,229,219,201 // vpand %ymm1,%ymm3,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,21,58,23,0,0 // vbroadcastss 0x173a(%rip),%ymm2 # 4110 <_sk_callback_hsw+0x3c7>
+ .byte 196,226,125,24,21,58,23,0,0 // vbroadcastss 0x173a(%rip),%ymm2 # 410c <_sk_callback_hsw+0x3c7>
.byte 197,244,89,202 // vmulps %ymm2,%ymm1,%ymm1
- .byte 196,226,125,88,21,49,23,0,0 // vpbroadcastd 0x1731(%rip),%ymm2 # 4114 <_sk_callback_hsw+0x3cb>
+ .byte 196,226,125,88,21,49,23,0,0 // vpbroadcastd 0x1731(%rip),%ymm2 # 4110 <_sk_callback_hsw+0x3cb>
.byte 197,229,219,210 // vpand %ymm2,%ymm3,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,98,125,24,5,36,23,0,0 // vbroadcastss 0x1724(%rip),%ymm8 # 4118 <_sk_callback_hsw+0x3cf>
+ .byte 196,98,125,24,5,36,23,0,0 // vbroadcastss 0x1724(%rip),%ymm8 # 4114 <_sk_callback_hsw+0x3cf>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
- .byte 196,98,125,88,5,26,23,0,0 // vpbroadcastd 0x171a(%rip),%ymm8 # 411c <_sk_callback_hsw+0x3d3>
+ .byte 196,98,125,88,5,26,23,0,0 // vpbroadcastd 0x171a(%rip),%ymm8 # 4118 <_sk_callback_hsw+0x3d3>
.byte 196,193,101,219,216 // vpand %ymm8,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,12,23,0,0 // vbroadcastss 0x170c(%rip),%ymm8 # 4120 <_sk_callback_hsw+0x3d7>
+ .byte 196,98,125,24,5,12,23,0,0 // vbroadcastss 0x170c(%rip),%ymm8 # 411c <_sk_callback_hsw+0x3d7>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 91 // pop %rbx
@@ -10208,7 +10206,7 @@ FUNCTION(_sk_store_4444_hsw)
_sk_store_4444_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,242,22,0,0 // vbroadcastss 0x16f2(%rip),%ymm8 # 4124 <_sk_callback_hsw+0x3db>
+ .byte 196,98,125,24,5,242,22,0,0 // vbroadcastss 0x16f2(%rip),%ymm8 # 4120 <_sk_callback_hsw+0x3db>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,193,53,114,241,12 // vpslld $0xc,%ymm9,%ymm9
@@ -10226,7 +10224,7 @@ _sk_store_4444_hsw:
.byte 196,67,125,57,193,1 // vextracti128 $0x1,%ymm8,%xmm9
.byte 196,66,57,43,193 // vpackusdw %xmm9,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 2a95 <_sk_store_4444_hsw+0x71>
+ .byte 117,10 // jne 2a91 <_sk_store_4444_hsw+0x71>
.byte 196,65,122,127,4,122 // vmovdqu %xmm8,(%r10,%rdi,2)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -10234,9 +10232,9 @@ _sk_store_4444_hsw:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 2a91 <_sk_store_4444_hsw+0x6d>
+ .byte 119,236 // ja 2a8d <_sk_store_4444_hsw+0x6d>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,68,0,0,0 // lea 0x44(%rip),%r9 # 2af4 <_sk_store_4444_hsw+0xd0>
+ .byte 76,141,13,68,0,0,0 // lea 0x44(%rip),%r9 # 2af0 <_sk_store_4444_hsw+0xd0>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -10247,7 +10245,7 @@ _sk_store_4444_hsw:
.byte 196,67,121,21,68,122,4,2 // vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
.byte 196,67,121,21,68,122,2,1 // vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
.byte 196,67,121,21,4,122,0 // vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- .byte 235,159 // jmp 2a91 <_sk_store_4444_hsw+0x6d>
+ .byte 235,159 // jmp 2a8d <_sk_store_4444_hsw+0x6d>
.byte 102,144 // xchg %ax,%ax
.byte 245 // cmc
.byte 255 // (bad)
@@ -10282,16 +10280,16 @@ _sk_load_8888_hsw:
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
.byte 76,3,8 // add (%rax),%r9
.byte 77,133,192 // test %r8,%r8
- .byte 117,88 // jne 2b7d <_sk_load_8888_hsw+0x6d>
+ .byte 117,88 // jne 2b79 <_sk_load_8888_hsw+0x6d>
.byte 196,193,126,111,25 // vmovdqu (%r9),%ymm3
- .byte 197,229,219,5,174,23,0,0 // vpand 0x17ae(%rip),%ymm3,%ymm0 # 42e0 <_sk_callback_hsw+0x597>
+ .byte 197,229,219,5,178,23,0,0 // vpand 0x17b2(%rip),%ymm3,%ymm0 # 42e0 <_sk_callback_hsw+0x59b>
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,5,233,21,0,0 // vbroadcastss 0x15e9(%rip),%ymm8 # 4128 <_sk_callback_hsw+0x3df>
+ .byte 196,98,125,24,5,233,21,0,0 // vbroadcastss 0x15e9(%rip),%ymm8 # 4124 <_sk_callback_hsw+0x3df>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
- .byte 196,226,101,0,13,179,23,0,0 // vpshufb 0x17b3(%rip),%ymm3,%ymm1 # 4300 <_sk_callback_hsw+0x5b7>
+ .byte 196,226,101,0,13,183,23,0,0 // vpshufb 0x17b7(%rip),%ymm3,%ymm1 # 4300 <_sk_callback_hsw+0x5bb>
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
- .byte 196,226,101,0,21,193,23,0,0 // vpshufb 0x17c1(%rip),%ymm3,%ymm2 # 4320 <_sk_callback_hsw+0x5d7>
+ .byte 196,226,101,0,21,197,23,0,0 // vpshufb 0x17c5(%rip),%ymm3,%ymm2 # 4320 <_sk_callback_hsw+0x5db>
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 197,229,114,211,24 // vpsrld $0x18,%ymm3,%ymm3
@@ -10308,7 +10306,7 @@ _sk_load_8888_hsw:
.byte 196,225,249,110,192 // vmovq %rax,%xmm0
.byte 196,226,125,33,192 // vpmovsxbd %xmm0,%ymm0
.byte 196,194,125,140,25 // vpmaskmovd (%r9),%ymm0,%ymm3
- .byte 235,135 // jmp 2b2a <_sk_load_8888_hsw+0x1a>
+ .byte 235,135 // jmp 2b26 <_sk_load_8888_hsw+0x1a>
HIDDEN _sk_gather_8888_hsw
.globl _sk_gather_8888_hsw
@@ -10323,14 +10321,14 @@ _sk_gather_8888_hsw:
.byte 197,245,254,192 // vpaddd %ymm0,%ymm1,%ymm0
.byte 197,245,118,201 // vpcmpeqd %ymm1,%ymm1,%ymm1
.byte 196,194,117,144,28,128 // vpgatherdd %ymm1,(%r8,%ymm0,4),%ymm3
- .byte 197,229,219,5,111,23,0,0 // vpand 0x176f(%rip),%ymm3,%ymm0 # 4340 <_sk_callback_hsw+0x5f7>
+ .byte 197,229,219,5,115,23,0,0 // vpand 0x1773(%rip),%ymm3,%ymm0 # 4340 <_sk_callback_hsw+0x5fb>
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,5,78,21,0,0 // vbroadcastss 0x154e(%rip),%ymm8 # 412c <_sk_callback_hsw+0x3e3>
+ .byte 196,98,125,24,5,78,21,0,0 // vbroadcastss 0x154e(%rip),%ymm8 # 4128 <_sk_callback_hsw+0x3e3>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
- .byte 196,226,101,0,13,116,23,0,0 // vpshufb 0x1774(%rip),%ymm3,%ymm1 # 4360 <_sk_callback_hsw+0x617>
+ .byte 196,226,101,0,13,120,23,0,0 // vpshufb 0x1778(%rip),%ymm3,%ymm1 # 4360 <_sk_callback_hsw+0x61b>
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
- .byte 196,226,101,0,21,130,23,0,0 // vpshufb 0x1782(%rip),%ymm3,%ymm2 # 4380 <_sk_callback_hsw+0x637>
+ .byte 196,226,101,0,21,134,23,0,0 // vpshufb 0x1786(%rip),%ymm3,%ymm2 # 4380 <_sk_callback_hsw+0x63b>
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 197,229,114,211,24 // vpsrld $0x18,%ymm3,%ymm3
@@ -10347,7 +10345,7 @@ _sk_store_8888_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
.byte 76,3,8 // add (%rax),%r9
- .byte 196,98,125,24,5,254,20,0,0 // vbroadcastss 0x14fe(%rip),%ymm8 # 4130 <_sk_callback_hsw+0x3e7>
+ .byte 196,98,125,24,5,254,20,0,0 // vbroadcastss 0x14fe(%rip),%ymm8 # 412c <_sk_callback_hsw+0x3e7>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,65,116,89,208 // vmulps %ymm8,%ymm1,%ymm10
@@ -10363,7 +10361,7 @@ _sk_store_8888_hsw:
.byte 196,65,45,235,192 // vpor %ymm8,%ymm10,%ymm8
.byte 196,65,53,235,192 // vpor %ymm8,%ymm9,%ymm8
.byte 77,133,192 // test %r8,%r8
- .byte 117,12 // jne 2c8c <_sk_store_8888_hsw+0x73>
+ .byte 117,12 // jne 2c88 <_sk_store_8888_hsw+0x73>
.byte 196,65,126,127,1 // vmovdqu %ymm8,(%r9)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,137,193 // mov %r8,%rcx
@@ -10376,7 +10374,7 @@ _sk_store_8888_hsw:
.byte 196,97,249,110,200 // vmovq %rax,%xmm9
.byte 196,66,125,33,201 // vpmovsxbd %xmm9,%ymm9
.byte 196,66,53,142,1 // vpmaskmovd %ymm8,%ymm9,(%r9)
- .byte 235,211 // jmp 2c85 <_sk_store_8888_hsw+0x6c>
+ .byte 235,211 // jmp 2c81 <_sk_store_8888_hsw+0x6c>
HIDDEN _sk_load_f16_hsw
.globl _sk_load_f16_hsw
@@ -10385,7 +10383,7 @@ _sk_load_f16_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,97 // jne 2d1d <_sk_load_f16_hsw+0x6b>
+ .byte 117,97 // jne 2d19 <_sk_load_f16_hsw+0x6b>
.byte 197,121,16,4,248 // vmovupd (%rax,%rdi,8),%xmm8
.byte 197,249,16,84,248,16 // vmovupd 0x10(%rax,%rdi,8),%xmm2
.byte 197,249,16,92,248,32 // vmovupd 0x20(%rax,%rdi,8),%xmm3
@@ -10411,29 +10409,29 @@ _sk_load_f16_hsw:
.byte 197,123,16,4,248 // vmovsd (%rax,%rdi,8),%xmm8
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,79 // je 2d7c <_sk_load_f16_hsw+0xca>
+ .byte 116,79 // je 2d78 <_sk_load_f16_hsw+0xca>
.byte 197,57,22,68,248,8 // vmovhpd 0x8(%rax,%rdi,8),%xmm8,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,67 // jb 2d7c <_sk_load_f16_hsw+0xca>
+ .byte 114,67 // jb 2d78 <_sk_load_f16_hsw+0xca>
.byte 197,251,16,84,248,16 // vmovsd 0x10(%rax,%rdi,8),%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 116,68 // je 2d89 <_sk_load_f16_hsw+0xd7>
+ .byte 116,68 // je 2d85 <_sk_load_f16_hsw+0xd7>
.byte 197,233,22,84,248,24 // vmovhpd 0x18(%rax,%rdi,8),%xmm2,%xmm2
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,56 // jb 2d89 <_sk_load_f16_hsw+0xd7>
+ .byte 114,56 // jb 2d85 <_sk_load_f16_hsw+0xd7>
.byte 197,251,16,92,248,32 // vmovsd 0x20(%rax,%rdi,8),%xmm3
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 15,132,114,255,255,255 // je 2cd3 <_sk_load_f16_hsw+0x21>
+ .byte 15,132,114,255,255,255 // je 2ccf <_sk_load_f16_hsw+0x21>
.byte 197,225,22,92,248,40 // vmovhpd 0x28(%rax,%rdi,8),%xmm3,%xmm3
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 15,130,98,255,255,255 // jb 2cd3 <_sk_load_f16_hsw+0x21>
+ .byte 15,130,98,255,255,255 // jb 2ccf <_sk_load_f16_hsw+0x21>
.byte 197,122,126,76,248,48 // vmovq 0x30(%rax,%rdi,8),%xmm9
- .byte 233,87,255,255,255 // jmpq 2cd3 <_sk_load_f16_hsw+0x21>
+ .byte 233,87,255,255,255 // jmpq 2ccf <_sk_load_f16_hsw+0x21>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
.byte 197,233,87,210 // vxorpd %xmm2,%xmm2,%xmm2
- .byte 233,74,255,255,255 // jmpq 2cd3 <_sk_load_f16_hsw+0x21>
+ .byte 233,74,255,255,255 // jmpq 2ccf <_sk_load_f16_hsw+0x21>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
- .byte 233,65,255,255,255 // jmpq 2cd3 <_sk_load_f16_hsw+0x21>
+ .byte 233,65,255,255,255 // jmpq 2ccf <_sk_load_f16_hsw+0x21>
HIDDEN _sk_gather_f16_hsw
.globl _sk_gather_f16_hsw
@@ -10491,7 +10489,7 @@ _sk_store_f16_hsw:
.byte 196,65,57,98,205 // vpunpckldq %xmm13,%xmm8,%xmm9
.byte 196,65,57,106,197 // vpunpckhdq %xmm13,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,27 // jne 2e81 <_sk_store_f16_hsw+0x65>
+ .byte 117,27 // jne 2e7d <_sk_store_f16_hsw+0x65>
.byte 197,120,17,28,248 // vmovups %xmm11,(%rax,%rdi,8)
.byte 197,120,17,84,248,16 // vmovups %xmm10,0x10(%rax,%rdi,8)
.byte 197,120,17,76,248,32 // vmovups %xmm9,0x20(%rax,%rdi,8)
@@ -10500,22 +10498,22 @@ _sk_store_f16_hsw:
.byte 255,224 // jmpq *%rax
.byte 197,121,214,28,248 // vmovq %xmm11,(%rax,%rdi,8)
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,241 // je 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 116,241 // je 2e79 <_sk_store_f16_hsw+0x61>
.byte 197,121,23,92,248,8 // vmovhpd %xmm11,0x8(%rax,%rdi,8)
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,229 // jb 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 114,229 // jb 2e79 <_sk_store_f16_hsw+0x61>
.byte 197,121,214,84,248,16 // vmovq %xmm10,0x10(%rax,%rdi,8)
- .byte 116,221 // je 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 116,221 // je 2e79 <_sk_store_f16_hsw+0x61>
.byte 197,121,23,84,248,24 // vmovhpd %xmm10,0x18(%rax,%rdi,8)
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,209 // jb 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 114,209 // jb 2e79 <_sk_store_f16_hsw+0x61>
.byte 197,121,214,76,248,32 // vmovq %xmm9,0x20(%rax,%rdi,8)
- .byte 116,201 // je 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 116,201 // je 2e79 <_sk_store_f16_hsw+0x61>
.byte 197,121,23,76,248,40 // vmovhpd %xmm9,0x28(%rax,%rdi,8)
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,189 // jb 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 114,189 // jb 2e79 <_sk_store_f16_hsw+0x61>
.byte 197,121,214,68,248,48 // vmovq %xmm8,0x30(%rax,%rdi,8)
- .byte 235,181 // jmp 2e7d <_sk_store_f16_hsw+0x61>
+ .byte 235,181 // jmp 2e79 <_sk_store_f16_hsw+0x61>
HIDDEN _sk_load_u16_be_hsw
.globl _sk_load_u16_be_hsw
@@ -10525,7 +10523,7 @@ _sk_load_u16_be_hsw:
.byte 76,139,0 // mov (%rax),%r8
.byte 72,141,4,189,0,0,0,0 // lea 0x0(,%rdi,4),%rax
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,204,0,0,0 // jne 2faa <_sk_load_u16_be_hsw+0xe2>
+ .byte 15,133,204,0,0,0 // jne 2fa6 <_sk_load_u16_be_hsw+0xe2>
.byte 196,65,121,16,4,64 // vmovupd (%r8,%rax,2),%xmm8
.byte 196,193,121,16,84,64,16 // vmovupd 0x10(%r8,%rax,2),%xmm2
.byte 196,193,121,16,92,64,32 // vmovupd 0x20(%r8,%rax,2),%xmm3
@@ -10544,7 +10542,7 @@ _sk_load_u16_be_hsw:
.byte 197,241,235,192 // vpor %xmm0,%xmm1,%xmm0
.byte 196,226,125,51,192 // vpmovzxwd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,21,245,17,0,0 // vbroadcastss 0x11f5(%rip),%ymm10 # 4134 <_sk_callback_hsw+0x3eb>
+ .byte 196,98,125,24,21,245,17,0,0 // vbroadcastss 0x11f5(%rip),%ymm10 # 4130 <_sk_callback_hsw+0x3eb>
.byte 196,193,124,89,194 // vmulps %ymm10,%ymm0,%ymm0
.byte 197,185,109,202 // vpunpckhqdq %xmm2,%xmm8,%xmm1
.byte 197,233,113,241,8 // vpsllw $0x8,%xmm1,%xmm2
@@ -10572,29 +10570,29 @@ _sk_load_u16_be_hsw:
.byte 196,65,123,16,4,64 // vmovsd (%r8,%rax,2),%xmm8
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,85 // je 3010 <_sk_load_u16_be_hsw+0x148>
+ .byte 116,85 // je 300c <_sk_load_u16_be_hsw+0x148>
.byte 196,65,57,22,68,64,8 // vmovhpd 0x8(%r8,%rax,2),%xmm8,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,72 // jb 3010 <_sk_load_u16_be_hsw+0x148>
+ .byte 114,72 // jb 300c <_sk_load_u16_be_hsw+0x148>
.byte 196,193,123,16,84,64,16 // vmovsd 0x10(%r8,%rax,2),%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 116,72 // je 301d <_sk_load_u16_be_hsw+0x155>
+ .byte 116,72 // je 3019 <_sk_load_u16_be_hsw+0x155>
.byte 196,193,105,22,84,64,24 // vmovhpd 0x18(%r8,%rax,2),%xmm2,%xmm2
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,59 // jb 301d <_sk_load_u16_be_hsw+0x155>
+ .byte 114,59 // jb 3019 <_sk_load_u16_be_hsw+0x155>
.byte 196,193,123,16,92,64,32 // vmovsd 0x20(%r8,%rax,2),%xmm3
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 15,132,6,255,255,255 // je 2ef9 <_sk_load_u16_be_hsw+0x31>
+ .byte 15,132,6,255,255,255 // je 2ef5 <_sk_load_u16_be_hsw+0x31>
.byte 196,193,97,22,92,64,40 // vmovhpd 0x28(%r8,%rax,2),%xmm3,%xmm3
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 15,130,245,254,255,255 // jb 2ef9 <_sk_load_u16_be_hsw+0x31>
+ .byte 15,130,245,254,255,255 // jb 2ef5 <_sk_load_u16_be_hsw+0x31>
.byte 196,65,122,126,76,64,48 // vmovq 0x30(%r8,%rax,2),%xmm9
- .byte 233,233,254,255,255 // jmpq 2ef9 <_sk_load_u16_be_hsw+0x31>
+ .byte 233,233,254,255,255 // jmpq 2ef5 <_sk_load_u16_be_hsw+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
.byte 197,233,87,210 // vxorpd %xmm2,%xmm2,%xmm2
- .byte 233,220,254,255,255 // jmpq 2ef9 <_sk_load_u16_be_hsw+0x31>
+ .byte 233,220,254,255,255 // jmpq 2ef5 <_sk_load_u16_be_hsw+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
- .byte 233,211,254,255,255 // jmpq 2ef9 <_sk_load_u16_be_hsw+0x31>
+ .byte 233,211,254,255,255 // jmpq 2ef5 <_sk_load_u16_be_hsw+0x31>
HIDDEN _sk_load_rgb_u16_be_hsw
.globl _sk_load_rgb_u16_be_hsw
@@ -10604,7 +10602,7 @@ _sk_load_rgb_u16_be_hsw:
.byte 76,139,0 // mov (%rax),%r8
.byte 72,141,4,127 // lea (%rdi,%rdi,2),%rax
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,204,0,0,0 // jne 3104 <_sk_load_rgb_u16_be_hsw+0xde>
+ .byte 15,133,204,0,0,0 // jne 3100 <_sk_load_rgb_u16_be_hsw+0xde>
.byte 196,193,122,111,4,64 // vmovdqu (%r8,%rax,2),%xmm0
.byte 196,193,122,111,84,64,12 // vmovdqu 0xc(%r8,%rax,2),%xmm2
.byte 196,193,122,111,76,64,24 // vmovdqu 0x18(%r8,%rax,2),%xmm1
@@ -10628,7 +10626,7 @@ _sk_load_rgb_u16_be_hsw:
.byte 197,241,235,192 // vpor %xmm0,%xmm1,%xmm0
.byte 196,226,125,51,192 // vpmovzxwd %xmm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,21,134,16,0,0 // vbroadcastss 0x1086(%rip),%ymm10 # 4138 <_sk_callback_hsw+0x3ef>
+ .byte 196,98,125,24,21,134,16,0,0 // vbroadcastss 0x1086(%rip),%ymm10 # 4134 <_sk_callback_hsw+0x3ef>
.byte 196,193,124,89,194 // vmulps %ymm10,%ymm0,%ymm0
.byte 197,185,109,202 // vpunpckhqdq %xmm2,%xmm8,%xmm1
.byte 197,233,113,241,8 // vpsllw $0x8,%xmm1,%xmm2
@@ -10645,41 +10643,41 @@ _sk_load_rgb_u16_be_hsw:
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 196,193,108,89,210 // vmulps %ymm10,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,58,16,0,0 // vbroadcastss 0x103a(%rip),%ymm3 # 413c <_sk_callback_hsw+0x3f3>
+ .byte 196,226,125,24,29,58,16,0,0 // vbroadcastss 0x103a(%rip),%ymm3 # 4138 <_sk_callback_hsw+0x3f3>
.byte 255,224 // jmpq *%rax
.byte 196,193,121,110,4,64 // vmovd (%r8,%rax,2),%xmm0
.byte 196,193,121,196,68,64,4,2 // vpinsrw $0x2,0x4(%r8,%rax,2),%xmm0,%xmm0
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 117,5 // jne 311d <_sk_load_rgb_u16_be_hsw+0xf7>
- .byte 233,79,255,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 117,5 // jne 3119 <_sk_load_rgb_u16_be_hsw+0xf7>
+ .byte 233,79,255,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
.byte 196,193,121,110,76,64,6 // vmovd 0x6(%r8,%rax,2),%xmm1
.byte 196,65,113,196,68,64,10,2 // vpinsrw $0x2,0xa(%r8,%rax,2),%xmm1,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,26 // jb 314c <_sk_load_rgb_u16_be_hsw+0x126>
+ .byte 114,26 // jb 3148 <_sk_load_rgb_u16_be_hsw+0x126>
.byte 196,193,121,110,76,64,12 // vmovd 0xc(%r8,%rax,2),%xmm1
.byte 196,193,113,196,84,64,16,2 // vpinsrw $0x2,0x10(%r8,%rax,2),%xmm1,%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 117,10 // jne 3151 <_sk_load_rgb_u16_be_hsw+0x12b>
- .byte 233,32,255,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
- .byte 233,27,255,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 117,10 // jne 314d <_sk_load_rgb_u16_be_hsw+0x12b>
+ .byte 233,32,255,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 233,27,255,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
.byte 196,193,121,110,76,64,18 // vmovd 0x12(%r8,%rax,2),%xmm1
.byte 196,65,113,196,76,64,22,2 // vpinsrw $0x2,0x16(%r8,%rax,2),%xmm1,%xmm9
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,26 // jb 3180 <_sk_load_rgb_u16_be_hsw+0x15a>
+ .byte 114,26 // jb 317c <_sk_load_rgb_u16_be_hsw+0x15a>
.byte 196,193,121,110,76,64,24 // vmovd 0x18(%r8,%rax,2),%xmm1
.byte 196,193,113,196,76,64,28,2 // vpinsrw $0x2,0x1c(%r8,%rax,2),%xmm1,%xmm1
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 117,10 // jne 3185 <_sk_load_rgb_u16_be_hsw+0x15f>
- .byte 233,236,254,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
- .byte 233,231,254,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 117,10 // jne 3181 <_sk_load_rgb_u16_be_hsw+0x15f>
+ .byte 233,236,254,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 233,231,254,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
.byte 196,193,121,110,92,64,30 // vmovd 0x1e(%r8,%rax,2),%xmm3
.byte 196,65,97,196,92,64,34,2 // vpinsrw $0x2,0x22(%r8,%rax,2),%xmm3,%xmm11
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,20 // jb 31ae <_sk_load_rgb_u16_be_hsw+0x188>
+ .byte 114,20 // jb 31aa <_sk_load_rgb_u16_be_hsw+0x188>
.byte 196,193,121,110,92,64,36 // vmovd 0x24(%r8,%rax,2),%xmm3
.byte 196,193,97,196,92,64,40,2 // vpinsrw $0x2,0x28(%r8,%rax,2),%xmm3,%xmm3
- .byte 233,190,254,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
- .byte 233,185,254,255,255 // jmpq 306c <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 233,190,254,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
+ .byte 233,185,254,255,255 // jmpq 3068 <_sk_load_rgb_u16_be_hsw+0x46>
HIDDEN _sk_store_u16_be_hsw
.globl _sk_store_u16_be_hsw
@@ -10688,7 +10686,7 @@ _sk_store_u16_be_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,0 // mov (%rax),%r8
.byte 72,141,4,189,0,0,0,0 // lea 0x0(,%rdi,4),%rax
- .byte 196,98,125,24,5,119,15,0,0 // vbroadcastss 0xf77(%rip),%ymm8 # 4140 <_sk_callback_hsw+0x3f7>
+ .byte 196,98,125,24,5,119,15,0,0 // vbroadcastss 0xf77(%rip),%ymm8 # 413c <_sk_callback_hsw+0x3f7>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,67,125,25,202,1 // vextractf128 $0x1,%ymm9,%xmm10
@@ -10726,7 +10724,7 @@ _sk_store_u16_be_hsw:
.byte 196,65,17,98,200 // vpunpckldq %xmm8,%xmm13,%xmm9
.byte 196,65,17,106,192 // vpunpckhdq %xmm8,%xmm13,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,31 // jne 32ad <_sk_store_u16_be_hsw+0xfa>
+ .byte 117,31 // jne 32a9 <_sk_store_u16_be_hsw+0xfa>
.byte 196,65,120,17,28,64 // vmovups %xmm11,(%r8,%rax,2)
.byte 196,65,120,17,84,64,16 // vmovups %xmm10,0x10(%r8,%rax,2)
.byte 196,65,120,17,76,64,32 // vmovups %xmm9,0x20(%r8,%rax,2)
@@ -10735,22 +10733,22 @@ _sk_store_u16_be_hsw:
.byte 255,224 // jmpq *%rax
.byte 196,65,121,214,28,64 // vmovq %xmm11,(%r8,%rax,2)
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,240 // je 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 116,240 // je 32a5 <_sk_store_u16_be_hsw+0xf6>
.byte 196,65,121,23,92,64,8 // vmovhpd %xmm11,0x8(%r8,%rax,2)
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,227 // jb 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 114,227 // jb 32a5 <_sk_store_u16_be_hsw+0xf6>
.byte 196,65,121,214,84,64,16 // vmovq %xmm10,0x10(%r8,%rax,2)
- .byte 116,218 // je 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 116,218 // je 32a5 <_sk_store_u16_be_hsw+0xf6>
.byte 196,65,121,23,84,64,24 // vmovhpd %xmm10,0x18(%r8,%rax,2)
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,205 // jb 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 114,205 // jb 32a5 <_sk_store_u16_be_hsw+0xf6>
.byte 196,65,121,214,76,64,32 // vmovq %xmm9,0x20(%r8,%rax,2)
- .byte 116,196 // je 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 116,196 // je 32a5 <_sk_store_u16_be_hsw+0xf6>
.byte 196,65,121,23,76,64,40 // vmovhpd %xmm9,0x28(%r8,%rax,2)
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,183 // jb 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 114,183 // jb 32a5 <_sk_store_u16_be_hsw+0xf6>
.byte 196,65,121,214,68,64,48 // vmovq %xmm8,0x30(%r8,%rax,2)
- .byte 235,174 // jmp 32a9 <_sk_store_u16_be_hsw+0xf6>
+ .byte 235,174 // jmp 32a5 <_sk_store_u16_be_hsw+0xf6>
HIDDEN _sk_load_f32_hsw
.globl _sk_load_f32_hsw
@@ -10758,10 +10756,10 @@ FUNCTION(_sk_load_f32_hsw)
_sk_load_f32_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 119,110 // ja 3371 <_sk_load_f32_hsw+0x76>
+ .byte 119,110 // ja 336d <_sk_load_f32_hsw+0x76>
.byte 76,139,0 // mov (%rax),%r8
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
- .byte 76,141,21,135,0,0,0 // lea 0x87(%rip),%r10 # 339c <_sk_load_f32_hsw+0xa1>
+ .byte 76,141,21,135,0,0,0 // lea 0x87(%rip),%r10 # 3398 <_sk_load_f32_hsw+0xa1>
.byte 73,99,4,138 // movslq (%r10,%rcx,4),%rax
.byte 76,1,208 // add %r10,%rax
.byte 255,224 // jmpq *%rax
@@ -10822,7 +10820,7 @@ _sk_store_f32_hsw:
.byte 196,65,37,20,196 // vunpcklpd %ymm12,%ymm11,%ymm8
.byte 196,65,37,21,220 // vunpckhpd %ymm12,%ymm11,%ymm11
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,55 // jne 3429 <_sk_store_f32_hsw+0x6d>
+ .byte 117,55 // jne 3425 <_sk_store_f32_hsw+0x6d>
.byte 196,67,45,24,225,1 // vinsertf128 $0x1,%xmm9,%ymm10,%ymm12
.byte 196,67,61,24,235,1 // vinsertf128 $0x1,%xmm11,%ymm8,%ymm13
.byte 196,67,45,6,201,49 // vperm2f128 $0x31,%ymm9,%ymm10,%ymm9
@@ -10835,22 +10833,22 @@ _sk_store_f32_hsw:
.byte 255,224 // jmpq *%rax
.byte 196,65,121,17,20,128 // vmovupd %xmm10,(%r8,%rax,4)
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,240 // je 3425 <_sk_store_f32_hsw+0x69>
+ .byte 116,240 // je 3421 <_sk_store_f32_hsw+0x69>
.byte 196,65,121,17,76,128,16 // vmovupd %xmm9,0x10(%r8,%rax,4)
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,227 // jb 3425 <_sk_store_f32_hsw+0x69>
+ .byte 114,227 // jb 3421 <_sk_store_f32_hsw+0x69>
.byte 196,65,121,17,68,128,32 // vmovupd %xmm8,0x20(%r8,%rax,4)
- .byte 116,218 // je 3425 <_sk_store_f32_hsw+0x69>
+ .byte 116,218 // je 3421 <_sk_store_f32_hsw+0x69>
.byte 196,65,121,17,92,128,48 // vmovupd %xmm11,0x30(%r8,%rax,4)
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,205 // jb 3425 <_sk_store_f32_hsw+0x69>
+ .byte 114,205 // jb 3421 <_sk_store_f32_hsw+0x69>
.byte 196,67,125,25,84,128,64,1 // vextractf128 $0x1,%ymm10,0x40(%r8,%rax,4)
- .byte 116,195 // je 3425 <_sk_store_f32_hsw+0x69>
+ .byte 116,195 // je 3421 <_sk_store_f32_hsw+0x69>
.byte 196,67,125,25,76,128,80,1 // vextractf128 $0x1,%ymm9,0x50(%r8,%rax,4)
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,181 // jb 3425 <_sk_store_f32_hsw+0x69>
+ .byte 114,181 // jb 3421 <_sk_store_f32_hsw+0x69>
.byte 196,67,125,25,68,128,96,1 // vextractf128 $0x1,%ymm8,0x60(%r8,%rax,4)
- .byte 235,171 // jmp 3425 <_sk_store_f32_hsw+0x69>
+ .byte 235,171 // jmp 3421 <_sk_store_f32_hsw+0x69>
HIDDEN _sk_clamp_x_hsw
.globl _sk_clamp_x_hsw
@@ -10960,11 +10958,11 @@ HIDDEN _sk_luminance_to_alpha_hsw
.globl _sk_luminance_to_alpha_hsw
FUNCTION(_sk_luminance_to_alpha_hsw)
_sk_luminance_to_alpha_hsw:
- .byte 196,226,125,24,29,145,11,0,0 // vbroadcastss 0xb91(%rip),%ymm3 # 4144 <_sk_callback_hsw+0x3fb>
- .byte 196,98,125,24,5,140,11,0,0 // vbroadcastss 0xb8c(%rip),%ymm8 # 4148 <_sk_callback_hsw+0x3ff>
+ .byte 196,226,125,24,29,145,11,0,0 // vbroadcastss 0xb91(%rip),%ymm3 # 4140 <_sk_callback_hsw+0x3fb>
+ .byte 196,98,125,24,5,140,11,0,0 // vbroadcastss 0xb8c(%rip),%ymm8 # 4144 <_sk_callback_hsw+0x3ff>
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
.byte 196,226,125,184,203 // vfmadd231ps %ymm3,%ymm0,%ymm1
- .byte 196,226,125,24,29,125,11,0,0 // vbroadcastss 0xb7d(%rip),%ymm3 # 414c <_sk_callback_hsw+0x403>
+ .byte 196,226,125,24,29,125,11,0,0 // vbroadcastss 0xb7d(%rip),%ymm3 # 4148 <_sk_callback_hsw+0x403>
.byte 196,226,109,168,217 // vfmadd213ps %ymm1,%ymm2,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,87,192 // vxorps %ymm0,%ymm0,%ymm0
@@ -11109,7 +11107,7 @@ _sk_linear_gradient_hsw:
.byte 196,98,125,24,72,28 // vbroadcastss 0x1c(%rax),%ymm9
.byte 76,139,0 // mov (%rax),%r8
.byte 77,133,192 // test %r8,%r8
- .byte 15,132,143,0,0,0 // je 38a7 <_sk_linear_gradient_hsw+0xb5>
+ .byte 15,132,143,0,0,0 // je 38a3 <_sk_linear_gradient_hsw+0xb5>
.byte 72,139,64,8 // mov 0x8(%rax),%rax
.byte 72,131,192,32 // add $0x20,%rax
.byte 196,65,28,87,228 // vxorps %ymm12,%ymm12,%ymm12
@@ -11136,8 +11134,8 @@ _sk_linear_gradient_hsw:
.byte 196,67,13,74,201,208 // vblendvps %ymm13,%ymm9,%ymm14,%ymm9
.byte 72,131,192,36 // add $0x24,%rax
.byte 73,255,200 // dec %r8
- .byte 117,140 // jne 3831 <_sk_linear_gradient_hsw+0x3f>
- .byte 235,17 // jmp 38b8 <_sk_linear_gradient_hsw+0xc6>
+ .byte 117,140 // jne 382d <_sk_linear_gradient_hsw+0x3f>
+ .byte 235,17 // jmp 38b4 <_sk_linear_gradient_hsw+0xc6>
.byte 197,244,87,201 // vxorps %ymm1,%ymm1,%ymm1
.byte 197,236,87,210 // vxorps %ymm2,%ymm2,%ymm2
.byte 197,228,87,219 // vxorps %ymm3,%ymm3,%ymm3
@@ -11184,24 +11182,24 @@ _sk_xy_to_polar_unit_hsw:
.byte 196,65,52,95,226 // vmaxps %ymm10,%ymm9,%ymm12
.byte 196,65,36,94,220 // vdivps %ymm12,%ymm11,%ymm11
.byte 196,65,36,89,227 // vmulps %ymm11,%ymm11,%ymm12
- .byte 196,98,125,24,45,253,7,0,0 // vbroadcastss 0x7fd(%rip),%ymm13 # 4150 <_sk_callback_hsw+0x407>
- .byte 196,98,125,24,53,248,7,0,0 // vbroadcastss 0x7f8(%rip),%ymm14 # 4154 <_sk_callback_hsw+0x40b>
+ .byte 196,98,125,24,45,253,7,0,0 // vbroadcastss 0x7fd(%rip),%ymm13 # 414c <_sk_callback_hsw+0x407>
+ .byte 196,98,125,24,53,248,7,0,0 // vbroadcastss 0x7f8(%rip),%ymm14 # 4150 <_sk_callback_hsw+0x40b>
.byte 196,66,29,184,245 // vfmadd231ps %ymm13,%ymm12,%ymm14
- .byte 196,98,125,24,45,238,7,0,0 // vbroadcastss 0x7ee(%rip),%ymm13 # 4158 <_sk_callback_hsw+0x40f>
+ .byte 196,98,125,24,45,238,7,0,0 // vbroadcastss 0x7ee(%rip),%ymm13 # 4154 <_sk_callback_hsw+0x40f>
.byte 196,66,29,184,238 // vfmadd231ps %ymm14,%ymm12,%ymm13
- .byte 196,98,125,24,53,228,7,0,0 // vbroadcastss 0x7e4(%rip),%ymm14 # 415c <_sk_callback_hsw+0x413>
+ .byte 196,98,125,24,53,228,7,0,0 // vbroadcastss 0x7e4(%rip),%ymm14 # 4158 <_sk_callback_hsw+0x413>
.byte 196,66,29,184,245 // vfmadd231ps %ymm13,%ymm12,%ymm14
.byte 196,65,36,89,222 // vmulps %ymm14,%ymm11,%ymm11
.byte 196,65,52,194,202,1 // vcmpltps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,24,21,207,7,0,0 // vbroadcastss 0x7cf(%rip),%ymm10 # 4160 <_sk_callback_hsw+0x417>
+ .byte 196,98,125,24,21,207,7,0,0 // vbroadcastss 0x7cf(%rip),%ymm10 # 415c <_sk_callback_hsw+0x417>
.byte 196,65,44,92,211 // vsubps %ymm11,%ymm10,%ymm10
.byte 196,67,37,74,202,144 // vblendvps %ymm9,%ymm10,%ymm11,%ymm9
.byte 196,193,124,194,192,1 // vcmpltps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,21,185,7,0,0 // vbroadcastss 0x7b9(%rip),%ymm10 # 4164 <_sk_callback_hsw+0x41b>
+ .byte 196,98,125,24,21,185,7,0,0 // vbroadcastss 0x7b9(%rip),%ymm10 # 4160 <_sk_callback_hsw+0x41b>
.byte 196,65,44,92,209 // vsubps %ymm9,%ymm10,%ymm10
.byte 196,195,53,74,194,0 // vblendvps %ymm0,%ymm10,%ymm9,%ymm0
.byte 196,65,116,194,200,1 // vcmpltps %ymm8,%ymm1,%ymm9
- .byte 196,98,125,24,21,163,7,0,0 // vbroadcastss 0x7a3(%rip),%ymm10 # 4168 <_sk_callback_hsw+0x41f>
+ .byte 196,98,125,24,21,163,7,0,0 // vbroadcastss 0x7a3(%rip),%ymm10 # 4164 <_sk_callback_hsw+0x41f>
.byte 197,44,92,208 // vsubps %ymm0,%ymm10,%ymm10
.byte 196,195,125,74,194,144 // vblendvps %ymm9,%ymm10,%ymm0,%ymm0
.byte 196,65,124,194,200,3 // vcmpunordps %ymm8,%ymm0,%ymm9
@@ -11214,7 +11212,7 @@ HIDDEN _sk_save_xy_hsw
FUNCTION(_sk_save_xy_hsw)
_sk_save_xy_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,130,7,0,0 // vbroadcastss 0x782(%rip),%ymm8 # 416c <_sk_callback_hsw+0x423>
+ .byte 196,98,125,24,5,130,7,0,0 // vbroadcastss 0x782(%rip),%ymm8 # 4168 <_sk_callback_hsw+0x423>
.byte 196,65,124,88,200 // vaddps %ymm8,%ymm0,%ymm9
.byte 196,67,125,8,209,1 // vroundps $0x1,%ymm9,%ymm10
.byte 196,65,52,92,202 // vsubps %ymm10,%ymm9,%ymm9
@@ -11248,9 +11246,9 @@ HIDDEN _sk_bilinear_nx_hsw
FUNCTION(_sk_bilinear_nx_hsw)
_sk_bilinear_nx_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,22,7,0,0 // vbroadcastss 0x716(%rip),%ymm0 # 4170 <_sk_callback_hsw+0x427>
+ .byte 196,226,125,24,5,22,7,0,0 // vbroadcastss 0x716(%rip),%ymm0 # 416c <_sk_callback_hsw+0x427>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,13,7,0,0 // vbroadcastss 0x70d(%rip),%ymm8 # 4174 <_sk_callback_hsw+0x42b>
+ .byte 196,98,125,24,5,13,7,0,0 // vbroadcastss 0x70d(%rip),%ymm8 # 4170 <_sk_callback_hsw+0x42b>
.byte 197,60,92,64,64 // vsubps 0x40(%rax),%ymm8,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -11261,7 +11259,7 @@ HIDDEN _sk_bilinear_px_hsw
FUNCTION(_sk_bilinear_px_hsw)
_sk_bilinear_px_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,245,6,0,0 // vbroadcastss 0x6f5(%rip),%ymm0 # 4178 <_sk_callback_hsw+0x42f>
+ .byte 196,226,125,24,5,245,6,0,0 // vbroadcastss 0x6f5(%rip),%ymm0 # 4174 <_sk_callback_hsw+0x42f>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,64,64 // vmovups 0x40(%rax),%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
@@ -11273,9 +11271,9 @@ HIDDEN _sk_bilinear_ny_hsw
FUNCTION(_sk_bilinear_ny_hsw)
_sk_bilinear_ny_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,217,6,0,0 // vbroadcastss 0x6d9(%rip),%ymm1 # 417c <_sk_callback_hsw+0x433>
+ .byte 196,226,125,24,13,217,6,0,0 // vbroadcastss 0x6d9(%rip),%ymm1 # 4178 <_sk_callback_hsw+0x433>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,207,6,0,0 // vbroadcastss 0x6cf(%rip),%ymm8 # 4180 <_sk_callback_hsw+0x437>
+ .byte 196,98,125,24,5,207,6,0,0 // vbroadcastss 0x6cf(%rip),%ymm8 # 417c <_sk_callback_hsw+0x437>
.byte 197,60,92,64,96 // vsubps 0x60(%rax),%ymm8,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -11286,7 +11284,7 @@ HIDDEN _sk_bilinear_py_hsw
FUNCTION(_sk_bilinear_py_hsw)
_sk_bilinear_py_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,183,6,0,0 // vbroadcastss 0x6b7(%rip),%ymm1 # 4184 <_sk_callback_hsw+0x43b>
+ .byte 196,226,125,24,13,183,6,0,0 // vbroadcastss 0x6b7(%rip),%ymm1 # 4180 <_sk_callback_hsw+0x43b>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
.byte 197,124,16,64,96 // vmovups 0x60(%rax),%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
@@ -11298,13 +11296,13 @@ HIDDEN _sk_bicubic_n3x_hsw
FUNCTION(_sk_bicubic_n3x_hsw)
_sk_bicubic_n3x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,154,6,0,0 // vbroadcastss 0x69a(%rip),%ymm0 # 4188 <_sk_callback_hsw+0x43f>
+ .byte 196,226,125,24,5,154,6,0,0 // vbroadcastss 0x69a(%rip),%ymm0 # 4184 <_sk_callback_hsw+0x43f>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,145,6,0,0 // vbroadcastss 0x691(%rip),%ymm8 # 418c <_sk_callback_hsw+0x443>
+ .byte 196,98,125,24,5,145,6,0,0 // vbroadcastss 0x691(%rip),%ymm8 # 4188 <_sk_callback_hsw+0x443>
.byte 197,60,92,64,64 // vsubps 0x40(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,130,6,0,0 // vbroadcastss 0x682(%rip),%ymm10 # 4190 <_sk_callback_hsw+0x447>
- .byte 196,98,125,24,29,125,6,0,0 // vbroadcastss 0x67d(%rip),%ymm11 # 4194 <_sk_callback_hsw+0x44b>
+ .byte 196,98,125,24,21,130,6,0,0 // vbroadcastss 0x682(%rip),%ymm10 # 418c <_sk_callback_hsw+0x447>
+ .byte 196,98,125,24,29,125,6,0,0 // vbroadcastss 0x67d(%rip),%ymm11 # 4190 <_sk_callback_hsw+0x44b>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,36,89,193 // vmulps %ymm9,%ymm11,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
@@ -11316,16 +11314,16 @@ HIDDEN _sk_bicubic_n1x_hsw
FUNCTION(_sk_bicubic_n1x_hsw)
_sk_bicubic_n1x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,96,6,0,0 // vbroadcastss 0x660(%rip),%ymm0 # 4198 <_sk_callback_hsw+0x44f>
+ .byte 196,226,125,24,5,96,6,0,0 // vbroadcastss 0x660(%rip),%ymm0 # 4194 <_sk_callback_hsw+0x44f>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,87,6,0,0 // vbroadcastss 0x657(%rip),%ymm8 # 419c <_sk_callback_hsw+0x453>
+ .byte 196,98,125,24,5,87,6,0,0 // vbroadcastss 0x657(%rip),%ymm8 # 4198 <_sk_callback_hsw+0x453>
.byte 197,60,92,64,64 // vsubps 0x40(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,77,6,0,0 // vbroadcastss 0x64d(%rip),%ymm9 # 41a0 <_sk_callback_hsw+0x457>
- .byte 196,98,125,24,21,72,6,0,0 // vbroadcastss 0x648(%rip),%ymm10 # 41a4 <_sk_callback_hsw+0x45b>
+ .byte 196,98,125,24,13,77,6,0,0 // vbroadcastss 0x64d(%rip),%ymm9 # 419c <_sk_callback_hsw+0x457>
+ .byte 196,98,125,24,21,72,6,0,0 // vbroadcastss 0x648(%rip),%ymm10 # 41a0 <_sk_callback_hsw+0x45b>
.byte 196,66,61,168,209 // vfmadd213ps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,13,62,6,0,0 // vbroadcastss 0x63e(%rip),%ymm9 # 41a8 <_sk_callback_hsw+0x45f>
+ .byte 196,98,125,24,13,62,6,0,0 // vbroadcastss 0x63e(%rip),%ymm9 # 41a4 <_sk_callback_hsw+0x45f>
.byte 196,66,61,184,202 // vfmadd231ps %ymm10,%ymm8,%ymm9
- .byte 196,98,125,24,21,52,6,0,0 // vbroadcastss 0x634(%rip),%ymm10 # 41ac <_sk_callback_hsw+0x463>
+ .byte 196,98,125,24,21,52,6,0,0 // vbroadcastss 0x634(%rip),%ymm10 # 41a8 <_sk_callback_hsw+0x463>
.byte 196,66,61,184,209 // vfmadd231ps %ymm9,%ymm8,%ymm10
.byte 197,124,17,144,128,0,0,0 // vmovups %ymm10,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -11336,14 +11334,14 @@ HIDDEN _sk_bicubic_p1x_hsw
FUNCTION(_sk_bicubic_p1x_hsw)
_sk_bicubic_p1x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,28,6,0,0 // vbroadcastss 0x61c(%rip),%ymm8 # 41b0 <_sk_callback_hsw+0x467>
+ .byte 196,98,125,24,5,28,6,0,0 // vbroadcastss 0x61c(%rip),%ymm8 # 41ac <_sk_callback_hsw+0x467>
.byte 197,188,88,0 // vaddps (%rax),%ymm8,%ymm0
.byte 197,124,16,72,64 // vmovups 0x40(%rax),%ymm9
- .byte 196,98,125,24,21,14,6,0,0 // vbroadcastss 0x60e(%rip),%ymm10 # 41b4 <_sk_callback_hsw+0x46b>
- .byte 196,98,125,24,29,9,6,0,0 // vbroadcastss 0x609(%rip),%ymm11 # 41b8 <_sk_callback_hsw+0x46f>
+ .byte 196,98,125,24,21,14,6,0,0 // vbroadcastss 0x60e(%rip),%ymm10 # 41b0 <_sk_callback_hsw+0x46b>
+ .byte 196,98,125,24,29,9,6,0,0 // vbroadcastss 0x609(%rip),%ymm11 # 41b4 <_sk_callback_hsw+0x46f>
.byte 196,66,53,168,218 // vfmadd213ps %ymm10,%ymm9,%ymm11
.byte 196,66,53,168,216 // vfmadd213ps %ymm8,%ymm9,%ymm11
- .byte 196,98,125,24,5,250,5,0,0 // vbroadcastss 0x5fa(%rip),%ymm8 # 41bc <_sk_callback_hsw+0x473>
+ .byte 196,98,125,24,5,250,5,0,0 // vbroadcastss 0x5fa(%rip),%ymm8 # 41b8 <_sk_callback_hsw+0x473>
.byte 196,66,53,184,195 // vfmadd231ps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -11354,12 +11352,12 @@ HIDDEN _sk_bicubic_p3x_hsw
FUNCTION(_sk_bicubic_p3x_hsw)
_sk_bicubic_p3x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,226,5,0,0 // vbroadcastss 0x5e2(%rip),%ymm0 # 41c0 <_sk_callback_hsw+0x477>
+ .byte 196,226,125,24,5,226,5,0,0 // vbroadcastss 0x5e2(%rip),%ymm0 # 41bc <_sk_callback_hsw+0x477>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,64,64 // vmovups 0x40(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,207,5,0,0 // vbroadcastss 0x5cf(%rip),%ymm10 # 41c4 <_sk_callback_hsw+0x47b>
- .byte 196,98,125,24,29,202,5,0,0 // vbroadcastss 0x5ca(%rip),%ymm11 # 41c8 <_sk_callback_hsw+0x47f>
+ .byte 196,98,125,24,21,207,5,0,0 // vbroadcastss 0x5cf(%rip),%ymm10 # 41c0 <_sk_callback_hsw+0x47b>
+ .byte 196,98,125,24,29,202,5,0,0 // vbroadcastss 0x5ca(%rip),%ymm11 # 41c4 <_sk_callback_hsw+0x47f>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,52,89,195 // vmulps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
@@ -11371,13 +11369,13 @@ HIDDEN _sk_bicubic_n3y_hsw
FUNCTION(_sk_bicubic_n3y_hsw)
_sk_bicubic_n3y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,173,5,0,0 // vbroadcastss 0x5ad(%rip),%ymm1 # 41cc <_sk_callback_hsw+0x483>
+ .byte 196,226,125,24,13,173,5,0,0 // vbroadcastss 0x5ad(%rip),%ymm1 # 41c8 <_sk_callback_hsw+0x483>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,163,5,0,0 // vbroadcastss 0x5a3(%rip),%ymm8 # 41d0 <_sk_callback_hsw+0x487>
+ .byte 196,98,125,24,5,163,5,0,0 // vbroadcastss 0x5a3(%rip),%ymm8 # 41cc <_sk_callback_hsw+0x487>
.byte 197,60,92,64,96 // vsubps 0x60(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,148,5,0,0 // vbroadcastss 0x594(%rip),%ymm10 # 41d4 <_sk_callback_hsw+0x48b>
- .byte 196,98,125,24,29,143,5,0,0 // vbroadcastss 0x58f(%rip),%ymm11 # 41d8 <_sk_callback_hsw+0x48f>
+ .byte 196,98,125,24,21,148,5,0,0 // vbroadcastss 0x594(%rip),%ymm10 # 41d0 <_sk_callback_hsw+0x48b>
+ .byte 196,98,125,24,29,143,5,0,0 // vbroadcastss 0x58f(%rip),%ymm11 # 41d4 <_sk_callback_hsw+0x48f>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,36,89,193 // vmulps %ymm9,%ymm11,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
@@ -11389,16 +11387,16 @@ HIDDEN _sk_bicubic_n1y_hsw
FUNCTION(_sk_bicubic_n1y_hsw)
_sk_bicubic_n1y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,114,5,0,0 // vbroadcastss 0x572(%rip),%ymm1 # 41dc <_sk_callback_hsw+0x493>
+ .byte 196,226,125,24,13,114,5,0,0 // vbroadcastss 0x572(%rip),%ymm1 # 41d8 <_sk_callback_hsw+0x493>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,104,5,0,0 // vbroadcastss 0x568(%rip),%ymm8 # 41e0 <_sk_callback_hsw+0x497>
+ .byte 196,98,125,24,5,104,5,0,0 // vbroadcastss 0x568(%rip),%ymm8 # 41dc <_sk_callback_hsw+0x497>
.byte 197,60,92,64,96 // vsubps 0x60(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,94,5,0,0 // vbroadcastss 0x55e(%rip),%ymm9 # 41e4 <_sk_callback_hsw+0x49b>
- .byte 196,98,125,24,21,89,5,0,0 // vbroadcastss 0x559(%rip),%ymm10 # 41e8 <_sk_callback_hsw+0x49f>
+ .byte 196,98,125,24,13,94,5,0,0 // vbroadcastss 0x55e(%rip),%ymm9 # 41e0 <_sk_callback_hsw+0x49b>
+ .byte 196,98,125,24,21,89,5,0,0 // vbroadcastss 0x559(%rip),%ymm10 # 41e4 <_sk_callback_hsw+0x49f>
.byte 196,66,61,168,209 // vfmadd213ps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,13,79,5,0,0 // vbroadcastss 0x54f(%rip),%ymm9 # 41ec <_sk_callback_hsw+0x4a3>
+ .byte 196,98,125,24,13,79,5,0,0 // vbroadcastss 0x54f(%rip),%ymm9 # 41e8 <_sk_callback_hsw+0x4a3>
.byte 196,66,61,184,202 // vfmadd231ps %ymm10,%ymm8,%ymm9
- .byte 196,98,125,24,21,69,5,0,0 // vbroadcastss 0x545(%rip),%ymm10 # 41f0 <_sk_callback_hsw+0x4a7>
+ .byte 196,98,125,24,21,69,5,0,0 // vbroadcastss 0x545(%rip),%ymm10 # 41ec <_sk_callback_hsw+0x4a7>
.byte 196,66,61,184,209 // vfmadd231ps %ymm9,%ymm8,%ymm10
.byte 197,124,17,144,160,0,0,0 // vmovups %ymm10,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -11409,14 +11407,14 @@ HIDDEN _sk_bicubic_p1y_hsw
FUNCTION(_sk_bicubic_p1y_hsw)
_sk_bicubic_p1y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,45,5,0,0 // vbroadcastss 0x52d(%rip),%ymm8 # 41f4 <_sk_callback_hsw+0x4ab>
+ .byte 196,98,125,24,5,45,5,0,0 // vbroadcastss 0x52d(%rip),%ymm8 # 41f0 <_sk_callback_hsw+0x4ab>
.byte 197,188,88,72,32 // vaddps 0x20(%rax),%ymm8,%ymm1
.byte 197,124,16,72,96 // vmovups 0x60(%rax),%ymm9
- .byte 196,98,125,24,21,30,5,0,0 // vbroadcastss 0x51e(%rip),%ymm10 # 41f8 <_sk_callback_hsw+0x4af>
- .byte 196,98,125,24,29,25,5,0,0 // vbroadcastss 0x519(%rip),%ymm11 # 41fc <_sk_callback_hsw+0x4b3>
+ .byte 196,98,125,24,21,30,5,0,0 // vbroadcastss 0x51e(%rip),%ymm10 # 41f4 <_sk_callback_hsw+0x4af>
+ .byte 196,98,125,24,29,25,5,0,0 // vbroadcastss 0x519(%rip),%ymm11 # 41f8 <_sk_callback_hsw+0x4b3>
.byte 196,66,53,168,218 // vfmadd213ps %ymm10,%ymm9,%ymm11
.byte 196,66,53,168,216 // vfmadd213ps %ymm8,%ymm9,%ymm11
- .byte 196,98,125,24,5,10,5,0,0 // vbroadcastss 0x50a(%rip),%ymm8 # 4200 <_sk_callback_hsw+0x4b7>
+ .byte 196,98,125,24,5,10,5,0,0 // vbroadcastss 0x50a(%rip),%ymm8 # 41fc <_sk_callback_hsw+0x4b7>
.byte 196,66,53,184,195 // vfmadd231ps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -11427,12 +11425,12 @@ HIDDEN _sk_bicubic_p3y_hsw
FUNCTION(_sk_bicubic_p3y_hsw)
_sk_bicubic_p3y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,242,4,0,0 // vbroadcastss 0x4f2(%rip),%ymm1 # 4204 <_sk_callback_hsw+0x4bb>
+ .byte 196,226,125,24,13,242,4,0,0 // vbroadcastss 0x4f2(%rip),%ymm1 # 4200 <_sk_callback_hsw+0x4bb>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
.byte 197,124,16,64,96 // vmovups 0x60(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,222,4,0,0 // vbroadcastss 0x4de(%rip),%ymm10 # 4208 <_sk_callback_hsw+0x4bf>
- .byte 196,98,125,24,29,217,4,0,0 // vbroadcastss 0x4d9(%rip),%ymm11 # 420c <_sk_callback_hsw+0x4c3>
+ .byte 196,98,125,24,21,222,4,0,0 // vbroadcastss 0x4de(%rip),%ymm10 # 4204 <_sk_callback_hsw+0x4bf>
+ .byte 196,98,125,24,29,217,4,0,0 // vbroadcastss 0x4d9(%rip),%ymm11 # 4208 <_sk_callback_hsw+0x4c3>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,52,89,195 // vmulps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
@@ -11525,11 +11523,10 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 2,0 // add (%rax),%al
.byte 0,0 // add %al,(%rax)
- .byte 33,8 // and %ecx,(%rax)
- .byte 130 // (bad)
- .byte 60,0 // cmp $0x0,%al
.byte 0,0 // add %al,(%rax)
- .byte 191,0,0,128,63 // mov $0x3f800000,%edi
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 252 // cld
+ .byte 190,0,0,128,63 // mov $0x3f800000,%esi
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
.byte 0,128,63,0,0,128 // add %al,-0x7fffffc1(%rax)
@@ -11601,7 +11598,7 @@ BALIGN4
.byte 190,129,128,128,59 // mov $0x3b808081,%esi
.byte 129,128,128,59,0,248,0,0,8,33 // addl $0x21080000,-0x7ffc480(%rax)
.byte 132,55 // test %dh,(%rdi)
- .byte 224,7 // loopne 3f61 <.literal4+0xf1>
+ .byte 224,7 // loopne 3f5d <.literal4+0xf1>
.byte 0,0 // add %al,(%rax)
.byte 33,8 // and %ecx,(%rax)
.byte 2,58 // add (%rdx),%bh
@@ -11615,10 +11612,10 @@ BALIGN4
.byte 129,128,128,59,129,128,128,59,0,0 // addl $0x3b80,-0x7f7ec480(%rax)
.byte 0,52,255 // add %dh,(%rdi,%rdi,8)
.byte 255 // (bad)
- .byte 127,0 // jg 3f8c <.literal4+0x11c>
+ .byte 127,0 // jg 3f88 <.literal4+0x11c>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 4005 <.literal4+0x195>
+ .byte 119,115 // ja 4001 <.literal4+0x195>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -11632,10 +11629,10 @@ BALIGN4
.byte 0,128,63,0,0,0 // add %al,0x3f(%rax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg 3fc0 <.literal4+0x150>
+ .byte 127,0 // jg 3fbc <.literal4+0x150>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 4039 <.literal4+0x1c9>
+ .byte 119,115 // ja 4035 <.literal4+0x1c9>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -11649,10 +11646,10 @@ BALIGN4
.byte 0,128,63,0,0,0 // add %al,0x3f(%rax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg 3ff4 <.literal4+0x184>
+ .byte 127,0 // jg 3ff0 <.literal4+0x184>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 406d <.literal4+0x1fd>
+ .byte 119,115 // ja 4069 <.literal4+0x1fd>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -11666,10 +11663,10 @@ BALIGN4
.byte 0,128,63,0,0,0 // add %al,0x3f(%rax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg 4028 <.literal4+0x1b8>
+ .byte 127,0 // jg 4024 <.literal4+0x1b8>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 40a1 <.literal4+0x231>
+ .byte 119,115 // ja 409d <.literal4+0x231>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -11682,7 +11679,7 @@ BALIGN4
.byte 0,75,0 // add %cl,0x0(%rbx)
.byte 0,128,63,0,0,200 // add %al,-0x37ffffc1(%rax)
.byte 66,0,0 // rex.X add %al,(%rax)
- .byte 127,67 // jg 409f <.literal4+0x22f>
+ .byte 127,67 // jg 409b <.literal4+0x22f>
.byte 0,0 // add %al,(%rax)
.byte 0,195 // add %al,%bl
.byte 0,0 // add %al,(%rax)
@@ -11694,10 +11691,10 @@ BALIGN4
.byte 190,80,128,3,62 // mov $0x3e038050,%esi
.byte 31 // (bad)
.byte 215 // xlat %ds:(%rbx)
- .byte 118,63 // jbe 40bf <.literal4+0x24f>
+ .byte 118,63 // jbe 40bb <.literal4+0x24f>
.byte 246,64,83,63 // testb $0x3f,0x53(%rax)
.byte 129,128,128,59,129,128,128,59,0,0 // addl $0x3b80,-0x7f7ec480(%rax)
- .byte 127,67 // jg 40d3 <.literal4+0x263>
+ .byte 127,67 // jg 40cf <.literal4+0x263>
.byte 129,128,128,59,0,0,128,63,129,128 // addl $0x80813f80,0x3b80(%rax)
.byte 128,59,0 // cmpb $0x0,(%rbx)
.byte 0,128,63,129,128,128 // add %al,-0x7f7f7ec1(%rax)
@@ -11706,7 +11703,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 8,33 // or %ah,(%rcx)
.byte 132,55 // test %dh,(%rdi)
- .byte 224,7 // loopne 40b5 <.literal4+0x245>
+ .byte 224,7 // loopne 40b1 <.literal4+0x245>
.byte 0,0 // add %al,(%rax)
.byte 33,8 // and %ecx,(%rax)
.byte 2,58 // add (%rdx),%bh
@@ -11718,7 +11715,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 8,33 // or %ah,(%rcx)
.byte 132,55 // test %dh,(%rdi)
- .byte 224,7 // loopne 40d1 <.literal4+0x261>
+ .byte 224,7 // loopne 40cd <.literal4+0x261>
.byte 0,0 // add %al,(%rax)
.byte 33,8 // and %ecx,(%rax)
.byte 2,58 // add (%rdx),%bh
@@ -11729,7 +11726,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 248 // clc
.byte 65,0,0 // add %al,(%r8)
- .byte 124,66 // jl 4126 <.literal4+0x2b6>
+ .byte 124,66 // jl 4122 <.literal4+0x2b6>
.byte 0,240 // add %dh,%al
.byte 0,0 // add %al,(%rax)
.byte 137,136,136,55,0,15 // mov %ecx,0xf003788(%rax)
@@ -11747,9 +11744,9 @@ BALIGN4
.byte 137,136,136,59,15,0 // mov %ecx,0xf3b88(%rax)
.byte 0,0 // add %al,(%rax)
.byte 137,136,136,61,0,0 // mov %ecx,0x3d88(%rax)
- .byte 112,65 // jo 4169 <.literal4+0x2f9>
+ .byte 112,65 // jo 4165 <.literal4+0x2f9>
.byte 129,128,128,59,129,128,128,59,0,0 // addl $0x3b80,-0x7f7ec480(%rax)
- .byte 127,67 // jg 4177 <.literal4+0x307>
+ .byte 127,67 // jg 4173 <.literal4+0x307>
.byte 128,0,128 // addb $0x80,(%rax)
.byte 55 // (bad)
.byte 128,0,128 // addb $0x80,(%rax)
@@ -11757,7 +11754,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
.byte 255 // (bad)
- .byte 127,71 // jg 418b <.literal4+0x31b>
+ .byte 127,71 // jg 4187 <.literal4+0x31b>
.byte 208 // (bad)
.byte 179,89 // mov $0x59,%bl
.byte 62,89 // ds pop %rcx
@@ -11854,16 +11851,16 @@ BALIGN32
.byte 0,0 // add %al,(%rax)
.byte 1,255 // add %edi,%edi
.byte 255 // (bad)
- .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a004248 <_sk_callback_hsw+0xa0004ff>
+ .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a004248 <_sk_callback_hsw+0xa000503>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 12004250 <_sk_callback_hsw+0x12000507>
+ .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 12004250 <_sk_callback_hsw+0x1200050b>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a004258 <_sk_callback_hsw+0x1a00050f>
+ .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a004258 <_sk_callback_hsw+0x1a000513>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 3004260 <_sk_callback_hsw+0x3000517>
+ .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 3004260 <_sk_callback_hsw+0x300051b>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -11906,16 +11903,16 @@ BALIGN32
.byte 0,0 // add %al,(%rax)
.byte 1,255 // add %edi,%edi
.byte 255 // (bad)
- .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a0042a8 <_sk_callback_hsw+0xa00055f>
+ .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a0042a8 <_sk_callback_hsw+0xa000563>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 120042b0 <_sk_callback_hsw+0x12000567>
+ .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 120042b0 <_sk_callback_hsw+0x1200056b>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a0042b8 <_sk_callback_hsw+0x1a00056f>
+ .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a0042b8 <_sk_callback_hsw+0x1a000573>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 30042c0 <_sk_callback_hsw+0x3000577>
+ .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 30042c0 <_sk_callback_hsw+0x300057b>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -11958,16 +11955,16 @@ BALIGN32
.byte 0,0 // add %al,(%rax)
.byte 1,255 // add %edi,%edi
.byte 255 // (bad)
- .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a004308 <_sk_callback_hsw+0xa0005bf>
+ .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a004308 <_sk_callback_hsw+0xa0005c3>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 12004310 <_sk_callback_hsw+0x120005c7>
+ .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 12004310 <_sk_callback_hsw+0x120005cb>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a004318 <_sk_callback_hsw+0x1a0005cf>
+ .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a004318 <_sk_callback_hsw+0x1a0005d3>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 3004320 <_sk_callback_hsw+0x30005d7>
+ .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 3004320 <_sk_callback_hsw+0x30005db>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -12010,16 +12007,16 @@ BALIGN32
.byte 0,0 // add %al,(%rax)
.byte 1,255 // add %edi,%edi
.byte 255 // (bad)
- .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a004368 <_sk_callback_hsw+0xa00061f>
+ .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a004368 <_sk_callback_hsw+0xa000623>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 12004370 <_sk_callback_hsw+0x12000627>
+ .byte 255,13,255,255,255,17 // decl 0x11ffffff(%rip) # 12004370 <_sk_callback_hsw+0x1200062b>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a004378 <_sk_callback_hsw+0x1a00062f>
+ .byte 255,21,255,255,255,25 // callq *0x19ffffff(%rip) # 1a004378 <_sk_callback_hsw+0x1a000633>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 3004380 <_sk_callback_hsw+0x3000637>
+ .byte 255,29,255,255,255,2 // lcall *0x2ffffff(%rip) # 3004380 <_sk_callback_hsw+0x300063b>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -12140,14 +12137,14 @@ _sk_seed_shader_avx:
.byte 197,249,112,192,0 // vpshufd $0x0,%xmm0,%xmm0
.byte 196,227,125,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,207,84,0,0 // vbroadcastss 0x54cf(%rip),%ymm1 # 5598 <_sk_callback_avx+0x125>
+ .byte 196,226,125,24,13,203,84,0,0 // vbroadcastss 0x54cb(%rip),%ymm1 # 5594 <_sk_callback_avx+0x125>
.byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
.byte 197,252,88,2 // vaddps (%rdx),%ymm0,%ymm0
.byte 196,226,125,24,16 // vbroadcastss (%rax),%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 197,236,88,201 // vaddps %ymm1,%ymm2,%ymm1
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,21,179,84,0,0 // vbroadcastss 0x54b3(%rip),%ymm2 # 559c <_sk_callback_avx+0x129>
+ .byte 196,226,125,24,21,175,84,0,0 // vbroadcastss 0x54af(%rip),%ymm2 # 5598 <_sk_callback_avx+0x129>
.byte 197,228,87,219 // vxorps %ymm3,%ymm3,%ymm3
.byte 197,220,87,228 // vxorps %ymm4,%ymm4,%ymm4
.byte 197,212,87,237 // vxorps %ymm5,%ymm5,%ymm5
@@ -12169,7 +12166,7 @@ _sk_dither_avx:
.byte 76,139,0 // mov (%rax),%r8
.byte 196,66,125,24,8 // vbroadcastss (%r8),%ymm9
.byte 196,65,60,87,209 // vxorps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,29,107,84,0,0 // vbroadcastss 0x546b(%rip),%ymm11 # 55a0 <_sk_callback_avx+0x12d>
+ .byte 196,98,125,24,29,103,84,0,0 // vbroadcastss 0x5467(%rip),%ymm11 # 559c <_sk_callback_avx+0x12d>
.byte 196,65,44,84,203 // vandps %ymm11,%ymm10,%ymm9
.byte 196,193,25,114,241,5 // vpslld $0x5,%xmm9,%xmm12
.byte 196,67,125,25,201,1 // vextractf128 $0x1,%ymm9,%xmm9
@@ -12180,8 +12177,8 @@ _sk_dither_avx:
.byte 196,67,125,25,219,1 // vextractf128 $0x1,%ymm11,%xmm11
.byte 196,193,33,114,243,4 // vpslld $0x4,%xmm11,%xmm11
.byte 196,67,29,24,219,1 // vinsertf128 $0x1,%xmm11,%ymm12,%ymm11
- .byte 196,98,125,24,37,44,84,0,0 // vbroadcastss 0x542c(%rip),%ymm12 # 55a4 <_sk_callback_avx+0x131>
- .byte 196,98,125,24,45,39,84,0,0 // vbroadcastss 0x5427(%rip),%ymm13 # 55a8 <_sk_callback_avx+0x135>
+ .byte 196,98,125,24,37,40,84,0,0 // vbroadcastss 0x5428(%rip),%ymm12 # 55a0 <_sk_callback_avx+0x131>
+ .byte 196,98,125,24,45,35,84,0,0 // vbroadcastss 0x5423(%rip),%ymm13 # 55a4 <_sk_callback_avx+0x135>
.byte 196,65,44,84,245 // vandps %ymm13,%ymm10,%ymm14
.byte 196,193,1,114,246,2 // vpslld $0x2,%xmm14,%xmm15
.byte 196,67,125,25,246,1 // vextractf128 $0x1,%ymm14,%xmm14
@@ -12208,13 +12205,12 @@ _sk_dither_avx:
.byte 196,65,60,86,193 // vorps %ymm9,%ymm8,%ymm8
.byte 196,65,60,86,194 // vorps %ymm10,%ymm8,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,146,83,0,0 // vbroadcastss 0x5392(%rip),%ymm9 # 55ac <_sk_callback_avx+0x139>
+ .byte 196,98,125,24,13,142,83,0,0 // vbroadcastss 0x538e(%rip),%ymm9 # 55a8 <_sk_callback_avx+0x139>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,24,13,136,83,0,0 // vbroadcastss 0x5388(%rip),%ymm9 # 55b0 <_sk_callback_avx+0x13d>
+ .byte 196,98,125,24,13,132,83,0,0 // vbroadcastss 0x5384(%rip),%ymm9 # 55ac <_sk_callback_avx+0x13d>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 196,98,125,24,72,8 // vbroadcastss 0x8(%rax),%ymm9
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
- .byte 197,60,89,195 // vmulps %ymm3,%ymm8,%ymm8
.byte 197,188,88,192 // vaddps %ymm0,%ymm8,%ymm0
.byte 197,188,88,201 // vaddps %ymm1,%ymm8,%ymm1
.byte 197,188,88,210 // vaddps %ymm2,%ymm8,%ymm2
@@ -12249,7 +12245,7 @@ HIDDEN _sk_srcatop_avx
FUNCTION(_sk_srcatop_avx)
_sk_srcatop_avx:
.byte 197,252,89,199 // vmulps %ymm7,%ymm0,%ymm0
- .byte 196,98,125,24,5,42,83,0,0 // vbroadcastss 0x532a(%rip),%ymm8 # 55b4 <_sk_callback_avx+0x141>
+ .byte 196,98,125,24,5,42,83,0,0 // vbroadcastss 0x532a(%rip),%ymm8 # 55b0 <_sk_callback_avx+0x141>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 197,60,89,204 // vmulps %ymm4,%ymm8,%ymm9
.byte 197,180,88,192 // vaddps %ymm0,%ymm9,%ymm0
@@ -12270,7 +12266,7 @@ HIDDEN _sk_dstatop_avx
FUNCTION(_sk_dstatop_avx)
_sk_dstatop_avx:
.byte 197,100,89,196 // vmulps %ymm4,%ymm3,%ymm8
- .byte 196,98,125,24,13,236,82,0,0 // vbroadcastss 0x52ec(%rip),%ymm9 # 55b8 <_sk_callback_avx+0x145>
+ .byte 196,98,125,24,13,236,82,0,0 // vbroadcastss 0x52ec(%rip),%ymm9 # 55b4 <_sk_callback_avx+0x145>
.byte 197,52,92,207 // vsubps %ymm7,%ymm9,%ymm9
.byte 197,180,89,192 // vmulps %ymm0,%ymm9,%ymm0
.byte 197,188,88,192 // vaddps %ymm0,%ymm8,%ymm0
@@ -12312,7 +12308,7 @@ HIDDEN _sk_srcout_avx
.globl _sk_srcout_avx
FUNCTION(_sk_srcout_avx)
_sk_srcout_avx:
- .byte 196,98,125,24,5,139,82,0,0 // vbroadcastss 0x528b(%rip),%ymm8 # 55bc <_sk_callback_avx+0x149>
+ .byte 196,98,125,24,5,139,82,0,0 // vbroadcastss 0x528b(%rip),%ymm8 # 55b8 <_sk_callback_avx+0x149>
.byte 197,60,92,199 // vsubps %ymm7,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
@@ -12325,7 +12321,7 @@ HIDDEN _sk_dstout_avx
.globl _sk_dstout_avx
FUNCTION(_sk_dstout_avx)
_sk_dstout_avx:
- .byte 196,226,125,24,5,110,82,0,0 // vbroadcastss 0x526e(%rip),%ymm0 # 55c0 <_sk_callback_avx+0x14d>
+ .byte 196,226,125,24,5,110,82,0,0 // vbroadcastss 0x526e(%rip),%ymm0 # 55bc <_sk_callback_avx+0x14d>
.byte 197,252,92,219 // vsubps %ymm3,%ymm0,%ymm3
.byte 197,228,89,196 // vmulps %ymm4,%ymm3,%ymm0
.byte 197,228,89,205 // vmulps %ymm5,%ymm3,%ymm1
@@ -12338,7 +12334,7 @@ HIDDEN _sk_srcover_avx
.globl _sk_srcover_avx
FUNCTION(_sk_srcover_avx)
_sk_srcover_avx:
- .byte 196,98,125,24,5,81,82,0,0 // vbroadcastss 0x5251(%rip),%ymm8 # 55c4 <_sk_callback_avx+0x151>
+ .byte 196,98,125,24,5,81,82,0,0 // vbroadcastss 0x5251(%rip),%ymm8 # 55c0 <_sk_callback_avx+0x151>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 197,60,89,204 // vmulps %ymm4,%ymm8,%ymm9
.byte 197,180,88,192 // vaddps %ymm0,%ymm9,%ymm0
@@ -12355,7 +12351,7 @@ HIDDEN _sk_dstover_avx
.globl _sk_dstover_avx
FUNCTION(_sk_dstover_avx)
_sk_dstover_avx:
- .byte 196,98,125,24,5,36,82,0,0 // vbroadcastss 0x5224(%rip),%ymm8 # 55c8 <_sk_callback_avx+0x155>
+ .byte 196,98,125,24,5,36,82,0,0 // vbroadcastss 0x5224(%rip),%ymm8 # 55c4 <_sk_callback_avx+0x155>
.byte 197,60,92,199 // vsubps %ymm7,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 197,252,88,196 // vaddps %ymm4,%ymm0,%ymm0
@@ -12383,7 +12379,7 @@ HIDDEN _sk_multiply_avx
.globl _sk_multiply_avx
FUNCTION(_sk_multiply_avx)
_sk_multiply_avx:
- .byte 196,98,125,24,5,227,81,0,0 // vbroadcastss 0x51e3(%rip),%ymm8 # 55cc <_sk_callback_avx+0x159>
+ .byte 196,98,125,24,5,227,81,0,0 // vbroadcastss 0x51e3(%rip),%ymm8 # 55c8 <_sk_callback_avx+0x159>
.byte 197,60,92,207 // vsubps %ymm7,%ymm8,%ymm9
.byte 197,52,89,208 // vmulps %ymm0,%ymm9,%ymm10
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -12443,7 +12439,7 @@ HIDDEN _sk_xor__avx
.globl _sk_xor__avx
FUNCTION(_sk_xor__avx)
_sk_xor__avx:
- .byte 196,98,125,24,5,50,81,0,0 // vbroadcastss 0x5132(%rip),%ymm8 # 55d0 <_sk_callback_avx+0x15d>
+ .byte 196,98,125,24,5,50,81,0,0 // vbroadcastss 0x5132(%rip),%ymm8 # 55cc <_sk_callback_avx+0x15d>
.byte 197,60,92,207 // vsubps %ymm7,%ymm8,%ymm9
.byte 197,180,89,192 // vmulps %ymm0,%ymm9,%ymm0
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -12480,7 +12476,7 @@ _sk_darken_avx:
.byte 197,100,89,206 // vmulps %ymm6,%ymm3,%ymm9
.byte 196,193,108,95,209 // vmaxps %ymm9,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,178,80,0,0 // vbroadcastss 0x50b2(%rip),%ymm8 # 55d4 <_sk_callback_avx+0x161>
+ .byte 196,98,125,24,5,178,80,0,0 // vbroadcastss 0x50b2(%rip),%ymm8 # 55d0 <_sk_callback_avx+0x161>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 197,60,89,199 // vmulps %ymm7,%ymm8,%ymm8
.byte 197,188,88,219 // vaddps %ymm3,%ymm8,%ymm3
@@ -12506,7 +12502,7 @@ _sk_lighten_avx:
.byte 197,100,89,206 // vmulps %ymm6,%ymm3,%ymm9
.byte 196,193,108,93,209 // vminps %ymm9,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,94,80,0,0 // vbroadcastss 0x505e(%rip),%ymm8 # 55d8 <_sk_callback_avx+0x165>
+ .byte 196,98,125,24,5,94,80,0,0 // vbroadcastss 0x505e(%rip),%ymm8 # 55d4 <_sk_callback_avx+0x165>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 197,60,89,199 // vmulps %ymm7,%ymm8,%ymm8
.byte 197,188,88,219 // vaddps %ymm3,%ymm8,%ymm3
@@ -12535,7 +12531,7 @@ _sk_difference_avx:
.byte 196,193,108,93,209 // vminps %ymm9,%ymm2,%ymm2
.byte 197,236,88,210 // vaddps %ymm2,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,254,79,0,0 // vbroadcastss 0x4ffe(%rip),%ymm8 # 55dc <_sk_callback_avx+0x169>
+ .byte 196,98,125,24,5,254,79,0,0 // vbroadcastss 0x4ffe(%rip),%ymm8 # 55d8 <_sk_callback_avx+0x169>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 197,60,89,199 // vmulps %ymm7,%ymm8,%ymm8
.byte 197,188,88,219 // vaddps %ymm3,%ymm8,%ymm3
@@ -12558,7 +12554,7 @@ _sk_exclusion_avx:
.byte 197,236,89,214 // vmulps %ymm6,%ymm2,%ymm2
.byte 197,236,88,210 // vaddps %ymm2,%ymm2,%ymm2
.byte 197,188,92,210 // vsubps %ymm2,%ymm8,%ymm2
- .byte 196,98,125,24,5,185,79,0,0 // vbroadcastss 0x4fb9(%rip),%ymm8 # 55e0 <_sk_callback_avx+0x16d>
+ .byte 196,98,125,24,5,185,79,0,0 // vbroadcastss 0x4fb9(%rip),%ymm8 # 55dc <_sk_callback_avx+0x16d>
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
.byte 197,60,89,199 // vmulps %ymm7,%ymm8,%ymm8
.byte 197,188,88,219 // vaddps %ymm3,%ymm8,%ymm3
@@ -12569,7 +12565,7 @@ HIDDEN _sk_colorburn_avx
.globl _sk_colorburn_avx
FUNCTION(_sk_colorburn_avx)
_sk_colorburn_avx:
- .byte 196,98,125,24,5,164,79,0,0 // vbroadcastss 0x4fa4(%rip),%ymm8 # 55e4 <_sk_callback_avx+0x171>
+ .byte 196,98,125,24,5,164,79,0,0 // vbroadcastss 0x4fa4(%rip),%ymm8 # 55e0 <_sk_callback_avx+0x171>
.byte 197,60,92,207 // vsubps %ymm7,%ymm8,%ymm9
.byte 197,52,89,216 // vmulps %ymm0,%ymm9,%ymm11
.byte 196,65,44,87,210 // vxorps %ymm10,%ymm10,%ymm10
@@ -12631,7 +12627,7 @@ HIDDEN _sk_colordodge_avx
FUNCTION(_sk_colordodge_avx)
_sk_colordodge_avx:
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
- .byte 196,98,125,24,13,160,78,0,0 // vbroadcastss 0x4ea0(%rip),%ymm9 # 55e8 <_sk_callback_avx+0x175>
+ .byte 196,98,125,24,13,160,78,0,0 // vbroadcastss 0x4ea0(%rip),%ymm9 # 55e4 <_sk_callback_avx+0x175>
.byte 197,52,92,215 // vsubps %ymm7,%ymm9,%ymm10
.byte 197,44,89,216 // vmulps %ymm0,%ymm10,%ymm11
.byte 197,52,92,203 // vsubps %ymm3,%ymm9,%ymm9
@@ -12688,7 +12684,7 @@ HIDDEN _sk_hardlight_avx
.globl _sk_hardlight_avx
FUNCTION(_sk_hardlight_avx)
_sk_hardlight_avx:
- .byte 196,98,125,24,5,178,77,0,0 // vbroadcastss 0x4db2(%rip),%ymm8 # 55ec <_sk_callback_avx+0x179>
+ .byte 196,98,125,24,5,178,77,0,0 // vbroadcastss 0x4db2(%rip),%ymm8 # 55e8 <_sk_callback_avx+0x179>
.byte 197,60,92,215 // vsubps %ymm7,%ymm8,%ymm10
.byte 197,44,89,200 // vmulps %ymm0,%ymm10,%ymm9
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -12743,7 +12739,7 @@ HIDDEN _sk_overlay_avx
.globl _sk_overlay_avx
FUNCTION(_sk_overlay_avx)
_sk_overlay_avx:
- .byte 196,98,125,24,5,219,76,0,0 // vbroadcastss 0x4cdb(%rip),%ymm8 # 55f0 <_sk_callback_avx+0x17d>
+ .byte 196,98,125,24,5,219,76,0,0 // vbroadcastss 0x4cdb(%rip),%ymm8 # 55ec <_sk_callback_avx+0x17d>
.byte 197,60,92,215 // vsubps %ymm7,%ymm8,%ymm10
.byte 197,44,89,200 // vmulps %ymm0,%ymm10,%ymm9
.byte 197,60,92,195 // vsubps %ymm3,%ymm8,%ymm8
@@ -12809,10 +12805,10 @@ _sk_softlight_avx:
.byte 196,65,60,88,192 // vaddps %ymm8,%ymm8,%ymm8
.byte 196,65,60,89,216 // vmulps %ymm8,%ymm8,%ymm11
.byte 196,65,60,88,195 // vaddps %ymm11,%ymm8,%ymm8
- .byte 196,98,125,24,29,210,75,0,0 // vbroadcastss 0x4bd2(%rip),%ymm11 # 55f8 <_sk_callback_avx+0x185>
+ .byte 196,98,125,24,29,210,75,0,0 // vbroadcastss 0x4bd2(%rip),%ymm11 # 55f4 <_sk_callback_avx+0x185>
.byte 196,65,28,88,235 // vaddps %ymm11,%ymm12,%ymm13
.byte 196,65,20,89,192 // vmulps %ymm8,%ymm13,%ymm8
- .byte 196,98,125,24,45,195,75,0,0 // vbroadcastss 0x4bc3(%rip),%ymm13 # 55fc <_sk_callback_avx+0x189>
+ .byte 196,98,125,24,45,195,75,0,0 // vbroadcastss 0x4bc3(%rip),%ymm13 # 55f8 <_sk_callback_avx+0x189>
.byte 196,65,28,89,245 // vmulps %ymm13,%ymm12,%ymm14
.byte 196,65,12,88,192 // vaddps %ymm8,%ymm14,%ymm8
.byte 196,65,124,82,244 // vrsqrtps %ymm12,%ymm14
@@ -12823,7 +12819,7 @@ _sk_softlight_avx:
.byte 197,4,194,255,2 // vcmpleps %ymm7,%ymm15,%ymm15
.byte 196,67,13,74,240,240 // vblendvps %ymm15,%ymm8,%ymm14,%ymm14
.byte 197,116,88,249 // vaddps %ymm1,%ymm1,%ymm15
- .byte 196,98,125,24,5,129,75,0,0 // vbroadcastss 0x4b81(%rip),%ymm8 # 55f4 <_sk_callback_avx+0x181>
+ .byte 196,98,125,24,5,129,75,0,0 // vbroadcastss 0x4b81(%rip),%ymm8 # 55f0 <_sk_callback_avx+0x181>
.byte 196,65,60,92,228 // vsubps %ymm12,%ymm8,%ymm12
.byte 197,132,92,195 // vsubps %ymm3,%ymm15,%ymm0
.byte 196,65,124,89,228 // vmulps %ymm12,%ymm0,%ymm12
@@ -12930,7 +12926,7 @@ HIDDEN _sk_clamp_1_avx
.globl _sk_clamp_1_avx
FUNCTION(_sk_clamp_1_avx)
_sk_clamp_1_avx:
- .byte 196,98,125,24,5,209,73,0,0 // vbroadcastss 0x49d1(%rip),%ymm8 # 5600 <_sk_callback_avx+0x18d>
+ .byte 196,98,125,24,5,209,73,0,0 // vbroadcastss 0x49d1(%rip),%ymm8 # 55fc <_sk_callback_avx+0x18d>
.byte 196,193,124,93,192 // vminps %ymm8,%ymm0,%ymm0
.byte 196,193,116,93,200 // vminps %ymm8,%ymm1,%ymm1
.byte 196,193,108,93,208 // vminps %ymm8,%ymm2,%ymm2
@@ -12942,7 +12938,7 @@ HIDDEN _sk_clamp_a_avx
.globl _sk_clamp_a_avx
FUNCTION(_sk_clamp_a_avx)
_sk_clamp_a_avx:
- .byte 196,98,125,24,5,180,73,0,0 // vbroadcastss 0x49b4(%rip),%ymm8 # 5604 <_sk_callback_avx+0x191>
+ .byte 196,98,125,24,5,180,73,0,0 // vbroadcastss 0x49b4(%rip),%ymm8 # 5600 <_sk_callback_avx+0x191>
.byte 196,193,100,93,216 // vminps %ymm8,%ymm3,%ymm3
.byte 197,252,93,195 // vminps %ymm3,%ymm0,%ymm0
.byte 197,244,93,203 // vminps %ymm3,%ymm1,%ymm1
@@ -13028,7 +13024,7 @@ FUNCTION(_sk_unpremul_avx)
_sk_unpremul_avx:
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,65,100,194,200,0 // vcmpeqps %ymm8,%ymm3,%ymm9
- .byte 196,98,125,24,21,252,72,0,0 // vbroadcastss 0x48fc(%rip),%ymm10 # 5608 <_sk_callback_avx+0x195>
+ .byte 196,98,125,24,21,252,72,0,0 // vbroadcastss 0x48fc(%rip),%ymm10 # 5604 <_sk_callback_avx+0x195>
.byte 197,44,94,211 // vdivps %ymm3,%ymm10,%ymm10
.byte 196,67,45,74,192,144 // vblendvps %ymm9,%ymm8,%ymm10,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
@@ -13041,17 +13037,17 @@ HIDDEN _sk_from_srgb_avx
.globl _sk_from_srgb_avx
FUNCTION(_sk_from_srgb_avx)
_sk_from_srgb_avx:
- .byte 196,98,125,24,5,221,72,0,0 // vbroadcastss 0x48dd(%rip),%ymm8 # 560c <_sk_callback_avx+0x199>
+ .byte 196,98,125,24,5,221,72,0,0 // vbroadcastss 0x48dd(%rip),%ymm8 # 5608 <_sk_callback_avx+0x199>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 197,124,89,208 // vmulps %ymm0,%ymm0,%ymm10
- .byte 196,98,125,24,29,207,72,0,0 // vbroadcastss 0x48cf(%rip),%ymm11 # 5610 <_sk_callback_avx+0x19d>
+ .byte 196,98,125,24,29,207,72,0,0 // vbroadcastss 0x48cf(%rip),%ymm11 # 560c <_sk_callback_avx+0x19d>
.byte 196,65,124,89,227 // vmulps %ymm11,%ymm0,%ymm12
- .byte 196,98,125,24,45,197,72,0,0 // vbroadcastss 0x48c5(%rip),%ymm13 # 5614 <_sk_callback_avx+0x1a1>
+ .byte 196,98,125,24,45,197,72,0,0 // vbroadcastss 0x48c5(%rip),%ymm13 # 5610 <_sk_callback_avx+0x1a1>
.byte 196,65,28,88,229 // vaddps %ymm13,%ymm12,%ymm12
.byte 196,65,44,89,212 // vmulps %ymm12,%ymm10,%ymm10
- .byte 196,98,125,24,37,182,72,0,0 // vbroadcastss 0x48b6(%rip),%ymm12 # 5618 <_sk_callback_avx+0x1a5>
+ .byte 196,98,125,24,37,182,72,0,0 // vbroadcastss 0x48b6(%rip),%ymm12 # 5614 <_sk_callback_avx+0x1a5>
.byte 196,65,44,88,212 // vaddps %ymm12,%ymm10,%ymm10
- .byte 196,98,125,24,53,172,72,0,0 // vbroadcastss 0x48ac(%rip),%ymm14 # 561c <_sk_callback_avx+0x1a9>
+ .byte 196,98,125,24,53,172,72,0,0 // vbroadcastss 0x48ac(%rip),%ymm14 # 5618 <_sk_callback_avx+0x1a9>
.byte 196,193,124,194,198,1 // vcmpltps %ymm14,%ymm0,%ymm0
.byte 196,195,45,74,193,0 // vblendvps %ymm0,%ymm9,%ymm10,%ymm0
.byte 196,65,116,89,200 // vmulps %ymm8,%ymm1,%ymm9
@@ -13080,18 +13076,18 @@ _sk_to_srgb_avx:
.byte 197,124,82,192 // vrsqrtps %ymm0,%ymm8
.byte 196,65,124,83,200 // vrcpps %ymm8,%ymm9
.byte 196,65,124,82,208 // vrsqrtps %ymm8,%ymm10
- .byte 196,98,125,24,5,55,72,0,0 // vbroadcastss 0x4837(%rip),%ymm8 # 5620 <_sk_callback_avx+0x1ad>
+ .byte 196,98,125,24,5,55,72,0,0 // vbroadcastss 0x4837(%rip),%ymm8 # 561c <_sk_callback_avx+0x1ad>
.byte 196,65,124,89,216 // vmulps %ymm8,%ymm0,%ymm11
- .byte 196,98,125,24,37,45,72,0,0 // vbroadcastss 0x482d(%rip),%ymm12 # 5624 <_sk_callback_avx+0x1b1>
+ .byte 196,98,125,24,37,45,72,0,0 // vbroadcastss 0x482d(%rip),%ymm12 # 5620 <_sk_callback_avx+0x1b1>
.byte 196,65,52,89,204 // vmulps %ymm12,%ymm9,%ymm9
- .byte 196,98,125,24,45,35,72,0,0 // vbroadcastss 0x4823(%rip),%ymm13 # 5628 <_sk_callback_avx+0x1b5>
+ .byte 196,98,125,24,45,35,72,0,0 // vbroadcastss 0x4823(%rip),%ymm13 # 5624 <_sk_callback_avx+0x1b5>
.byte 196,65,52,88,205 // vaddps %ymm13,%ymm9,%ymm9
- .byte 196,98,125,24,53,25,72,0,0 // vbroadcastss 0x4819(%rip),%ymm14 # 562c <_sk_callback_avx+0x1b9>
+ .byte 196,98,125,24,53,25,72,0,0 // vbroadcastss 0x4819(%rip),%ymm14 # 5628 <_sk_callback_avx+0x1b9>
.byte 196,65,44,89,214 // vmulps %ymm14,%ymm10,%ymm10
.byte 196,65,44,88,201 // vaddps %ymm9,%ymm10,%ymm9
- .byte 196,98,125,24,21,10,72,0,0 // vbroadcastss 0x480a(%rip),%ymm10 # 5630 <_sk_callback_avx+0x1bd>
+ .byte 196,98,125,24,21,10,72,0,0 // vbroadcastss 0x480a(%rip),%ymm10 # 562c <_sk_callback_avx+0x1bd>
.byte 196,65,44,93,201 // vminps %ymm9,%ymm10,%ymm9
- .byte 196,98,125,24,61,0,72,0,0 // vbroadcastss 0x4800(%rip),%ymm15 # 5634 <_sk_callback_avx+0x1c1>
+ .byte 196,98,125,24,61,0,72,0,0 // vbroadcastss 0x4800(%rip),%ymm15 # 5630 <_sk_callback_avx+0x1c1>
.byte 196,193,124,194,199,1 // vcmpltps %ymm15,%ymm0,%ymm0
.byte 196,195,53,74,195,0 // vblendvps %ymm0,%ymm11,%ymm9,%ymm0
.byte 197,124,82,201 // vrsqrtps %ymm1,%ymm9
@@ -13128,7 +13124,7 @@ _sk_rgb_to_hsl_avx:
.byte 197,124,93,201 // vminps %ymm1,%ymm0,%ymm9
.byte 197,52,93,202 // vminps %ymm2,%ymm9,%ymm9
.byte 196,65,60,92,209 // vsubps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,29,102,71,0,0 // vbroadcastss 0x4766(%rip),%ymm11 # 5638 <_sk_callback_avx+0x1c5>
+ .byte 196,98,125,24,29,102,71,0,0 // vbroadcastss 0x4766(%rip),%ymm11 # 5634 <_sk_callback_avx+0x1c5>
.byte 196,65,36,94,218 // vdivps %ymm10,%ymm11,%ymm11
.byte 197,116,92,226 // vsubps %ymm2,%ymm1,%ymm12
.byte 196,65,28,89,227 // vmulps %ymm11,%ymm12,%ymm12
@@ -13138,19 +13134,19 @@ _sk_rgb_to_hsl_avx:
.byte 196,193,108,89,211 // vmulps %ymm11,%ymm2,%ymm2
.byte 197,252,92,201 // vsubps %ymm1,%ymm0,%ymm1
.byte 196,193,116,89,203 // vmulps %ymm11,%ymm1,%ymm1
- .byte 196,98,125,24,29,63,71,0,0 // vbroadcastss 0x473f(%rip),%ymm11 # 5644 <_sk_callback_avx+0x1d1>
+ .byte 196,98,125,24,29,63,71,0,0 // vbroadcastss 0x473f(%rip),%ymm11 # 5640 <_sk_callback_avx+0x1d1>
.byte 196,193,116,88,203 // vaddps %ymm11,%ymm1,%ymm1
- .byte 196,98,125,24,29,45,71,0,0 // vbroadcastss 0x472d(%rip),%ymm11 # 5640 <_sk_callback_avx+0x1cd>
+ .byte 196,98,125,24,29,45,71,0,0 // vbroadcastss 0x472d(%rip),%ymm11 # 563c <_sk_callback_avx+0x1cd>
.byte 196,193,108,88,211 // vaddps %ymm11,%ymm2,%ymm2
.byte 196,227,117,74,202,224 // vblendvps %ymm14,%ymm2,%ymm1,%ymm1
- .byte 196,226,125,24,21,21,71,0,0 // vbroadcastss 0x4715(%rip),%ymm2 # 563c <_sk_callback_avx+0x1c9>
+ .byte 196,226,125,24,21,21,71,0,0 // vbroadcastss 0x4715(%rip),%ymm2 # 5638 <_sk_callback_avx+0x1c9>
.byte 196,65,12,87,246 // vxorps %ymm14,%ymm14,%ymm14
.byte 196,227,13,74,210,208 // vblendvps %ymm13,%ymm2,%ymm14,%ymm2
.byte 197,188,194,192,0 // vcmpeqps %ymm0,%ymm8,%ymm0
.byte 196,193,108,88,212 // vaddps %ymm12,%ymm2,%ymm2
.byte 196,227,117,74,194,0 // vblendvps %ymm0,%ymm2,%ymm1,%ymm0
.byte 196,193,60,88,201 // vaddps %ymm9,%ymm8,%ymm1
- .byte 196,98,125,24,37,252,70,0,0 // vbroadcastss 0x46fc(%rip),%ymm12 # 564c <_sk_callback_avx+0x1d9>
+ .byte 196,98,125,24,37,252,70,0,0 // vbroadcastss 0x46fc(%rip),%ymm12 # 5648 <_sk_callback_avx+0x1d9>
.byte 196,193,116,89,212 // vmulps %ymm12,%ymm1,%ymm2
.byte 197,28,194,226,1 // vcmpltps %ymm2,%ymm12,%ymm12
.byte 196,65,36,92,216 // vsubps %ymm8,%ymm11,%ymm11
@@ -13160,7 +13156,7 @@ _sk_rgb_to_hsl_avx:
.byte 197,172,94,201 // vdivps %ymm1,%ymm10,%ymm1
.byte 196,195,125,74,198,128 // vblendvps %ymm8,%ymm14,%ymm0,%ymm0
.byte 196,195,117,74,206,128 // vblendvps %ymm8,%ymm14,%ymm1,%ymm1
- .byte 196,98,125,24,5,191,70,0,0 // vbroadcastss 0x46bf(%rip),%ymm8 # 5648 <_sk_callback_avx+0x1d5>
+ .byte 196,98,125,24,5,191,70,0,0 // vbroadcastss 0x46bf(%rip),%ymm8 # 5644 <_sk_callback_avx+0x1d5>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -13177,7 +13173,7 @@ _sk_hsl_to_rgb_avx:
.byte 197,252,17,92,36,128 // vmovups %ymm3,-0x80(%rsp)
.byte 197,252,40,225 // vmovaps %ymm1,%ymm4
.byte 197,252,40,216 // vmovaps %ymm0,%ymm3
- .byte 196,98,125,24,5,140,70,0,0 // vbroadcastss 0x468c(%rip),%ymm8 # 5650 <_sk_callback_avx+0x1dd>
+ .byte 196,98,125,24,5,140,70,0,0 // vbroadcastss 0x468c(%rip),%ymm8 # 564c <_sk_callback_avx+0x1dd>
.byte 197,60,194,202,2 // vcmpleps %ymm2,%ymm8,%ymm9
.byte 197,92,89,210 // vmulps %ymm2,%ymm4,%ymm10
.byte 196,65,92,92,218 // vsubps %ymm10,%ymm4,%ymm11
@@ -13185,23 +13181,23 @@ _sk_hsl_to_rgb_avx:
.byte 197,52,88,210 // vaddps %ymm2,%ymm9,%ymm10
.byte 197,108,88,202 // vaddps %ymm2,%ymm2,%ymm9
.byte 196,65,52,92,202 // vsubps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,24,29,102,70,0,0 // vbroadcastss 0x4666(%rip),%ymm11 # 5654 <_sk_callback_avx+0x1e1>
+ .byte 196,98,125,24,29,102,70,0,0 // vbroadcastss 0x4666(%rip),%ymm11 # 5650 <_sk_callback_avx+0x1e1>
.byte 196,65,100,88,219 // vaddps %ymm11,%ymm3,%ymm11
.byte 196,67,125,8,227,1 // vroundps $0x1,%ymm11,%ymm12
.byte 196,65,36,92,252 // vsubps %ymm12,%ymm11,%ymm15
.byte 196,65,44,92,217 // vsubps %ymm9,%ymm10,%ymm11
- .byte 196,98,125,24,37,80,70,0,0 // vbroadcastss 0x4650(%rip),%ymm12 # 565c <_sk_callback_avx+0x1e9>
+ .byte 196,98,125,24,37,80,70,0,0 // vbroadcastss 0x4650(%rip),%ymm12 # 5658 <_sk_callback_avx+0x1e9>
.byte 196,193,4,89,196 // vmulps %ymm12,%ymm15,%ymm0
- .byte 196,98,125,24,45,70,70,0,0 // vbroadcastss 0x4646(%rip),%ymm13 # 5660 <_sk_callback_avx+0x1ed>
+ .byte 196,98,125,24,45,70,70,0,0 // vbroadcastss 0x4646(%rip),%ymm13 # 565c <_sk_callback_avx+0x1ed>
.byte 197,20,92,240 // vsubps %ymm0,%ymm13,%ymm14
.byte 196,65,36,89,246 // vmulps %ymm14,%ymm11,%ymm14
.byte 196,65,52,88,246 // vaddps %ymm14,%ymm9,%ymm14
- .byte 196,226,125,24,13,39,70,0,0 // vbroadcastss 0x4627(%rip),%ymm1 # 5658 <_sk_callback_avx+0x1e5>
+ .byte 196,226,125,24,13,39,70,0,0 // vbroadcastss 0x4627(%rip),%ymm1 # 5654 <_sk_callback_avx+0x1e5>
.byte 196,193,116,194,255,2 // vcmpleps %ymm15,%ymm1,%ymm7
.byte 196,195,13,74,249,112 // vblendvps %ymm7,%ymm9,%ymm14,%ymm7
.byte 196,65,60,194,247,2 // vcmpleps %ymm15,%ymm8,%ymm14
.byte 196,227,45,74,255,224 // vblendvps %ymm14,%ymm7,%ymm10,%ymm7
- .byte 196,98,125,24,53,18,70,0,0 // vbroadcastss 0x4612(%rip),%ymm14 # 5664 <_sk_callback_avx+0x1f1>
+ .byte 196,98,125,24,53,18,70,0,0 // vbroadcastss 0x4612(%rip),%ymm14 # 5660 <_sk_callback_avx+0x1f1>
.byte 196,65,12,194,255,2 // vcmpleps %ymm15,%ymm14,%ymm15
.byte 196,193,124,89,195 // vmulps %ymm11,%ymm0,%ymm0
.byte 197,180,88,192 // vaddps %ymm0,%ymm9,%ymm0
@@ -13220,7 +13216,7 @@ _sk_hsl_to_rgb_avx:
.byte 197,164,89,247 // vmulps %ymm7,%ymm11,%ymm6
.byte 197,180,88,246 // vaddps %ymm6,%ymm9,%ymm6
.byte 196,227,77,74,237,0 // vblendvps %ymm0,%ymm5,%ymm6,%ymm5
- .byte 196,226,125,24,5,180,69,0,0 // vbroadcastss 0x45b4(%rip),%ymm0 # 5668 <_sk_callback_avx+0x1f5>
+ .byte 196,226,125,24,5,180,69,0,0 // vbroadcastss 0x45b4(%rip),%ymm0 # 5664 <_sk_callback_avx+0x1f5>
.byte 197,228,88,192 // vaddps %ymm0,%ymm3,%ymm0
.byte 196,227,125,8,216,1 // vroundps $0x1,%ymm0,%ymm3
.byte 197,252,92,195 // vsubps %ymm3,%ymm0,%ymm0
@@ -13272,14 +13268,14 @@ _sk_scale_u8_avx:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,68 // jne 11ab <_sk_scale_u8_avx+0x54>
+ .byte 117,68 // jne 11a7 <_sk_scale_u8_avx+0x54>
.byte 197,122,126,0 // vmovq (%rax),%xmm8
.byte 196,66,121,49,200 // vpmovzxbd %xmm8,%xmm9
.byte 196,67,121,4,192,229 // vpermilps $0xe5,%xmm8,%xmm8
.byte 196,66,121,49,192 // vpmovzxbd %xmm8,%xmm8
.byte 196,67,53,24,192,1 // vinsertf128 $0x1,%xmm8,%ymm9,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,221,68,0,0 // vbroadcastss 0x44dd(%rip),%ymm9 # 566c <_sk_callback_avx+0x1f9>
+ .byte 196,98,125,24,13,221,68,0,0 // vbroadcastss 0x44dd(%rip),%ymm9 # 5668 <_sk_callback_avx+0x1f9>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
@@ -13297,9 +13293,9 @@ _sk_scale_u8_avx:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 11b3 <_sk_scale_u8_avx+0x5c>
+ .byte 117,234 // jne 11af <_sk_scale_u8_avx+0x5c>
.byte 196,65,249,110,193 // vmovq %r9,%xmm8
- .byte 235,155 // jmp 116b <_sk_scale_u8_avx+0x14>
+ .byte 235,155 // jmp 1167 <_sk_scale_u8_avx+0x14>
HIDDEN _sk_lerp_1_float_avx
.globl _sk_lerp_1_float_avx
@@ -13331,14 +13327,14 @@ _sk_lerp_u8_avx:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,104 // jne 1287 <_sk_lerp_u8_avx+0x78>
+ .byte 117,104 // jne 1283 <_sk_lerp_u8_avx+0x78>
.byte 197,122,126,0 // vmovq (%rax),%xmm8
.byte 196,66,121,49,200 // vpmovzxbd %xmm8,%xmm9
.byte 196,67,121,4,192,229 // vpermilps $0xe5,%xmm8,%xmm8
.byte 196,66,121,49,192 // vpmovzxbd %xmm8,%xmm8
.byte 196,67,53,24,192,1 // vinsertf128 $0x1,%xmm8,%ymm9,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,41,68,0,0 // vbroadcastss 0x4429(%rip),%ymm9 # 5670 <_sk_callback_avx+0x1fd>
+ .byte 196,98,125,24,13,41,68,0,0 // vbroadcastss 0x4429(%rip),%ymm9 # 566c <_sk_callback_avx+0x1fd>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,252,92,196 // vsubps %ymm4,%ymm0,%ymm0
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
@@ -13364,9 +13360,9 @@ _sk_lerp_u8_avx:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 128f <_sk_lerp_u8_avx+0x80>
+ .byte 117,234 // jne 128b <_sk_lerp_u8_avx+0x80>
.byte 196,65,249,110,193 // vmovq %r9,%xmm8
- .byte 233,116,255,255,255 // jmpq 1223 <_sk_lerp_u8_avx+0x14>
+ .byte 233,116,255,255,255 // jmpq 121f <_sk_lerp_u8_avx+0x14>
HIDDEN _sk_lerp_565_avx
.globl _sk_lerp_565_avx
@@ -13375,26 +13371,26 @@ _sk_lerp_565_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,174,0,0,0 // jne 136b <_sk_lerp_565_avx+0xbc>
+ .byte 15,133,174,0,0,0 // jne 1367 <_sk_lerp_565_avx+0xbc>
.byte 196,65,122,111,4,122 // vmovdqu (%r10,%rdi,2),%xmm8
.byte 197,225,239,219 // vpxor %xmm3,%xmm3,%xmm3
.byte 197,185,105,219 // vpunpckhwd %xmm3,%xmm8,%xmm3
.byte 196,66,121,51,192 // vpmovzxwd %xmm8,%xmm8
.byte 196,227,61,24,219,1 // vinsertf128 $0x1,%xmm3,%ymm8,%ymm3
- .byte 196,98,125,24,5,149,67,0,0 // vbroadcastss 0x4395(%rip),%ymm8 # 5674 <_sk_callback_avx+0x201>
+ .byte 196,98,125,24,5,149,67,0,0 // vbroadcastss 0x4395(%rip),%ymm8 # 5670 <_sk_callback_avx+0x201>
.byte 196,65,100,84,192 // vandps %ymm8,%ymm3,%ymm8
.byte 196,65,124,91,192 // vcvtdq2ps %ymm8,%ymm8
- .byte 196,98,125,24,13,134,67,0,0 // vbroadcastss 0x4386(%rip),%ymm9 # 5678 <_sk_callback_avx+0x205>
+ .byte 196,98,125,24,13,134,67,0,0 // vbroadcastss 0x4386(%rip),%ymm9 # 5674 <_sk_callback_avx+0x205>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,24,13,124,67,0,0 // vbroadcastss 0x437c(%rip),%ymm9 # 567c <_sk_callback_avx+0x209>
+ .byte 196,98,125,24,13,124,67,0,0 // vbroadcastss 0x437c(%rip),%ymm9 # 5678 <_sk_callback_avx+0x209>
.byte 196,65,100,84,201 // vandps %ymm9,%ymm3,%ymm9
.byte 196,65,124,91,201 // vcvtdq2ps %ymm9,%ymm9
- .byte 196,98,125,24,21,109,67,0,0 // vbroadcastss 0x436d(%rip),%ymm10 # 5680 <_sk_callback_avx+0x20d>
+ .byte 196,98,125,24,21,109,67,0,0 // vbroadcastss 0x436d(%rip),%ymm10 # 567c <_sk_callback_avx+0x20d>
.byte 196,65,52,89,202 // vmulps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,24,21,99,67,0,0 // vbroadcastss 0x4363(%rip),%ymm10 # 5684 <_sk_callback_avx+0x211>
+ .byte 196,98,125,24,21,99,67,0,0 // vbroadcastss 0x4363(%rip),%ymm10 # 5680 <_sk_callback_avx+0x211>
.byte 196,193,100,84,218 // vandps %ymm10,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,21,85,67,0,0 // vbroadcastss 0x4355(%rip),%ymm10 # 5688 <_sk_callback_avx+0x215>
+ .byte 196,98,125,24,21,85,67,0,0 // vbroadcastss 0x4355(%rip),%ymm10 # 5684 <_sk_callback_avx+0x215>
.byte 196,193,100,89,218 // vmulps %ymm10,%ymm3,%ymm3
.byte 197,252,92,196 // vsubps %ymm4,%ymm0,%ymm0
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
@@ -13406,16 +13402,16 @@ _sk_lerp_565_avx:
.byte 197,236,89,211 // vmulps %ymm3,%ymm2,%ymm2
.byte 197,236,88,214 // vaddps %ymm6,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,35,67,0,0 // vbroadcastss 0x4323(%rip),%ymm3 # 568c <_sk_callback_avx+0x219>
+ .byte 196,226,125,24,29,35,67,0,0 // vbroadcastss 0x4323(%rip),%ymm3 # 5688 <_sk_callback_avx+0x219>
.byte 255,224 // jmpq *%rax
.byte 65,137,200 // mov %ecx,%r8d
.byte 65,128,224,7 // and $0x7,%r8b
.byte 196,65,57,239,192 // vpxor %xmm8,%xmm8,%xmm8
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 15,135,63,255,255,255 // ja 12c3 <_sk_lerp_565_avx+0x14>
+ .byte 15,135,63,255,255,255 // ja 12bf <_sk_lerp_565_avx+0x14>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 13d8 <_sk_lerp_565_avx+0x129>
+ .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 13d4 <_sk_lerp_565_avx+0x129>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -13427,7 +13423,7 @@ _sk_lerp_565_avx:
.byte 196,65,57,196,68,122,4,2 // vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm8,%xmm8
.byte 196,65,57,196,68,122,2,1 // vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm8,%xmm8
.byte 196,65,57,196,4,122,0 // vpinsrw $0x0,(%r10,%rdi,2),%xmm8,%xmm8
- .byte 233,235,254,255,255 // jmpq 12c3 <_sk_lerp_565_avx+0x14>
+ .byte 233,235,254,255,255 // jmpq 12bf <_sk_lerp_565_avx+0x14>
.byte 244 // hlt
.byte 255 // (bad)
.byte 255 // (bad)
@@ -13459,7 +13455,7 @@ _sk_load_tables_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,0 // mov (%rax),%r8
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,26,2,0,0 // jne 161c <_sk_load_tables_avx+0x228>
+ .byte 15,133,26,2,0,0 // jne 1618 <_sk_load_tables_avx+0x228>
.byte 196,65,124,16,4,184 // vmovups (%r8,%rdi,4),%ymm8
.byte 85 // push %rbp
.byte 65,87 // push %r15
@@ -13467,7 +13463,7 @@ _sk_load_tables_avx:
.byte 65,85 // push %r13
.byte 65,84 // push %r12
.byte 83 // push %rbx
- .byte 197,124,40,13,70,69,0,0 // vmovaps 0x4546(%rip),%ymm9 # 5960 <_sk_callback_avx+0x4ed>
+ .byte 197,124,40,13,74,69,0,0 // vmovaps 0x454a(%rip),%ymm9 # 5960 <_sk_callback_avx+0x4f1>
.byte 196,193,60,84,193 // vandps %ymm9,%ymm8,%ymm0
.byte 196,193,249,126,193 // vmovq %xmm0,%r9
.byte 69,137,203 // mov %r9d,%r11d
@@ -13559,7 +13555,7 @@ _sk_load_tables_avx:
.byte 196,193,97,114,210,24 // vpsrld $0x18,%xmm10,%xmm3
.byte 196,227,61,24,219,1 // vinsertf128 $0x1,%xmm3,%ymm8,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,135,64,0,0 // vbroadcastss 0x4087(%rip),%ymm8 # 5690 <_sk_callback_avx+0x21d>
+ .byte 196,98,125,24,5,135,64,0,0 // vbroadcastss 0x4087(%rip),%ymm8 # 568c <_sk_callback_avx+0x21d>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 91 // pop %rbx
@@ -13574,9 +13570,9 @@ _sk_load_tables_avx:
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 65,254,201 // dec %r9b
.byte 65,128,249,6 // cmp $0x6,%r9b
- .byte 15,135,211,253,255,255 // ja 1408 <_sk_load_tables_avx+0x14>
+ .byte 15,135,211,253,255,255 // ja 1404 <_sk_load_tables_avx+0x14>
.byte 69,15,182,201 // movzbl %r9b,%r9d
- .byte 76,141,21,140,0,0,0 // lea 0x8c(%rip),%r10 # 16cc <_sk_load_tables_avx+0x2d8>
+ .byte 76,141,21,140,0,0,0 // lea 0x8c(%rip),%r10 # 16c8 <_sk_load_tables_avx+0x2d8>
.byte 79,99,12,138 // movslq (%r10,%r9,4),%r9
.byte 77,1,209 // add %r10,%r9
.byte 65,255,225 // jmpq *%r9
@@ -13599,7 +13595,7 @@ _sk_load_tables_avx:
.byte 196,99,61,12,192,15 // vblendps $0xf,%ymm0,%ymm8,%ymm8
.byte 196,195,57,34,4,184,0 // vpinsrd $0x0,(%r8,%rdi,4),%xmm8,%xmm0
.byte 196,99,61,12,192,15 // vblendps $0xf,%ymm0,%ymm8,%ymm8
- .byte 233,62,253,255,255 // jmpq 1408 <_sk_load_tables_avx+0x14>
+ .byte 233,62,253,255,255 // jmpq 1404 <_sk_load_tables_avx+0x14>
.byte 102,144 // xchg %ax,%ax
.byte 236 // in (%dx),%al
.byte 255 // (bad)
@@ -13617,7 +13613,7 @@ _sk_load_tables_avx:
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 126,255 // jle 16e5 <_sk_load_tables_avx+0x2f1>
+ .byte 126,255 // jle 16e1 <_sk_load_tables_avx+0x2f1>
.byte 255 // (bad)
.byte 255 // .byte 0xff
@@ -13629,7 +13625,7 @@ _sk_load_tables_u16_be_avx:
.byte 76,139,0 // mov (%rax),%r8
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,113,2,0,0 // jne 196f <_sk_load_tables_u16_be_avx+0x287>
+ .byte 15,133,113,2,0,0 // jne 196b <_sk_load_tables_u16_be_avx+0x287>
.byte 196,1,121,16,4,72 // vmovupd (%r8,%r9,2),%xmm8
.byte 196,129,121,16,84,72,16 // vmovupd 0x10(%r8,%r9,2),%xmm2
.byte 196,129,121,16,92,72,32 // vmovupd 0x20(%r8,%r9,2),%xmm3
@@ -13651,7 +13647,7 @@ _sk_load_tables_u16_be_avx:
.byte 197,177,108,208 // vpunpcklqdq %xmm0,%xmm9,%xmm2
.byte 197,177,109,200 // vpunpckhqdq %xmm0,%xmm9,%xmm1
.byte 196,65,57,108,212 // vpunpcklqdq %xmm12,%xmm8,%xmm10
- .byte 197,121,111,29,134,66,0,0 // vmovdqa 0x4286(%rip),%xmm11 # 59e0 <_sk_callback_avx+0x56d>
+ .byte 197,121,111,29,138,66,0,0 // vmovdqa 0x428a(%rip),%xmm11 # 59e0 <_sk_callback_avx+0x571>
.byte 196,193,105,219,195 // vpand %xmm11,%xmm2,%xmm0
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 196,193,121,105,209 // vpunpckhwd %xmm9,%xmm0,%xmm2
@@ -13750,7 +13746,7 @@ _sk_load_tables_u16_be_avx:
.byte 196,226,121,51,219 // vpmovzxwd %xmm3,%xmm3
.byte 196,195,101,24,216,1 // vinsertf128 $0x1,%xmm8,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,56,61,0,0 // vbroadcastss 0x3d38(%rip),%ymm8 # 5694 <_sk_callback_avx+0x221>
+ .byte 196,98,125,24,5,56,61,0,0 // vbroadcastss 0x3d38(%rip),%ymm8 # 5690 <_sk_callback_avx+0x221>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 91 // pop %rbx
@@ -13763,29 +13759,29 @@ _sk_load_tables_u16_be_avx:
.byte 196,1,123,16,4,72 // vmovsd (%r8,%r9,2),%xmm8
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,85 // je 19d5 <_sk_load_tables_u16_be_avx+0x2ed>
+ .byte 116,85 // je 19d1 <_sk_load_tables_u16_be_avx+0x2ed>
.byte 196,1,57,22,68,72,8 // vmovhpd 0x8(%r8,%r9,2),%xmm8,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,72 // jb 19d5 <_sk_load_tables_u16_be_avx+0x2ed>
+ .byte 114,72 // jb 19d1 <_sk_load_tables_u16_be_avx+0x2ed>
.byte 196,129,123,16,84,72,16 // vmovsd 0x10(%r8,%r9,2),%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 116,72 // je 19e2 <_sk_load_tables_u16_be_avx+0x2fa>
+ .byte 116,72 // je 19de <_sk_load_tables_u16_be_avx+0x2fa>
.byte 196,129,105,22,84,72,24 // vmovhpd 0x18(%r8,%r9,2),%xmm2,%xmm2
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,59 // jb 19e2 <_sk_load_tables_u16_be_avx+0x2fa>
+ .byte 114,59 // jb 19de <_sk_load_tables_u16_be_avx+0x2fa>
.byte 196,129,123,16,92,72,32 // vmovsd 0x20(%r8,%r9,2),%xmm3
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 15,132,97,253,255,255 // je 1719 <_sk_load_tables_u16_be_avx+0x31>
+ .byte 15,132,97,253,255,255 // je 1715 <_sk_load_tables_u16_be_avx+0x31>
.byte 196,129,97,22,92,72,40 // vmovhpd 0x28(%r8,%r9,2),%xmm3,%xmm3
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 15,130,80,253,255,255 // jb 1719 <_sk_load_tables_u16_be_avx+0x31>
+ .byte 15,130,80,253,255,255 // jb 1715 <_sk_load_tables_u16_be_avx+0x31>
.byte 196,1,122,126,76,72,48 // vmovq 0x30(%r8,%r9,2),%xmm9
- .byte 233,68,253,255,255 // jmpq 1719 <_sk_load_tables_u16_be_avx+0x31>
+ .byte 233,68,253,255,255 // jmpq 1715 <_sk_load_tables_u16_be_avx+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
.byte 197,233,87,210 // vxorpd %xmm2,%xmm2,%xmm2
- .byte 233,55,253,255,255 // jmpq 1719 <_sk_load_tables_u16_be_avx+0x31>
+ .byte 233,55,253,255,255 // jmpq 1715 <_sk_load_tables_u16_be_avx+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
- .byte 233,46,253,255,255 // jmpq 1719 <_sk_load_tables_u16_be_avx+0x31>
+ .byte 233,46,253,255,255 // jmpq 1715 <_sk_load_tables_u16_be_avx+0x31>
HIDDEN _sk_load_tables_rgb_u16_be_avx
.globl _sk_load_tables_rgb_u16_be_avx
@@ -13795,7 +13791,7 @@ _sk_load_tables_rgb_u16_be_avx:
.byte 76,139,0 // mov (%rax),%r8
.byte 76,141,12,127 // lea (%rdi,%rdi,2),%r9
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,93,2,0,0 // jne 1c5a <_sk_load_tables_rgb_u16_be_avx+0x26f>
+ .byte 15,133,93,2,0,0 // jne 1c56 <_sk_load_tables_rgb_u16_be_avx+0x26f>
.byte 196,129,122,111,4,72 // vmovdqu (%r8,%r9,2),%xmm0
.byte 196,129,122,111,84,72,12 // vmovdqu 0xc(%r8,%r9,2),%xmm2
.byte 196,129,122,111,76,72,24 // vmovdqu 0x18(%r8,%r9,2),%xmm1
@@ -13822,7 +13818,7 @@ _sk_load_tables_rgb_u16_be_avx:
.byte 197,185,108,202 // vpunpcklqdq %xmm2,%xmm8,%xmm1
.byte 197,185,109,210 // vpunpckhqdq %xmm2,%xmm8,%xmm2
.byte 197,121,108,195 // vpunpcklqdq %xmm3,%xmm0,%xmm8
- .byte 197,121,111,13,127,63,0,0 // vmovdqa 0x3f7f(%rip),%xmm9 # 59f0 <_sk_callback_avx+0x57d>
+ .byte 197,121,111,13,131,63,0,0 // vmovdqa 0x3f83(%rip),%xmm9 # 59f0 <_sk_callback_avx+0x581>
.byte 196,193,113,219,193 // vpand %xmm9,%xmm1,%xmm0
.byte 196,65,41,239,210 // vpxor %xmm10,%xmm10,%xmm10
.byte 196,193,121,105,202 // vpunpckhwd %xmm10,%xmm0,%xmm1
@@ -13914,7 +13910,7 @@ _sk_load_tables_rgb_u16_be_avx:
.byte 196,227,105,33,211,48 // vinsertps $0x30,%xmm3,%xmm2,%xmm2
.byte 196,195,109,24,208,1 // vinsertf128 $0x1,%xmm8,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,74,58,0,0 // vbroadcastss 0x3a4a(%rip),%ymm3 # 5698 <_sk_callback_avx+0x225>
+ .byte 196,226,125,24,29,74,58,0,0 // vbroadcastss 0x3a4a(%rip),%ymm3 # 5694 <_sk_callback_avx+0x225>
.byte 91 // pop %rbx
.byte 65,92 // pop %r12
.byte 65,93 // pop %r13
@@ -13925,36 +13921,36 @@ _sk_load_tables_rgb_u16_be_avx:
.byte 196,129,121,110,4,72 // vmovd (%r8,%r9,2),%xmm0
.byte 196,129,121,196,68,72,4,2 // vpinsrw $0x2,0x4(%r8,%r9,2),%xmm0,%xmm0
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 117,5 // jne 1c73 <_sk_load_tables_rgb_u16_be_avx+0x288>
- .byte 233,190,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 117,5 // jne 1c6f <_sk_load_tables_rgb_u16_be_avx+0x288>
+ .byte 233,190,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
.byte 196,129,121,110,76,72,6 // vmovd 0x6(%r8,%r9,2),%xmm1
.byte 196,1,113,196,68,72,10,2 // vpinsrw $0x2,0xa(%r8,%r9,2),%xmm1,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,26 // jb 1ca2 <_sk_load_tables_rgb_u16_be_avx+0x2b7>
+ .byte 114,26 // jb 1c9e <_sk_load_tables_rgb_u16_be_avx+0x2b7>
.byte 196,129,121,110,76,72,12 // vmovd 0xc(%r8,%r9,2),%xmm1
.byte 196,129,113,196,84,72,16,2 // vpinsrw $0x2,0x10(%r8,%r9,2),%xmm1,%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 117,10 // jne 1ca7 <_sk_load_tables_rgb_u16_be_avx+0x2bc>
- .byte 233,143,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
- .byte 233,138,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 117,10 // jne 1ca3 <_sk_load_tables_rgb_u16_be_avx+0x2bc>
+ .byte 233,143,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 233,138,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
.byte 196,129,121,110,76,72,18 // vmovd 0x12(%r8,%r9,2),%xmm1
.byte 196,1,113,196,76,72,22,2 // vpinsrw $0x2,0x16(%r8,%r9,2),%xmm1,%xmm9
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,26 // jb 1cd6 <_sk_load_tables_rgb_u16_be_avx+0x2eb>
+ .byte 114,26 // jb 1cd2 <_sk_load_tables_rgb_u16_be_avx+0x2eb>
.byte 196,129,121,110,76,72,24 // vmovd 0x18(%r8,%r9,2),%xmm1
.byte 196,129,113,196,76,72,28,2 // vpinsrw $0x2,0x1c(%r8,%r9,2),%xmm1,%xmm1
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 117,10 // jne 1cdb <_sk_load_tables_rgb_u16_be_avx+0x2f0>
- .byte 233,91,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
- .byte 233,86,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 117,10 // jne 1cd7 <_sk_load_tables_rgb_u16_be_avx+0x2f0>
+ .byte 233,91,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 233,86,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
.byte 196,129,121,110,92,72,30 // vmovd 0x1e(%r8,%r9,2),%xmm3
.byte 196,1,97,196,92,72,34,2 // vpinsrw $0x2,0x22(%r8,%r9,2),%xmm3,%xmm11
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,20 // jb 1d04 <_sk_load_tables_rgb_u16_be_avx+0x319>
+ .byte 114,20 // jb 1d00 <_sk_load_tables_rgb_u16_be_avx+0x319>
.byte 196,129,121,110,92,72,36 // vmovd 0x24(%r8,%r9,2),%xmm3
.byte 196,129,97,196,92,72,40,2 // vpinsrw $0x2,0x28(%r8,%r9,2),%xmm3,%xmm3
- .byte 233,45,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
- .byte 233,40,253,255,255 // jmpq 1a31 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 233,45,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
+ .byte 233,40,253,255,255 // jmpq 1a2d <_sk_load_tables_rgb_u16_be_avx+0x46>
HIDDEN _sk_byte_tables_avx
.globl _sk_byte_tables_avx
@@ -13967,7 +13963,7 @@ _sk_byte_tables_avx:
.byte 65,84 // push %r12
.byte 83 // push %rbx
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,126,57,0,0 // vbroadcastss 0x397e(%rip),%ymm8 # 569c <_sk_callback_avx+0x229>
+ .byte 196,98,125,24,5,126,57,0,0 // vbroadcastss 0x397e(%rip),%ymm8 # 5698 <_sk_callback_avx+0x229>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
.byte 197,253,91,192 // vcvtps2dq %ymm0,%ymm0
.byte 196,195,249,22,192,1 // vpextrq $0x1,%xmm0,%r8
@@ -14004,7 +14000,7 @@ _sk_byte_tables_avx:
.byte 196,226,121,49,192 // vpmovzxbd %xmm0,%xmm0
.byte 196,227,53,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm9,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,13,204,56,0,0 // vbroadcastss 0x38cc(%rip),%ymm9 # 56a0 <_sk_callback_avx+0x22d>
+ .byte 196,98,125,24,13,204,56,0,0 // vbroadcastss 0x38cc(%rip),%ymm9 # 569c <_sk_callback_avx+0x22d>
.byte 196,193,124,89,193 // vmulps %ymm9,%ymm0,%ymm0
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
.byte 197,253,91,201 // vcvtps2dq %ymm1,%ymm1
@@ -14166,7 +14162,7 @@ _sk_byte_tables_rgb_avx:
.byte 196,226,121,49,192 // vpmovzxbd %xmm0,%xmm0
.byte 196,227,53,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm9,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,13,242,53,0,0 // vbroadcastss 0x35f2(%rip),%ymm9 # 56a4 <_sk_callback_avx+0x231>
+ .byte 196,98,125,24,13,242,53,0,0 // vbroadcastss 0x35f2(%rip),%ymm9 # 56a0 <_sk_callback_avx+0x231>
.byte 196,193,124,89,193 // vmulps %ymm9,%ymm0,%ymm0
.byte 197,188,89,201 // vmulps %ymm1,%ymm8,%ymm1
.byte 197,253,91,201 // vcvtps2dq %ymm1,%ymm1
@@ -14463,36 +14459,36 @@ _sk_parametric_r_avx:
.byte 196,193,124,88,195 // vaddps %ymm11,%ymm0,%ymm0
.byte 196,98,125,24,16 // vbroadcastss (%rax),%ymm10
.byte 197,124,91,216 // vcvtdq2ps %ymm0,%ymm11
- .byte 196,98,125,24,37,80,49,0,0 // vbroadcastss 0x3150(%rip),%ymm12 # 56a8 <_sk_callback_avx+0x235>
+ .byte 196,98,125,24,37,80,49,0,0 // vbroadcastss 0x3150(%rip),%ymm12 # 56a4 <_sk_callback_avx+0x235>
.byte 196,65,36,89,220 // vmulps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,70,49,0,0 // vbroadcastss 0x3146(%rip),%ymm12 # 56ac <_sk_callback_avx+0x239>
+ .byte 196,98,125,24,37,70,49,0,0 // vbroadcastss 0x3146(%rip),%ymm12 # 56a8 <_sk_callback_avx+0x239>
.byte 196,193,124,84,196 // vandps %ymm12,%ymm0,%ymm0
- .byte 196,98,125,24,37,60,49,0,0 // vbroadcastss 0x313c(%rip),%ymm12 # 56b0 <_sk_callback_avx+0x23d>
+ .byte 196,98,125,24,37,60,49,0,0 // vbroadcastss 0x313c(%rip),%ymm12 # 56ac <_sk_callback_avx+0x23d>
.byte 196,193,124,86,196 // vorps %ymm12,%ymm0,%ymm0
- .byte 196,98,125,24,37,50,49,0,0 // vbroadcastss 0x3132(%rip),%ymm12 # 56b4 <_sk_callback_avx+0x241>
+ .byte 196,98,125,24,37,50,49,0,0 // vbroadcastss 0x3132(%rip),%ymm12 # 56b0 <_sk_callback_avx+0x241>
.byte 196,65,36,88,220 // vaddps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,40,49,0,0 // vbroadcastss 0x3128(%rip),%ymm12 # 56b8 <_sk_callback_avx+0x245>
+ .byte 196,98,125,24,37,40,49,0,0 // vbroadcastss 0x3128(%rip),%ymm12 # 56b4 <_sk_callback_avx+0x245>
.byte 196,65,124,89,228 // vmulps %ymm12,%ymm0,%ymm12
.byte 196,65,36,92,220 // vsubps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,25,49,0,0 // vbroadcastss 0x3119(%rip),%ymm12 # 56bc <_sk_callback_avx+0x249>
+ .byte 196,98,125,24,37,25,49,0,0 // vbroadcastss 0x3119(%rip),%ymm12 # 56b8 <_sk_callback_avx+0x249>
.byte 196,193,124,88,196 // vaddps %ymm12,%ymm0,%ymm0
- .byte 196,98,125,24,37,15,49,0,0 // vbroadcastss 0x310f(%rip),%ymm12 # 56c0 <_sk_callback_avx+0x24d>
+ .byte 196,98,125,24,37,15,49,0,0 // vbroadcastss 0x310f(%rip),%ymm12 # 56bc <_sk_callback_avx+0x24d>
.byte 197,156,94,192 // vdivps %ymm0,%ymm12,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
.byte 197,172,89,192 // vmulps %ymm0,%ymm10,%ymm0
.byte 196,99,125,8,208,1 // vroundps $0x1,%ymm0,%ymm10
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 196,98,125,24,29,243,48,0,0 // vbroadcastss 0x30f3(%rip),%ymm11 # 56c4 <_sk_callback_avx+0x251>
+ .byte 196,98,125,24,29,243,48,0,0 // vbroadcastss 0x30f3(%rip),%ymm11 # 56c0 <_sk_callback_avx+0x251>
.byte 196,193,124,88,195 // vaddps %ymm11,%ymm0,%ymm0
- .byte 196,98,125,24,29,233,48,0,0 // vbroadcastss 0x30e9(%rip),%ymm11 # 56c8 <_sk_callback_avx+0x255>
+ .byte 196,98,125,24,29,233,48,0,0 // vbroadcastss 0x30e9(%rip),%ymm11 # 56c4 <_sk_callback_avx+0x255>
.byte 196,65,44,89,219 // vmulps %ymm11,%ymm10,%ymm11
.byte 196,193,124,92,195 // vsubps %ymm11,%ymm0,%ymm0
- .byte 196,98,125,24,29,218,48,0,0 // vbroadcastss 0x30da(%rip),%ymm11 # 56cc <_sk_callback_avx+0x259>
+ .byte 196,98,125,24,29,218,48,0,0 // vbroadcastss 0x30da(%rip),%ymm11 # 56c8 <_sk_callback_avx+0x259>
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
- .byte 196,98,125,24,29,208,48,0,0 // vbroadcastss 0x30d0(%rip),%ymm11 # 56d0 <_sk_callback_avx+0x25d>
+ .byte 196,98,125,24,29,208,48,0,0 // vbroadcastss 0x30d0(%rip),%ymm11 # 56cc <_sk_callback_avx+0x25d>
.byte 196,65,36,94,210 // vdivps %ymm10,%ymm11,%ymm10
.byte 196,193,124,88,194 // vaddps %ymm10,%ymm0,%ymm0
- .byte 196,98,125,24,21,193,48,0,0 // vbroadcastss 0x30c1(%rip),%ymm10 # 56d4 <_sk_callback_avx+0x261>
+ .byte 196,98,125,24,21,193,48,0,0 // vbroadcastss 0x30c1(%rip),%ymm10 # 56d0 <_sk_callback_avx+0x261>
.byte 196,193,124,89,194 // vmulps %ymm10,%ymm0,%ymm0
.byte 197,253,91,192 // vcvtps2dq %ymm0,%ymm0
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -14500,7 +14496,7 @@ _sk_parametric_r_avx:
.byte 196,195,125,74,193,128 // vblendvps %ymm8,%ymm9,%ymm0,%ymm0
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,124,95,192 // vmaxps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,5,152,48,0,0 // vbroadcastss 0x3098(%rip),%ymm8 # 56d8 <_sk_callback_avx+0x265>
+ .byte 196,98,125,24,5,152,48,0,0 // vbroadcastss 0x3098(%rip),%ymm8 # 56d4 <_sk_callback_avx+0x265>
.byte 196,193,124,93,192 // vminps %ymm8,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -14522,36 +14518,36 @@ _sk_parametric_g_avx:
.byte 196,193,116,88,203 // vaddps %ymm11,%ymm1,%ymm1
.byte 196,98,125,24,16 // vbroadcastss (%rax),%ymm10
.byte 197,124,91,217 // vcvtdq2ps %ymm1,%ymm11
- .byte 196,98,125,24,37,73,48,0,0 // vbroadcastss 0x3049(%rip),%ymm12 # 56dc <_sk_callback_avx+0x269>
+ .byte 196,98,125,24,37,73,48,0,0 // vbroadcastss 0x3049(%rip),%ymm12 # 56d8 <_sk_callback_avx+0x269>
.byte 196,65,36,89,220 // vmulps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,63,48,0,0 // vbroadcastss 0x303f(%rip),%ymm12 # 56e0 <_sk_callback_avx+0x26d>
+ .byte 196,98,125,24,37,63,48,0,0 // vbroadcastss 0x303f(%rip),%ymm12 # 56dc <_sk_callback_avx+0x26d>
.byte 196,193,116,84,204 // vandps %ymm12,%ymm1,%ymm1
- .byte 196,98,125,24,37,53,48,0,0 // vbroadcastss 0x3035(%rip),%ymm12 # 56e4 <_sk_callback_avx+0x271>
+ .byte 196,98,125,24,37,53,48,0,0 // vbroadcastss 0x3035(%rip),%ymm12 # 56e0 <_sk_callback_avx+0x271>
.byte 196,193,116,86,204 // vorps %ymm12,%ymm1,%ymm1
- .byte 196,98,125,24,37,43,48,0,0 // vbroadcastss 0x302b(%rip),%ymm12 # 56e8 <_sk_callback_avx+0x275>
+ .byte 196,98,125,24,37,43,48,0,0 // vbroadcastss 0x302b(%rip),%ymm12 # 56e4 <_sk_callback_avx+0x275>
.byte 196,65,36,88,220 // vaddps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,33,48,0,0 // vbroadcastss 0x3021(%rip),%ymm12 # 56ec <_sk_callback_avx+0x279>
+ .byte 196,98,125,24,37,33,48,0,0 // vbroadcastss 0x3021(%rip),%ymm12 # 56e8 <_sk_callback_avx+0x279>
.byte 196,65,116,89,228 // vmulps %ymm12,%ymm1,%ymm12
.byte 196,65,36,92,220 // vsubps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,18,48,0,0 // vbroadcastss 0x3012(%rip),%ymm12 # 56f0 <_sk_callback_avx+0x27d>
+ .byte 196,98,125,24,37,18,48,0,0 // vbroadcastss 0x3012(%rip),%ymm12 # 56ec <_sk_callback_avx+0x27d>
.byte 196,193,116,88,204 // vaddps %ymm12,%ymm1,%ymm1
- .byte 196,98,125,24,37,8,48,0,0 // vbroadcastss 0x3008(%rip),%ymm12 # 56f4 <_sk_callback_avx+0x281>
+ .byte 196,98,125,24,37,8,48,0,0 // vbroadcastss 0x3008(%rip),%ymm12 # 56f0 <_sk_callback_avx+0x281>
.byte 197,156,94,201 // vdivps %ymm1,%ymm12,%ymm1
.byte 197,164,92,201 // vsubps %ymm1,%ymm11,%ymm1
.byte 197,172,89,201 // vmulps %ymm1,%ymm10,%ymm1
.byte 196,99,125,8,209,1 // vroundps $0x1,%ymm1,%ymm10
.byte 196,65,116,92,210 // vsubps %ymm10,%ymm1,%ymm10
- .byte 196,98,125,24,29,236,47,0,0 // vbroadcastss 0x2fec(%rip),%ymm11 # 56f8 <_sk_callback_avx+0x285>
+ .byte 196,98,125,24,29,236,47,0,0 // vbroadcastss 0x2fec(%rip),%ymm11 # 56f4 <_sk_callback_avx+0x285>
.byte 196,193,116,88,203 // vaddps %ymm11,%ymm1,%ymm1
- .byte 196,98,125,24,29,226,47,0,0 // vbroadcastss 0x2fe2(%rip),%ymm11 # 56fc <_sk_callback_avx+0x289>
+ .byte 196,98,125,24,29,226,47,0,0 // vbroadcastss 0x2fe2(%rip),%ymm11 # 56f8 <_sk_callback_avx+0x289>
.byte 196,65,44,89,219 // vmulps %ymm11,%ymm10,%ymm11
.byte 196,193,116,92,203 // vsubps %ymm11,%ymm1,%ymm1
- .byte 196,98,125,24,29,211,47,0,0 // vbroadcastss 0x2fd3(%rip),%ymm11 # 5700 <_sk_callback_avx+0x28d>
+ .byte 196,98,125,24,29,211,47,0,0 // vbroadcastss 0x2fd3(%rip),%ymm11 # 56fc <_sk_callback_avx+0x28d>
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
- .byte 196,98,125,24,29,201,47,0,0 // vbroadcastss 0x2fc9(%rip),%ymm11 # 5704 <_sk_callback_avx+0x291>
+ .byte 196,98,125,24,29,201,47,0,0 // vbroadcastss 0x2fc9(%rip),%ymm11 # 5700 <_sk_callback_avx+0x291>
.byte 196,65,36,94,210 // vdivps %ymm10,%ymm11,%ymm10
.byte 196,193,116,88,202 // vaddps %ymm10,%ymm1,%ymm1
- .byte 196,98,125,24,21,186,47,0,0 // vbroadcastss 0x2fba(%rip),%ymm10 # 5708 <_sk_callback_avx+0x295>
+ .byte 196,98,125,24,21,186,47,0,0 // vbroadcastss 0x2fba(%rip),%ymm10 # 5704 <_sk_callback_avx+0x295>
.byte 196,193,116,89,202 // vmulps %ymm10,%ymm1,%ymm1
.byte 197,253,91,201 // vcvtps2dq %ymm1,%ymm1
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -14559,7 +14555,7 @@ _sk_parametric_g_avx:
.byte 196,195,117,74,201,128 // vblendvps %ymm8,%ymm9,%ymm1,%ymm1
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,116,95,200 // vmaxps %ymm8,%ymm1,%ymm1
- .byte 196,98,125,24,5,145,47,0,0 // vbroadcastss 0x2f91(%rip),%ymm8 # 570c <_sk_callback_avx+0x299>
+ .byte 196,98,125,24,5,145,47,0,0 // vbroadcastss 0x2f91(%rip),%ymm8 # 5708 <_sk_callback_avx+0x299>
.byte 196,193,116,93,200 // vminps %ymm8,%ymm1,%ymm1
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -14581,36 +14577,36 @@ _sk_parametric_b_avx:
.byte 196,193,108,88,211 // vaddps %ymm11,%ymm2,%ymm2
.byte 196,98,125,24,16 // vbroadcastss (%rax),%ymm10
.byte 197,124,91,218 // vcvtdq2ps %ymm2,%ymm11
- .byte 196,98,125,24,37,66,47,0,0 // vbroadcastss 0x2f42(%rip),%ymm12 # 5710 <_sk_callback_avx+0x29d>
+ .byte 196,98,125,24,37,66,47,0,0 // vbroadcastss 0x2f42(%rip),%ymm12 # 570c <_sk_callback_avx+0x29d>
.byte 196,65,36,89,220 // vmulps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,56,47,0,0 // vbroadcastss 0x2f38(%rip),%ymm12 # 5714 <_sk_callback_avx+0x2a1>
+ .byte 196,98,125,24,37,56,47,0,0 // vbroadcastss 0x2f38(%rip),%ymm12 # 5710 <_sk_callback_avx+0x2a1>
.byte 196,193,108,84,212 // vandps %ymm12,%ymm2,%ymm2
- .byte 196,98,125,24,37,46,47,0,0 // vbroadcastss 0x2f2e(%rip),%ymm12 # 5718 <_sk_callback_avx+0x2a5>
+ .byte 196,98,125,24,37,46,47,0,0 // vbroadcastss 0x2f2e(%rip),%ymm12 # 5714 <_sk_callback_avx+0x2a5>
.byte 196,193,108,86,212 // vorps %ymm12,%ymm2,%ymm2
- .byte 196,98,125,24,37,36,47,0,0 // vbroadcastss 0x2f24(%rip),%ymm12 # 571c <_sk_callback_avx+0x2a9>
+ .byte 196,98,125,24,37,36,47,0,0 // vbroadcastss 0x2f24(%rip),%ymm12 # 5718 <_sk_callback_avx+0x2a9>
.byte 196,65,36,88,220 // vaddps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,26,47,0,0 // vbroadcastss 0x2f1a(%rip),%ymm12 # 5720 <_sk_callback_avx+0x2ad>
+ .byte 196,98,125,24,37,26,47,0,0 // vbroadcastss 0x2f1a(%rip),%ymm12 # 571c <_sk_callback_avx+0x2ad>
.byte 196,65,108,89,228 // vmulps %ymm12,%ymm2,%ymm12
.byte 196,65,36,92,220 // vsubps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,11,47,0,0 // vbroadcastss 0x2f0b(%rip),%ymm12 # 5724 <_sk_callback_avx+0x2b1>
+ .byte 196,98,125,24,37,11,47,0,0 // vbroadcastss 0x2f0b(%rip),%ymm12 # 5720 <_sk_callback_avx+0x2b1>
.byte 196,193,108,88,212 // vaddps %ymm12,%ymm2,%ymm2
- .byte 196,98,125,24,37,1,47,0,0 // vbroadcastss 0x2f01(%rip),%ymm12 # 5728 <_sk_callback_avx+0x2b5>
+ .byte 196,98,125,24,37,1,47,0,0 // vbroadcastss 0x2f01(%rip),%ymm12 # 5724 <_sk_callback_avx+0x2b5>
.byte 197,156,94,210 // vdivps %ymm2,%ymm12,%ymm2
.byte 197,164,92,210 // vsubps %ymm2,%ymm11,%ymm2
.byte 197,172,89,210 // vmulps %ymm2,%ymm10,%ymm2
.byte 196,99,125,8,210,1 // vroundps $0x1,%ymm2,%ymm10
.byte 196,65,108,92,210 // vsubps %ymm10,%ymm2,%ymm10
- .byte 196,98,125,24,29,229,46,0,0 // vbroadcastss 0x2ee5(%rip),%ymm11 # 572c <_sk_callback_avx+0x2b9>
+ .byte 196,98,125,24,29,229,46,0,0 // vbroadcastss 0x2ee5(%rip),%ymm11 # 5728 <_sk_callback_avx+0x2b9>
.byte 196,193,108,88,211 // vaddps %ymm11,%ymm2,%ymm2
- .byte 196,98,125,24,29,219,46,0,0 // vbroadcastss 0x2edb(%rip),%ymm11 # 5730 <_sk_callback_avx+0x2bd>
+ .byte 196,98,125,24,29,219,46,0,0 // vbroadcastss 0x2edb(%rip),%ymm11 # 572c <_sk_callback_avx+0x2bd>
.byte 196,65,44,89,219 // vmulps %ymm11,%ymm10,%ymm11
.byte 196,193,108,92,211 // vsubps %ymm11,%ymm2,%ymm2
- .byte 196,98,125,24,29,204,46,0,0 // vbroadcastss 0x2ecc(%rip),%ymm11 # 5734 <_sk_callback_avx+0x2c1>
+ .byte 196,98,125,24,29,204,46,0,0 // vbroadcastss 0x2ecc(%rip),%ymm11 # 5730 <_sk_callback_avx+0x2c1>
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
- .byte 196,98,125,24,29,194,46,0,0 // vbroadcastss 0x2ec2(%rip),%ymm11 # 5738 <_sk_callback_avx+0x2c5>
+ .byte 196,98,125,24,29,194,46,0,0 // vbroadcastss 0x2ec2(%rip),%ymm11 # 5734 <_sk_callback_avx+0x2c5>
.byte 196,65,36,94,210 // vdivps %ymm10,%ymm11,%ymm10
.byte 196,193,108,88,210 // vaddps %ymm10,%ymm2,%ymm2
- .byte 196,98,125,24,21,179,46,0,0 // vbroadcastss 0x2eb3(%rip),%ymm10 # 573c <_sk_callback_avx+0x2c9>
+ .byte 196,98,125,24,21,179,46,0,0 // vbroadcastss 0x2eb3(%rip),%ymm10 # 5738 <_sk_callback_avx+0x2c9>
.byte 196,193,108,89,210 // vmulps %ymm10,%ymm2,%ymm2
.byte 197,253,91,210 // vcvtps2dq %ymm2,%ymm2
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -14618,7 +14614,7 @@ _sk_parametric_b_avx:
.byte 196,195,109,74,209,128 // vblendvps %ymm8,%ymm9,%ymm2,%ymm2
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,108,95,208 // vmaxps %ymm8,%ymm2,%ymm2
- .byte 196,98,125,24,5,138,46,0,0 // vbroadcastss 0x2e8a(%rip),%ymm8 # 5740 <_sk_callback_avx+0x2cd>
+ .byte 196,98,125,24,5,138,46,0,0 // vbroadcastss 0x2e8a(%rip),%ymm8 # 573c <_sk_callback_avx+0x2cd>
.byte 196,193,108,93,208 // vminps %ymm8,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -14640,36 +14636,36 @@ _sk_parametric_a_avx:
.byte 196,193,100,88,219 // vaddps %ymm11,%ymm3,%ymm3
.byte 196,98,125,24,16 // vbroadcastss (%rax),%ymm10
.byte 197,124,91,219 // vcvtdq2ps %ymm3,%ymm11
- .byte 196,98,125,24,37,59,46,0,0 // vbroadcastss 0x2e3b(%rip),%ymm12 # 5744 <_sk_callback_avx+0x2d1>
+ .byte 196,98,125,24,37,59,46,0,0 // vbroadcastss 0x2e3b(%rip),%ymm12 # 5740 <_sk_callback_avx+0x2d1>
.byte 196,65,36,89,220 // vmulps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,49,46,0,0 // vbroadcastss 0x2e31(%rip),%ymm12 # 5748 <_sk_callback_avx+0x2d5>
+ .byte 196,98,125,24,37,49,46,0,0 // vbroadcastss 0x2e31(%rip),%ymm12 # 5744 <_sk_callback_avx+0x2d5>
.byte 196,193,100,84,220 // vandps %ymm12,%ymm3,%ymm3
- .byte 196,98,125,24,37,39,46,0,0 // vbroadcastss 0x2e27(%rip),%ymm12 # 574c <_sk_callback_avx+0x2d9>
+ .byte 196,98,125,24,37,39,46,0,0 // vbroadcastss 0x2e27(%rip),%ymm12 # 5748 <_sk_callback_avx+0x2d9>
.byte 196,193,100,86,220 // vorps %ymm12,%ymm3,%ymm3
- .byte 196,98,125,24,37,29,46,0,0 // vbroadcastss 0x2e1d(%rip),%ymm12 # 5750 <_sk_callback_avx+0x2dd>
+ .byte 196,98,125,24,37,29,46,0,0 // vbroadcastss 0x2e1d(%rip),%ymm12 # 574c <_sk_callback_avx+0x2dd>
.byte 196,65,36,88,220 // vaddps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,19,46,0,0 // vbroadcastss 0x2e13(%rip),%ymm12 # 5754 <_sk_callback_avx+0x2e1>
+ .byte 196,98,125,24,37,19,46,0,0 // vbroadcastss 0x2e13(%rip),%ymm12 # 5750 <_sk_callback_avx+0x2e1>
.byte 196,65,100,89,228 // vmulps %ymm12,%ymm3,%ymm12
.byte 196,65,36,92,220 // vsubps %ymm12,%ymm11,%ymm11
- .byte 196,98,125,24,37,4,46,0,0 // vbroadcastss 0x2e04(%rip),%ymm12 # 5758 <_sk_callback_avx+0x2e5>
+ .byte 196,98,125,24,37,4,46,0,0 // vbroadcastss 0x2e04(%rip),%ymm12 # 5754 <_sk_callback_avx+0x2e5>
.byte 196,193,100,88,220 // vaddps %ymm12,%ymm3,%ymm3
- .byte 196,98,125,24,37,250,45,0,0 // vbroadcastss 0x2dfa(%rip),%ymm12 # 575c <_sk_callback_avx+0x2e9>
+ .byte 196,98,125,24,37,250,45,0,0 // vbroadcastss 0x2dfa(%rip),%ymm12 # 5758 <_sk_callback_avx+0x2e9>
.byte 197,156,94,219 // vdivps %ymm3,%ymm12,%ymm3
.byte 197,164,92,219 // vsubps %ymm3,%ymm11,%ymm3
.byte 197,172,89,219 // vmulps %ymm3,%ymm10,%ymm3
.byte 196,99,125,8,211,1 // vroundps $0x1,%ymm3,%ymm10
.byte 196,65,100,92,210 // vsubps %ymm10,%ymm3,%ymm10
- .byte 196,98,125,24,29,222,45,0,0 // vbroadcastss 0x2dde(%rip),%ymm11 # 5760 <_sk_callback_avx+0x2ed>
+ .byte 196,98,125,24,29,222,45,0,0 // vbroadcastss 0x2dde(%rip),%ymm11 # 575c <_sk_callback_avx+0x2ed>
.byte 196,193,100,88,219 // vaddps %ymm11,%ymm3,%ymm3
- .byte 196,98,125,24,29,212,45,0,0 // vbroadcastss 0x2dd4(%rip),%ymm11 # 5764 <_sk_callback_avx+0x2f1>
+ .byte 196,98,125,24,29,212,45,0,0 // vbroadcastss 0x2dd4(%rip),%ymm11 # 5760 <_sk_callback_avx+0x2f1>
.byte 196,65,44,89,219 // vmulps %ymm11,%ymm10,%ymm11
.byte 196,193,100,92,219 // vsubps %ymm11,%ymm3,%ymm3
- .byte 196,98,125,24,29,197,45,0,0 // vbroadcastss 0x2dc5(%rip),%ymm11 # 5768 <_sk_callback_avx+0x2f5>
+ .byte 196,98,125,24,29,197,45,0,0 // vbroadcastss 0x2dc5(%rip),%ymm11 # 5764 <_sk_callback_avx+0x2f5>
.byte 196,65,36,92,210 // vsubps %ymm10,%ymm11,%ymm10
- .byte 196,98,125,24,29,187,45,0,0 // vbroadcastss 0x2dbb(%rip),%ymm11 # 576c <_sk_callback_avx+0x2f9>
+ .byte 196,98,125,24,29,187,45,0,0 // vbroadcastss 0x2dbb(%rip),%ymm11 # 5768 <_sk_callback_avx+0x2f9>
.byte 196,65,36,94,210 // vdivps %ymm10,%ymm11,%ymm10
.byte 196,193,100,88,218 // vaddps %ymm10,%ymm3,%ymm3
- .byte 196,98,125,24,21,172,45,0,0 // vbroadcastss 0x2dac(%rip),%ymm10 # 5770 <_sk_callback_avx+0x2fd>
+ .byte 196,98,125,24,21,172,45,0,0 // vbroadcastss 0x2dac(%rip),%ymm10 # 576c <_sk_callback_avx+0x2fd>
.byte 196,193,100,89,218 // vmulps %ymm10,%ymm3,%ymm3
.byte 197,253,91,219 // vcvtps2dq %ymm3,%ymm3
.byte 196,98,125,24,80,20 // vbroadcastss 0x14(%rax),%ymm10
@@ -14677,7 +14673,7 @@ _sk_parametric_a_avx:
.byte 196,195,101,74,217,128 // vblendvps %ymm8,%ymm9,%ymm3,%ymm3
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,193,100,95,216 // vmaxps %ymm8,%ymm3,%ymm3
- .byte 196,98,125,24,5,131,45,0,0 // vbroadcastss 0x2d83(%rip),%ymm8 # 5774 <_sk_callback_avx+0x301>
+ .byte 196,98,125,24,5,131,45,0,0 // vbroadcastss 0x2d83(%rip),%ymm8 # 5770 <_sk_callback_avx+0x301>
.byte 196,193,100,93,216 // vminps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -14686,31 +14682,31 @@ HIDDEN _sk_lab_to_xyz_avx
.globl _sk_lab_to_xyz_avx
FUNCTION(_sk_lab_to_xyz_avx)
_sk_lab_to_xyz_avx:
- .byte 196,98,125,24,5,117,45,0,0 // vbroadcastss 0x2d75(%rip),%ymm8 # 5778 <_sk_callback_avx+0x305>
+ .byte 196,98,125,24,5,117,45,0,0 // vbroadcastss 0x2d75(%rip),%ymm8 # 5774 <_sk_callback_avx+0x305>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,5,107,45,0,0 // vbroadcastss 0x2d6b(%rip),%ymm8 # 577c <_sk_callback_avx+0x309>
+ .byte 196,98,125,24,5,107,45,0,0 // vbroadcastss 0x2d6b(%rip),%ymm8 # 5778 <_sk_callback_avx+0x309>
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
- .byte 196,98,125,24,13,97,45,0,0 // vbroadcastss 0x2d61(%rip),%ymm9 # 5780 <_sk_callback_avx+0x30d>
+ .byte 196,98,125,24,13,97,45,0,0 // vbroadcastss 0x2d61(%rip),%ymm9 # 577c <_sk_callback_avx+0x30d>
.byte 196,193,116,88,201 // vaddps %ymm9,%ymm1,%ymm1
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 196,193,108,88,209 // vaddps %ymm9,%ymm2,%ymm2
- .byte 196,98,125,24,5,77,45,0,0 // vbroadcastss 0x2d4d(%rip),%ymm8 # 5784 <_sk_callback_avx+0x311>
+ .byte 196,98,125,24,5,77,45,0,0 // vbroadcastss 0x2d4d(%rip),%ymm8 # 5780 <_sk_callback_avx+0x311>
.byte 196,193,124,88,192 // vaddps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,5,67,45,0,0 // vbroadcastss 0x2d43(%rip),%ymm8 # 5788 <_sk_callback_avx+0x315>
+ .byte 196,98,125,24,5,67,45,0,0 // vbroadcastss 0x2d43(%rip),%ymm8 # 5784 <_sk_callback_avx+0x315>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,5,57,45,0,0 // vbroadcastss 0x2d39(%rip),%ymm8 # 578c <_sk_callback_avx+0x319>
+ .byte 196,98,125,24,5,57,45,0,0 // vbroadcastss 0x2d39(%rip),%ymm8 # 5788 <_sk_callback_avx+0x319>
.byte 196,193,116,89,200 // vmulps %ymm8,%ymm1,%ymm1
.byte 197,252,88,201 // vaddps %ymm1,%ymm0,%ymm1
- .byte 196,98,125,24,5,43,45,0,0 // vbroadcastss 0x2d2b(%rip),%ymm8 # 5790 <_sk_callback_avx+0x31d>
+ .byte 196,98,125,24,5,43,45,0,0 // vbroadcastss 0x2d2b(%rip),%ymm8 # 578c <_sk_callback_avx+0x31d>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 197,252,92,210 // vsubps %ymm2,%ymm0,%ymm2
.byte 197,116,89,193 // vmulps %ymm1,%ymm1,%ymm8
.byte 196,65,116,89,192 // vmulps %ymm8,%ymm1,%ymm8
- .byte 196,98,125,24,13,20,45,0,0 // vbroadcastss 0x2d14(%rip),%ymm9 # 5794 <_sk_callback_avx+0x321>
+ .byte 196,98,125,24,13,20,45,0,0 // vbroadcastss 0x2d14(%rip),%ymm9 # 5790 <_sk_callback_avx+0x321>
.byte 196,65,52,194,208,1 // vcmpltps %ymm8,%ymm9,%ymm10
- .byte 196,98,125,24,29,9,45,0,0 // vbroadcastss 0x2d09(%rip),%ymm11 # 5798 <_sk_callback_avx+0x325>
+ .byte 196,98,125,24,29,9,45,0,0 // vbroadcastss 0x2d09(%rip),%ymm11 # 5794 <_sk_callback_avx+0x325>
.byte 196,193,116,88,203 // vaddps %ymm11,%ymm1,%ymm1
- .byte 196,98,125,24,37,255,44,0,0 // vbroadcastss 0x2cff(%rip),%ymm12 # 579c <_sk_callback_avx+0x329>
+ .byte 196,98,125,24,37,255,44,0,0 // vbroadcastss 0x2cff(%rip),%ymm12 # 5798 <_sk_callback_avx+0x329>
.byte 196,193,116,89,204 // vmulps %ymm12,%ymm1,%ymm1
.byte 196,67,117,74,192,160 // vblendvps %ymm10,%ymm8,%ymm1,%ymm8
.byte 197,252,89,200 // vmulps %ymm0,%ymm0,%ymm1
@@ -14725,9 +14721,9 @@ _sk_lab_to_xyz_avx:
.byte 196,193,108,88,211 // vaddps %ymm11,%ymm2,%ymm2
.byte 196,193,108,89,212 // vmulps %ymm12,%ymm2,%ymm2
.byte 196,227,109,74,208,144 // vblendvps %ymm9,%ymm0,%ymm2,%ymm2
- .byte 196,226,125,24,5,181,44,0,0 // vbroadcastss 0x2cb5(%rip),%ymm0 # 57a0 <_sk_callback_avx+0x32d>
+ .byte 196,226,125,24,5,181,44,0,0 // vbroadcastss 0x2cb5(%rip),%ymm0 # 579c <_sk_callback_avx+0x32d>
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
- .byte 196,98,125,24,5,172,44,0,0 // vbroadcastss 0x2cac(%rip),%ymm8 # 57a4 <_sk_callback_avx+0x331>
+ .byte 196,98,125,24,5,172,44,0,0 // vbroadcastss 0x2cac(%rip),%ymm8 # 57a0 <_sk_callback_avx+0x331>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -14741,14 +14737,14 @@ _sk_load_a8_avx:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,62 // jne 2b4f <_sk_load_a8_avx+0x4e>
+ .byte 117,62 // jne 2b4b <_sk_load_a8_avx+0x4e>
.byte 197,250,126,0 // vmovq (%rax),%xmm0
.byte 196,226,121,49,200 // vpmovzxbd %xmm0,%xmm1
.byte 196,227,121,4,192,229 // vpermilps $0xe5,%xmm0,%xmm0
.byte 196,226,121,49,192 // vpmovzxbd %xmm0,%xmm0
.byte 196,227,117,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm1,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,112,44,0,0 // vbroadcastss 0x2c70(%rip),%ymm1 # 57a8 <_sk_callback_avx+0x335>
+ .byte 196,226,125,24,13,112,44,0,0 // vbroadcastss 0x2c70(%rip),%ymm1 # 57a4 <_sk_callback_avx+0x335>
.byte 197,252,89,217 // vmulps %ymm1,%ymm0,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,87,192 // vxorps %ymm0,%ymm0,%ymm0
@@ -14765,9 +14761,9 @@ _sk_load_a8_avx:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 2b57 <_sk_load_a8_avx+0x56>
+ .byte 117,234 // jne 2b53 <_sk_load_a8_avx+0x56>
.byte 196,193,249,110,193 // vmovq %r9,%xmm0
- .byte 235,161 // jmp 2b15 <_sk_load_a8_avx+0x14>
+ .byte 235,161 // jmp 2b11 <_sk_load_a8_avx+0x14>
HIDDEN _sk_gather_a8_avx
.globl _sk_gather_a8_avx
@@ -14817,7 +14813,7 @@ _sk_gather_a8_avx:
.byte 196,226,121,49,201 // vpmovzxbd %xmm1,%xmm1
.byte 196,227,125,24,193,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,101,43,0,0 // vbroadcastss 0x2b65(%rip),%ymm1 # 57ac <_sk_callback_avx+0x339>
+ .byte 196,226,125,24,13,101,43,0,0 // vbroadcastss 0x2b65(%rip),%ymm1 # 57a8 <_sk_callback_avx+0x339>
.byte 197,252,89,217 // vmulps %ymm1,%ymm0,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,87,192 // vxorps %ymm0,%ymm0,%ymm0
@@ -14835,14 +14831,14 @@ FUNCTION(_sk_store_a8_avx)
_sk_store_a8_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,64,43,0,0 // vbroadcastss 0x2b40(%rip),%ymm8 # 57b0 <_sk_callback_avx+0x33d>
+ .byte 196,98,125,24,5,64,43,0,0 // vbroadcastss 0x2b40(%rip),%ymm8 # 57ac <_sk_callback_avx+0x33d>
.byte 196,65,100,89,192 // vmulps %ymm8,%ymm3,%ymm8
.byte 196,65,125,91,192 // vcvtps2dq %ymm8,%ymm8
.byte 196,67,125,25,193,1 // vextractf128 $0x1,%ymm8,%xmm9
.byte 196,66,57,43,193 // vpackusdw %xmm9,%xmm8,%xmm8
.byte 196,65,57,103,192 // vpackuswb %xmm8,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 2c99 <_sk_store_a8_avx+0x37>
+ .byte 117,10 // jne 2c95 <_sk_store_a8_avx+0x37>
.byte 196,65,123,17,4,58 // vmovsd %xmm8,(%r10,%rdi,1)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -14850,10 +14846,10 @@ _sk_store_a8_avx:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 2c95 <_sk_store_a8_avx+0x33>
+ .byte 119,236 // ja 2c91 <_sk_store_a8_avx+0x33>
.byte 196,66,121,48,192 // vpmovzxbw %xmm8,%xmm8
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,67,0,0,0 // lea 0x43(%rip),%r9 # 2cfc <_sk_store_a8_avx+0x9a>
+ .byte 76,141,13,67,0,0,0 // lea 0x43(%rip),%r9 # 2cf8 <_sk_store_a8_avx+0x9a>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -14864,7 +14860,7 @@ _sk_store_a8_avx:
.byte 196,67,121,20,68,58,2,4 // vpextrb $0x4,%xmm8,0x2(%r10,%rdi,1)
.byte 196,67,121,20,68,58,1,2 // vpextrb $0x2,%xmm8,0x1(%r10,%rdi,1)
.byte 196,67,121,20,4,58,0 // vpextrb $0x0,%xmm8,(%r10,%rdi,1)
- .byte 235,154 // jmp 2c95 <_sk_store_a8_avx+0x33>
+ .byte 235,154 // jmp 2c91 <_sk_store_a8_avx+0x33>
.byte 144 // nop
.byte 246,255 // idiv %bh
.byte 255 // (bad)
@@ -14898,17 +14894,17 @@ _sk_load_g8_avx:
.byte 72,139,0 // mov (%rax),%rax
.byte 72,1,248 // add %rdi,%rax
.byte 77,133,192 // test %r8,%r8
- .byte 117,67 // jne 2d6b <_sk_load_g8_avx+0x53>
+ .byte 117,67 // jne 2d67 <_sk_load_g8_avx+0x53>
.byte 197,250,126,0 // vmovq (%rax),%xmm0
.byte 196,226,121,49,200 // vpmovzxbd %xmm0,%xmm1
.byte 196,227,121,4,192,229 // vpermilps $0xe5,%xmm0,%xmm0
.byte 196,226,121,49,192 // vpmovzxbd %xmm0,%xmm0
.byte 196,227,117,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm1,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,101,42,0,0 // vbroadcastss 0x2a65(%rip),%ymm1 # 57b4 <_sk_callback_avx+0x341>
+ .byte 196,226,125,24,13,101,42,0,0 // vbroadcastss 0x2a65(%rip),%ymm1 # 57b0 <_sk_callback_avx+0x341>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,90,42,0,0 // vbroadcastss 0x2a5a(%rip),%ymm3 # 57b8 <_sk_callback_avx+0x345>
+ .byte 196,226,125,24,29,90,42,0,0 // vbroadcastss 0x2a5a(%rip),%ymm3 # 57b4 <_sk_callback_avx+0x345>
.byte 76,137,193 // mov %r8,%rcx
.byte 197,252,40,200 // vmovaps %ymm0,%ymm1
.byte 197,252,40,208 // vmovaps %ymm0,%ymm2
@@ -14922,9 +14918,9 @@ _sk_load_g8_avx:
.byte 77,9,217 // or %r11,%r9
.byte 72,131,193,8 // add $0x8,%rcx
.byte 73,255,202 // dec %r10
- .byte 117,234 // jne 2d73 <_sk_load_g8_avx+0x5b>
+ .byte 117,234 // jne 2d6f <_sk_load_g8_avx+0x5b>
.byte 196,193,249,110,193 // vmovq %r9,%xmm0
- .byte 235,156 // jmp 2d2c <_sk_load_g8_avx+0x14>
+ .byte 235,156 // jmp 2d28 <_sk_load_g8_avx+0x14>
HIDDEN _sk_gather_g8_avx
.globl _sk_gather_g8_avx
@@ -14974,10 +14970,10 @@ _sk_gather_g8_avx:
.byte 196,226,121,49,201 // vpmovzxbd %xmm1,%xmm1
.byte 196,227,125,24,193,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,89,41,0,0 // vbroadcastss 0x2959(%rip),%ymm1 # 57bc <_sk_callback_avx+0x349>
+ .byte 196,226,125,24,13,89,41,0,0 // vbroadcastss 0x2959(%rip),%ymm1 # 57b8 <_sk_callback_avx+0x349>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,78,41,0,0 // vbroadcastss 0x294e(%rip),%ymm3 # 57c0 <_sk_callback_avx+0x34d>
+ .byte 196,226,125,24,29,78,41,0,0 // vbroadcastss 0x294e(%rip),%ymm3 # 57bc <_sk_callback_avx+0x34d>
.byte 197,252,40,200 // vmovaps %ymm0,%ymm1
.byte 197,252,40,208 // vmovaps %ymm0,%ymm2
.byte 91 // pop %rbx
@@ -14993,9 +14989,9 @@ _sk_gather_i8_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 73,137,192 // mov %rax,%r8
.byte 77,133,192 // test %r8,%r8
- .byte 116,5 // je 2e92 <_sk_gather_i8_avx+0xf>
+ .byte 116,5 // je 2e8e <_sk_gather_i8_avx+0xf>
.byte 76,137,192 // mov %r8,%rax
- .byte 235,2 // jmp 2e94 <_sk_gather_i8_avx+0x11>
+ .byte 235,2 // jmp 2e90 <_sk_gather_i8_avx+0x11>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,87 // push %r15
.byte 65,86 // push %r14
@@ -15057,10 +15053,10 @@ _sk_gather_i8_avx:
.byte 196,163,121,34,4,163,2 // vpinsrd $0x2,(%rbx,%r12,4),%xmm0,%xmm0
.byte 196,163,121,34,28,19,3 // vpinsrd $0x3,(%rbx,%r10,1),%xmm0,%xmm3
.byte 196,227,61,24,195,1 // vinsertf128 $0x1,%xmm3,%ymm8,%ymm0
- .byte 197,124,40,21,194,41,0,0 // vmovaps 0x29c2(%rip),%ymm10 # 5980 <_sk_callback_avx+0x50d>
+ .byte 197,124,40,21,198,41,0,0 // vmovaps 0x29c6(%rip),%ymm10 # 5980 <_sk_callback_avx+0x511>
.byte 196,193,124,84,194 // vandps %ymm10,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,13,244,39,0,0 // vbroadcastss 0x27f4(%rip),%ymm9 # 57c4 <_sk_callback_avx+0x351>
+ .byte 196,98,125,24,13,244,39,0,0 // vbroadcastss 0x27f4(%rip),%ymm9 # 57c0 <_sk_callback_avx+0x351>
.byte 196,193,124,89,193 // vmulps %ymm9,%ymm0,%ymm0
.byte 196,193,113,114,208,8 // vpsrld $0x8,%xmm8,%xmm1
.byte 197,233,114,211,8 // vpsrld $0x8,%xmm3,%xmm2
@@ -15094,38 +15090,38 @@ _sk_load_565_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,128,0,0,0 // jne 30c8 <_sk_load_565_avx+0x8e>
+ .byte 15,133,128,0,0,0 // jne 30c4 <_sk_load_565_avx+0x8e>
.byte 196,193,122,111,4,122 // vmovdqu (%r10,%rdi,2),%xmm0
.byte 197,241,239,201 // vpxor %xmm1,%xmm1,%xmm1
.byte 197,249,105,201 // vpunpckhwd %xmm1,%xmm0,%xmm1
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,209,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm2
- .byte 196,226,125,24,5,94,39,0,0 // vbroadcastss 0x275e(%rip),%ymm0 # 57c8 <_sk_callback_avx+0x355>
+ .byte 196,226,125,24,5,94,39,0,0 // vbroadcastss 0x275e(%rip),%ymm0 # 57c4 <_sk_callback_avx+0x355>
.byte 197,236,84,192 // vandps %ymm0,%ymm2,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,81,39,0,0 // vbroadcastss 0x2751(%rip),%ymm1 # 57cc <_sk_callback_avx+0x359>
+ .byte 196,226,125,24,13,81,39,0,0 // vbroadcastss 0x2751(%rip),%ymm1 # 57c8 <_sk_callback_avx+0x359>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,24,13,72,39,0,0 // vbroadcastss 0x2748(%rip),%ymm1 # 57d0 <_sk_callback_avx+0x35d>
+ .byte 196,226,125,24,13,72,39,0,0 // vbroadcastss 0x2748(%rip),%ymm1 # 57cc <_sk_callback_avx+0x35d>
.byte 197,236,84,201 // vandps %ymm1,%ymm2,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,29,59,39,0,0 // vbroadcastss 0x273b(%rip),%ymm3 # 57d4 <_sk_callback_avx+0x361>
+ .byte 196,226,125,24,29,59,39,0,0 // vbroadcastss 0x273b(%rip),%ymm3 # 57d0 <_sk_callback_avx+0x361>
.byte 197,244,89,203 // vmulps %ymm3,%ymm1,%ymm1
- .byte 196,226,125,24,29,50,39,0,0 // vbroadcastss 0x2732(%rip),%ymm3 # 57d8 <_sk_callback_avx+0x365>
+ .byte 196,226,125,24,29,50,39,0,0 // vbroadcastss 0x2732(%rip),%ymm3 # 57d4 <_sk_callback_avx+0x365>
.byte 197,236,84,211 // vandps %ymm3,%ymm2,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,226,125,24,29,37,39,0,0 // vbroadcastss 0x2725(%rip),%ymm3 # 57dc <_sk_callback_avx+0x369>
+ .byte 196,226,125,24,29,37,39,0,0 // vbroadcastss 0x2725(%rip),%ymm3 # 57d8 <_sk_callback_avx+0x369>
.byte 197,236,89,211 // vmulps %ymm3,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,26,39,0,0 // vbroadcastss 0x271a(%rip),%ymm3 # 57e0 <_sk_callback_avx+0x36d>
+ .byte 196,226,125,24,29,26,39,0,0 // vbroadcastss 0x271a(%rip),%ymm3 # 57dc <_sk_callback_avx+0x36d>
.byte 255,224 // jmpq *%rax
.byte 65,137,200 // mov %ecx,%r8d
.byte 65,128,224,7 // and $0x7,%r8b
.byte 197,249,239,192 // vpxor %xmm0,%xmm0,%xmm0
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 15,135,110,255,255,255 // ja 304e <_sk_load_565_avx+0x14>
+ .byte 15,135,110,255,255,255 // ja 304a <_sk_load_565_avx+0x14>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 3134 <_sk_load_565_avx+0xfa>
+ .byte 76,141,13,73,0,0,0 // lea 0x49(%rip),%r9 # 3130 <_sk_load_565_avx+0xfa>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -15137,7 +15133,7 @@ _sk_load_565_avx:
.byte 196,193,121,196,68,122,4,2 // vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,68,122,2,1 // vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,4,122,0 // vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- .byte 233,26,255,255,255 // jmpq 304e <_sk_load_565_avx+0x14>
+ .byte 233,26,255,255,255 // jmpq 304a <_sk_load_565_avx+0x14>
.byte 244 // hlt
.byte 255 // (bad)
.byte 255 // (bad)
@@ -15215,23 +15211,23 @@ _sk_gather_565_avx:
.byte 197,249,105,201 // vpunpckhwd %xmm1,%xmm0,%xmm1
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,209,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm2
- .byte 196,226,125,24,5,186,37,0,0 // vbroadcastss 0x25ba(%rip),%ymm0 # 57e4 <_sk_callback_avx+0x371>
+ .byte 196,226,125,24,5,186,37,0,0 // vbroadcastss 0x25ba(%rip),%ymm0 # 57e0 <_sk_callback_avx+0x371>
.byte 197,236,84,192 // vandps %ymm0,%ymm2,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,173,37,0,0 // vbroadcastss 0x25ad(%rip),%ymm1 # 57e8 <_sk_callback_avx+0x375>
+ .byte 196,226,125,24,13,173,37,0,0 // vbroadcastss 0x25ad(%rip),%ymm1 # 57e4 <_sk_callback_avx+0x375>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,24,13,164,37,0,0 // vbroadcastss 0x25a4(%rip),%ymm1 # 57ec <_sk_callback_avx+0x379>
+ .byte 196,226,125,24,13,164,37,0,0 // vbroadcastss 0x25a4(%rip),%ymm1 # 57e8 <_sk_callback_avx+0x379>
.byte 197,236,84,201 // vandps %ymm1,%ymm2,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,29,151,37,0,0 // vbroadcastss 0x2597(%rip),%ymm3 # 57f0 <_sk_callback_avx+0x37d>
+ .byte 196,226,125,24,29,151,37,0,0 // vbroadcastss 0x2597(%rip),%ymm3 # 57ec <_sk_callback_avx+0x37d>
.byte 197,244,89,203 // vmulps %ymm3,%ymm1,%ymm1
- .byte 196,226,125,24,29,142,37,0,0 // vbroadcastss 0x258e(%rip),%ymm3 # 57f4 <_sk_callback_avx+0x381>
+ .byte 196,226,125,24,29,142,37,0,0 // vbroadcastss 0x258e(%rip),%ymm3 # 57f0 <_sk_callback_avx+0x381>
.byte 197,236,84,211 // vandps %ymm3,%ymm2,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,226,125,24,29,129,37,0,0 // vbroadcastss 0x2581(%rip),%ymm3 # 57f8 <_sk_callback_avx+0x385>
+ .byte 196,226,125,24,29,129,37,0,0 // vbroadcastss 0x2581(%rip),%ymm3 # 57f4 <_sk_callback_avx+0x385>
.byte 197,236,89,211 // vmulps %ymm3,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,118,37,0,0 // vbroadcastss 0x2576(%rip),%ymm3 # 57fc <_sk_callback_avx+0x389>
+ .byte 196,226,125,24,29,118,37,0,0 // vbroadcastss 0x2576(%rip),%ymm3 # 57f8 <_sk_callback_avx+0x389>
.byte 91 // pop %rbx
.byte 65,92 // pop %r12
.byte 65,94 // pop %r14
@@ -15245,14 +15241,14 @@ FUNCTION(_sk_store_565_avx)
_sk_store_565_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,98,37,0,0 // vbroadcastss 0x2562(%rip),%ymm8 # 5800 <_sk_callback_avx+0x38d>
+ .byte 196,98,125,24,5,98,37,0,0 // vbroadcastss 0x2562(%rip),%ymm8 # 57fc <_sk_callback_avx+0x38d>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,193,41,114,241,11 // vpslld $0xb,%xmm9,%xmm10
.byte 196,67,125,25,201,1 // vextractf128 $0x1,%ymm9,%xmm9
.byte 196,193,49,114,241,11 // vpslld $0xb,%xmm9,%xmm9
.byte 196,67,45,24,201,1 // vinsertf128 $0x1,%xmm9,%ymm10,%ymm9
- .byte 196,98,125,24,21,59,37,0,0 // vbroadcastss 0x253b(%rip),%ymm10 # 5804 <_sk_callback_avx+0x391>
+ .byte 196,98,125,24,21,59,37,0,0 // vbroadcastss 0x253b(%rip),%ymm10 # 5800 <_sk_callback_avx+0x391>
.byte 196,65,116,89,210 // vmulps %ymm10,%ymm1,%ymm10
.byte 196,65,125,91,210 // vcvtps2dq %ymm10,%ymm10
.byte 196,193,33,114,242,5 // vpslld $0x5,%xmm10,%xmm11
@@ -15266,7 +15262,7 @@ _sk_store_565_avx:
.byte 196,67,125,25,193,1 // vextractf128 $0x1,%ymm8,%xmm9
.byte 196,66,57,43,193 // vpackusdw %xmm9,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 3319 <_sk_store_565_avx+0x89>
+ .byte 117,10 // jne 3315 <_sk_store_565_avx+0x89>
.byte 196,65,122,127,4,122 // vmovdqu %xmm8,(%r10,%rdi,2)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15274,9 +15270,9 @@ _sk_store_565_avx:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 3315 <_sk_store_565_avx+0x85>
+ .byte 119,236 // ja 3311 <_sk_store_565_avx+0x85>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,68,0,0,0 // lea 0x44(%rip),%r9 # 3378 <_sk_store_565_avx+0xe8>
+ .byte 76,141,13,68,0,0,0 // lea 0x44(%rip),%r9 # 3374 <_sk_store_565_avx+0xe8>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -15287,7 +15283,7 @@ _sk_store_565_avx:
.byte 196,67,121,21,68,122,4,2 // vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
.byte 196,67,121,21,68,122,2,1 // vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
.byte 196,67,121,21,4,122,0 // vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- .byte 235,159 // jmp 3315 <_sk_store_565_avx+0x85>
+ .byte 235,159 // jmp 3311 <_sk_store_565_avx+0x85>
.byte 102,144 // xchg %ax,%ax
.byte 245 // cmc
.byte 255 // (bad)
@@ -15320,31 +15316,31 @@ _sk_load_4444_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,152,0,0,0 // jne 343a <_sk_load_4444_avx+0xa6>
+ .byte 15,133,152,0,0,0 // jne 3436 <_sk_load_4444_avx+0xa6>
.byte 196,193,122,111,4,122 // vmovdqu (%r10,%rdi,2),%xmm0
.byte 197,241,239,201 // vpxor %xmm1,%xmm1,%xmm1
.byte 197,249,105,201 // vpunpckhwd %xmm1,%xmm0,%xmm1
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,217,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm3
- .byte 196,226,125,24,5,68,36,0,0 // vbroadcastss 0x2444(%rip),%ymm0 # 5808 <_sk_callback_avx+0x395>
+ .byte 196,226,125,24,5,68,36,0,0 // vbroadcastss 0x2444(%rip),%ymm0 # 5804 <_sk_callback_avx+0x395>
.byte 197,228,84,192 // vandps %ymm0,%ymm3,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,55,36,0,0 // vbroadcastss 0x2437(%rip),%ymm1 # 580c <_sk_callback_avx+0x399>
+ .byte 196,226,125,24,13,55,36,0,0 // vbroadcastss 0x2437(%rip),%ymm1 # 5808 <_sk_callback_avx+0x399>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,24,13,46,36,0,0 // vbroadcastss 0x242e(%rip),%ymm1 # 5810 <_sk_callback_avx+0x39d>
+ .byte 196,226,125,24,13,46,36,0,0 // vbroadcastss 0x242e(%rip),%ymm1 # 580c <_sk_callback_avx+0x39d>
.byte 197,228,84,201 // vandps %ymm1,%ymm3,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,21,33,36,0,0 // vbroadcastss 0x2421(%rip),%ymm2 # 5814 <_sk_callback_avx+0x3a1>
+ .byte 196,226,125,24,21,33,36,0,0 // vbroadcastss 0x2421(%rip),%ymm2 # 5810 <_sk_callback_avx+0x3a1>
.byte 197,244,89,202 // vmulps %ymm2,%ymm1,%ymm1
- .byte 196,226,125,24,21,24,36,0,0 // vbroadcastss 0x2418(%rip),%ymm2 # 5818 <_sk_callback_avx+0x3a5>
+ .byte 196,226,125,24,21,24,36,0,0 // vbroadcastss 0x2418(%rip),%ymm2 # 5814 <_sk_callback_avx+0x3a5>
.byte 197,228,84,210 // vandps %ymm2,%ymm3,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,98,125,24,5,11,36,0,0 // vbroadcastss 0x240b(%rip),%ymm8 # 581c <_sk_callback_avx+0x3a9>
+ .byte 196,98,125,24,5,11,36,0,0 // vbroadcastss 0x240b(%rip),%ymm8 # 5818 <_sk_callback_avx+0x3a9>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
- .byte 196,98,125,24,5,1,36,0,0 // vbroadcastss 0x2401(%rip),%ymm8 # 5820 <_sk_callback_avx+0x3ad>
+ .byte 196,98,125,24,5,1,36,0,0 // vbroadcastss 0x2401(%rip),%ymm8 # 581c <_sk_callback_avx+0x3ad>
.byte 196,193,100,84,216 // vandps %ymm8,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,243,35,0,0 // vbroadcastss 0x23f3(%rip),%ymm8 # 5824 <_sk_callback_avx+0x3b1>
+ .byte 196,98,125,24,5,243,35,0,0 // vbroadcastss 0x23f3(%rip),%ymm8 # 5820 <_sk_callback_avx+0x3b1>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15353,9 +15349,9 @@ _sk_load_4444_avx:
.byte 197,249,239,192 // vpxor %xmm0,%xmm0,%xmm0
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 15,135,86,255,255,255 // ja 33a8 <_sk_load_4444_avx+0x14>
+ .byte 15,135,86,255,255,255 // ja 33a4 <_sk_load_4444_avx+0x14>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,75,0,0,0 // lea 0x4b(%rip),%r9 # 34a8 <_sk_load_4444_avx+0x114>
+ .byte 76,141,13,75,0,0,0 // lea 0x4b(%rip),%r9 # 34a4 <_sk_load_4444_avx+0x114>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -15367,7 +15363,7 @@ _sk_load_4444_avx:
.byte 196,193,121,196,68,122,4,2 // vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,68,122,2,1 // vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
.byte 196,193,121,196,4,122,0 // vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- .byte 233,2,255,255,255 // jmpq 33a8 <_sk_load_4444_avx+0x14>
+ .byte 233,2,255,255,255 // jmpq 33a4 <_sk_load_4444_avx+0x14>
.byte 102,144 // xchg %ax,%ax
.byte 242,255 // repnz (bad)
.byte 255 // (bad)
@@ -15446,25 +15442,25 @@ _sk_gather_4444_avx:
.byte 197,249,105,201 // vpunpckhwd %xmm1,%xmm0,%xmm1
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,217,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm3
- .byte 196,226,125,24,5,138,34,0,0 // vbroadcastss 0x228a(%rip),%ymm0 # 5828 <_sk_callback_avx+0x3b5>
+ .byte 196,226,125,24,5,138,34,0,0 // vbroadcastss 0x228a(%rip),%ymm0 # 5824 <_sk_callback_avx+0x3b5>
.byte 197,228,84,192 // vandps %ymm0,%ymm3,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,226,125,24,13,125,34,0,0 // vbroadcastss 0x227d(%rip),%ymm1 # 582c <_sk_callback_avx+0x3b9>
+ .byte 196,226,125,24,13,125,34,0,0 // vbroadcastss 0x227d(%rip),%ymm1 # 5828 <_sk_callback_avx+0x3b9>
.byte 197,252,89,193 // vmulps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,24,13,116,34,0,0 // vbroadcastss 0x2274(%rip),%ymm1 # 5830 <_sk_callback_avx+0x3bd>
+ .byte 196,226,125,24,13,116,34,0,0 // vbroadcastss 0x2274(%rip),%ymm1 # 582c <_sk_callback_avx+0x3bd>
.byte 197,228,84,201 // vandps %ymm1,%ymm3,%ymm1
.byte 197,252,91,201 // vcvtdq2ps %ymm1,%ymm1
- .byte 196,226,125,24,21,103,34,0,0 // vbroadcastss 0x2267(%rip),%ymm2 # 5834 <_sk_callback_avx+0x3c1>
+ .byte 196,226,125,24,21,103,34,0,0 // vbroadcastss 0x2267(%rip),%ymm2 # 5830 <_sk_callback_avx+0x3c1>
.byte 197,244,89,202 // vmulps %ymm2,%ymm1,%ymm1
- .byte 196,226,125,24,21,94,34,0,0 // vbroadcastss 0x225e(%rip),%ymm2 # 5838 <_sk_callback_avx+0x3c5>
+ .byte 196,226,125,24,21,94,34,0,0 // vbroadcastss 0x225e(%rip),%ymm2 # 5834 <_sk_callback_avx+0x3c5>
.byte 197,228,84,210 // vandps %ymm2,%ymm3,%ymm2
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
- .byte 196,98,125,24,5,81,34,0,0 // vbroadcastss 0x2251(%rip),%ymm8 # 583c <_sk_callback_avx+0x3c9>
+ .byte 196,98,125,24,5,81,34,0,0 // vbroadcastss 0x2251(%rip),%ymm8 # 5838 <_sk_callback_avx+0x3c9>
.byte 196,193,108,89,208 // vmulps %ymm8,%ymm2,%ymm2
- .byte 196,98,125,24,5,71,34,0,0 // vbroadcastss 0x2247(%rip),%ymm8 # 5840 <_sk_callback_avx+0x3cd>
+ .byte 196,98,125,24,5,71,34,0,0 // vbroadcastss 0x2247(%rip),%ymm8 # 583c <_sk_callback_avx+0x3cd>
.byte 196,193,100,84,216 // vandps %ymm8,%ymm3,%ymm3
.byte 197,252,91,219 // vcvtdq2ps %ymm3,%ymm3
- .byte 196,98,125,24,5,57,34,0,0 // vbroadcastss 0x2239(%rip),%ymm8 # 5844 <_sk_callback_avx+0x3d1>
+ .byte 196,98,125,24,5,57,34,0,0 // vbroadcastss 0x2239(%rip),%ymm8 # 5840 <_sk_callback_avx+0x3d1>
.byte 196,193,100,89,216 // vmulps %ymm8,%ymm3,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 91 // pop %rbx
@@ -15480,7 +15476,7 @@ FUNCTION(_sk_store_4444_avx)
_sk_store_4444_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,30,34,0,0 // vbroadcastss 0x221e(%rip),%ymm8 # 5848 <_sk_callback_avx+0x3d5>
+ .byte 196,98,125,24,5,30,34,0,0 // vbroadcastss 0x221e(%rip),%ymm8 # 5844 <_sk_callback_avx+0x3d5>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,193,41,114,241,12 // vpslld $0xc,%xmm9,%xmm10
@@ -15507,7 +15503,7 @@ _sk_store_4444_avx:
.byte 196,67,125,25,193,1 // vextractf128 $0x1,%ymm8,%xmm9
.byte 196,66,57,43,193 // vpackusdw %xmm9,%xmm8,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 36c3 <_sk_store_4444_avx+0xa7>
+ .byte 117,10 // jne 36bf <_sk_store_4444_avx+0xa7>
.byte 196,65,122,127,4,122 // vmovdqu %xmm8,(%r10,%rdi,2)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15515,9 +15511,9 @@ _sk_store_4444_avx:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 36bf <_sk_store_4444_avx+0xa3>
+ .byte 119,236 // ja 36bb <_sk_store_4444_avx+0xa3>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,66,0,0,0 // lea 0x42(%rip),%r9 # 3720 <_sk_store_4444_avx+0x104>
+ .byte 76,141,13,66,0,0,0 // lea 0x42(%rip),%r9 # 371c <_sk_store_4444_avx+0x104>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -15528,7 +15524,7 @@ _sk_store_4444_avx:
.byte 196,67,121,21,68,122,4,2 // vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
.byte 196,67,121,21,68,122,2,1 // vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
.byte 196,67,121,21,4,122,0 // vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- .byte 235,159 // jmp 36bf <_sk_store_4444_avx+0xa3>
+ .byte 235,159 // jmp 36bb <_sk_store_4444_avx+0xa3>
.byte 247,255 // idiv %edi
.byte 255 // (bad)
.byte 255 // (bad)
@@ -15559,12 +15555,12 @@ _sk_load_8888_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,135,0,0,0 // jne 37d1 <_sk_load_8888_avx+0x95>
+ .byte 15,133,135,0,0,0 // jne 37cd <_sk_load_8888_avx+0x95>
.byte 196,65,124,16,12,186 // vmovups (%r10,%rdi,4),%ymm9
- .byte 197,124,40,21,72,34,0,0 // vmovaps 0x2248(%rip),%ymm10 # 59a0 <_sk_callback_avx+0x52d>
+ .byte 197,124,40,21,76,34,0,0 // vmovaps 0x224c(%rip),%ymm10 # 59a0 <_sk_callback_avx+0x531>
.byte 196,193,52,84,194 // vandps %ymm10,%ymm9,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,5,226,32,0,0 // vbroadcastss 0x20e2(%rip),%ymm8 # 584c <_sk_callback_avx+0x3d9>
+ .byte 196,98,125,24,5,226,32,0,0 // vbroadcastss 0x20e2(%rip),%ymm8 # 5848 <_sk_callback_avx+0x3d9>
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
.byte 196,193,113,114,209,8 // vpsrld $0x8,%xmm9,%xmm1
.byte 196,99,125,25,203,1 // vextractf128 $0x1,%ymm9,%xmm3
@@ -15591,9 +15587,9 @@ _sk_load_8888_avx:
.byte 196,65,52,87,201 // vxorps %ymm9,%ymm9,%ymm9
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 15,135,102,255,255,255 // ja 3750 <_sk_load_8888_avx+0x14>
+ .byte 15,135,102,255,255,255 // ja 374c <_sk_load_8888_avx+0x14>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,139,0,0,0 // lea 0x8b(%rip),%r9 # 3880 <_sk_load_8888_avx+0x144>
+ .byte 76,141,13,139,0,0,0 // lea 0x8b(%rip),%r9 # 387c <_sk_load_8888_avx+0x144>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -15616,7 +15612,7 @@ _sk_load_8888_avx:
.byte 196,99,53,12,200,15 // vblendps $0xf,%ymm0,%ymm9,%ymm9
.byte 196,195,49,34,4,186,0 // vpinsrd $0x0,(%r10,%rdi,4),%xmm9,%xmm0
.byte 196,99,53,12,200,15 // vblendps $0xf,%ymm0,%ymm9,%ymm9
- .byte 233,210,254,255,255 // jmpq 3750 <_sk_load_8888_avx+0x14>
+ .byte 233,210,254,255,255 // jmpq 374c <_sk_load_8888_avx+0x14>
.byte 102,144 // xchg %ax,%ax
.byte 236 // in (%dx),%al
.byte 255 // (bad)
@@ -15634,7 +15630,7 @@ _sk_load_8888_avx:
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 126,255 // jle 3899 <_sk_load_8888_avx+0x15d>
+ .byte 126,255 // jle 3895 <_sk_load_8888_avx+0x15d>
.byte 255 // (bad)
.byte 255 // .byte 0xff
@@ -15679,10 +15675,10 @@ _sk_gather_8888_avx:
.byte 196,131,121,34,4,152,2 // vpinsrd $0x2,(%r8,%r11,4),%xmm0,%xmm0
.byte 196,131,121,34,28,144,3 // vpinsrd $0x3,(%r8,%r10,4),%xmm0,%xmm3
.byte 196,227,61,24,195,1 // vinsertf128 $0x1,%xmm3,%ymm8,%ymm0
- .byte 197,124,40,21,114,32,0,0 // vmovaps 0x2072(%rip),%ymm10 # 59c0 <_sk_callback_avx+0x54d>
+ .byte 197,124,40,21,118,32,0,0 // vmovaps 0x2076(%rip),%ymm10 # 59c0 <_sk_callback_avx+0x551>
.byte 196,193,124,84,194 // vandps %ymm10,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,13,240,30,0,0 // vbroadcastss 0x1ef0(%rip),%ymm9 # 5850 <_sk_callback_avx+0x3dd>
+ .byte 196,98,125,24,13,240,30,0,0 // vbroadcastss 0x1ef0(%rip),%ymm9 # 584c <_sk_callback_avx+0x3dd>
.byte 196,193,124,89,193 // vmulps %ymm9,%ymm0,%ymm0
.byte 196,193,113,114,208,8 // vpsrld $0x8,%xmm8,%xmm1
.byte 197,233,114,211,8 // vpsrld $0x8,%xmm3,%xmm2
@@ -15714,7 +15710,7 @@ FUNCTION(_sk_store_8888_avx)
_sk_store_8888_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
- .byte 196,98,125,24,5,126,30,0,0 // vbroadcastss 0x1e7e(%rip),%ymm8 # 5854 <_sk_callback_avx+0x3e1>
+ .byte 196,98,125,24,5,126,30,0,0 // vbroadcastss 0x1e7e(%rip),%ymm8 # 5850 <_sk_callback_avx+0x3e1>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,65,116,89,208 // vmulps %ymm8,%ymm1,%ymm10
@@ -15739,7 +15735,7 @@ _sk_store_8888_avx:
.byte 196,65,45,86,192 // vorpd %ymm8,%ymm10,%ymm8
.byte 196,65,53,86,192 // vorpd %ymm8,%ymm9,%ymm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,10 // jne 3a64 <_sk_store_8888_avx+0x9c>
+ .byte 117,10 // jne 3a60 <_sk_store_8888_avx+0x9c>
.byte 196,65,124,17,4,186 // vmovups %ymm8,(%r10,%rdi,4)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15747,9 +15743,9 @@ _sk_store_8888_avx:
.byte 65,128,224,7 // and $0x7,%r8b
.byte 65,254,200 // dec %r8b
.byte 65,128,248,6 // cmp $0x6,%r8b
- .byte 119,236 // ja 3a60 <_sk_store_8888_avx+0x98>
+ .byte 119,236 // ja 3a5c <_sk_store_8888_avx+0x98>
.byte 69,15,182,192 // movzbl %r8b,%r8d
- .byte 76,141,13,85,0,0,0 // lea 0x55(%rip),%r9 # 3ad4 <_sk_store_8888_avx+0x10c>
+ .byte 76,141,13,85,0,0,0 // lea 0x55(%rip),%r9 # 3ad0 <_sk_store_8888_avx+0x10c>
.byte 75,99,4,129 // movslq (%r9,%r8,4),%rax
.byte 76,1,200 // add %r9,%rax
.byte 255,224 // jmpq *%rax
@@ -15763,7 +15759,7 @@ _sk_store_8888_avx:
.byte 196,67,121,22,68,186,8,2 // vpextrd $0x2,%xmm8,0x8(%r10,%rdi,4)
.byte 196,67,121,22,68,186,4,1 // vpextrd $0x1,%xmm8,0x4(%r10,%rdi,4)
.byte 196,65,121,126,4,186 // vmovd %xmm8,(%r10,%rdi,4)
- .byte 235,143 // jmp 3a60 <_sk_store_8888_avx+0x98>
+ .byte 235,143 // jmp 3a5c <_sk_store_8888_avx+0x98>
.byte 15,31,0 // nopl (%rax)
.byte 245 // cmc
.byte 255 // (bad)
@@ -15801,7 +15797,7 @@ _sk_load_f16_avx:
.byte 197,252,17,116,36,192 // vmovups %ymm6,-0x40(%rsp)
.byte 197,252,17,108,36,160 // vmovups %ymm5,-0x60(%rsp)
.byte 197,254,127,100,36,128 // vmovdqu %ymm4,-0x80(%rsp)
- .byte 15,133,141,2,0,0 // jne 3da7 <_sk_load_f16_avx+0x2b7>
+ .byte 15,133,141,2,0,0 // jne 3da3 <_sk_load_f16_avx+0x2b7>
.byte 197,121,16,4,248 // vmovupd (%rax,%rdi,8),%xmm8
.byte 197,249,16,84,248,16 // vmovupd 0x10(%rax,%rdi,8),%xmm2
.byte 197,249,16,76,248,32 // vmovupd 0x20(%rax,%rdi,8),%xmm1
@@ -15819,13 +15815,13 @@ _sk_load_f16_avx:
.byte 197,249,105,201 // vpunpckhwd %xmm1,%xmm0,%xmm1
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,193,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
- .byte 196,98,125,24,37,229,28,0,0 // vbroadcastss 0x1ce5(%rip),%ymm12 # 5858 <_sk_callback_avx+0x3e5>
+ .byte 196,98,125,24,37,229,28,0,0 // vbroadcastss 0x1ce5(%rip),%ymm12 # 5854 <_sk_callback_avx+0x3e5>
.byte 196,193,124,84,204 // vandps %ymm12,%ymm0,%ymm1
.byte 197,252,87,193 // vxorps %ymm1,%ymm0,%ymm0
.byte 196,195,125,25,198,1 // vextractf128 $0x1,%ymm0,%xmm14
- .byte 196,98,121,24,29,209,28,0,0 // vbroadcastss 0x1cd1(%rip),%xmm11 # 585c <_sk_callback_avx+0x3e9>
+ .byte 196,98,121,24,29,209,28,0,0 // vbroadcastss 0x1cd1(%rip),%xmm11 # 5858 <_sk_callback_avx+0x3e9>
.byte 196,193,8,87,219 // vxorps %xmm11,%xmm14,%xmm3
- .byte 196,98,121,24,45,199,28,0,0 // vbroadcastss 0x1cc7(%rip),%xmm13 # 5860 <_sk_callback_avx+0x3ed>
+ .byte 196,98,121,24,45,199,28,0,0 // vbroadcastss 0x1cc7(%rip),%xmm13 # 585c <_sk_callback_avx+0x3ed>
.byte 197,145,102,219 // vpcmpgtd %xmm3,%xmm13,%xmm3
.byte 196,65,120,87,211 // vxorps %xmm11,%xmm0,%xmm10
.byte 196,65,17,102,210 // vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -15839,7 +15835,7 @@ _sk_load_f16_avx:
.byte 196,227,125,24,195,1 // vinsertf128 $0x1,%xmm3,%ymm0,%ymm0
.byte 197,252,86,193 // vorps %ymm1,%ymm0,%ymm0
.byte 196,227,125,25,193,1 // vextractf128 $0x1,%ymm0,%xmm1
- .byte 196,226,121,24,29,125,28,0,0 // vbroadcastss 0x1c7d(%rip),%xmm3 # 5864 <_sk_callback_avx+0x3f1>
+ .byte 196,226,121,24,29,125,28,0,0 // vbroadcastss 0x1c7d(%rip),%xmm3 # 5860 <_sk_callback_avx+0x3f1>
.byte 197,241,254,203 // vpaddd %xmm3,%xmm1,%xmm1
.byte 197,249,254,195 // vpaddd %xmm3,%xmm0,%xmm0
.byte 196,227,125,24,193,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
@@ -15932,29 +15928,29 @@ _sk_load_f16_avx:
.byte 197,123,16,4,248 // vmovsd (%rax,%rdi,8),%xmm8
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,79 // je 3e06 <_sk_load_f16_avx+0x316>
+ .byte 116,79 // je 3e02 <_sk_load_f16_avx+0x316>
.byte 197,57,22,68,248,8 // vmovhpd 0x8(%rax,%rdi,8),%xmm8,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,67 // jb 3e06 <_sk_load_f16_avx+0x316>
+ .byte 114,67 // jb 3e02 <_sk_load_f16_avx+0x316>
.byte 197,251,16,84,248,16 // vmovsd 0x10(%rax,%rdi,8),%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 116,68 // je 3e13 <_sk_load_f16_avx+0x323>
+ .byte 116,68 // je 3e0f <_sk_load_f16_avx+0x323>
.byte 197,233,22,84,248,24 // vmovhpd 0x18(%rax,%rdi,8),%xmm2,%xmm2
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,56 // jb 3e13 <_sk_load_f16_avx+0x323>
+ .byte 114,56 // jb 3e0f <_sk_load_f16_avx+0x323>
.byte 197,251,16,76,248,32 // vmovsd 0x20(%rax,%rdi,8),%xmm1
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 15,132,70,253,255,255 // je 3b31 <_sk_load_f16_avx+0x41>
+ .byte 15,132,70,253,255,255 // je 3b2d <_sk_load_f16_avx+0x41>
.byte 197,241,22,76,248,40 // vmovhpd 0x28(%rax,%rdi,8),%xmm1,%xmm1
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 15,130,54,253,255,255 // jb 3b31 <_sk_load_f16_avx+0x41>
+ .byte 15,130,54,253,255,255 // jb 3b2d <_sk_load_f16_avx+0x41>
.byte 197,122,126,76,248,48 // vmovq 0x30(%rax,%rdi,8),%xmm9
- .byte 233,43,253,255,255 // jmpq 3b31 <_sk_load_f16_avx+0x41>
+ .byte 233,43,253,255,255 // jmpq 3b2d <_sk_load_f16_avx+0x41>
.byte 197,241,87,201 // vxorpd %xmm1,%xmm1,%xmm1
.byte 197,233,87,210 // vxorpd %xmm2,%xmm2,%xmm2
- .byte 233,30,253,255,255 // jmpq 3b31 <_sk_load_f16_avx+0x41>
+ .byte 233,30,253,255,255 // jmpq 3b2d <_sk_load_f16_avx+0x41>
.byte 197,241,87,201 // vxorpd %xmm1,%xmm1,%xmm1
- .byte 233,21,253,255,255 // jmpq 3b31 <_sk_load_f16_avx+0x41>
+ .byte 233,21,253,255,255 // jmpq 3b2d <_sk_load_f16_avx+0x41>
HIDDEN _sk_gather_f16_avx
.globl _sk_gather_f16_avx
@@ -16018,13 +16014,13 @@ _sk_gather_f16_avx:
.byte 197,249,105,210 // vpunpckhwd %xmm2,%xmm0,%xmm2
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,194,1 // vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
- .byte 196,98,125,24,37,65,25,0,0 // vbroadcastss 0x1941(%rip),%ymm12 # 5868 <_sk_callback_avx+0x3f5>
+ .byte 196,98,125,24,37,65,25,0,0 // vbroadcastss 0x1941(%rip),%ymm12 # 5864 <_sk_callback_avx+0x3f5>
.byte 196,193,124,84,212 // vandps %ymm12,%ymm0,%ymm2
.byte 197,252,87,194 // vxorps %ymm2,%ymm0,%ymm0
.byte 196,195,125,25,198,1 // vextractf128 $0x1,%ymm0,%xmm14
- .byte 196,98,121,24,29,45,25,0,0 // vbroadcastss 0x192d(%rip),%xmm11 # 586c <_sk_callback_avx+0x3f9>
+ .byte 196,98,121,24,29,45,25,0,0 // vbroadcastss 0x192d(%rip),%xmm11 # 5868 <_sk_callback_avx+0x3f9>
.byte 196,193,8,87,219 // vxorps %xmm11,%xmm14,%xmm3
- .byte 196,98,121,24,45,35,25,0,0 // vbroadcastss 0x1923(%rip),%xmm13 # 5870 <_sk_callback_avx+0x3fd>
+ .byte 196,98,121,24,45,35,25,0,0 // vbroadcastss 0x1923(%rip),%xmm13 # 586c <_sk_callback_avx+0x3fd>
.byte 197,145,102,219 // vpcmpgtd %xmm3,%xmm13,%xmm3
.byte 196,65,120,87,211 // vxorps %xmm11,%xmm0,%xmm10
.byte 196,65,17,102,210 // vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -16038,7 +16034,7 @@ _sk_gather_f16_avx:
.byte 196,227,125,24,195,1 // vinsertf128 $0x1,%xmm3,%ymm0,%ymm0
.byte 197,252,86,194 // vorps %ymm2,%ymm0,%ymm0
.byte 196,227,125,25,194,1 // vextractf128 $0x1,%ymm0,%xmm2
- .byte 196,226,121,24,29,217,24,0,0 // vbroadcastss 0x18d9(%rip),%xmm3 # 5874 <_sk_callback_avx+0x401>
+ .byte 196,226,121,24,29,217,24,0,0 // vbroadcastss 0x18d9(%rip),%xmm3 # 5870 <_sk_callback_avx+0x401>
.byte 197,233,254,211 // vpaddd %xmm3,%xmm2,%xmm2
.byte 197,249,254,195 // vpaddd %xmm3,%xmm0,%xmm0
.byte 196,227,125,24,194,1 // vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
@@ -16142,12 +16138,12 @@ _sk_store_f16_avx:
.byte 197,252,17,52,36 // vmovups %ymm6,(%rsp)
.byte 197,252,17,108,36,224 // vmovups %ymm5,-0x20(%rsp)
.byte 197,252,17,100,36,192 // vmovups %ymm4,-0x40(%rsp)
- .byte 196,98,125,24,13,242,22,0,0 // vbroadcastss 0x16f2(%rip),%ymm9 # 5878 <_sk_callback_avx+0x405>
+ .byte 196,98,125,24,13,242,22,0,0 // vbroadcastss 0x16f2(%rip),%ymm9 # 5874 <_sk_callback_avx+0x405>
.byte 196,65,124,84,209 // vandps %ymm9,%ymm0,%ymm10
.byte 197,252,17,68,36,128 // vmovups %ymm0,-0x80(%rsp)
.byte 196,65,124,87,218 // vxorps %ymm10,%ymm0,%ymm11
.byte 196,67,125,25,220,1 // vextractf128 $0x1,%ymm11,%xmm12
- .byte 196,98,121,24,5,215,22,0,0 // vbroadcastss 0x16d7(%rip),%xmm8 # 587c <_sk_callback_avx+0x409>
+ .byte 196,98,121,24,5,215,22,0,0 // vbroadcastss 0x16d7(%rip),%xmm8 # 5878 <_sk_callback_avx+0x409>
.byte 196,65,57,102,236 // vpcmpgtd %xmm12,%xmm8,%xmm13
.byte 196,65,57,102,243 // vpcmpgtd %xmm11,%xmm8,%xmm14
.byte 196,67,13,24,237,1 // vinsertf128 $0x1,%xmm13,%ymm14,%ymm13
@@ -16157,7 +16153,7 @@ _sk_store_f16_avx:
.byte 196,67,13,24,242,1 // vinsertf128 $0x1,%xmm10,%ymm14,%ymm14
.byte 196,193,33,114,211,13 // vpsrld $0xd,%xmm11,%xmm11
.byte 196,193,25,114,212,13 // vpsrld $0xd,%xmm12,%xmm12
- .byte 196,98,125,24,21,158,22,0,0 // vbroadcastss 0x169e(%rip),%ymm10 # 5880 <_sk_callback_avx+0x40d>
+ .byte 196,98,125,24,21,158,22,0,0 // vbroadcastss 0x169e(%rip),%ymm10 # 587c <_sk_callback_avx+0x40d>
.byte 196,65,12,86,242 // vorps %ymm10,%ymm14,%ymm14
.byte 196,67,125,25,247,1 // vextractf128 $0x1,%ymm14,%xmm15
.byte 196,65,1,254,228 // vpaddd %xmm12,%xmm15,%xmm12
@@ -16239,7 +16235,7 @@ _sk_store_f16_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,66 // jne 43c0 <_sk_store_f16_avx+0x25e>
+ .byte 117,66 // jne 43bc <_sk_store_f16_avx+0x25e>
.byte 197,120,17,28,248 // vmovups %xmm11,(%rax,%rdi,8)
.byte 197,120,17,84,248,16 // vmovups %xmm10,0x10(%rax,%rdi,8)
.byte 197,120,17,76,248,32 // vmovups %xmm9,0x20(%rax,%rdi,8)
@@ -16255,22 +16251,22 @@ _sk_store_f16_avx:
.byte 255,224 // jmpq *%rax
.byte 197,121,214,28,248 // vmovq %xmm11,(%rax,%rdi,8)
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,202 // je 4395 <_sk_store_f16_avx+0x233>
+ .byte 116,202 // je 4391 <_sk_store_f16_avx+0x233>
.byte 197,121,23,92,248,8 // vmovhpd %xmm11,0x8(%rax,%rdi,8)
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,190 // jb 4395 <_sk_store_f16_avx+0x233>
+ .byte 114,190 // jb 4391 <_sk_store_f16_avx+0x233>
.byte 197,121,214,84,248,16 // vmovq %xmm10,0x10(%rax,%rdi,8)
- .byte 116,182 // je 4395 <_sk_store_f16_avx+0x233>
+ .byte 116,182 // je 4391 <_sk_store_f16_avx+0x233>
.byte 197,121,23,84,248,24 // vmovhpd %xmm10,0x18(%rax,%rdi,8)
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,170 // jb 4395 <_sk_store_f16_avx+0x233>
+ .byte 114,170 // jb 4391 <_sk_store_f16_avx+0x233>
.byte 197,121,214,76,248,32 // vmovq %xmm9,0x20(%rax,%rdi,8)
- .byte 116,162 // je 4395 <_sk_store_f16_avx+0x233>
+ .byte 116,162 // je 4391 <_sk_store_f16_avx+0x233>
.byte 197,121,23,76,248,40 // vmovhpd %xmm9,0x28(%rax,%rdi,8)
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,150 // jb 4395 <_sk_store_f16_avx+0x233>
+ .byte 114,150 // jb 4391 <_sk_store_f16_avx+0x233>
.byte 197,121,214,68,248,48 // vmovq %xmm8,0x30(%rax,%rdi,8)
- .byte 235,142 // jmp 4395 <_sk_store_f16_avx+0x233>
+ .byte 235,142 // jmp 4391 <_sk_store_f16_avx+0x233>
HIDDEN _sk_load_u16_be_avx
.globl _sk_load_u16_be_avx
@@ -16280,7 +16276,7 @@ _sk_load_u16_be_avx:
.byte 76,139,0 // mov (%rax),%r8
.byte 72,141,4,189,0,0,0,0 // lea 0x0(,%rdi,4),%rax
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,253,0,0,0 // jne 451a <_sk_load_u16_be_avx+0x113>
+ .byte 15,133,253,0,0,0 // jne 4516 <_sk_load_u16_be_avx+0x113>
.byte 196,65,121,16,4,64 // vmovupd (%r8,%rax,2),%xmm8
.byte 196,193,121,16,84,64,16 // vmovupd 0x10(%r8,%rax,2),%xmm2
.byte 196,193,121,16,92,64,32 // vmovupd 0x20(%r8,%rax,2),%xmm3
@@ -16302,7 +16298,7 @@ _sk_load_u16_be_avx:
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,193,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,29,246,19,0,0 // vbroadcastss 0x13f6(%rip),%ymm11 # 5884 <_sk_callback_avx+0x411>
+ .byte 196,98,125,24,29,246,19,0,0 // vbroadcastss 0x13f6(%rip),%ymm11 # 5880 <_sk_callback_avx+0x411>
.byte 196,193,124,89,195 // vmulps %ymm11,%ymm0,%ymm0
.byte 197,177,109,202 // vpunpckhqdq %xmm2,%xmm9,%xmm1
.byte 197,233,113,241,8 // vpsllw $0x8,%xmm1,%xmm2
@@ -16336,29 +16332,29 @@ _sk_load_u16_be_avx:
.byte 196,65,123,16,4,64 // vmovsd (%r8,%rax,2),%xmm8
.byte 196,65,49,239,201 // vpxor %xmm9,%xmm9,%xmm9
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,85 // je 4580 <_sk_load_u16_be_avx+0x179>
+ .byte 116,85 // je 457c <_sk_load_u16_be_avx+0x179>
.byte 196,65,57,22,68,64,8 // vmovhpd 0x8(%r8,%rax,2),%xmm8,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,72 // jb 4580 <_sk_load_u16_be_avx+0x179>
+ .byte 114,72 // jb 457c <_sk_load_u16_be_avx+0x179>
.byte 196,193,123,16,84,64,16 // vmovsd 0x10(%r8,%rax,2),%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 116,72 // je 458d <_sk_load_u16_be_avx+0x186>
+ .byte 116,72 // je 4589 <_sk_load_u16_be_avx+0x186>
.byte 196,193,105,22,84,64,24 // vmovhpd 0x18(%r8,%rax,2),%xmm2,%xmm2
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,59 // jb 458d <_sk_load_u16_be_avx+0x186>
+ .byte 114,59 // jb 4589 <_sk_load_u16_be_avx+0x186>
.byte 196,193,123,16,92,64,32 // vmovsd 0x20(%r8,%rax,2),%xmm3
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 15,132,213,254,255,255 // je 4438 <_sk_load_u16_be_avx+0x31>
+ .byte 15,132,213,254,255,255 // je 4434 <_sk_load_u16_be_avx+0x31>
.byte 196,193,97,22,92,64,40 // vmovhpd 0x28(%r8,%rax,2),%xmm3,%xmm3
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 15,130,196,254,255,255 // jb 4438 <_sk_load_u16_be_avx+0x31>
+ .byte 15,130,196,254,255,255 // jb 4434 <_sk_load_u16_be_avx+0x31>
.byte 196,65,122,126,76,64,48 // vmovq 0x30(%r8,%rax,2),%xmm9
- .byte 233,184,254,255,255 // jmpq 4438 <_sk_load_u16_be_avx+0x31>
+ .byte 233,184,254,255,255 // jmpq 4434 <_sk_load_u16_be_avx+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
.byte 197,233,87,210 // vxorpd %xmm2,%xmm2,%xmm2
- .byte 233,171,254,255,255 // jmpq 4438 <_sk_load_u16_be_avx+0x31>
+ .byte 233,171,254,255,255 // jmpq 4434 <_sk_load_u16_be_avx+0x31>
.byte 197,225,87,219 // vxorpd %xmm3,%xmm3,%xmm3
- .byte 233,162,254,255,255 // jmpq 4438 <_sk_load_u16_be_avx+0x31>
+ .byte 233,162,254,255,255 // jmpq 4434 <_sk_load_u16_be_avx+0x31>
HIDDEN _sk_load_rgb_u16_be_avx
.globl _sk_load_rgb_u16_be_avx
@@ -16368,7 +16364,7 @@ _sk_load_rgb_u16_be_avx:
.byte 76,139,0 // mov (%rax),%r8
.byte 72,141,4,127 // lea (%rdi,%rdi,2),%rax
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,133,243,0,0,0 // jne 469b <_sk_load_rgb_u16_be_avx+0x105>
+ .byte 15,133,243,0,0,0 // jne 4697 <_sk_load_rgb_u16_be_avx+0x105>
.byte 196,193,122,111,4,64 // vmovdqu (%r8,%rax,2),%xmm0
.byte 196,193,122,111,84,64,12 // vmovdqu 0xc(%r8,%rax,2),%xmm2
.byte 196,193,122,111,76,64,24 // vmovdqu 0x18(%r8,%rax,2),%xmm1
@@ -16395,7 +16391,7 @@ _sk_load_rgb_u16_be_avx:
.byte 196,226,121,51,192 // vpmovzxwd %xmm0,%xmm0
.byte 196,227,125,24,193,1 // vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
.byte 197,252,91,192 // vcvtdq2ps %ymm0,%ymm0
- .byte 196,98,125,24,29,86,18,0,0 // vbroadcastss 0x1256(%rip),%ymm11 # 5888 <_sk_callback_avx+0x415>
+ .byte 196,98,125,24,29,86,18,0,0 // vbroadcastss 0x1256(%rip),%ymm11 # 5884 <_sk_callback_avx+0x415>
.byte 196,193,124,89,195 // vmulps %ymm11,%ymm0,%ymm0
.byte 197,185,109,202 // vpunpckhqdq %xmm2,%xmm8,%xmm1
.byte 197,233,113,241,8 // vpsllw $0x8,%xmm1,%xmm2
@@ -16416,41 +16412,41 @@ _sk_load_rgb_u16_be_avx:
.byte 197,252,91,210 // vcvtdq2ps %ymm2,%ymm2
.byte 196,193,108,89,211 // vmulps %ymm11,%ymm2,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,243,17,0,0 // vbroadcastss 0x11f3(%rip),%ymm3 # 588c <_sk_callback_avx+0x419>
+ .byte 196,226,125,24,29,243,17,0,0 // vbroadcastss 0x11f3(%rip),%ymm3 # 5888 <_sk_callback_avx+0x419>
.byte 255,224 // jmpq *%rax
.byte 196,193,121,110,4,64 // vmovd (%r8,%rax,2),%xmm0
.byte 196,193,121,196,68,64,4,2 // vpinsrw $0x2,0x4(%r8,%rax,2),%xmm0,%xmm0
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 117,5 // jne 46b4 <_sk_load_rgb_u16_be_avx+0x11e>
- .byte 233,40,255,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 117,5 // jne 46b0 <_sk_load_rgb_u16_be_avx+0x11e>
+ .byte 233,40,255,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
.byte 196,193,121,110,76,64,6 // vmovd 0x6(%r8,%rax,2),%xmm1
.byte 196,65,113,196,68,64,10,2 // vpinsrw $0x2,0xa(%r8,%rax,2),%xmm1,%xmm8
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,26 // jb 46e3 <_sk_load_rgb_u16_be_avx+0x14d>
+ .byte 114,26 // jb 46df <_sk_load_rgb_u16_be_avx+0x14d>
.byte 196,193,121,110,76,64,12 // vmovd 0xc(%r8,%rax,2),%xmm1
.byte 196,193,113,196,84,64,16,2 // vpinsrw $0x2,0x10(%r8,%rax,2),%xmm1,%xmm2
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 117,10 // jne 46e8 <_sk_load_rgb_u16_be_avx+0x152>
- .byte 233,249,254,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
- .byte 233,244,254,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 117,10 // jne 46e4 <_sk_load_rgb_u16_be_avx+0x152>
+ .byte 233,249,254,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 233,244,254,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
.byte 196,193,121,110,76,64,18 // vmovd 0x12(%r8,%rax,2),%xmm1
.byte 196,65,113,196,76,64,22,2 // vpinsrw $0x2,0x16(%r8,%rax,2),%xmm1,%xmm9
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,26 // jb 4717 <_sk_load_rgb_u16_be_avx+0x181>
+ .byte 114,26 // jb 4713 <_sk_load_rgb_u16_be_avx+0x181>
.byte 196,193,121,110,76,64,24 // vmovd 0x18(%r8,%rax,2),%xmm1
.byte 196,193,113,196,76,64,28,2 // vpinsrw $0x2,0x1c(%r8,%rax,2),%xmm1,%xmm1
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 117,10 // jne 471c <_sk_load_rgb_u16_be_avx+0x186>
- .byte 233,197,254,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
- .byte 233,192,254,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 117,10 // jne 4718 <_sk_load_rgb_u16_be_avx+0x186>
+ .byte 233,197,254,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 233,192,254,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
.byte 196,193,121,110,92,64,30 // vmovd 0x1e(%r8,%rax,2),%xmm3
.byte 196,65,97,196,92,64,34,2 // vpinsrw $0x2,0x22(%r8,%rax,2),%xmm3,%xmm11
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,20 // jb 4745 <_sk_load_rgb_u16_be_avx+0x1af>
+ .byte 114,20 // jb 4741 <_sk_load_rgb_u16_be_avx+0x1af>
.byte 196,193,121,110,92,64,36 // vmovd 0x24(%r8,%rax,2),%xmm3
.byte 196,193,97,196,92,64,40,2 // vpinsrw $0x2,0x28(%r8,%rax,2),%xmm3,%xmm3
- .byte 233,151,254,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
- .byte 233,146,254,255,255 // jmpq 45dc <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 233,151,254,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
+ .byte 233,146,254,255,255 // jmpq 45d8 <_sk_load_rgb_u16_be_avx+0x46>
HIDDEN _sk_store_u16_be_avx
.globl _sk_store_u16_be_avx
@@ -16459,7 +16455,7 @@ _sk_store_u16_be_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,0 // mov (%rax),%r8
.byte 72,141,4,189,0,0,0,0 // lea 0x0(,%rdi,4),%rax
- .byte 196,98,125,24,5,48,17,0,0 // vbroadcastss 0x1130(%rip),%ymm8 # 5890 <_sk_callback_avx+0x41d>
+ .byte 196,98,125,24,5,48,17,0,0 // vbroadcastss 0x1130(%rip),%ymm8 # 588c <_sk_callback_avx+0x41d>
.byte 196,65,124,89,200 // vmulps %ymm8,%ymm0,%ymm9
.byte 196,65,125,91,201 // vcvtps2dq %ymm9,%ymm9
.byte 196,67,125,25,202,1 // vextractf128 $0x1,%ymm9,%xmm10
@@ -16497,7 +16493,7 @@ _sk_store_u16_be_avx:
.byte 196,65,17,98,200 // vpunpckldq %xmm8,%xmm13,%xmm9
.byte 196,65,17,106,192 // vpunpckhdq %xmm8,%xmm13,%xmm8
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,31 // jne 4844 <_sk_store_u16_be_avx+0xfa>
+ .byte 117,31 // jne 4840 <_sk_store_u16_be_avx+0xfa>
.byte 196,65,120,17,28,64 // vmovups %xmm11,(%r8,%rax,2)
.byte 196,65,120,17,84,64,16 // vmovups %xmm10,0x10(%r8,%rax,2)
.byte 196,65,120,17,76,64,32 // vmovups %xmm9,0x20(%r8,%rax,2)
@@ -16506,22 +16502,22 @@ _sk_store_u16_be_avx:
.byte 255,224 // jmpq *%rax
.byte 196,65,121,214,28,64 // vmovq %xmm11,(%r8,%rax,2)
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,240 // je 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 116,240 // je 483c <_sk_store_u16_be_avx+0xf6>
.byte 196,65,121,23,92,64,8 // vmovhpd %xmm11,0x8(%r8,%rax,2)
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,227 // jb 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 114,227 // jb 483c <_sk_store_u16_be_avx+0xf6>
.byte 196,65,121,214,84,64,16 // vmovq %xmm10,0x10(%r8,%rax,2)
- .byte 116,218 // je 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 116,218 // je 483c <_sk_store_u16_be_avx+0xf6>
.byte 196,65,121,23,84,64,24 // vmovhpd %xmm10,0x18(%r8,%rax,2)
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,205 // jb 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 114,205 // jb 483c <_sk_store_u16_be_avx+0xf6>
.byte 196,65,121,214,76,64,32 // vmovq %xmm9,0x20(%r8,%rax,2)
- .byte 116,196 // je 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 116,196 // je 483c <_sk_store_u16_be_avx+0xf6>
.byte 196,65,121,23,76,64,40 // vmovhpd %xmm9,0x28(%r8,%rax,2)
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,183 // jb 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 114,183 // jb 483c <_sk_store_u16_be_avx+0xf6>
.byte 196,65,121,214,68,64,48 // vmovq %xmm8,0x30(%r8,%rax,2)
- .byte 235,174 // jmp 4840 <_sk_store_u16_be_avx+0xf6>
+ .byte 235,174 // jmp 483c <_sk_store_u16_be_avx+0xf6>
HIDDEN _sk_load_f32_avx
.globl _sk_load_f32_avx
@@ -16529,10 +16525,10 @@ FUNCTION(_sk_load_f32_avx)
_sk_load_f32_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 119,110 // ja 4908 <_sk_load_f32_avx+0x76>
+ .byte 119,110 // ja 4904 <_sk_load_f32_avx+0x76>
.byte 76,139,0 // mov (%rax),%r8
.byte 76,141,12,189,0,0,0,0 // lea 0x0(,%rdi,4),%r9
- .byte 76,141,21,132,0,0,0 // lea 0x84(%rip),%r10 # 4930 <_sk_load_f32_avx+0x9e>
+ .byte 76,141,21,132,0,0,0 // lea 0x84(%rip),%r10 # 492c <_sk_load_f32_avx+0x9e>
.byte 73,99,4,138 // movslq (%r10,%rcx,4),%rax
.byte 76,1,208 // add %r10,%rax
.byte 255,224 // jmpq *%rax
@@ -16591,7 +16587,7 @@ _sk_store_f32_avx:
.byte 196,65,37,20,196 // vunpcklpd %ymm12,%ymm11,%ymm8
.byte 196,65,37,21,220 // vunpckhpd %ymm12,%ymm11,%ymm11
.byte 72,133,201 // test %rcx,%rcx
- .byte 117,55 // jne 49bd <_sk_store_f32_avx+0x6d>
+ .byte 117,55 // jne 49b9 <_sk_store_f32_avx+0x6d>
.byte 196,67,45,24,225,1 // vinsertf128 $0x1,%xmm9,%ymm10,%ymm12
.byte 196,67,61,24,235,1 // vinsertf128 $0x1,%xmm11,%ymm8,%ymm13
.byte 196,67,45,6,201,49 // vperm2f128 $0x31,%ymm9,%ymm10,%ymm9
@@ -16604,22 +16600,22 @@ _sk_store_f32_avx:
.byte 255,224 // jmpq *%rax
.byte 196,65,121,17,20,128 // vmovupd %xmm10,(%r8,%rax,4)
.byte 72,131,249,1 // cmp $0x1,%rcx
- .byte 116,240 // je 49b9 <_sk_store_f32_avx+0x69>
+ .byte 116,240 // je 49b5 <_sk_store_f32_avx+0x69>
.byte 196,65,121,17,76,128,16 // vmovupd %xmm9,0x10(%r8,%rax,4)
.byte 72,131,249,3 // cmp $0x3,%rcx
- .byte 114,227 // jb 49b9 <_sk_store_f32_avx+0x69>
+ .byte 114,227 // jb 49b5 <_sk_store_f32_avx+0x69>
.byte 196,65,121,17,68,128,32 // vmovupd %xmm8,0x20(%r8,%rax,4)
- .byte 116,218 // je 49b9 <_sk_store_f32_avx+0x69>
+ .byte 116,218 // je 49b5 <_sk_store_f32_avx+0x69>
.byte 196,65,121,17,92,128,48 // vmovupd %xmm11,0x30(%r8,%rax,4)
.byte 72,131,249,5 // cmp $0x5,%rcx
- .byte 114,205 // jb 49b9 <_sk_store_f32_avx+0x69>
+ .byte 114,205 // jb 49b5 <_sk_store_f32_avx+0x69>
.byte 196,67,125,25,84,128,64,1 // vextractf128 $0x1,%ymm10,0x40(%r8,%rax,4)
- .byte 116,195 // je 49b9 <_sk_store_f32_avx+0x69>
+ .byte 116,195 // je 49b5 <_sk_store_f32_avx+0x69>
.byte 196,67,125,25,76,128,80,1 // vextractf128 $0x1,%ymm9,0x50(%r8,%rax,4)
.byte 72,131,249,7 // cmp $0x7,%rcx
- .byte 114,181 // jb 49b9 <_sk_store_f32_avx+0x69>
+ .byte 114,181 // jb 49b5 <_sk_store_f32_avx+0x69>
.byte 196,67,125,25,68,128,96,1 // vextractf128 $0x1,%ymm8,0x60(%r8,%rax,4)
- .byte 235,171 // jmp 49b9 <_sk_store_f32_avx+0x69>
+ .byte 235,171 // jmp 49b5 <_sk_store_f32_avx+0x69>
HIDDEN _sk_clamp_x_avx
.globl _sk_clamp_x_avx
@@ -16755,12 +16751,12 @@ HIDDEN _sk_luminance_to_alpha_avx
.globl _sk_luminance_to_alpha_avx
FUNCTION(_sk_luminance_to_alpha_avx)
_sk_luminance_to_alpha_avx:
- .byte 196,226,125,24,29,187,12,0,0 // vbroadcastss 0xcbb(%rip),%ymm3 # 5894 <_sk_callback_avx+0x421>
+ .byte 196,226,125,24,29,187,12,0,0 // vbroadcastss 0xcbb(%rip),%ymm3 # 5890 <_sk_callback_avx+0x421>
.byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
- .byte 196,226,125,24,29,178,12,0,0 // vbroadcastss 0xcb2(%rip),%ymm3 # 5898 <_sk_callback_avx+0x425>
+ .byte 196,226,125,24,29,178,12,0,0 // vbroadcastss 0xcb2(%rip),%ymm3 # 5894 <_sk_callback_avx+0x425>
.byte 197,244,89,203 // vmulps %ymm3,%ymm1,%ymm1
.byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
- .byte 196,226,125,24,13,165,12,0,0 // vbroadcastss 0xca5(%rip),%ymm1 # 589c <_sk_callback_avx+0x429>
+ .byte 196,226,125,24,13,165,12,0,0 // vbroadcastss 0xca5(%rip),%ymm1 # 5898 <_sk_callback_avx+0x429>
.byte 197,236,89,201 // vmulps %ymm1,%ymm2,%ymm1
.byte 197,252,88,217 // vaddps %ymm1,%ymm0,%ymm3
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -16938,7 +16934,7 @@ _sk_linear_gradient_avx:
.byte 196,226,125,24,88,28 // vbroadcastss 0x1c(%rax),%ymm3
.byte 76,139,0 // mov (%rax),%r8
.byte 77,133,192 // test %r8,%r8
- .byte 15,132,146,0,0,0 // je 4f4d <_sk_linear_gradient_avx+0xb8>
+ .byte 15,132,146,0,0,0 // je 4f49 <_sk_linear_gradient_avx+0xb8>
.byte 72,139,64,8 // mov 0x8(%rax),%rax
.byte 72,131,192,32 // add $0x20,%rax
.byte 196,65,28,87,228 // vxorps %ymm12,%ymm12,%ymm12
@@ -16965,8 +16961,8 @@ _sk_linear_gradient_avx:
.byte 196,227,13,74,219,208 // vblendvps %ymm13,%ymm3,%ymm14,%ymm3
.byte 72,131,192,36 // add $0x24,%rax
.byte 73,255,200 // dec %r8
- .byte 117,140 // jne 4ed7 <_sk_linear_gradient_avx+0x42>
- .byte 235,20 // jmp 4f61 <_sk_linear_gradient_avx+0xcc>
+ .byte 117,140 // jne 4ed3 <_sk_linear_gradient_avx+0x42>
+ .byte 235,20 // jmp 4f5d <_sk_linear_gradient_avx+0xcc>
.byte 196,65,36,87,219 // vxorps %ymm11,%ymm11,%ymm11
.byte 196,65,44,87,210 // vxorps %ymm10,%ymm10,%ymm10
.byte 196,65,52,87,201 // vxorps %ymm9,%ymm9,%ymm9
@@ -17021,27 +17017,27 @@ _sk_xy_to_polar_unit_avx:
.byte 196,65,52,95,226 // vmaxps %ymm10,%ymm9,%ymm12
.byte 196,65,36,94,220 // vdivps %ymm12,%ymm11,%ymm11
.byte 196,65,36,89,227 // vmulps %ymm11,%ymm11,%ymm12
- .byte 196,98,125,24,45,138,8,0,0 // vbroadcastss 0x88a(%rip),%ymm13 # 58a0 <_sk_callback_avx+0x42d>
+ .byte 196,98,125,24,45,138,8,0,0 // vbroadcastss 0x88a(%rip),%ymm13 # 589c <_sk_callback_avx+0x42d>
.byte 196,65,28,89,237 // vmulps %ymm13,%ymm12,%ymm13
- .byte 196,98,125,24,53,128,8,0,0 // vbroadcastss 0x880(%rip),%ymm14 # 58a4 <_sk_callback_avx+0x431>
+ .byte 196,98,125,24,53,128,8,0,0 // vbroadcastss 0x880(%rip),%ymm14 # 58a0 <_sk_callback_avx+0x431>
.byte 196,65,20,88,238 // vaddps %ymm14,%ymm13,%ymm13
.byte 196,65,28,89,237 // vmulps %ymm13,%ymm12,%ymm13
- .byte 196,98,125,24,53,113,8,0,0 // vbroadcastss 0x871(%rip),%ymm14 # 58a8 <_sk_callback_avx+0x435>
+ .byte 196,98,125,24,53,113,8,0,0 // vbroadcastss 0x871(%rip),%ymm14 # 58a4 <_sk_callback_avx+0x435>
.byte 196,65,20,88,238 // vaddps %ymm14,%ymm13,%ymm13
.byte 196,65,28,89,229 // vmulps %ymm13,%ymm12,%ymm12
- .byte 196,98,125,24,45,98,8,0,0 // vbroadcastss 0x862(%rip),%ymm13 # 58ac <_sk_callback_avx+0x439>
+ .byte 196,98,125,24,45,98,8,0,0 // vbroadcastss 0x862(%rip),%ymm13 # 58a8 <_sk_callback_avx+0x439>
.byte 196,65,28,88,229 // vaddps %ymm13,%ymm12,%ymm12
.byte 196,65,36,89,220 // vmulps %ymm12,%ymm11,%ymm11
.byte 196,65,52,194,202,1 // vcmpltps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,24,21,77,8,0,0 // vbroadcastss 0x84d(%rip),%ymm10 # 58b0 <_sk_callback_avx+0x43d>
+ .byte 196,98,125,24,21,77,8,0,0 // vbroadcastss 0x84d(%rip),%ymm10 # 58ac <_sk_callback_avx+0x43d>
.byte 196,65,44,92,211 // vsubps %ymm11,%ymm10,%ymm10
.byte 196,67,37,74,202,144 // vblendvps %ymm9,%ymm10,%ymm11,%ymm9
.byte 196,193,124,194,192,1 // vcmpltps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,21,55,8,0,0 // vbroadcastss 0x837(%rip),%ymm10 # 58b4 <_sk_callback_avx+0x441>
+ .byte 196,98,125,24,21,55,8,0,0 // vbroadcastss 0x837(%rip),%ymm10 # 58b0 <_sk_callback_avx+0x441>
.byte 196,65,44,92,209 // vsubps %ymm9,%ymm10,%ymm10
.byte 196,195,53,74,194,0 // vblendvps %ymm0,%ymm10,%ymm9,%ymm0
.byte 196,65,116,194,200,1 // vcmpltps %ymm8,%ymm1,%ymm9
- .byte 196,98,125,24,21,33,8,0,0 // vbroadcastss 0x821(%rip),%ymm10 # 58b8 <_sk_callback_avx+0x445>
+ .byte 196,98,125,24,21,33,8,0,0 // vbroadcastss 0x821(%rip),%ymm10 # 58b4 <_sk_callback_avx+0x445>
.byte 197,44,92,208 // vsubps %ymm0,%ymm10,%ymm10
.byte 196,195,125,74,194,144 // vblendvps %ymm9,%ymm10,%ymm0,%ymm0
.byte 196,65,124,194,200,3 // vcmpunordps %ymm8,%ymm0,%ymm9
@@ -17054,7 +17050,7 @@ HIDDEN _sk_save_xy_avx
FUNCTION(_sk_save_xy_avx)
_sk_save_xy_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,0,8,0,0 // vbroadcastss 0x800(%rip),%ymm8 # 58bc <_sk_callback_avx+0x449>
+ .byte 196,98,125,24,5,0,8,0,0 // vbroadcastss 0x800(%rip),%ymm8 # 58b8 <_sk_callback_avx+0x449>
.byte 196,65,124,88,200 // vaddps %ymm8,%ymm0,%ymm9
.byte 196,67,125,8,209,1 // vroundps $0x1,%ymm9,%ymm10
.byte 196,65,52,92,202 // vsubps %ymm10,%ymm9,%ymm9
@@ -17091,9 +17087,9 @@ HIDDEN _sk_bilinear_nx_avx
FUNCTION(_sk_bilinear_nx_avx)
_sk_bilinear_nx_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,140,7,0,0 // vbroadcastss 0x78c(%rip),%ymm0 # 58c0 <_sk_callback_avx+0x44d>
+ .byte 196,226,125,24,5,140,7,0,0 // vbroadcastss 0x78c(%rip),%ymm0 # 58bc <_sk_callback_avx+0x44d>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,131,7,0,0 // vbroadcastss 0x783(%rip),%ymm8 # 58c4 <_sk_callback_avx+0x451>
+ .byte 196,98,125,24,5,131,7,0,0 // vbroadcastss 0x783(%rip),%ymm8 # 58c0 <_sk_callback_avx+0x451>
.byte 197,60,92,64,64 // vsubps 0x40(%rax),%ymm8,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -17104,7 +17100,7 @@ HIDDEN _sk_bilinear_px_avx
FUNCTION(_sk_bilinear_px_avx)
_sk_bilinear_px_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,107,7,0,0 // vbroadcastss 0x76b(%rip),%ymm0 # 58c8 <_sk_callback_avx+0x455>
+ .byte 196,226,125,24,5,107,7,0,0 // vbroadcastss 0x76b(%rip),%ymm0 # 58c4 <_sk_callback_avx+0x455>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,64,64 // vmovups 0x40(%rax),%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
@@ -17116,9 +17112,9 @@ HIDDEN _sk_bilinear_ny_avx
FUNCTION(_sk_bilinear_ny_avx)
_sk_bilinear_ny_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,79,7,0,0 // vbroadcastss 0x74f(%rip),%ymm1 # 58cc <_sk_callback_avx+0x459>
+ .byte 196,226,125,24,13,79,7,0,0 // vbroadcastss 0x74f(%rip),%ymm1 # 58c8 <_sk_callback_avx+0x459>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,69,7,0,0 // vbroadcastss 0x745(%rip),%ymm8 # 58d0 <_sk_callback_avx+0x45d>
+ .byte 196,98,125,24,5,69,7,0,0 // vbroadcastss 0x745(%rip),%ymm8 # 58cc <_sk_callback_avx+0x45d>
.byte 197,60,92,64,96 // vsubps 0x60(%rax),%ymm8,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -17129,7 +17125,7 @@ HIDDEN _sk_bilinear_py_avx
FUNCTION(_sk_bilinear_py_avx)
_sk_bilinear_py_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,45,7,0,0 // vbroadcastss 0x72d(%rip),%ymm1 # 58d4 <_sk_callback_avx+0x461>
+ .byte 196,226,125,24,13,45,7,0,0 // vbroadcastss 0x72d(%rip),%ymm1 # 58d0 <_sk_callback_avx+0x461>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
.byte 197,124,16,64,96 // vmovups 0x60(%rax),%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
@@ -17141,14 +17137,14 @@ HIDDEN _sk_bicubic_n3x_avx
FUNCTION(_sk_bicubic_n3x_avx)
_sk_bicubic_n3x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,16,7,0,0 // vbroadcastss 0x710(%rip),%ymm0 # 58d8 <_sk_callback_avx+0x465>
+ .byte 196,226,125,24,5,16,7,0,0 // vbroadcastss 0x710(%rip),%ymm0 # 58d4 <_sk_callback_avx+0x465>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,7,7,0,0 // vbroadcastss 0x707(%rip),%ymm8 # 58dc <_sk_callback_avx+0x469>
+ .byte 196,98,125,24,5,7,7,0,0 // vbroadcastss 0x707(%rip),%ymm8 # 58d8 <_sk_callback_avx+0x469>
.byte 197,60,92,64,64 // vsubps 0x40(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,248,6,0,0 // vbroadcastss 0x6f8(%rip),%ymm10 # 58e0 <_sk_callback_avx+0x46d>
+ .byte 196,98,125,24,21,248,6,0,0 // vbroadcastss 0x6f8(%rip),%ymm10 # 58dc <_sk_callback_avx+0x46d>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,238,6,0,0 // vbroadcastss 0x6ee(%rip),%ymm10 # 58e4 <_sk_callback_avx+0x471>
+ .byte 196,98,125,24,21,238,6,0,0 // vbroadcastss 0x6ee(%rip),%ymm10 # 58e0 <_sk_callback_avx+0x471>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
@@ -17160,19 +17156,19 @@ HIDDEN _sk_bicubic_n1x_avx
FUNCTION(_sk_bicubic_n1x_avx)
_sk_bicubic_n1x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,209,6,0,0 // vbroadcastss 0x6d1(%rip),%ymm0 # 58e8 <_sk_callback_avx+0x475>
+ .byte 196,226,125,24,5,209,6,0,0 // vbroadcastss 0x6d1(%rip),%ymm0 # 58e4 <_sk_callback_avx+0x475>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,200,6,0,0 // vbroadcastss 0x6c8(%rip),%ymm8 # 58ec <_sk_callback_avx+0x479>
+ .byte 196,98,125,24,5,200,6,0,0 // vbroadcastss 0x6c8(%rip),%ymm8 # 58e8 <_sk_callback_avx+0x479>
.byte 197,60,92,64,64 // vsubps 0x40(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,190,6,0,0 // vbroadcastss 0x6be(%rip),%ymm9 # 58f0 <_sk_callback_avx+0x47d>
+ .byte 196,98,125,24,13,190,6,0,0 // vbroadcastss 0x6be(%rip),%ymm9 # 58ec <_sk_callback_avx+0x47d>
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,180,6,0,0 // vbroadcastss 0x6b4(%rip),%ymm10 # 58f4 <_sk_callback_avx+0x481>
+ .byte 196,98,125,24,21,180,6,0,0 // vbroadcastss 0x6b4(%rip),%ymm10 # 58f0 <_sk_callback_avx+0x481>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,165,6,0,0 // vbroadcastss 0x6a5(%rip),%ymm10 # 58f8 <_sk_callback_avx+0x485>
+ .byte 196,98,125,24,21,165,6,0,0 // vbroadcastss 0x6a5(%rip),%ymm10 # 58f4 <_sk_callback_avx+0x485>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,24,13,150,6,0,0 // vbroadcastss 0x696(%rip),%ymm9 # 58fc <_sk_callback_avx+0x489>
+ .byte 196,98,125,24,13,150,6,0,0 // vbroadcastss 0x696(%rip),%ymm9 # 58f8 <_sk_callback_avx+0x489>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -17183,17 +17179,17 @@ HIDDEN _sk_bicubic_p1x_avx
FUNCTION(_sk_bicubic_p1x_avx)
_sk_bicubic_p1x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,126,6,0,0 // vbroadcastss 0x67e(%rip),%ymm8 # 5900 <_sk_callback_avx+0x48d>
+ .byte 196,98,125,24,5,126,6,0,0 // vbroadcastss 0x67e(%rip),%ymm8 # 58fc <_sk_callback_avx+0x48d>
.byte 197,188,88,0 // vaddps (%rax),%ymm8,%ymm0
.byte 197,124,16,72,64 // vmovups 0x40(%rax),%ymm9
- .byte 196,98,125,24,21,112,6,0,0 // vbroadcastss 0x670(%rip),%ymm10 # 5904 <_sk_callback_avx+0x491>
+ .byte 196,98,125,24,21,112,6,0,0 // vbroadcastss 0x670(%rip),%ymm10 # 5900 <_sk_callback_avx+0x491>
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
- .byte 196,98,125,24,29,102,6,0,0 // vbroadcastss 0x666(%rip),%ymm11 # 5908 <_sk_callback_avx+0x495>
+ .byte 196,98,125,24,29,102,6,0,0 // vbroadcastss 0x666(%rip),%ymm11 # 5904 <_sk_callback_avx+0x495>
.byte 196,65,44,88,211 // vaddps %ymm11,%ymm10,%ymm10
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
.byte 196,65,44,88,192 // vaddps %ymm8,%ymm10,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
- .byte 196,98,125,24,13,77,6,0,0 // vbroadcastss 0x64d(%rip),%ymm9 # 590c <_sk_callback_avx+0x499>
+ .byte 196,98,125,24,13,77,6,0,0 // vbroadcastss 0x64d(%rip),%ymm9 # 5908 <_sk_callback_avx+0x499>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -17204,13 +17200,13 @@ HIDDEN _sk_bicubic_p3x_avx
FUNCTION(_sk_bicubic_p3x_avx)
_sk_bicubic_p3x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,53,6,0,0 // vbroadcastss 0x635(%rip),%ymm0 # 5910 <_sk_callback_avx+0x49d>
+ .byte 196,226,125,24,5,53,6,0,0 // vbroadcastss 0x635(%rip),%ymm0 # 590c <_sk_callback_avx+0x49d>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,64,64 // vmovups 0x40(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,34,6,0,0 // vbroadcastss 0x622(%rip),%ymm10 # 5914 <_sk_callback_avx+0x4a1>
+ .byte 196,98,125,24,21,34,6,0,0 // vbroadcastss 0x622(%rip),%ymm10 # 5910 <_sk_callback_avx+0x4a1>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,24,6,0,0 // vbroadcastss 0x618(%rip),%ymm10 # 5918 <_sk_callback_avx+0x4a5>
+ .byte 196,98,125,24,21,24,6,0,0 // vbroadcastss 0x618(%rip),%ymm10 # 5914 <_sk_callback_avx+0x4a5>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,128,0,0,0 // vmovups %ymm8,0x80(%rax)
@@ -17222,14 +17218,14 @@ HIDDEN _sk_bicubic_n3y_avx
FUNCTION(_sk_bicubic_n3y_avx)
_sk_bicubic_n3y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,251,5,0,0 // vbroadcastss 0x5fb(%rip),%ymm1 # 591c <_sk_callback_avx+0x4a9>
+ .byte 196,226,125,24,13,251,5,0,0 // vbroadcastss 0x5fb(%rip),%ymm1 # 5918 <_sk_callback_avx+0x4a9>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,241,5,0,0 // vbroadcastss 0x5f1(%rip),%ymm8 # 5920 <_sk_callback_avx+0x4ad>
+ .byte 196,98,125,24,5,241,5,0,0 // vbroadcastss 0x5f1(%rip),%ymm8 # 591c <_sk_callback_avx+0x4ad>
.byte 197,60,92,64,96 // vsubps 0x60(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,226,5,0,0 // vbroadcastss 0x5e2(%rip),%ymm10 # 5924 <_sk_callback_avx+0x4b1>
+ .byte 196,98,125,24,21,226,5,0,0 // vbroadcastss 0x5e2(%rip),%ymm10 # 5920 <_sk_callback_avx+0x4b1>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,216,5,0,0 // vbroadcastss 0x5d8(%rip),%ymm10 # 5928 <_sk_callback_avx+0x4b5>
+ .byte 196,98,125,24,21,216,5,0,0 // vbroadcastss 0x5d8(%rip),%ymm10 # 5924 <_sk_callback_avx+0x4b5>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
@@ -17241,19 +17237,19 @@ HIDDEN _sk_bicubic_n1y_avx
FUNCTION(_sk_bicubic_n1y_avx)
_sk_bicubic_n1y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,187,5,0,0 // vbroadcastss 0x5bb(%rip),%ymm1 # 592c <_sk_callback_avx+0x4b9>
+ .byte 196,226,125,24,13,187,5,0,0 // vbroadcastss 0x5bb(%rip),%ymm1 # 5928 <_sk_callback_avx+0x4b9>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,177,5,0,0 // vbroadcastss 0x5b1(%rip),%ymm8 # 5930 <_sk_callback_avx+0x4bd>
+ .byte 196,98,125,24,5,177,5,0,0 // vbroadcastss 0x5b1(%rip),%ymm8 # 592c <_sk_callback_avx+0x4bd>
.byte 197,60,92,64,96 // vsubps 0x60(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,167,5,0,0 // vbroadcastss 0x5a7(%rip),%ymm9 # 5934 <_sk_callback_avx+0x4c1>
+ .byte 196,98,125,24,13,167,5,0,0 // vbroadcastss 0x5a7(%rip),%ymm9 # 5930 <_sk_callback_avx+0x4c1>
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,157,5,0,0 // vbroadcastss 0x59d(%rip),%ymm10 # 5938 <_sk_callback_avx+0x4c5>
+ .byte 196,98,125,24,21,157,5,0,0 // vbroadcastss 0x59d(%rip),%ymm10 # 5934 <_sk_callback_avx+0x4c5>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,142,5,0,0 // vbroadcastss 0x58e(%rip),%ymm10 # 593c <_sk_callback_avx+0x4c9>
+ .byte 196,98,125,24,21,142,5,0,0 // vbroadcastss 0x58e(%rip),%ymm10 # 5938 <_sk_callback_avx+0x4c9>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,24,13,127,5,0,0 // vbroadcastss 0x57f(%rip),%ymm9 # 5940 <_sk_callback_avx+0x4cd>
+ .byte 196,98,125,24,13,127,5,0,0 // vbroadcastss 0x57f(%rip),%ymm9 # 593c <_sk_callback_avx+0x4cd>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -17264,17 +17260,17 @@ HIDDEN _sk_bicubic_p1y_avx
FUNCTION(_sk_bicubic_p1y_avx)
_sk_bicubic_p1y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,103,5,0,0 // vbroadcastss 0x567(%rip),%ymm8 # 5944 <_sk_callback_avx+0x4d1>
+ .byte 196,98,125,24,5,103,5,0,0 // vbroadcastss 0x567(%rip),%ymm8 # 5940 <_sk_callback_avx+0x4d1>
.byte 197,188,88,72,32 // vaddps 0x20(%rax),%ymm8,%ymm1
.byte 197,124,16,72,96 // vmovups 0x60(%rax),%ymm9
- .byte 196,98,125,24,21,88,5,0,0 // vbroadcastss 0x558(%rip),%ymm10 # 5948 <_sk_callback_avx+0x4d5>
+ .byte 196,98,125,24,21,88,5,0,0 // vbroadcastss 0x558(%rip),%ymm10 # 5944 <_sk_callback_avx+0x4d5>
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
- .byte 196,98,125,24,29,78,5,0,0 // vbroadcastss 0x54e(%rip),%ymm11 # 594c <_sk_callback_avx+0x4d9>
+ .byte 196,98,125,24,29,78,5,0,0 // vbroadcastss 0x54e(%rip),%ymm11 # 5948 <_sk_callback_avx+0x4d9>
.byte 196,65,44,88,211 // vaddps %ymm11,%ymm10,%ymm10
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
.byte 196,65,44,88,192 // vaddps %ymm8,%ymm10,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
- .byte 196,98,125,24,13,53,5,0,0 // vbroadcastss 0x535(%rip),%ymm9 # 5950 <_sk_callback_avx+0x4dd>
+ .byte 196,98,125,24,13,53,5,0,0 // vbroadcastss 0x535(%rip),%ymm9 # 594c <_sk_callback_avx+0x4dd>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -17285,13 +17281,13 @@ HIDDEN _sk_bicubic_p3y_avx
FUNCTION(_sk_bicubic_p3y_avx)
_sk_bicubic_p3y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,29,5,0,0 // vbroadcastss 0x51d(%rip),%ymm1 # 5954 <_sk_callback_avx+0x4e1>
+ .byte 196,226,125,24,13,29,5,0,0 // vbroadcastss 0x51d(%rip),%ymm1 # 5950 <_sk_callback_avx+0x4e1>
.byte 197,244,88,72,32 // vaddps 0x20(%rax),%ymm1,%ymm1
.byte 197,124,16,64,96 // vmovups 0x60(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,9,5,0,0 // vbroadcastss 0x509(%rip),%ymm10 # 5958 <_sk_callback_avx+0x4e5>
+ .byte 196,98,125,24,21,9,5,0,0 // vbroadcastss 0x509(%rip),%ymm10 # 5954 <_sk_callback_avx+0x4e5>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,255,4,0,0 // vbroadcastss 0x4ff(%rip),%ymm10 # 595c <_sk_callback_avx+0x4e9>
+ .byte 196,98,125,24,21,255,4,0,0 // vbroadcastss 0x4ff(%rip),%ymm10 # 5958 <_sk_callback_avx+0x4e9>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,160,0,0,0 // vmovups %ymm8,0xa0(%rax)
@@ -17384,11 +17380,10 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 2,0 // add (%rax),%al
.byte 0,0 // add %al,(%rax)
- .byte 33,8 // and %ecx,(%rax)
- .byte 130 // (bad)
- .byte 60,0 // cmp $0x0,%al
.byte 0,0 // add %al,(%rax)
- .byte 191,0,0,128,63 // mov $0x3f800000,%edi
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 252 // cld
+ .byte 190,0,0,128,63 // mov $0x3f800000,%esi
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
.byte 0,128,63,0,0,128 // add %al,-0x7fffffc1(%rax)
@@ -17460,7 +17455,7 @@ BALIGN4
.byte 190,129,128,128,59 // mov $0x3b808081,%esi
.byte 129,128,128,59,0,248,0,0,8,33 // addl $0x21080000,-0x7ffc480(%rax)
.byte 132,55 // test %dh,(%rdi)
- .byte 224,7 // loopne 5685 <.literal4+0xed>
+ .byte 224,7 // loopne 5681 <.literal4+0xed>
.byte 0,0 // add %al,(%rax)
.byte 33,8 // and %ecx,(%rax)
.byte 2,58 // add (%rdx),%bh
@@ -17474,10 +17469,10 @@ BALIGN4
.byte 129,128,128,59,129,128,128,59,0,0 // addl $0x3b80,-0x7f7ec480(%rax)
.byte 0,52,255 // add %dh,(%rdi,%rdi,8)
.byte 255 // (bad)
- .byte 127,0 // jg 56b0 <.literal4+0x118>
+ .byte 127,0 // jg 56ac <.literal4+0x118>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 5729 <.literal4+0x191>
+ .byte 119,115 // ja 5725 <.literal4+0x191>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -17491,10 +17486,10 @@ BALIGN4
.byte 0,128,63,0,0,0 // add %al,0x3f(%rax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg 56e4 <.literal4+0x14c>
+ .byte 127,0 // jg 56e0 <.literal4+0x14c>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 575d <.literal4+0x1c5>
+ .byte 119,115 // ja 5759 <.literal4+0x1c5>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -17508,10 +17503,10 @@ BALIGN4
.byte 0,128,63,0,0,0 // add %al,0x3f(%rax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg 5718 <.literal4+0x180>
+ .byte 127,0 // jg 5714 <.literal4+0x180>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 5791 <.literal4+0x1f9>
+ .byte 119,115 // ja 578d <.literal4+0x1f9>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -17525,10 +17520,10 @@ BALIGN4
.byte 0,128,63,0,0,0 // add %al,0x3f(%rax)
.byte 52,255 // xor $0xff,%al
.byte 255 // (bad)
- .byte 127,0 // jg 574c <.literal4+0x1b4>
+ .byte 127,0 // jg 5748 <.literal4+0x1b4>
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
- .byte 119,115 // ja 57c5 <.literal4+0x22d>
+ .byte 119,115 // ja 57c1 <.literal4+0x22d>
.byte 248 // clc
.byte 194,117,191 // retq $0xbf75
.byte 191,63,249,68,180 // mov $0xb444f93f,%edi
@@ -17541,7 +17536,7 @@ BALIGN4
.byte 0,75,0 // add %cl,0x0(%rbx)
.byte 0,128,63,0,0,200 // add %al,-0x37ffffc1(%rax)
.byte 66,0,0 // rex.X add %al,(%rax)
- .byte 127,67 // jg 57c3 <.literal4+0x22b>
+ .byte 127,67 // jg 57bf <.literal4+0x22b>
.byte 0,0 // add %al,(%rax)
.byte 0,195 // add %al,%bl
.byte 0,0 // add %al,(%rax)
@@ -17553,10 +17548,10 @@ BALIGN4
.byte 190,80,128,3,62 // mov $0x3e038050,%esi
.byte 31 // (bad)
.byte 215 // xlat %ds:(%rbx)
- .byte 118,63 // jbe 57e3 <.literal4+0x24b>
+ .byte 118,63 // jbe 57df <.literal4+0x24b>
.byte 246,64,83,63 // testb $0x3f,0x53(%rax)
.byte 129,128,128,59,129,128,128,59,0,0 // addl $0x3b80,-0x7f7ec480(%rax)
- .byte 127,67 // jg 57f7 <.literal4+0x25f>
+ .byte 127,67 // jg 57f3 <.literal4+0x25f>
.byte 129,128,128,59,0,0,128,63,129,128 // addl $0x80813f80,0x3b80(%rax)
.byte 128,59,0 // cmpb $0x0,(%rbx)
.byte 0,128,63,129,128,128 // add %al,-0x7f7f7ec1(%rax)
@@ -17565,7 +17560,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 8,33 // or %ah,(%rcx)
.byte 132,55 // test %dh,(%rdi)
- .byte 224,7 // loopne 57d9 <.literal4+0x241>
+ .byte 224,7 // loopne 57d5 <.literal4+0x241>
.byte 0,0 // add %al,(%rax)
.byte 33,8 // and %ecx,(%rax)
.byte 2,58 // add (%rdx),%bh
@@ -17577,7 +17572,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 8,33 // or %ah,(%rcx)
.byte 132,55 // test %dh,(%rdi)
- .byte 224,7 // loopne 57f5 <.literal4+0x25d>
+ .byte 224,7 // loopne 57f1 <.literal4+0x25d>
.byte 0,0 // add %al,(%rax)
.byte 33,8 // and %ecx,(%rax)
.byte 2,58 // add (%rdx),%bh
@@ -17588,7 +17583,7 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 248 // clc
.byte 65,0,0 // add %al,(%r8)
- .byte 124,66 // jl 584a <.literal4+0x2b2>
+ .byte 124,66 // jl 5846 <.literal4+0x2b2>
.byte 0,240 // add %dh,%al
.byte 0,0 // add %al,(%rax)
.byte 137,136,136,55,0,15 // mov %ecx,0xf003788(%rax)
@@ -17606,9 +17601,9 @@ BALIGN4
.byte 137,136,136,59,15,0 // mov %ecx,0xf3b88(%rax)
.byte 0,0 // add %al,(%rax)
.byte 137,136,136,61,0,0 // mov %ecx,0x3d88(%rax)
- .byte 112,65 // jo 588d <.literal4+0x2f5>
+ .byte 112,65 // jo 5889 <.literal4+0x2f5>
.byte 129,128,128,59,129,128,128,59,0,0 // addl $0x3b80,-0x7f7ec480(%rax)
- .byte 127,67 // jg 589b <.literal4+0x303>
+ .byte 127,67 // jg 5897 <.literal4+0x303>
.byte 0,128,0,0,0,0 // add %al,0x0(%rax)
.byte 0,128,0,4,0,128 // add %al,-0x7ffffc00(%rax)
.byte 0,0 // add %al,(%rax)
@@ -17624,7 +17619,7 @@ BALIGN4
.byte 0,128,55,0,0,128 // add %al,-0x7fffffc9(%rax)
.byte 63 // (bad)
.byte 0,255 // add %bh,%bh
- .byte 127,71 // jg 58db <.literal4+0x343>
+ .byte 127,71 // jg 58d7 <.literal4+0x343>
.byte 208 // (bad)
.byte 179,89 // mov $0x59,%bl
.byte 62,89 // ds pop %rcx
@@ -17851,7 +17846,7 @@ _sk_seed_shader_sse41:
.byte 102,15,110,199 // movd %edi,%xmm0
.byte 102,15,112,192,0 // pshufd $0x0,%xmm0,%xmm0
.byte 15,91,200 // cvtdq2ps %xmm0,%xmm1
- .byte 15,40,21,68,58,0,0 // movaps 0x3a44(%rip),%xmm2 # 3ac0 <_sk_callback_sse41+0xdc>
+ .byte 15,40,21,68,58,0,0 // movaps 0x3a44(%rip),%xmm2 # 3ac0 <_sk_callback_sse41+0xe0>
.byte 15,88,202 // addps %xmm2,%xmm1
.byte 15,16,2 // movups (%rdx),%xmm0
.byte 15,88,193 // addps %xmm1,%xmm0
@@ -17860,7 +17855,7 @@ _sk_seed_shader_sse41:
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 15,88,202 // addps %xmm2,%xmm1
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,21,51,58,0,0 // movaps 0x3a33(%rip),%xmm2 # 3ad0 <_sk_callback_sse41+0xec>
+ .byte 15,40,21,51,58,0,0 // movaps 0x3a33(%rip),%xmm2 # 3ad0 <_sk_callback_sse41+0xf0>
.byte 15,87,219 // xorps %xmm3,%xmm3
.byte 15,87,228 // xorps %xmm4,%xmm4
.byte 15,87,237 // xorps %xmm5,%xmm5
@@ -17883,14 +17878,14 @@ _sk_dither_sse41:
.byte 102,68,15,110,1 // movd (%rcx),%xmm8
.byte 102,69,15,112,192,0 // pshufd $0x0,%xmm8,%xmm8
.byte 102,69,15,239,193 // pxor %xmm9,%xmm8
- .byte 102,68,15,111,21,248,57,0,0 // movdqa 0x39f8(%rip),%xmm10 # 3ae0 <_sk_callback_sse41+0xfc>
+ .byte 102,68,15,111,21,248,57,0,0 // movdqa 0x39f8(%rip),%xmm10 # 3ae0 <_sk_callback_sse41+0x100>
.byte 102,69,15,111,216 // movdqa %xmm8,%xmm11
.byte 102,69,15,219,218 // pand %xmm10,%xmm11
.byte 102,65,15,114,243,5 // pslld $0x5,%xmm11
.byte 102,69,15,219,209 // pand %xmm9,%xmm10
.byte 102,65,15,114,242,4 // pslld $0x4,%xmm10
- .byte 102,68,15,111,37,228,57,0,0 // movdqa 0x39e4(%rip),%xmm12 # 3af0 <_sk_callback_sse41+0x10c>
- .byte 102,68,15,111,45,235,57,0,0 // movdqa 0x39eb(%rip),%xmm13 # 3b00 <_sk_callback_sse41+0x11c>
+ .byte 102,68,15,111,37,228,57,0,0 // movdqa 0x39e4(%rip),%xmm12 # 3af0 <_sk_callback_sse41+0x110>
+ .byte 102,68,15,111,45,235,57,0,0 // movdqa 0x39eb(%rip),%xmm13 # 3b00 <_sk_callback_sse41+0x120>
.byte 102,69,15,111,240 // movdqa %xmm8,%xmm14
.byte 102,69,15,219,245 // pand %xmm13,%xmm14
.byte 102,65,15,114,246,2 // pslld $0x2,%xmm14
@@ -17906,12 +17901,11 @@ _sk_dither_sse41:
.byte 102,69,15,235,245 // por %xmm13,%xmm14
.byte 102,69,15,235,240 // por %xmm8,%xmm14
.byte 69,15,91,198 // cvtdq2ps %xmm14,%xmm8
- .byte 68,15,89,5,166,57,0,0 // mulps 0x39a6(%rip),%xmm8 # 3b10 <_sk_callback_sse41+0x12c>
- .byte 68,15,88,5,174,57,0,0 // addps 0x39ae(%rip),%xmm8 # 3b20 <_sk_callback_sse41+0x13c>
+ .byte 68,15,89,5,166,57,0,0 // mulps 0x39a6(%rip),%xmm8 # 3b10 <_sk_callback_sse41+0x130>
+ .byte 68,15,88,5,174,57,0,0 // addps 0x39ae(%rip),%xmm8 # 3b20 <_sk_callback_sse41+0x140>
.byte 243,68,15,16,72,8 // movss 0x8(%rax),%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
- .byte 68,15,89,203 // mulps %xmm3,%xmm9
.byte 65,15,88,193 // addps %xmm9,%xmm0
.byte 65,15,88,201 // addps %xmm9,%xmm1
.byte 65,15,88,209 // addps %xmm9,%xmm2
@@ -17950,7 +17944,7 @@ HIDDEN _sk_srcatop_sse41
FUNCTION(_sk_srcatop_sse41)
_sk_srcatop_sse41:
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 68,15,40,5,87,57,0,0 // movaps 0x3957(%rip),%xmm8 # 3b30 <_sk_callback_sse41+0x14c>
+ .byte 68,15,40,5,91,57,0,0 // movaps 0x395b(%rip),%xmm8 # 3b30 <_sk_callback_sse41+0x150>
.byte 68,15,92,195 // subps %xmm3,%xmm8
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 68,15,89,204 // mulps %xmm4,%xmm9
@@ -17975,7 +17969,7 @@ FUNCTION(_sk_dstatop_sse41)
_sk_dstatop_sse41:
.byte 68,15,40,195 // movaps %xmm3,%xmm8
.byte 68,15,89,196 // mulps %xmm4,%xmm8
- .byte 68,15,40,13,26,57,0,0 // movaps 0x391a(%rip),%xmm9 # 3b40 <_sk_callback_sse41+0x15c>
+ .byte 68,15,40,13,30,57,0,0 // movaps 0x391e(%rip),%xmm9 # 3b40 <_sk_callback_sse41+0x160>
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 65,15,88,192 // addps %xmm8,%xmm0
@@ -18022,7 +18016,7 @@ HIDDEN _sk_srcout_sse41
.globl _sk_srcout_sse41
FUNCTION(_sk_srcout_sse41)
_sk_srcout_sse41:
- .byte 68,15,40,5,190,56,0,0 // movaps 0x38be(%rip),%xmm8 # 3b50 <_sk_callback_sse41+0x16c>
+ .byte 68,15,40,5,194,56,0,0 // movaps 0x38c2(%rip),%xmm8 # 3b50 <_sk_callback_sse41+0x170>
.byte 68,15,92,199 // subps %xmm7,%xmm8
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
@@ -18035,7 +18029,7 @@ HIDDEN _sk_dstout_sse41
.globl _sk_dstout_sse41
FUNCTION(_sk_dstout_sse41)
_sk_dstout_sse41:
- .byte 68,15,40,5,174,56,0,0 // movaps 0x38ae(%rip),%xmm8 # 3b60 <_sk_callback_sse41+0x17c>
+ .byte 68,15,40,5,178,56,0,0 // movaps 0x38b2(%rip),%xmm8 # 3b60 <_sk_callback_sse41+0x180>
.byte 68,15,92,195 // subps %xmm3,%xmm8
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 15,89,196 // mulps %xmm4,%xmm0
@@ -18052,7 +18046,7 @@ HIDDEN _sk_srcover_sse41
.globl _sk_srcover_sse41
FUNCTION(_sk_srcover_sse41)
_sk_srcover_sse41:
- .byte 68,15,40,5,145,56,0,0 // movaps 0x3891(%rip),%xmm8 # 3b70 <_sk_callback_sse41+0x18c>
+ .byte 68,15,40,5,149,56,0,0 // movaps 0x3895(%rip),%xmm8 # 3b70 <_sk_callback_sse41+0x190>
.byte 68,15,92,195 // subps %xmm3,%xmm8
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 68,15,89,204 // mulps %xmm4,%xmm9
@@ -18072,7 +18066,7 @@ HIDDEN _sk_dstover_sse41
.globl _sk_dstover_sse41
FUNCTION(_sk_dstover_sse41)
_sk_dstover_sse41:
- .byte 68,15,40,5,101,56,0,0 // movaps 0x3865(%rip),%xmm8 # 3b80 <_sk_callback_sse41+0x19c>
+ .byte 68,15,40,5,105,56,0,0 // movaps 0x3869(%rip),%xmm8 # 3b80 <_sk_callback_sse41+0x1a0>
.byte 68,15,92,199 // subps %xmm7,%xmm8
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 15,88,196 // addps %xmm4,%xmm0
@@ -18100,7 +18094,7 @@ HIDDEN _sk_multiply_sse41
.globl _sk_multiply_sse41
FUNCTION(_sk_multiply_sse41)
_sk_multiply_sse41:
- .byte 68,15,40,5,57,56,0,0 // movaps 0x3839(%rip),%xmm8 # 3b90 <_sk_callback_sse41+0x1ac>
+ .byte 68,15,40,5,61,56,0,0 // movaps 0x383d(%rip),%xmm8 # 3b90 <_sk_callback_sse41+0x1b0>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 69,15,40,209 // movaps %xmm9,%xmm10
@@ -18176,7 +18170,7 @@ HIDDEN _sk_xor__sse41
FUNCTION(_sk_xor__sse41)
_sk_xor__sse41:
.byte 68,15,40,195 // movaps %xmm3,%xmm8
- .byte 15,40,29,106,55,0,0 // movaps 0x376a(%rip),%xmm3 # 3ba0 <_sk_callback_sse41+0x1bc>
+ .byte 15,40,29,110,55,0,0 // movaps 0x376e(%rip),%xmm3 # 3ba0 <_sk_callback_sse41+0x1c0>
.byte 68,15,40,203 // movaps %xmm3,%xmm9
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 65,15,89,193 // mulps %xmm9,%xmm0
@@ -18224,7 +18218,7 @@ _sk_darken_sse41:
.byte 68,15,89,206 // mulps %xmm6,%xmm9
.byte 65,15,95,209 // maxps %xmm9,%xmm2
.byte 68,15,92,194 // subps %xmm2,%xmm8
- .byte 15,40,21,213,54,0,0 // movaps 0x36d5(%rip),%xmm2 # 3bb0 <_sk_callback_sse41+0x1cc>
+ .byte 15,40,21,217,54,0,0 // movaps 0x36d9(%rip),%xmm2 # 3bb0 <_sk_callback_sse41+0x1d0>
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,215 // mulps %xmm7,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -18258,7 +18252,7 @@ _sk_lighten_sse41:
.byte 68,15,89,206 // mulps %xmm6,%xmm9
.byte 65,15,93,209 // minps %xmm9,%xmm2
.byte 68,15,92,194 // subps %xmm2,%xmm8
- .byte 15,40,21,122,54,0,0 // movaps 0x367a(%rip),%xmm2 # 3bc0 <_sk_callback_sse41+0x1dc>
+ .byte 15,40,21,126,54,0,0 // movaps 0x367e(%rip),%xmm2 # 3bc0 <_sk_callback_sse41+0x1e0>
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,215 // mulps %xmm7,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -18295,7 +18289,7 @@ _sk_difference_sse41:
.byte 65,15,93,209 // minps %xmm9,%xmm2
.byte 15,88,210 // addps %xmm2,%xmm2
.byte 68,15,92,194 // subps %xmm2,%xmm8
- .byte 15,40,21,20,54,0,0 // movaps 0x3614(%rip),%xmm2 # 3bd0 <_sk_callback_sse41+0x1ec>
+ .byte 15,40,21,24,54,0,0 // movaps 0x3618(%rip),%xmm2 # 3bd0 <_sk_callback_sse41+0x1f0>
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,215 // mulps %xmm7,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -18322,7 +18316,7 @@ _sk_exclusion_sse41:
.byte 15,89,214 // mulps %xmm6,%xmm2
.byte 15,88,210 // addps %xmm2,%xmm2
.byte 68,15,92,202 // subps %xmm2,%xmm9
- .byte 15,40,13,213,53,0,0 // movaps 0x35d5(%rip),%xmm1 # 3be0 <_sk_callback_sse41+0x1fc>
+ .byte 15,40,13,217,53,0,0 // movaps 0x35d9(%rip),%xmm1 # 3be0 <_sk_callback_sse41+0x200>
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,89,207 // mulps %xmm7,%xmm1
.byte 15,88,217 // addps %xmm1,%xmm3
@@ -18336,7 +18330,7 @@ HIDDEN _sk_colorburn_sse41
FUNCTION(_sk_colorburn_sse41)
_sk_colorburn_sse41:
.byte 68,15,40,192 // movaps %xmm0,%xmm8
- .byte 68,15,40,21,196,53,0,0 // movaps 0x35c4(%rip),%xmm10 # 3bf0 <_sk_callback_sse41+0x20c>
+ .byte 68,15,40,21,200,53,0,0 // movaps 0x35c8(%rip),%xmm10 # 3bf0 <_sk_callback_sse41+0x210>
.byte 69,15,40,218 // movaps %xmm10,%xmm11
.byte 68,15,92,223 // subps %xmm7,%xmm11
.byte 69,15,40,203 // movaps %xmm11,%xmm9
@@ -18418,7 +18412,7 @@ HIDDEN _sk_colordodge_sse41
FUNCTION(_sk_colordodge_sse41)
_sk_colordodge_sse41:
.byte 68,15,40,192 // movaps %xmm0,%xmm8
- .byte 68,15,40,21,162,52,0,0 // movaps 0x34a2(%rip),%xmm10 # 3c00 <_sk_callback_sse41+0x21c>
+ .byte 68,15,40,21,166,52,0,0 // movaps 0x34a6(%rip),%xmm10 # 3c00 <_sk_callback_sse41+0x220>
.byte 69,15,40,218 // movaps %xmm10,%xmm11
.byte 68,15,92,223 // subps %xmm7,%xmm11
.byte 69,15,40,227 // movaps %xmm11,%xmm12
@@ -18500,7 +18494,7 @@ _sk_hardlight_sse41:
.byte 15,40,244 // movaps %xmm4,%xmm6
.byte 15,40,227 // movaps %xmm3,%xmm4
.byte 68,15,40,200 // movaps %xmm0,%xmm9
- .byte 68,15,40,21,123,51,0,0 // movaps 0x337b(%rip),%xmm10 # 3c10 <_sk_callback_sse41+0x22c>
+ .byte 68,15,40,21,127,51,0,0 // movaps 0x337f(%rip),%xmm10 # 3c10 <_sk_callback_sse41+0x230>
.byte 65,15,40,234 // movaps %xmm10,%xmm5
.byte 15,92,239 // subps %xmm7,%xmm5
.byte 15,40,197 // movaps %xmm5,%xmm0
@@ -18583,7 +18577,7 @@ FUNCTION(_sk_overlay_sse41)
_sk_overlay_sse41:
.byte 68,15,40,201 // movaps %xmm1,%xmm9
.byte 68,15,40,240 // movaps %xmm0,%xmm14
- .byte 68,15,40,21,96,50,0,0 // movaps 0x3260(%rip),%xmm10 # 3c20 <_sk_callback_sse41+0x23c>
+ .byte 68,15,40,21,100,50,0,0 // movaps 0x3264(%rip),%xmm10 # 3c20 <_sk_callback_sse41+0x240>
.byte 69,15,40,218 // movaps %xmm10,%xmm11
.byte 68,15,92,223 // subps %xmm7,%xmm11
.byte 65,15,40,195 // movaps %xmm11,%xmm0
@@ -18668,7 +18662,7 @@ _sk_softlight_sse41:
.byte 15,40,198 // movaps %xmm6,%xmm0
.byte 15,94,199 // divps %xmm7,%xmm0
.byte 65,15,84,193 // andps %xmm9,%xmm0
- .byte 15,40,13,55,49,0,0 // movaps 0x3137(%rip),%xmm1 # 3c30 <_sk_callback_sse41+0x24c>
+ .byte 15,40,13,59,49,0,0 // movaps 0x313b(%rip),%xmm1 # 3c30 <_sk_callback_sse41+0x250>
.byte 68,15,40,209 // movaps %xmm1,%xmm10
.byte 68,15,92,208 // subps %xmm0,%xmm10
.byte 68,15,40,240 // movaps %xmm0,%xmm14
@@ -18681,10 +18675,10 @@ _sk_softlight_sse41:
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 15,89,210 // mulps %xmm2,%xmm2
.byte 15,88,208 // addps %xmm0,%xmm2
- .byte 68,15,40,45,21,49,0,0 // movaps 0x3115(%rip),%xmm13 # 3c40 <_sk_callback_sse41+0x25c>
+ .byte 68,15,40,45,25,49,0,0 // movaps 0x3119(%rip),%xmm13 # 3c40 <_sk_callback_sse41+0x260>
.byte 69,15,88,245 // addps %xmm13,%xmm14
.byte 68,15,89,242 // mulps %xmm2,%xmm14
- .byte 68,15,40,37,21,49,0,0 // movaps 0x3115(%rip),%xmm12 # 3c50 <_sk_callback_sse41+0x26c>
+ .byte 68,15,40,37,25,49,0,0 // movaps 0x3119(%rip),%xmm12 # 3c50 <_sk_callback_sse41+0x270>
.byte 69,15,89,252 // mulps %xmm12,%xmm15
.byte 69,15,88,254 // addps %xmm14,%xmm15
.byte 15,40,198 // movaps %xmm6,%xmm0
@@ -18832,7 +18826,7 @@ HIDDEN _sk_clamp_1_sse41
.globl _sk_clamp_1_sse41
FUNCTION(_sk_clamp_1_sse41)
_sk_clamp_1_sse41:
- .byte 68,15,40,5,39,47,0,0 // movaps 0x2f27(%rip),%xmm8 # 3c60 <_sk_callback_sse41+0x27c>
+ .byte 68,15,40,5,43,47,0,0 // movaps 0x2f2b(%rip),%xmm8 # 3c60 <_sk_callback_sse41+0x280>
.byte 65,15,93,192 // minps %xmm8,%xmm0
.byte 65,15,93,200 // minps %xmm8,%xmm1
.byte 65,15,93,208 // minps %xmm8,%xmm2
@@ -18844,7 +18838,7 @@ HIDDEN _sk_clamp_a_sse41
.globl _sk_clamp_a_sse41
FUNCTION(_sk_clamp_a_sse41)
_sk_clamp_a_sse41:
- .byte 15,93,29,28,47,0,0 // minps 0x2f1c(%rip),%xmm3 # 3c70 <_sk_callback_sse41+0x28c>
+ .byte 15,93,29,32,47,0,0 // minps 0x2f20(%rip),%xmm3 # 3c70 <_sk_callback_sse41+0x290>
.byte 15,93,195 // minps %xmm3,%xmm0
.byte 15,93,203 // minps %xmm3,%xmm1
.byte 15,93,211 // minps %xmm3,%xmm2
@@ -18931,7 +18925,7 @@ HIDDEN _sk_unpremul_sse41
FUNCTION(_sk_unpremul_sse41)
_sk_unpremul_sse41:
.byte 69,15,87,192 // xorps %xmm8,%xmm8
- .byte 68,15,40,13,135,46,0,0 // movaps 0x2e87(%rip),%xmm9 # 3c80 <_sk_callback_sse41+0x29c>
+ .byte 68,15,40,13,139,46,0,0 // movaps 0x2e8b(%rip),%xmm9 # 3c80 <_sk_callback_sse41+0x2a0>
.byte 68,15,94,203 // divps %xmm3,%xmm9
.byte 68,15,194,195,4 // cmpneqps %xmm3,%xmm8
.byte 69,15,84,193 // andps %xmm9,%xmm8
@@ -18945,20 +18939,20 @@ HIDDEN _sk_from_srgb_sse41
.globl _sk_from_srgb_sse41
FUNCTION(_sk_from_srgb_sse41)
_sk_from_srgb_sse41:
- .byte 68,15,40,29,114,46,0,0 // movaps 0x2e72(%rip),%xmm11 # 3c90 <_sk_callback_sse41+0x2ac>
+ .byte 68,15,40,29,118,46,0,0 // movaps 0x2e76(%rip),%xmm11 # 3c90 <_sk_callback_sse41+0x2b0>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,203 // mulps %xmm11,%xmm9
.byte 68,15,40,208 // movaps %xmm0,%xmm10
.byte 69,15,89,210 // mulps %xmm10,%xmm10
- .byte 68,15,40,37,106,46,0,0 // movaps 0x2e6a(%rip),%xmm12 # 3ca0 <_sk_callback_sse41+0x2bc>
+ .byte 68,15,40,37,110,46,0,0 // movaps 0x2e6e(%rip),%xmm12 # 3ca0 <_sk_callback_sse41+0x2c0>
.byte 68,15,40,192 // movaps %xmm0,%xmm8
.byte 69,15,89,196 // mulps %xmm12,%xmm8
- .byte 68,15,40,45,106,46,0,0 // movaps 0x2e6a(%rip),%xmm13 # 3cb0 <_sk_callback_sse41+0x2cc>
+ .byte 68,15,40,45,110,46,0,0 // movaps 0x2e6e(%rip),%xmm13 # 3cb0 <_sk_callback_sse41+0x2d0>
.byte 69,15,88,197 // addps %xmm13,%xmm8
.byte 69,15,89,194 // mulps %xmm10,%xmm8
- .byte 68,15,40,53,106,46,0,0 // movaps 0x2e6a(%rip),%xmm14 # 3cc0 <_sk_callback_sse41+0x2dc>
+ .byte 68,15,40,53,110,46,0,0 // movaps 0x2e6e(%rip),%xmm14 # 3cc0 <_sk_callback_sse41+0x2e0>
.byte 69,15,88,198 // addps %xmm14,%xmm8
- .byte 68,15,40,61,110,46,0,0 // movaps 0x2e6e(%rip),%xmm15 # 3cd0 <_sk_callback_sse41+0x2ec>
+ .byte 68,15,40,61,114,46,0,0 // movaps 0x2e72(%rip),%xmm15 # 3cd0 <_sk_callback_sse41+0x2f0>
.byte 65,15,194,199,1 // cmpltps %xmm15,%xmm0
.byte 102,69,15,56,20,193 // blendvps %xmm0,%xmm9,%xmm8
.byte 68,15,40,209 // movaps %xmm1,%xmm10
@@ -19003,20 +18997,20 @@ _sk_to_srgb_sse41:
.byte 68,15,82,192 // rsqrtps %xmm0,%xmm8
.byte 69,15,83,200 // rcpps %xmm8,%xmm9
.byte 69,15,82,208 // rsqrtps %xmm8,%xmm10
- .byte 68,15,40,29,222,45,0,0 // movaps 0x2dde(%rip),%xmm11 # 3ce0 <_sk_callback_sse41+0x2fc>
+ .byte 68,15,40,29,226,45,0,0 // movaps 0x2de2(%rip),%xmm11 # 3ce0 <_sk_callback_sse41+0x300>
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 65,15,89,203 // mulps %xmm11,%xmm1
- .byte 68,15,40,37,223,45,0,0 // movaps 0x2ddf(%rip),%xmm12 # 3cf0 <_sk_callback_sse41+0x30c>
+ .byte 68,15,40,37,227,45,0,0 // movaps 0x2de3(%rip),%xmm12 # 3cf0 <_sk_callback_sse41+0x310>
.byte 69,15,89,204 // mulps %xmm12,%xmm9
- .byte 68,15,40,45,227,45,0,0 // movaps 0x2de3(%rip),%xmm13 # 3d00 <_sk_callback_sse41+0x31c>
+ .byte 68,15,40,45,231,45,0,0 // movaps 0x2de7(%rip),%xmm13 # 3d00 <_sk_callback_sse41+0x320>
.byte 69,15,88,205 // addps %xmm13,%xmm9
- .byte 68,15,40,53,231,45,0,0 // movaps 0x2de7(%rip),%xmm14 # 3d10 <_sk_callback_sse41+0x32c>
+ .byte 68,15,40,53,235,45,0,0 // movaps 0x2deb(%rip),%xmm14 # 3d10 <_sk_callback_sse41+0x330>
.byte 69,15,89,214 // mulps %xmm14,%xmm10
.byte 69,15,88,209 // addps %xmm9,%xmm10
- .byte 68,15,40,5,231,45,0,0 // movaps 0x2de7(%rip),%xmm8 # 3d20 <_sk_callback_sse41+0x33c>
+ .byte 68,15,40,5,235,45,0,0 // movaps 0x2deb(%rip),%xmm8 # 3d20 <_sk_callback_sse41+0x340>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,93,202 // minps %xmm10,%xmm9
- .byte 68,15,40,61,231,45,0,0 // movaps 0x2de7(%rip),%xmm15 # 3d30 <_sk_callback_sse41+0x34c>
+ .byte 68,15,40,61,235,45,0,0 // movaps 0x2deb(%rip),%xmm15 # 3d30 <_sk_callback_sse41+0x350>
.byte 65,15,194,199,1 // cmpltps %xmm15,%xmm0
.byte 102,68,15,56,20,201 // blendvps %xmm0,%xmm1,%xmm9
.byte 15,82,194 // rsqrtps %xmm2,%xmm0
@@ -19070,7 +19064,7 @@ _sk_rgb_to_hsl_sse41:
.byte 68,15,93,226 // minps %xmm2,%xmm12
.byte 65,15,40,203 // movaps %xmm11,%xmm1
.byte 65,15,92,204 // subps %xmm12,%xmm1
- .byte 68,15,40,53,56,45,0,0 // movaps 0x2d38(%rip),%xmm14 # 3d40 <_sk_callback_sse41+0x35c>
+ .byte 68,15,40,53,60,45,0,0 // movaps 0x2d3c(%rip),%xmm14 # 3d40 <_sk_callback_sse41+0x360>
.byte 68,15,94,241 // divps %xmm1,%xmm14
.byte 69,15,40,211 // movaps %xmm11,%xmm10
.byte 69,15,194,208,0 // cmpeqps %xmm8,%xmm10
@@ -19079,27 +19073,27 @@ _sk_rgb_to_hsl_sse41:
.byte 65,15,89,198 // mulps %xmm14,%xmm0
.byte 69,15,40,249 // movaps %xmm9,%xmm15
.byte 68,15,194,250,1 // cmpltps %xmm2,%xmm15
- .byte 68,15,84,61,31,45,0,0 // andps 0x2d1f(%rip),%xmm15 # 3d50 <_sk_callback_sse41+0x36c>
+ .byte 68,15,84,61,35,45,0,0 // andps 0x2d23(%rip),%xmm15 # 3d50 <_sk_callback_sse41+0x370>
.byte 68,15,88,248 // addps %xmm0,%xmm15
.byte 65,15,40,195 // movaps %xmm11,%xmm0
.byte 65,15,194,193,0 // cmpeqps %xmm9,%xmm0
.byte 65,15,92,208 // subps %xmm8,%xmm2
.byte 65,15,89,214 // mulps %xmm14,%xmm2
- .byte 68,15,40,45,18,45,0,0 // movaps 0x2d12(%rip),%xmm13 # 3d60 <_sk_callback_sse41+0x37c>
+ .byte 68,15,40,45,22,45,0,0 // movaps 0x2d16(%rip),%xmm13 # 3d60 <_sk_callback_sse41+0x380>
.byte 65,15,88,213 // addps %xmm13,%xmm2
.byte 69,15,92,193 // subps %xmm9,%xmm8
.byte 69,15,89,198 // mulps %xmm14,%xmm8
- .byte 68,15,88,5,14,45,0,0 // addps 0x2d0e(%rip),%xmm8 # 3d70 <_sk_callback_sse41+0x38c>
+ .byte 68,15,88,5,18,45,0,0 // addps 0x2d12(%rip),%xmm8 # 3d70 <_sk_callback_sse41+0x390>
.byte 102,68,15,56,20,194 // blendvps %xmm0,%xmm2,%xmm8
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 102,69,15,56,20,199 // blendvps %xmm0,%xmm15,%xmm8
- .byte 68,15,89,5,6,45,0,0 // mulps 0x2d06(%rip),%xmm8 # 3d80 <_sk_callback_sse41+0x39c>
+ .byte 68,15,89,5,10,45,0,0 // mulps 0x2d0a(%rip),%xmm8 # 3d80 <_sk_callback_sse41+0x3a0>
.byte 69,15,40,203 // movaps %xmm11,%xmm9
.byte 69,15,194,204,4 // cmpneqps %xmm12,%xmm9
.byte 69,15,84,193 // andps %xmm9,%xmm8
.byte 69,15,92,235 // subps %xmm11,%xmm13
.byte 69,15,88,220 // addps %xmm12,%xmm11
- .byte 15,40,5,250,44,0,0 // movaps 0x2cfa(%rip),%xmm0 # 3d90 <_sk_callback_sse41+0x3ac>
+ .byte 15,40,5,254,44,0,0 // movaps 0x2cfe(%rip),%xmm0 # 3d90 <_sk_callback_sse41+0x3b0>
.byte 65,15,40,211 // movaps %xmm11,%xmm2
.byte 15,89,208 // mulps %xmm0,%xmm2
.byte 15,194,194,1 // cmpltps %xmm2,%xmm0
@@ -19121,7 +19115,7 @@ _sk_hsl_to_rgb_sse41:
.byte 15,41,100,36,184 // movaps %xmm4,-0x48(%rsp)
.byte 15,41,92,36,168 // movaps %xmm3,-0x58(%rsp)
.byte 68,15,40,208 // movaps %xmm0,%xmm10
- .byte 68,15,40,13,192,44,0,0 // movaps 0x2cc0(%rip),%xmm9 # 3da0 <_sk_callback_sse41+0x3bc>
+ .byte 68,15,40,13,196,44,0,0 // movaps 0x2cc4(%rip),%xmm9 # 3da0 <_sk_callback_sse41+0x3c0>
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 15,194,194,2 // cmpleps %xmm2,%xmm0
.byte 15,40,217 // movaps %xmm1,%xmm3
@@ -19134,19 +19128,19 @@ _sk_hsl_to_rgb_sse41:
.byte 15,41,84,36,152 // movaps %xmm2,-0x68(%rsp)
.byte 69,15,88,192 // addps %xmm8,%xmm8
.byte 68,15,92,197 // subps %xmm5,%xmm8
- .byte 68,15,40,53,155,44,0,0 // movaps 0x2c9b(%rip),%xmm14 # 3db0 <_sk_callback_sse41+0x3cc>
+ .byte 68,15,40,53,159,44,0,0 // movaps 0x2c9f(%rip),%xmm14 # 3db0 <_sk_callback_sse41+0x3d0>
.byte 69,15,88,242 // addps %xmm10,%xmm14
.byte 102,65,15,58,8,198,1 // roundps $0x1,%xmm14,%xmm0
.byte 68,15,92,240 // subps %xmm0,%xmm14
- .byte 68,15,40,29,148,44,0,0 // movaps 0x2c94(%rip),%xmm11 # 3dc0 <_sk_callback_sse41+0x3dc>
+ .byte 68,15,40,29,152,44,0,0 // movaps 0x2c98(%rip),%xmm11 # 3dc0 <_sk_callback_sse41+0x3e0>
.byte 65,15,40,195 // movaps %xmm11,%xmm0
.byte 65,15,194,198,2 // cmpleps %xmm14,%xmm0
.byte 15,40,245 // movaps %xmm5,%xmm6
.byte 65,15,92,240 // subps %xmm8,%xmm6
- .byte 15,40,61,141,44,0,0 // movaps 0x2c8d(%rip),%xmm7 # 3dd0 <_sk_callback_sse41+0x3ec>
+ .byte 15,40,61,145,44,0,0 // movaps 0x2c91(%rip),%xmm7 # 3dd0 <_sk_callback_sse41+0x3f0>
.byte 69,15,40,238 // movaps %xmm14,%xmm13
.byte 68,15,89,239 // mulps %xmm7,%xmm13
- .byte 15,40,29,142,44,0,0 // movaps 0x2c8e(%rip),%xmm3 # 3de0 <_sk_callback_sse41+0x3fc>
+ .byte 15,40,29,146,44,0,0 // movaps 0x2c92(%rip),%xmm3 # 3de0 <_sk_callback_sse41+0x400>
.byte 68,15,40,227 // movaps %xmm3,%xmm12
.byte 69,15,92,229 // subps %xmm13,%xmm12
.byte 68,15,89,230 // mulps %xmm6,%xmm12
@@ -19156,7 +19150,7 @@ _sk_hsl_to_rgb_sse41:
.byte 65,15,194,198,2 // cmpleps %xmm14,%xmm0
.byte 68,15,40,253 // movaps %xmm5,%xmm15
.byte 102,69,15,56,20,252 // blendvps %xmm0,%xmm12,%xmm15
- .byte 68,15,40,37,109,44,0,0 // movaps 0x2c6d(%rip),%xmm12 # 3df0 <_sk_callback_sse41+0x40c>
+ .byte 68,15,40,37,113,44,0,0 // movaps 0x2c71(%rip),%xmm12 # 3df0 <_sk_callback_sse41+0x410>
.byte 65,15,40,196 // movaps %xmm12,%xmm0
.byte 65,15,194,198,2 // cmpleps %xmm14,%xmm0
.byte 68,15,89,238 // mulps %xmm6,%xmm13
@@ -19190,7 +19184,7 @@ _sk_hsl_to_rgb_sse41:
.byte 65,15,40,198 // movaps %xmm14,%xmm0
.byte 15,40,84,36,152 // movaps -0x68(%rsp),%xmm2
.byte 102,15,56,20,202 // blendvps %xmm0,%xmm2,%xmm1
- .byte 68,15,88,21,229,43,0,0 // addps 0x2be5(%rip),%xmm10 # 3e00 <_sk_callback_sse41+0x41c>
+ .byte 68,15,88,21,233,43,0,0 // addps 0x2be9(%rip),%xmm10 # 3e00 <_sk_callback_sse41+0x420>
.byte 102,65,15,58,8,194,1 // roundps $0x1,%xmm10,%xmm0
.byte 68,15,92,208 // subps %xmm0,%xmm10
.byte 69,15,194,218,2 // cmpleps %xmm10,%xmm11
@@ -19242,7 +19236,7 @@ _sk_scale_u8_sse41:
.byte 72,139,0 // mov (%rax),%rax
.byte 102,68,15,56,49,4,56 // pmovzxbd (%rax,%rdi,1),%xmm8
.byte 69,15,91,192 // cvtdq2ps %xmm8,%xmm8
- .byte 68,15,89,5,66,43,0,0 // mulps 0x2b42(%rip),%xmm8 # 3e10 <_sk_callback_sse41+0x42c>
+ .byte 68,15,89,5,70,43,0,0 // mulps 0x2b46(%rip),%xmm8 # 3e10 <_sk_callback_sse41+0x430>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 65,15,89,208 // mulps %xmm8,%xmm2
@@ -19280,7 +19274,7 @@ _sk_lerp_u8_sse41:
.byte 72,139,0 // mov (%rax),%rax
.byte 102,68,15,56,49,4,56 // pmovzxbd (%rax,%rdi,1),%xmm8
.byte 69,15,91,192 // cvtdq2ps %xmm8,%xmm8
- .byte 68,15,89,5,238,42,0,0 // mulps 0x2aee(%rip),%xmm8 # 3e20 <_sk_callback_sse41+0x43c>
+ .byte 68,15,89,5,242,42,0,0 // mulps 0x2af2(%rip),%xmm8 # 3e20 <_sk_callback_sse41+0x440>
.byte 15,92,196 // subps %xmm4,%xmm0
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 15,88,196 // addps %xmm4,%xmm0
@@ -19303,17 +19297,17 @@ _sk_lerp_565_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 102,68,15,56,51,4,120 // pmovzxwd (%rax,%rdi,2),%xmm8
- .byte 102,15,111,29,190,42,0,0 // movdqa 0x2abe(%rip),%xmm3 # 3e30 <_sk_callback_sse41+0x44c>
+ .byte 102,15,111,29,194,42,0,0 // movdqa 0x2ac2(%rip),%xmm3 # 3e30 <_sk_callback_sse41+0x450>
.byte 102,65,15,219,216 // pand %xmm8,%xmm3
.byte 68,15,91,203 // cvtdq2ps %xmm3,%xmm9
- .byte 68,15,89,13,189,42,0,0 // mulps 0x2abd(%rip),%xmm9 # 3e40 <_sk_callback_sse41+0x45c>
- .byte 102,15,111,29,197,42,0,0 // movdqa 0x2ac5(%rip),%xmm3 # 3e50 <_sk_callback_sse41+0x46c>
+ .byte 68,15,89,13,193,42,0,0 // mulps 0x2ac1(%rip),%xmm9 # 3e40 <_sk_callback_sse41+0x460>
+ .byte 102,15,111,29,201,42,0,0 // movdqa 0x2ac9(%rip),%xmm3 # 3e50 <_sk_callback_sse41+0x470>
.byte 102,65,15,219,216 // pand %xmm8,%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,198,42,0,0 // mulps 0x2ac6(%rip),%xmm3 # 3e60 <_sk_callback_sse41+0x47c>
- .byte 102,68,15,219,5,205,42,0,0 // pand 0x2acd(%rip),%xmm8 # 3e70 <_sk_callback_sse41+0x48c>
+ .byte 15,89,29,202,42,0,0 // mulps 0x2aca(%rip),%xmm3 # 3e60 <_sk_callback_sse41+0x480>
+ .byte 102,68,15,219,5,209,42,0,0 // pand 0x2ad1(%rip),%xmm8 # 3e70 <_sk_callback_sse41+0x490>
.byte 69,15,91,192 // cvtdq2ps %xmm8,%xmm8
- .byte 68,15,89,5,209,42,0,0 // mulps 0x2ad1(%rip),%xmm8 # 3e80 <_sk_callback_sse41+0x49c>
+ .byte 68,15,89,5,213,42,0,0 // mulps 0x2ad5(%rip),%xmm8 # 3e80 <_sk_callback_sse41+0x4a0>
.byte 15,92,196 // subps %xmm4,%xmm0
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 15,88,196 // addps %xmm4,%xmm0
@@ -19324,7 +19318,7 @@ _sk_lerp_565_sse41:
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 15,88,214 // addps %xmm6,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,187,42,0,0 // movaps 0x2abb(%rip),%xmm3 # 3e90 <_sk_callback_sse41+0x4ac>
+ .byte 15,40,29,191,42,0,0 // movaps 0x2abf(%rip),%xmm3 # 3e90 <_sk_callback_sse41+0x4b0>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_load_tables_sse41
@@ -19335,7 +19329,7 @@ _sk_load_tables_sse41:
.byte 76,139,0 // mov (%rax),%r8
.byte 76,139,72,8 // mov 0x8(%rax),%r9
.byte 243,69,15,111,4,184 // movdqu (%r8,%rdi,4),%xmm8
- .byte 102,15,111,5,178,42,0,0 // movdqa 0x2ab2(%rip),%xmm0 # 3ea0 <_sk_callback_sse41+0x4bc>
+ .byte 102,15,111,5,182,42,0,0 // movdqa 0x2ab6(%rip),%xmm0 # 3ea0 <_sk_callback_sse41+0x4c0>
.byte 102,65,15,219,192 // pand %xmm8,%xmm0
.byte 102,73,15,58,22,192,1 // pextrq $0x1,%xmm0,%r8
.byte 102,72,15,126,193 // movq %xmm0,%rcx
@@ -19350,7 +19344,7 @@ _sk_load_tables_sse41:
.byte 102,15,58,33,193,48 // insertps $0x30,%xmm1,%xmm0
.byte 76,139,64,16 // mov 0x10(%rax),%r8
.byte 102,65,15,111,200 // movdqa %xmm8,%xmm1
- .byte 102,15,56,0,13,109,42,0,0 // pshufb 0x2a6d(%rip),%xmm1 # 3eb0 <_sk_callback_sse41+0x4cc>
+ .byte 102,15,56,0,13,113,42,0,0 // pshufb 0x2a71(%rip),%xmm1 # 3eb0 <_sk_callback_sse41+0x4d0>
.byte 102,73,15,58,22,201,1 // pextrq $0x1,%xmm1,%r9
.byte 102,72,15,126,201 // movq %xmm1,%rcx
.byte 68,15,182,209 // movzbl %cl,%r10d
@@ -19365,7 +19359,7 @@ _sk_load_tables_sse41:
.byte 102,15,58,33,202,48 // insertps $0x30,%xmm2,%xmm1
.byte 76,139,64,24 // mov 0x18(%rax),%r8
.byte 102,65,15,111,208 // movdqa %xmm8,%xmm2
- .byte 102,15,56,0,21,41,42,0,0 // pshufb 0x2a29(%rip),%xmm2 # 3ec0 <_sk_callback_sse41+0x4dc>
+ .byte 102,15,56,0,21,45,42,0,0 // pshufb 0x2a2d(%rip),%xmm2 # 3ec0 <_sk_callback_sse41+0x4e0>
.byte 102,72,15,58,22,209,1 // pextrq $0x1,%xmm2,%rcx
.byte 102,72,15,126,208 // movq %xmm2,%rax
.byte 68,15,182,200 // movzbl %al,%r9d
@@ -19380,7 +19374,7 @@ _sk_load_tables_sse41:
.byte 102,15,58,33,211,48 // insertps $0x30,%xmm3,%xmm2
.byte 102,65,15,114,208,24 // psrld $0x18,%xmm8
.byte 65,15,91,216 // cvtdq2ps %xmm8,%xmm3
- .byte 15,89,29,230,41,0,0 // mulps 0x29e6(%rip),%xmm3 # 3ed0 <_sk_callback_sse41+0x4ec>
+ .byte 15,89,29,234,41,0,0 // mulps 0x29ea(%rip),%xmm3 # 3ed0 <_sk_callback_sse41+0x4f0>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -19399,7 +19393,7 @@ _sk_load_tables_u16_be_sse41:
.byte 102,65,15,111,201 // movdqa %xmm9,%xmm1
.byte 102,15,97,200 // punpcklwd %xmm0,%xmm1
.byte 102,68,15,105,200 // punpckhwd %xmm0,%xmm9
- .byte 102,68,15,111,5,185,41,0,0 // movdqa 0x29b9(%rip),%xmm8 # 3ee0 <_sk_callback_sse41+0x4fc>
+ .byte 102,68,15,111,5,189,41,0,0 // movdqa 0x29bd(%rip),%xmm8 # 3ee0 <_sk_callback_sse41+0x500>
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,65,15,219,192 // pand %xmm8,%xmm0
.byte 102,15,56,51,192 // pmovzxwd %xmm0,%xmm0
@@ -19416,7 +19410,7 @@ _sk_load_tables_u16_be_sse41:
.byte 243,67,15,16,20,8 // movss (%r8,%r9,1),%xmm2
.byte 102,15,58,33,194,48 // insertps $0x30,%xmm2,%xmm0
.byte 76,139,64,16 // mov 0x10(%rax),%r8
- .byte 102,15,56,0,13,108,41,0,0 // pshufb 0x296c(%rip),%xmm1 # 3ef0 <_sk_callback_sse41+0x50c>
+ .byte 102,15,56,0,13,112,41,0,0 // pshufb 0x2970(%rip),%xmm1 # 3ef0 <_sk_callback_sse41+0x510>
.byte 102,15,56,51,201 // pmovzxwd %xmm1,%xmm1
.byte 102,73,15,58,22,201,1 // pextrq $0x1,%xmm1,%r9
.byte 102,72,15,126,201 // movq %xmm1,%rcx
@@ -19452,7 +19446,7 @@ _sk_load_tables_u16_be_sse41:
.byte 102,65,15,235,216 // por %xmm8,%xmm3
.byte 102,15,56,51,219 // pmovzxwd %xmm3,%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,186,40,0,0 // mulps 0x28ba(%rip),%xmm3 # 3f00 <_sk_callback_sse41+0x51c>
+ .byte 15,89,29,190,40,0,0 // mulps 0x28be(%rip),%xmm3 # 3f00 <_sk_callback_sse41+0x520>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -19474,7 +19468,7 @@ _sk_load_tables_rgb_u16_be_sse41:
.byte 102,68,15,97,200 // punpcklwd %xmm0,%xmm9
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
.byte 102,65,15,97,201 // punpcklwd %xmm9,%xmm1
- .byte 102,68,15,111,5,124,40,0,0 // movdqa 0x287c(%rip),%xmm8 # 3f10 <_sk_callback_sse41+0x52c>
+ .byte 102,68,15,111,5,128,40,0,0 // movdqa 0x2880(%rip),%xmm8 # 3f10 <_sk_callback_sse41+0x530>
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,65,15,219,192 // pand %xmm8,%xmm0
.byte 102,15,56,51,192 // pmovzxwd %xmm0,%xmm0
@@ -19491,7 +19485,7 @@ _sk_load_tables_rgb_u16_be_sse41:
.byte 243,67,15,16,28,8 // movss (%r8,%r9,1),%xmm3
.byte 102,15,58,33,195,48 // insertps $0x30,%xmm3,%xmm0
.byte 76,139,64,16 // mov 0x10(%rax),%r8
- .byte 102,15,56,0,13,47,40,0,0 // pshufb 0x282f(%rip),%xmm1 # 3f20 <_sk_callback_sse41+0x53c>
+ .byte 102,15,56,0,13,51,40,0,0 // pshufb 0x2833(%rip),%xmm1 # 3f20 <_sk_callback_sse41+0x540>
.byte 102,15,56,51,201 // pmovzxwd %xmm1,%xmm1
.byte 102,73,15,58,22,201,1 // pextrq $0x1,%xmm1,%r9
.byte 102,72,15,126,201 // movq %xmm1,%rcx
@@ -19522,7 +19516,7 @@ _sk_load_tables_rgb_u16_be_sse41:
.byte 243,65,15,16,28,8 // movss (%r8,%rcx,1),%xmm3
.byte 102,15,58,33,211,48 // insertps $0x30,%xmm3,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,154,39,0,0 // movaps 0x279a(%rip),%xmm3 # 3f30 <_sk_callback_sse41+0x54c>
+ .byte 15,40,29,158,39,0,0 // movaps 0x279e(%rip),%xmm3 # 3f30 <_sk_callback_sse41+0x550>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_byte_tables_sse41
@@ -19532,7 +19526,7 @@ _sk_byte_tables_sse41:
.byte 65,86 // push %r14
.byte 83 // push %rbx
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,155,39,0,0 // movaps 0x279b(%rip),%xmm8 # 3f40 <_sk_callback_sse41+0x55c>
+ .byte 68,15,40,5,159,39,0,0 // movaps 0x279f(%rip),%xmm8 # 3f40 <_sk_callback_sse41+0x560>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 102,72,15,58,22,193,1 // pextrq $0x1,%xmm0,%rcx
@@ -19551,7 +19545,7 @@ _sk_byte_tables_sse41:
.byte 102,15,58,32,193,3 // pinsrb $0x3,%ecx,%xmm0
.byte 102,15,56,49,192 // pmovzxbd %xmm0,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,13,76,39,0,0 // movaps 0x274c(%rip),%xmm9 # 3f50 <_sk_callback_sse41+0x56c>
+ .byte 68,15,40,13,80,39,0,0 // movaps 0x2750(%rip),%xmm9 # 3f50 <_sk_callback_sse41+0x570>
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1
@@ -19642,7 +19636,7 @@ _sk_byte_tables_rgb_sse41:
.byte 102,15,58,32,193,3 // pinsrb $0x3,%ecx,%xmm0
.byte 102,15,56,49,192 // pmovzxbd %xmm0,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,13,212,37,0,0 // movaps 0x25d4(%rip),%xmm9 # 3f60 <_sk_callback_sse41+0x57c>
+ .byte 68,15,40,13,216,37,0,0 // movaps 0x25d8(%rip),%xmm9 # 3f60 <_sk_callback_sse41+0x580>
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1
@@ -19819,31 +19813,31 @@ _sk_parametric_r_sse41:
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,91,194 // cvtdq2ps %xmm10,%xmm8
- .byte 68,15,89,5,43,35,0,0 // mulps 0x232b(%rip),%xmm8 # 3f70 <_sk_callback_sse41+0x58c>
- .byte 68,15,84,21,51,35,0,0 // andps 0x2333(%rip),%xmm10 # 3f80 <_sk_callback_sse41+0x59c>
- .byte 68,15,86,21,59,35,0,0 // orps 0x233b(%rip),%xmm10 # 3f90 <_sk_callback_sse41+0x5ac>
- .byte 68,15,88,5,67,35,0,0 // addps 0x2343(%rip),%xmm8 # 3fa0 <_sk_callback_sse41+0x5bc>
- .byte 68,15,40,37,75,35,0,0 // movaps 0x234b(%rip),%xmm12 # 3fb0 <_sk_callback_sse41+0x5cc>
+ .byte 68,15,89,5,47,35,0,0 // mulps 0x232f(%rip),%xmm8 # 3f70 <_sk_callback_sse41+0x590>
+ .byte 68,15,84,21,55,35,0,0 // andps 0x2337(%rip),%xmm10 # 3f80 <_sk_callback_sse41+0x5a0>
+ .byte 68,15,86,21,63,35,0,0 // orps 0x233f(%rip),%xmm10 # 3f90 <_sk_callback_sse41+0x5b0>
+ .byte 68,15,88,5,71,35,0,0 // addps 0x2347(%rip),%xmm8 # 3fa0 <_sk_callback_sse41+0x5c0>
+ .byte 68,15,40,37,79,35,0,0 // movaps 0x234f(%rip),%xmm12 # 3fb0 <_sk_callback_sse41+0x5d0>
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 69,15,92,196 // subps %xmm12,%xmm8
- .byte 68,15,88,21,75,35,0,0 // addps 0x234b(%rip),%xmm10 # 3fc0 <_sk_callback_sse41+0x5dc>
- .byte 68,15,40,37,83,35,0,0 // movaps 0x2353(%rip),%xmm12 # 3fd0 <_sk_callback_sse41+0x5ec>
+ .byte 68,15,88,21,79,35,0,0 // addps 0x234f(%rip),%xmm10 # 3fc0 <_sk_callback_sse41+0x5e0>
+ .byte 68,15,40,37,87,35,0,0 // movaps 0x2357(%rip),%xmm12 # 3fd0 <_sk_callback_sse41+0x5f0>
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,92,196 // subps %xmm12,%xmm8
.byte 69,15,89,195 // mulps %xmm11,%xmm8
.byte 102,69,15,58,8,208,1 // roundps $0x1,%xmm8,%xmm10
.byte 69,15,40,216 // movaps %xmm8,%xmm11
.byte 69,15,92,218 // subps %xmm10,%xmm11
- .byte 68,15,88,5,64,35,0,0 // addps 0x2340(%rip),%xmm8 # 3fe0 <_sk_callback_sse41+0x5fc>
- .byte 68,15,40,21,72,35,0,0 // movaps 0x2348(%rip),%xmm10 # 3ff0 <_sk_callback_sse41+0x60c>
+ .byte 68,15,88,5,68,35,0,0 // addps 0x2344(%rip),%xmm8 # 3fe0 <_sk_callback_sse41+0x600>
+ .byte 68,15,40,21,76,35,0,0 // movaps 0x234c(%rip),%xmm10 # 3ff0 <_sk_callback_sse41+0x610>
.byte 69,15,89,211 // mulps %xmm11,%xmm10
.byte 69,15,92,194 // subps %xmm10,%xmm8
- .byte 68,15,40,21,72,35,0,0 // movaps 0x2348(%rip),%xmm10 # 4000 <_sk_callback_sse41+0x61c>
+ .byte 68,15,40,21,76,35,0,0 // movaps 0x234c(%rip),%xmm10 # 4000 <_sk_callback_sse41+0x620>
.byte 69,15,92,211 // subps %xmm11,%xmm10
- .byte 68,15,40,29,76,35,0,0 // movaps 0x234c(%rip),%xmm11 # 4010 <_sk_callback_sse41+0x62c>
+ .byte 68,15,40,29,80,35,0,0 // movaps 0x2350(%rip),%xmm11 # 4010 <_sk_callback_sse41+0x630>
.byte 69,15,94,218 // divps %xmm10,%xmm11
.byte 69,15,88,216 // addps %xmm8,%xmm11
- .byte 68,15,89,29,76,35,0,0 // mulps 0x234c(%rip),%xmm11 # 4020 <_sk_callback_sse41+0x63c>
+ .byte 68,15,89,29,80,35,0,0 // mulps 0x2350(%rip),%xmm11 # 4020 <_sk_callback_sse41+0x640>
.byte 102,69,15,91,211 // cvtps2dq %xmm11,%xmm10
.byte 243,68,15,16,64,20 // movss 0x14(%rax),%xmm8
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
@@ -19851,7 +19845,7 @@ _sk_parametric_r_sse41:
.byte 102,69,15,56,20,193 // blendvps %xmm0,%xmm9,%xmm8
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 68,15,95,192 // maxps %xmm0,%xmm8
- .byte 68,15,93,5,51,35,0,0 // minps 0x2333(%rip),%xmm8 # 4030 <_sk_callback_sse41+0x64c>
+ .byte 68,15,93,5,55,35,0,0 // minps 0x2337(%rip),%xmm8 # 4030 <_sk_callback_sse41+0x650>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 255,224 // jmpq *%rax
@@ -19881,31 +19875,31 @@ _sk_parametric_g_sse41:
.byte 68,15,88,217 // addps %xmm1,%xmm11
.byte 69,15,198,210,0 // shufps $0x0,%xmm10,%xmm10
.byte 69,15,91,227 // cvtdq2ps %xmm11,%xmm12
- .byte 68,15,89,37,212,34,0,0 // mulps 0x22d4(%rip),%xmm12 # 4040 <_sk_callback_sse41+0x65c>
- .byte 68,15,84,29,220,34,0,0 // andps 0x22dc(%rip),%xmm11 # 4050 <_sk_callback_sse41+0x66c>
- .byte 68,15,86,29,228,34,0,0 // orps 0x22e4(%rip),%xmm11 # 4060 <_sk_callback_sse41+0x67c>
- .byte 68,15,88,37,236,34,0,0 // addps 0x22ec(%rip),%xmm12 # 4070 <_sk_callback_sse41+0x68c>
- .byte 15,40,13,245,34,0,0 // movaps 0x22f5(%rip),%xmm1 # 4080 <_sk_callback_sse41+0x69c>
+ .byte 68,15,89,37,216,34,0,0 // mulps 0x22d8(%rip),%xmm12 # 4040 <_sk_callback_sse41+0x660>
+ .byte 68,15,84,29,224,34,0,0 // andps 0x22e0(%rip),%xmm11 # 4050 <_sk_callback_sse41+0x670>
+ .byte 68,15,86,29,232,34,0,0 // orps 0x22e8(%rip),%xmm11 # 4060 <_sk_callback_sse41+0x680>
+ .byte 68,15,88,37,240,34,0,0 // addps 0x22f0(%rip),%xmm12 # 4070 <_sk_callback_sse41+0x690>
+ .byte 15,40,13,249,34,0,0 // movaps 0x22f9(%rip),%xmm1 # 4080 <_sk_callback_sse41+0x6a0>
.byte 65,15,89,203 // mulps %xmm11,%xmm1
.byte 68,15,92,225 // subps %xmm1,%xmm12
- .byte 68,15,88,29,245,34,0,0 // addps 0x22f5(%rip),%xmm11 # 4090 <_sk_callback_sse41+0x6ac>
- .byte 15,40,13,254,34,0,0 // movaps 0x22fe(%rip),%xmm1 # 40a0 <_sk_callback_sse41+0x6bc>
+ .byte 68,15,88,29,249,34,0,0 // addps 0x22f9(%rip),%xmm11 # 4090 <_sk_callback_sse41+0x6b0>
+ .byte 15,40,13,2,35,0,0 // movaps 0x2302(%rip),%xmm1 # 40a0 <_sk_callback_sse41+0x6c0>
.byte 65,15,94,203 // divps %xmm11,%xmm1
.byte 68,15,92,225 // subps %xmm1,%xmm12
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 102,69,15,58,8,212,1 // roundps $0x1,%xmm12,%xmm10
.byte 69,15,40,220 // movaps %xmm12,%xmm11
.byte 69,15,92,218 // subps %xmm10,%xmm11
- .byte 68,15,88,37,235,34,0,0 // addps 0x22eb(%rip),%xmm12 # 40b0 <_sk_callback_sse41+0x6cc>
- .byte 15,40,13,244,34,0,0 // movaps 0x22f4(%rip),%xmm1 # 40c0 <_sk_callback_sse41+0x6dc>
+ .byte 68,15,88,37,239,34,0,0 // addps 0x22ef(%rip),%xmm12 # 40b0 <_sk_callback_sse41+0x6d0>
+ .byte 15,40,13,248,34,0,0 // movaps 0x22f8(%rip),%xmm1 # 40c0 <_sk_callback_sse41+0x6e0>
.byte 65,15,89,203 // mulps %xmm11,%xmm1
.byte 68,15,92,225 // subps %xmm1,%xmm12
- .byte 68,15,40,21,244,34,0,0 // movaps 0x22f4(%rip),%xmm10 # 40d0 <_sk_callback_sse41+0x6ec>
+ .byte 68,15,40,21,248,34,0,0 // movaps 0x22f8(%rip),%xmm10 # 40d0 <_sk_callback_sse41+0x6f0>
.byte 69,15,92,211 // subps %xmm11,%xmm10
- .byte 15,40,13,249,34,0,0 // movaps 0x22f9(%rip),%xmm1 # 40e0 <_sk_callback_sse41+0x6fc>
+ .byte 15,40,13,253,34,0,0 // movaps 0x22fd(%rip),%xmm1 # 40e0 <_sk_callback_sse41+0x700>
.byte 65,15,94,202 // divps %xmm10,%xmm1
.byte 65,15,88,204 // addps %xmm12,%xmm1
- .byte 15,89,13,250,34,0,0 // mulps 0x22fa(%rip),%xmm1 # 40f0 <_sk_callback_sse41+0x70c>
+ .byte 15,89,13,254,34,0,0 // mulps 0x22fe(%rip),%xmm1 # 40f0 <_sk_callback_sse41+0x710>
.byte 102,68,15,91,209 // cvtps2dq %xmm1,%xmm10
.byte 243,15,16,72,20 // movss 0x14(%rax),%xmm1
.byte 15,198,201,0 // shufps $0x0,%xmm1,%xmm1
@@ -19913,7 +19907,7 @@ _sk_parametric_g_sse41:
.byte 102,65,15,56,20,201 // blendvps %xmm0,%xmm9,%xmm1
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 15,95,200 // maxps %xmm0,%xmm1
- .byte 15,93,13,229,34,0,0 // minps 0x22e5(%rip),%xmm1 # 4100 <_sk_callback_sse41+0x71c>
+ .byte 15,93,13,233,34,0,0 // minps 0x22e9(%rip),%xmm1 # 4100 <_sk_callback_sse41+0x720>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 255,224 // jmpq *%rax
@@ -19943,31 +19937,31 @@ _sk_parametric_b_sse41:
.byte 68,15,88,218 // addps %xmm2,%xmm11
.byte 69,15,198,210,0 // shufps $0x0,%xmm10,%xmm10
.byte 69,15,91,227 // cvtdq2ps %xmm11,%xmm12
- .byte 68,15,89,37,134,34,0,0 // mulps 0x2286(%rip),%xmm12 # 4110 <_sk_callback_sse41+0x72c>
- .byte 68,15,84,29,142,34,0,0 // andps 0x228e(%rip),%xmm11 # 4120 <_sk_callback_sse41+0x73c>
- .byte 68,15,86,29,150,34,0,0 // orps 0x2296(%rip),%xmm11 # 4130 <_sk_callback_sse41+0x74c>
- .byte 68,15,88,37,158,34,0,0 // addps 0x229e(%rip),%xmm12 # 4140 <_sk_callback_sse41+0x75c>
- .byte 15,40,21,167,34,0,0 // movaps 0x22a7(%rip),%xmm2 # 4150 <_sk_callback_sse41+0x76c>
+ .byte 68,15,89,37,138,34,0,0 // mulps 0x228a(%rip),%xmm12 # 4110 <_sk_callback_sse41+0x730>
+ .byte 68,15,84,29,146,34,0,0 // andps 0x2292(%rip),%xmm11 # 4120 <_sk_callback_sse41+0x740>
+ .byte 68,15,86,29,154,34,0,0 // orps 0x229a(%rip),%xmm11 # 4130 <_sk_callback_sse41+0x750>
+ .byte 68,15,88,37,162,34,0,0 // addps 0x22a2(%rip),%xmm12 # 4140 <_sk_callback_sse41+0x760>
+ .byte 15,40,21,171,34,0,0 // movaps 0x22ab(%rip),%xmm2 # 4150 <_sk_callback_sse41+0x770>
.byte 65,15,89,211 // mulps %xmm11,%xmm2
.byte 68,15,92,226 // subps %xmm2,%xmm12
- .byte 68,15,88,29,167,34,0,0 // addps 0x22a7(%rip),%xmm11 # 4160 <_sk_callback_sse41+0x77c>
- .byte 15,40,21,176,34,0,0 // movaps 0x22b0(%rip),%xmm2 # 4170 <_sk_callback_sse41+0x78c>
+ .byte 68,15,88,29,171,34,0,0 // addps 0x22ab(%rip),%xmm11 # 4160 <_sk_callback_sse41+0x780>
+ .byte 15,40,21,180,34,0,0 // movaps 0x22b4(%rip),%xmm2 # 4170 <_sk_callback_sse41+0x790>
.byte 65,15,94,211 // divps %xmm11,%xmm2
.byte 68,15,92,226 // subps %xmm2,%xmm12
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 102,69,15,58,8,212,1 // roundps $0x1,%xmm12,%xmm10
.byte 69,15,40,220 // movaps %xmm12,%xmm11
.byte 69,15,92,218 // subps %xmm10,%xmm11
- .byte 68,15,88,37,157,34,0,0 // addps 0x229d(%rip),%xmm12 # 4180 <_sk_callback_sse41+0x79c>
- .byte 15,40,21,166,34,0,0 // movaps 0x22a6(%rip),%xmm2 # 4190 <_sk_callback_sse41+0x7ac>
+ .byte 68,15,88,37,161,34,0,0 // addps 0x22a1(%rip),%xmm12 # 4180 <_sk_callback_sse41+0x7a0>
+ .byte 15,40,21,170,34,0,0 // movaps 0x22aa(%rip),%xmm2 # 4190 <_sk_callback_sse41+0x7b0>
.byte 65,15,89,211 // mulps %xmm11,%xmm2
.byte 68,15,92,226 // subps %xmm2,%xmm12
- .byte 68,15,40,21,166,34,0,0 // movaps 0x22a6(%rip),%xmm10 # 41a0 <_sk_callback_sse41+0x7bc>
+ .byte 68,15,40,21,170,34,0,0 // movaps 0x22aa(%rip),%xmm10 # 41a0 <_sk_callback_sse41+0x7c0>
.byte 69,15,92,211 // subps %xmm11,%xmm10
- .byte 15,40,21,171,34,0,0 // movaps 0x22ab(%rip),%xmm2 # 41b0 <_sk_callback_sse41+0x7cc>
+ .byte 15,40,21,175,34,0,0 // movaps 0x22af(%rip),%xmm2 # 41b0 <_sk_callback_sse41+0x7d0>
.byte 65,15,94,210 // divps %xmm10,%xmm2
.byte 65,15,88,212 // addps %xmm12,%xmm2
- .byte 15,89,21,172,34,0,0 // mulps 0x22ac(%rip),%xmm2 # 41c0 <_sk_callback_sse41+0x7dc>
+ .byte 15,89,21,176,34,0,0 // mulps 0x22b0(%rip),%xmm2 # 41c0 <_sk_callback_sse41+0x7e0>
.byte 102,68,15,91,210 // cvtps2dq %xmm2,%xmm10
.byte 243,15,16,80,20 // movss 0x14(%rax),%xmm2
.byte 15,198,210,0 // shufps $0x0,%xmm2,%xmm2
@@ -19975,7 +19969,7 @@ _sk_parametric_b_sse41:
.byte 102,65,15,56,20,209 // blendvps %xmm0,%xmm9,%xmm2
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 15,95,208 // maxps %xmm0,%xmm2
- .byte 15,93,21,151,34,0,0 // minps 0x2297(%rip),%xmm2 # 41d0 <_sk_callback_sse41+0x7ec>
+ .byte 15,93,21,155,34,0,0 // minps 0x229b(%rip),%xmm2 # 41d0 <_sk_callback_sse41+0x7f0>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 255,224 // jmpq *%rax
@@ -20005,31 +19999,31 @@ _sk_parametric_a_sse41:
.byte 68,15,88,219 // addps %xmm3,%xmm11
.byte 69,15,198,210,0 // shufps $0x0,%xmm10,%xmm10
.byte 69,15,91,227 // cvtdq2ps %xmm11,%xmm12
- .byte 68,15,89,37,56,34,0,0 // mulps 0x2238(%rip),%xmm12 # 41e0 <_sk_callback_sse41+0x7fc>
- .byte 68,15,84,29,64,34,0,0 // andps 0x2240(%rip),%xmm11 # 41f0 <_sk_callback_sse41+0x80c>
- .byte 68,15,86,29,72,34,0,0 // orps 0x2248(%rip),%xmm11 # 4200 <_sk_callback_sse41+0x81c>
- .byte 68,15,88,37,80,34,0,0 // addps 0x2250(%rip),%xmm12 # 4210 <_sk_callback_sse41+0x82c>
- .byte 15,40,29,89,34,0,0 // movaps 0x2259(%rip),%xmm3 # 4220 <_sk_callback_sse41+0x83c>
+ .byte 68,15,89,37,60,34,0,0 // mulps 0x223c(%rip),%xmm12 # 41e0 <_sk_callback_sse41+0x800>
+ .byte 68,15,84,29,68,34,0,0 // andps 0x2244(%rip),%xmm11 # 41f0 <_sk_callback_sse41+0x810>
+ .byte 68,15,86,29,76,34,0,0 // orps 0x224c(%rip),%xmm11 # 4200 <_sk_callback_sse41+0x820>
+ .byte 68,15,88,37,84,34,0,0 // addps 0x2254(%rip),%xmm12 # 4210 <_sk_callback_sse41+0x830>
+ .byte 15,40,29,93,34,0,0 // movaps 0x225d(%rip),%xmm3 # 4220 <_sk_callback_sse41+0x840>
.byte 65,15,89,219 // mulps %xmm11,%xmm3
.byte 68,15,92,227 // subps %xmm3,%xmm12
- .byte 68,15,88,29,89,34,0,0 // addps 0x2259(%rip),%xmm11 # 4230 <_sk_callback_sse41+0x84c>
- .byte 15,40,29,98,34,0,0 // movaps 0x2262(%rip),%xmm3 # 4240 <_sk_callback_sse41+0x85c>
+ .byte 68,15,88,29,93,34,0,0 // addps 0x225d(%rip),%xmm11 # 4230 <_sk_callback_sse41+0x850>
+ .byte 15,40,29,102,34,0,0 // movaps 0x2266(%rip),%xmm3 # 4240 <_sk_callback_sse41+0x860>
.byte 65,15,94,219 // divps %xmm11,%xmm3
.byte 68,15,92,227 // subps %xmm3,%xmm12
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 102,69,15,58,8,212,1 // roundps $0x1,%xmm12,%xmm10
.byte 69,15,40,220 // movaps %xmm12,%xmm11
.byte 69,15,92,218 // subps %xmm10,%xmm11
- .byte 68,15,88,37,79,34,0,0 // addps 0x224f(%rip),%xmm12 # 4250 <_sk_callback_sse41+0x86c>
- .byte 15,40,29,88,34,0,0 // movaps 0x2258(%rip),%xmm3 # 4260 <_sk_callback_sse41+0x87c>
+ .byte 68,15,88,37,83,34,0,0 // addps 0x2253(%rip),%xmm12 # 4250 <_sk_callback_sse41+0x870>
+ .byte 15,40,29,92,34,0,0 // movaps 0x225c(%rip),%xmm3 # 4260 <_sk_callback_sse41+0x880>
.byte 65,15,89,219 // mulps %xmm11,%xmm3
.byte 68,15,92,227 // subps %xmm3,%xmm12
- .byte 68,15,40,21,88,34,0,0 // movaps 0x2258(%rip),%xmm10 # 4270 <_sk_callback_sse41+0x88c>
+ .byte 68,15,40,21,92,34,0,0 // movaps 0x225c(%rip),%xmm10 # 4270 <_sk_callback_sse41+0x890>
.byte 69,15,92,211 // subps %xmm11,%xmm10
- .byte 15,40,29,93,34,0,0 // movaps 0x225d(%rip),%xmm3 # 4280 <_sk_callback_sse41+0x89c>
+ .byte 15,40,29,97,34,0,0 // movaps 0x2261(%rip),%xmm3 # 4280 <_sk_callback_sse41+0x8a0>
.byte 65,15,94,218 // divps %xmm10,%xmm3
.byte 65,15,88,220 // addps %xmm12,%xmm3
- .byte 15,89,29,94,34,0,0 // mulps 0x225e(%rip),%xmm3 # 4290 <_sk_callback_sse41+0x8ac>
+ .byte 15,89,29,98,34,0,0 // mulps 0x2262(%rip),%xmm3 # 4290 <_sk_callback_sse41+0x8b0>
.byte 102,68,15,91,211 // cvtps2dq %xmm3,%xmm10
.byte 243,15,16,88,20 // movss 0x14(%rax),%xmm3
.byte 15,198,219,0 // shufps $0x0,%xmm3,%xmm3
@@ -20037,7 +20031,7 @@ _sk_parametric_a_sse41:
.byte 102,65,15,56,20,217 // blendvps %xmm0,%xmm9,%xmm3
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 15,95,216 // maxps %xmm0,%xmm3
- .byte 15,93,29,73,34,0,0 // minps 0x2249(%rip),%xmm3 # 42a0 <_sk_callback_sse41+0x8bc>
+ .byte 15,93,29,77,34,0,0 // minps 0x224d(%rip),%xmm3 # 42a0 <_sk_callback_sse41+0x8c0>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 255,224 // jmpq *%rax
@@ -20047,29 +20041,29 @@ HIDDEN _sk_lab_to_xyz_sse41
FUNCTION(_sk_lab_to_xyz_sse41)
_sk_lab_to_xyz_sse41:
.byte 68,15,40,192 // movaps %xmm0,%xmm8
- .byte 68,15,89,5,69,34,0,0 // mulps 0x2245(%rip),%xmm8 # 42b0 <_sk_callback_sse41+0x8cc>
- .byte 68,15,40,13,77,34,0,0 // movaps 0x224d(%rip),%xmm9 # 42c0 <_sk_callback_sse41+0x8dc>
+ .byte 68,15,89,5,73,34,0,0 // mulps 0x2249(%rip),%xmm8 # 42b0 <_sk_callback_sse41+0x8d0>
+ .byte 68,15,40,13,81,34,0,0 // movaps 0x2251(%rip),%xmm9 # 42c0 <_sk_callback_sse41+0x8e0>
.byte 65,15,89,201 // mulps %xmm9,%xmm1
- .byte 15,40,5,82,34,0,0 // movaps 0x2252(%rip),%xmm0 # 42d0 <_sk_callback_sse41+0x8ec>
+ .byte 15,40,5,86,34,0,0 // movaps 0x2256(%rip),%xmm0 # 42d0 <_sk_callback_sse41+0x8f0>
.byte 15,88,200 // addps %xmm0,%xmm1
.byte 65,15,89,209 // mulps %xmm9,%xmm2
.byte 15,88,208 // addps %xmm0,%xmm2
- .byte 68,15,88,5,80,34,0,0 // addps 0x2250(%rip),%xmm8 # 42e0 <_sk_callback_sse41+0x8fc>
- .byte 68,15,89,5,88,34,0,0 // mulps 0x2258(%rip),%xmm8 # 42f0 <_sk_callback_sse41+0x90c>
- .byte 15,89,13,97,34,0,0 // mulps 0x2261(%rip),%xmm1 # 4300 <_sk_callback_sse41+0x91c>
+ .byte 68,15,88,5,84,34,0,0 // addps 0x2254(%rip),%xmm8 # 42e0 <_sk_callback_sse41+0x900>
+ .byte 68,15,89,5,92,34,0,0 // mulps 0x225c(%rip),%xmm8 # 42f0 <_sk_callback_sse41+0x910>
+ .byte 15,89,13,101,34,0,0 // mulps 0x2265(%rip),%xmm1 # 4300 <_sk_callback_sse41+0x920>
.byte 65,15,88,200 // addps %xmm8,%xmm1
- .byte 15,89,21,102,34,0,0 // mulps 0x2266(%rip),%xmm2 # 4310 <_sk_callback_sse41+0x92c>
+ .byte 15,89,21,106,34,0,0 // mulps 0x226a(%rip),%xmm2 # 4310 <_sk_callback_sse41+0x930>
.byte 69,15,40,208 // movaps %xmm8,%xmm10
.byte 68,15,92,210 // subps %xmm2,%xmm10
.byte 68,15,40,217 // movaps %xmm1,%xmm11
.byte 69,15,89,219 // mulps %xmm11,%xmm11
.byte 68,15,89,217 // mulps %xmm1,%xmm11
- .byte 68,15,40,13,90,34,0,0 // movaps 0x225a(%rip),%xmm9 # 4320 <_sk_callback_sse41+0x93c>
+ .byte 68,15,40,13,94,34,0,0 // movaps 0x225e(%rip),%xmm9 # 4320 <_sk_callback_sse41+0x940>
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 65,15,194,195,1 // cmpltps %xmm11,%xmm0
- .byte 15,40,21,90,34,0,0 // movaps 0x225a(%rip),%xmm2 # 4330 <_sk_callback_sse41+0x94c>
+ .byte 15,40,21,94,34,0,0 // movaps 0x225e(%rip),%xmm2 # 4330 <_sk_callback_sse41+0x950>
.byte 15,88,202 // addps %xmm2,%xmm1
- .byte 68,15,40,37,95,34,0,0 // movaps 0x225f(%rip),%xmm12 # 4340 <_sk_callback_sse41+0x95c>
+ .byte 68,15,40,37,99,34,0,0 // movaps 0x2263(%rip),%xmm12 # 4340 <_sk_callback_sse41+0x960>
.byte 65,15,89,204 // mulps %xmm12,%xmm1
.byte 102,65,15,56,20,203 // blendvps %xmm0,%xmm11,%xmm1
.byte 69,15,40,216 // movaps %xmm8,%xmm11
@@ -20088,8 +20082,8 @@ _sk_lab_to_xyz_sse41:
.byte 65,15,89,212 // mulps %xmm12,%xmm2
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 102,65,15,56,20,211 // blendvps %xmm0,%xmm11,%xmm2
- .byte 15,89,13,24,34,0,0 // mulps 0x2218(%rip),%xmm1 # 4350 <_sk_callback_sse41+0x96c>
- .byte 15,89,21,33,34,0,0 // mulps 0x2221(%rip),%xmm2 # 4360 <_sk_callback_sse41+0x97c>
+ .byte 15,89,13,28,34,0,0 // mulps 0x221c(%rip),%xmm1 # 4350 <_sk_callback_sse41+0x970>
+ .byte 15,89,21,37,34,0,0 // mulps 0x2225(%rip),%xmm2 # 4360 <_sk_callback_sse41+0x980>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,40,193 // movaps %xmm1,%xmm0
.byte 65,15,40,200 // movaps %xmm8,%xmm1
@@ -20103,7 +20097,7 @@ _sk_load_a8_sse41:
.byte 72,139,0 // mov (%rax),%rax
.byte 102,15,56,49,4,56 // pmovzxbd (%rax,%rdi,1),%xmm0
.byte 15,91,216 // cvtdq2ps %xmm0,%xmm3
- .byte 15,89,29,17,34,0,0 // mulps 0x2211(%rip),%xmm3 # 4370 <_sk_callback_sse41+0x98c>
+ .byte 15,89,29,21,34,0,0 // mulps 0x2215(%rip),%xmm3 # 4370 <_sk_callback_sse41+0x990>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 15,87,201 // xorps %xmm1,%xmm1
@@ -20136,7 +20130,7 @@ _sk_gather_a8_sse41:
.byte 102,15,58,32,192,3 // pinsrb $0x3,%eax,%xmm0
.byte 102,15,56,49,192 // pmovzxbd %xmm0,%xmm0
.byte 15,91,216 // cvtdq2ps %xmm0,%xmm3
- .byte 15,89,29,165,33,0,0 // mulps 0x21a5(%rip),%xmm3 # 4380 <_sk_callback_sse41+0x99c>
+ .byte 15,89,29,169,33,0,0 // mulps 0x21a9(%rip),%xmm3 # 4380 <_sk_callback_sse41+0x9a0>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 102,15,239,201 // pxor %xmm1,%xmm1
@@ -20149,7 +20143,7 @@ FUNCTION(_sk_store_a8_sse41)
_sk_store_a8_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,153,33,0,0 // movaps 0x2199(%rip),%xmm8 # 4390 <_sk_callback_sse41+0x9ac>
+ .byte 68,15,40,5,157,33,0,0 // movaps 0x219d(%rip),%xmm8 # 4390 <_sk_callback_sse41+0x9b0>
.byte 68,15,89,195 // mulps %xmm3,%xmm8
.byte 102,69,15,91,192 // cvtps2dq %xmm8,%xmm8
.byte 102,69,15,56,43,192 // packusdw %xmm8,%xmm8
@@ -20166,9 +20160,9 @@ _sk_load_g8_sse41:
.byte 72,139,0 // mov (%rax),%rax
.byte 102,15,56,49,4,56 // pmovzxbd (%rax,%rdi,1),%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,118,33,0,0 // mulps 0x2176(%rip),%xmm0 # 43a0 <_sk_callback_sse41+0x9bc>
+ .byte 15,89,5,122,33,0,0 // mulps 0x217a(%rip),%xmm0 # 43a0 <_sk_callback_sse41+0x9c0>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,125,33,0,0 // movaps 0x217d(%rip),%xmm3 # 43b0 <_sk_callback_sse41+0x9cc>
+ .byte 15,40,29,129,33,0,0 // movaps 0x2181(%rip),%xmm3 # 43b0 <_sk_callback_sse41+0x9d0>
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 255,224 // jmpq *%rax
@@ -20199,9 +20193,9 @@ _sk_gather_g8_sse41:
.byte 102,15,58,32,192,3 // pinsrb $0x3,%eax,%xmm0
.byte 102,15,56,49,192 // pmovzxbd %xmm0,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,22,33,0,0 // mulps 0x2116(%rip),%xmm0 # 43c0 <_sk_callback_sse41+0x9dc>
+ .byte 15,89,5,26,33,0,0 // mulps 0x211a(%rip),%xmm0 # 43c0 <_sk_callback_sse41+0x9e0>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,29,33,0,0 // movaps 0x211d(%rip),%xmm3 # 43d0 <_sk_callback_sse41+0x9ec>
+ .byte 15,40,29,33,33,0,0 // movaps 0x2121(%rip),%xmm3 # 43d0 <_sk_callback_sse41+0x9f0>
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 255,224 // jmpq *%rax
@@ -20213,9 +20207,9 @@ _sk_gather_i8_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 73,137,192 // mov %rax,%r8
.byte 77,133,192 // test %r8,%r8
- .byte 116,5 // je 22ca <_sk_gather_i8_sse41+0xf>
+ .byte 116,5 // je 22c6 <_sk_gather_i8_sse41+0xf>
.byte 76,137,192 // mov %r8,%rax
- .byte 235,2 // jmp 22cc <_sk_gather_i8_sse41+0x11>
+ .byte 235,2 // jmp 22c8 <_sk_gather_i8_sse41+0x11>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 243,15,91,201 // cvttps2dq %xmm1,%xmm1
@@ -20246,17 +20240,17 @@ _sk_gather_i8_sse41:
.byte 102,15,58,34,28,8,1 // pinsrd $0x1,(%rax,%rcx,1),%xmm3
.byte 102,66,15,58,34,28,144,2 // pinsrd $0x2,(%rax,%r10,4),%xmm3
.byte 102,66,15,58,34,28,8,3 // pinsrd $0x3,(%rax,%r9,1),%xmm3
- .byte 102,15,111,5,116,32,0,0 // movdqa 0x2074(%rip),%xmm0 # 43e0 <_sk_callback_sse41+0x9fc>
+ .byte 102,15,111,5,120,32,0,0 // movdqa 0x2078(%rip),%xmm0 # 43e0 <_sk_callback_sse41+0xa00>
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,117,32,0,0 // movaps 0x2075(%rip),%xmm8 # 43f0 <_sk_callback_sse41+0xa0c>
+ .byte 68,15,40,5,121,32,0,0 // movaps 0x2079(%rip),%xmm8 # 43f0 <_sk_callback_sse41+0xa10>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
- .byte 102,15,56,0,13,116,32,0,0 // pshufb 0x2074(%rip),%xmm1 # 4400 <_sk_callback_sse41+0xa1c>
+ .byte 102,15,56,0,13,120,32,0,0 // pshufb 0x2078(%rip),%xmm1 # 4400 <_sk_callback_sse41+0xa20>
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 102,15,111,211 // movdqa %xmm3,%xmm2
- .byte 102,15,56,0,21,112,32,0,0 // pshufb 0x2070(%rip),%xmm2 # 4410 <_sk_callback_sse41+0xa2c>
+ .byte 102,15,56,0,21,116,32,0,0 // pshufb 0x2074(%rip),%xmm2 # 4410 <_sk_callback_sse41+0xa30>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 102,15,114,211,24 // psrld $0x18,%xmm3
@@ -20272,19 +20266,19 @@ _sk_load_565_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 102,15,56,51,20,120 // pmovzxwd (%rax,%rdi,2),%xmm2
- .byte 102,15,111,5,86,32,0,0 // movdqa 0x2056(%rip),%xmm0 # 4420 <_sk_callback_sse41+0xa3c>
+ .byte 102,15,111,5,90,32,0,0 // movdqa 0x205a(%rip),%xmm0 # 4420 <_sk_callback_sse41+0xa40>
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,88,32,0,0 // mulps 0x2058(%rip),%xmm0 # 4430 <_sk_callback_sse41+0xa4c>
- .byte 102,15,111,13,96,32,0,0 // movdqa 0x2060(%rip),%xmm1 # 4440 <_sk_callback_sse41+0xa5c>
+ .byte 15,89,5,92,32,0,0 // mulps 0x205c(%rip),%xmm0 # 4430 <_sk_callback_sse41+0xa50>
+ .byte 102,15,111,13,100,32,0,0 // movdqa 0x2064(%rip),%xmm1 # 4440 <_sk_callback_sse41+0xa60>
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,98,32,0,0 // mulps 0x2062(%rip),%xmm1 # 4450 <_sk_callback_sse41+0xa6c>
- .byte 102,15,219,21,106,32,0,0 // pand 0x206a(%rip),%xmm2 # 4460 <_sk_callback_sse41+0xa7c>
+ .byte 15,89,13,102,32,0,0 // mulps 0x2066(%rip),%xmm1 # 4450 <_sk_callback_sse41+0xa70>
+ .byte 102,15,219,21,110,32,0,0 // pand 0x206e(%rip),%xmm2 # 4460 <_sk_callback_sse41+0xa80>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,112,32,0,0 // mulps 0x2070(%rip),%xmm2 # 4470 <_sk_callback_sse41+0xa8c>
+ .byte 15,89,21,116,32,0,0 // mulps 0x2074(%rip),%xmm2 # 4470 <_sk_callback_sse41+0xa90>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,119,32,0,0 // movaps 0x2077(%rip),%xmm3 # 4480 <_sk_callback_sse41+0xa9c>
+ .byte 15,40,29,123,32,0,0 // movaps 0x207b(%rip),%xmm3 # 4480 <_sk_callback_sse41+0xaa0>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_gather_565_sse41
@@ -20312,19 +20306,19 @@ _sk_gather_565_sse41:
.byte 65,15,183,4,65 // movzwl (%r9,%rax,2),%eax
.byte 102,15,196,192,3 // pinsrw $0x3,%eax,%xmm0
.byte 102,15,56,51,208 // pmovzxwd %xmm0,%xmm2
- .byte 102,15,111,5,28,32,0,0 // movdqa 0x201c(%rip),%xmm0 # 4490 <_sk_callback_sse41+0xaac>
+ .byte 102,15,111,5,32,32,0,0 // movdqa 0x2020(%rip),%xmm0 # 4490 <_sk_callback_sse41+0xab0>
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,30,32,0,0 // mulps 0x201e(%rip),%xmm0 # 44a0 <_sk_callback_sse41+0xabc>
- .byte 102,15,111,13,38,32,0,0 // movdqa 0x2026(%rip),%xmm1 # 44b0 <_sk_callback_sse41+0xacc>
+ .byte 15,89,5,34,32,0,0 // mulps 0x2022(%rip),%xmm0 # 44a0 <_sk_callback_sse41+0xac0>
+ .byte 102,15,111,13,42,32,0,0 // movdqa 0x202a(%rip),%xmm1 # 44b0 <_sk_callback_sse41+0xad0>
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,40,32,0,0 // mulps 0x2028(%rip),%xmm1 # 44c0 <_sk_callback_sse41+0xadc>
- .byte 102,15,219,21,48,32,0,0 // pand 0x2030(%rip),%xmm2 # 44d0 <_sk_callback_sse41+0xaec>
+ .byte 15,89,13,44,32,0,0 // mulps 0x202c(%rip),%xmm1 # 44c0 <_sk_callback_sse41+0xae0>
+ .byte 102,15,219,21,52,32,0,0 // pand 0x2034(%rip),%xmm2 # 44d0 <_sk_callback_sse41+0xaf0>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,54,32,0,0 // mulps 0x2036(%rip),%xmm2 # 44e0 <_sk_callback_sse41+0xafc>
+ .byte 15,89,21,58,32,0,0 // mulps 0x203a(%rip),%xmm2 # 44e0 <_sk_callback_sse41+0xb00>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,61,32,0,0 // movaps 0x203d(%rip),%xmm3 # 44f0 <_sk_callback_sse41+0xb0c>
+ .byte 15,40,29,65,32,0,0 // movaps 0x2041(%rip),%xmm3 # 44f0 <_sk_callback_sse41+0xb10>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_store_565_sse41
@@ -20333,12 +20327,12 @@ FUNCTION(_sk_store_565_sse41)
_sk_store_565_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,62,32,0,0 // movaps 0x203e(%rip),%xmm8 # 4500 <_sk_callback_sse41+0xb1c>
+ .byte 68,15,40,5,66,32,0,0 // movaps 0x2042(%rip),%xmm8 # 4500 <_sk_callback_sse41+0xb20>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 102,69,15,91,201 // cvtps2dq %xmm9,%xmm9
.byte 102,65,15,114,241,11 // pslld $0xb,%xmm9
- .byte 68,15,40,21,51,32,0,0 // movaps 0x2033(%rip),%xmm10 # 4510 <_sk_callback_sse41+0xb2c>
+ .byte 68,15,40,21,55,32,0,0 // movaps 0x2037(%rip),%xmm10 # 4510 <_sk_callback_sse41+0xb30>
.byte 68,15,89,209 // mulps %xmm1,%xmm10
.byte 102,69,15,91,210 // cvtps2dq %xmm10,%xmm10
.byte 102,65,15,114,242,5 // pslld $0x5,%xmm10
@@ -20358,21 +20352,21 @@ _sk_load_4444_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 102,15,56,51,28,120 // pmovzxwd (%rax,%rdi,2),%xmm3
- .byte 102,15,111,5,254,31,0,0 // movdqa 0x1ffe(%rip),%xmm0 # 4520 <_sk_callback_sse41+0xb3c>
+ .byte 102,15,111,5,2,32,0,0 // movdqa 0x2002(%rip),%xmm0 # 4520 <_sk_callback_sse41+0xb40>
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,0,32,0,0 // mulps 0x2000(%rip),%xmm0 # 4530 <_sk_callback_sse41+0xb4c>
- .byte 102,15,111,13,8,32,0,0 // movdqa 0x2008(%rip),%xmm1 # 4540 <_sk_callback_sse41+0xb5c>
+ .byte 15,89,5,4,32,0,0 // mulps 0x2004(%rip),%xmm0 # 4530 <_sk_callback_sse41+0xb50>
+ .byte 102,15,111,13,12,32,0,0 // movdqa 0x200c(%rip),%xmm1 # 4540 <_sk_callback_sse41+0xb60>
.byte 102,15,219,203 // pand %xmm3,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,10,32,0,0 // mulps 0x200a(%rip),%xmm1 # 4550 <_sk_callback_sse41+0xb6c>
- .byte 102,15,111,21,18,32,0,0 // movdqa 0x2012(%rip),%xmm2 # 4560 <_sk_callback_sse41+0xb7c>
+ .byte 15,89,13,14,32,0,0 // mulps 0x200e(%rip),%xmm1 # 4550 <_sk_callback_sse41+0xb70>
+ .byte 102,15,111,21,22,32,0,0 // movdqa 0x2016(%rip),%xmm2 # 4560 <_sk_callback_sse41+0xb80>
.byte 102,15,219,211 // pand %xmm3,%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,20,32,0,0 // mulps 0x2014(%rip),%xmm2 # 4570 <_sk_callback_sse41+0xb8c>
- .byte 102,15,219,29,28,32,0,0 // pand 0x201c(%rip),%xmm3 # 4580 <_sk_callback_sse41+0xb9c>
+ .byte 15,89,21,24,32,0,0 // mulps 0x2018(%rip),%xmm2 # 4570 <_sk_callback_sse41+0xb90>
+ .byte 102,15,219,29,32,32,0,0 // pand 0x2020(%rip),%xmm3 # 4580 <_sk_callback_sse41+0xba0>
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,34,32,0,0 // mulps 0x2022(%rip),%xmm3 # 4590 <_sk_callback_sse41+0xbac>
+ .byte 15,89,29,38,32,0,0 // mulps 0x2026(%rip),%xmm3 # 4590 <_sk_callback_sse41+0xbb0>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -20401,21 +20395,21 @@ _sk_gather_4444_sse41:
.byte 65,15,183,4,65 // movzwl (%r9,%rax,2),%eax
.byte 102,15,196,192,3 // pinsrw $0x3,%eax,%xmm0
.byte 102,15,56,51,216 // pmovzxwd %xmm0,%xmm3
- .byte 102,15,111,5,197,31,0,0 // movdqa 0x1fc5(%rip),%xmm0 # 45a0 <_sk_callback_sse41+0xbbc>
+ .byte 102,15,111,5,201,31,0,0 // movdqa 0x1fc9(%rip),%xmm0 # 45a0 <_sk_callback_sse41+0xbc0>
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,199,31,0,0 // mulps 0x1fc7(%rip),%xmm0 # 45b0 <_sk_callback_sse41+0xbcc>
- .byte 102,15,111,13,207,31,0,0 // movdqa 0x1fcf(%rip),%xmm1 # 45c0 <_sk_callback_sse41+0xbdc>
+ .byte 15,89,5,203,31,0,0 // mulps 0x1fcb(%rip),%xmm0 # 45b0 <_sk_callback_sse41+0xbd0>
+ .byte 102,15,111,13,211,31,0,0 // movdqa 0x1fd3(%rip),%xmm1 # 45c0 <_sk_callback_sse41+0xbe0>
.byte 102,15,219,203 // pand %xmm3,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,209,31,0,0 // mulps 0x1fd1(%rip),%xmm1 # 45d0 <_sk_callback_sse41+0xbec>
- .byte 102,15,111,21,217,31,0,0 // movdqa 0x1fd9(%rip),%xmm2 # 45e0 <_sk_callback_sse41+0xbfc>
+ .byte 15,89,13,213,31,0,0 // mulps 0x1fd5(%rip),%xmm1 # 45d0 <_sk_callback_sse41+0xbf0>
+ .byte 102,15,111,21,221,31,0,0 // movdqa 0x1fdd(%rip),%xmm2 # 45e0 <_sk_callback_sse41+0xc00>
.byte 102,15,219,211 // pand %xmm3,%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,219,31,0,0 // mulps 0x1fdb(%rip),%xmm2 # 45f0 <_sk_callback_sse41+0xc0c>
- .byte 102,15,219,29,227,31,0,0 // pand 0x1fe3(%rip),%xmm3 # 4600 <_sk_callback_sse41+0xc1c>
+ .byte 15,89,21,223,31,0,0 // mulps 0x1fdf(%rip),%xmm2 # 45f0 <_sk_callback_sse41+0xc10>
+ .byte 102,15,219,29,231,31,0,0 // pand 0x1fe7(%rip),%xmm3 # 4600 <_sk_callback_sse41+0xc20>
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,233,31,0,0 // mulps 0x1fe9(%rip),%xmm3 # 4610 <_sk_callback_sse41+0xc2c>
+ .byte 15,89,29,237,31,0,0 // mulps 0x1fed(%rip),%xmm3 # 4610 <_sk_callback_sse41+0xc30>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -20425,7 +20419,7 @@ FUNCTION(_sk_store_4444_sse41)
_sk_store_4444_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,232,31,0,0 // movaps 0x1fe8(%rip),%xmm8 # 4620 <_sk_callback_sse41+0xc3c>
+ .byte 68,15,40,5,236,31,0,0 // movaps 0x1fec(%rip),%xmm8 # 4620 <_sk_callback_sse41+0xc40>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 102,69,15,91,201 // cvtps2dq %xmm9,%xmm9
@@ -20455,17 +20449,17 @@ _sk_load_8888_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 15,16,28,184 // movups (%rax,%rdi,4),%xmm3
- .byte 15,40,5,135,31,0,0 // movaps 0x1f87(%rip),%xmm0 # 4630 <_sk_callback_sse41+0xc4c>
+ .byte 15,40,5,139,31,0,0 // movaps 0x1f8b(%rip),%xmm0 # 4630 <_sk_callback_sse41+0xc50>
.byte 15,84,195 // andps %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,137,31,0,0 // movaps 0x1f89(%rip),%xmm8 # 4640 <_sk_callback_sse41+0xc5c>
+ .byte 68,15,40,5,141,31,0,0 // movaps 0x1f8d(%rip),%xmm8 # 4640 <_sk_callback_sse41+0xc60>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 15,40,203 // movaps %xmm3,%xmm1
- .byte 102,15,56,0,13,137,31,0,0 // pshufb 0x1f89(%rip),%xmm1 # 4650 <_sk_callback_sse41+0xc6c>
+ .byte 102,15,56,0,13,141,31,0,0 // pshufb 0x1f8d(%rip),%xmm1 # 4650 <_sk_callback_sse41+0xc70>
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 15,40,211 // movaps %xmm3,%xmm2
- .byte 102,15,56,0,21,134,31,0,0 // pshufb 0x1f86(%rip),%xmm2 # 4660 <_sk_callback_sse41+0xc7c>
+ .byte 102,15,56,0,21,138,31,0,0 // pshufb 0x1f8a(%rip),%xmm2 # 4660 <_sk_callback_sse41+0xc80>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 102,15,114,211,24 // psrld $0x18,%xmm3
@@ -20496,17 +20490,17 @@ _sk_gather_8888_sse41:
.byte 102,65,15,58,34,28,129,1 // pinsrd $0x1,(%r9,%rax,4),%xmm3
.byte 102,67,15,58,34,28,145,2 // pinsrd $0x2,(%r9,%r10,4),%xmm3
.byte 102,65,15,58,34,28,137,3 // pinsrd $0x3,(%r9,%rcx,4),%xmm3
- .byte 102,15,111,5,31,31,0,0 // movdqa 0x1f1f(%rip),%xmm0 # 4670 <_sk_callback_sse41+0xc8c>
+ .byte 102,15,111,5,35,31,0,0 // movdqa 0x1f23(%rip),%xmm0 # 4670 <_sk_callback_sse41+0xc90>
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,32,31,0,0 // movaps 0x1f20(%rip),%xmm8 # 4680 <_sk_callback_sse41+0xc9c>
+ .byte 68,15,40,5,36,31,0,0 // movaps 0x1f24(%rip),%xmm8 # 4680 <_sk_callback_sse41+0xca0>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
- .byte 102,15,56,0,13,31,31,0,0 // pshufb 0x1f1f(%rip),%xmm1 # 4690 <_sk_callback_sse41+0xcac>
+ .byte 102,15,56,0,13,35,31,0,0 // pshufb 0x1f23(%rip),%xmm1 # 4690 <_sk_callback_sse41+0xcb0>
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 102,15,111,211 // movdqa %xmm3,%xmm2
- .byte 102,15,56,0,21,27,31,0,0 // pshufb 0x1f1b(%rip),%xmm2 # 46a0 <_sk_callback_sse41+0xcbc>
+ .byte 102,15,56,0,21,31,31,0,0 // pshufb 0x1f1f(%rip),%xmm2 # 46a0 <_sk_callback_sse41+0xcc0>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 102,15,114,211,24 // psrld $0x18,%xmm3
@@ -20521,7 +20515,7 @@ FUNCTION(_sk_store_8888_sse41)
_sk_store_8888_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,7,31,0,0 // movaps 0x1f07(%rip),%xmm8 # 46b0 <_sk_callback_sse41+0xccc>
+ .byte 68,15,40,5,11,31,0,0 // movaps 0x1f0b(%rip),%xmm8 # 46b0 <_sk_callback_sse41+0xcd0>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 102,69,15,91,201 // cvtps2dq %xmm9,%xmm9
@@ -20558,18 +20552,18 @@ _sk_load_f16_sse41:
.byte 102,68,15,97,216 // punpcklwd %xmm0,%xmm11
.byte 102,68,15,105,200 // punpckhwd %xmm0,%xmm9
.byte 102,65,15,56,51,203 // pmovzxwd %xmm11,%xmm1
- .byte 102,68,15,111,5,128,30,0,0 // movdqa 0x1e80(%rip),%xmm8 # 46c0 <_sk_callback_sse41+0xcdc>
+ .byte 102,68,15,111,5,132,30,0,0 // movdqa 0x1e84(%rip),%xmm8 # 46c0 <_sk_callback_sse41+0xce0>
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,65,15,219,208 // pand %xmm8,%xmm2
.byte 102,15,239,202 // pxor %xmm2,%xmm1
- .byte 102,15,111,29,123,30,0,0 // movdqa 0x1e7b(%rip),%xmm3 # 46d0 <_sk_callback_sse41+0xcec>
+ .byte 102,15,111,29,127,30,0,0 // movdqa 0x1e7f(%rip),%xmm3 # 46d0 <_sk_callback_sse41+0xcf0>
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,56,63,195 // pmaxud %xmm3,%xmm0
.byte 102,15,118,193 // pcmpeqd %xmm1,%xmm0
.byte 102,15,114,241,13 // pslld $0xd,%xmm1
.byte 102,15,235,202 // por %xmm2,%xmm1
- .byte 102,68,15,111,21,103,30,0,0 // movdqa 0x1e67(%rip),%xmm10 # 46e0 <_sk_callback_sse41+0xcfc>
+ .byte 102,68,15,111,21,107,30,0,0 // movdqa 0x1e6b(%rip),%xmm10 # 46e0 <_sk_callback_sse41+0xd00>
.byte 102,65,15,254,202 // paddd %xmm10,%xmm1
.byte 102,15,219,193 // pand %xmm1,%xmm0
.byte 102,65,15,115,219,8 // psrldq $0x8,%xmm11
@@ -20642,18 +20636,18 @@ _sk_gather_f16_sse41:
.byte 102,68,15,97,218 // punpcklwd %xmm2,%xmm11
.byte 102,68,15,105,202 // punpckhwd %xmm2,%xmm9
.byte 102,65,15,56,51,203 // pmovzxwd %xmm11,%xmm1
- .byte 102,68,15,111,5,37,29,0,0 // movdqa 0x1d25(%rip),%xmm8 # 46f0 <_sk_callback_sse41+0xd0c>
+ .byte 102,68,15,111,5,41,29,0,0 // movdqa 0x1d29(%rip),%xmm8 # 46f0 <_sk_callback_sse41+0xd10>
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,65,15,219,208 // pand %xmm8,%xmm2
.byte 102,15,239,202 // pxor %xmm2,%xmm1
- .byte 102,15,111,29,32,29,0,0 // movdqa 0x1d20(%rip),%xmm3 # 4700 <_sk_callback_sse41+0xd1c>
+ .byte 102,15,111,29,36,29,0,0 // movdqa 0x1d24(%rip),%xmm3 # 4700 <_sk_callback_sse41+0xd20>
.byte 102,15,114,242,16 // pslld $0x10,%xmm2
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,56,63,195 // pmaxud %xmm3,%xmm0
.byte 102,15,118,193 // pcmpeqd %xmm1,%xmm0
.byte 102,15,114,241,13 // pslld $0xd,%xmm1
.byte 102,15,235,202 // por %xmm2,%xmm1
- .byte 102,68,15,111,21,12,29,0,0 // movdqa 0x1d0c(%rip),%xmm10 # 4710 <_sk_callback_sse41+0xd2c>
+ .byte 102,68,15,111,21,16,29,0,0 // movdqa 0x1d10(%rip),%xmm10 # 4710 <_sk_callback_sse41+0xd30>
.byte 102,65,15,254,202 // paddd %xmm10,%xmm1
.byte 102,15,219,193 // pand %xmm1,%xmm0
.byte 102,65,15,115,219,8 // psrldq $0x8,%xmm11
@@ -20701,17 +20695,17 @@ FUNCTION(_sk_store_f16_sse41)
_sk_store_f16_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 102,68,15,111,21,66,28,0,0 // movdqa 0x1c42(%rip),%xmm10 # 4720 <_sk_callback_sse41+0xd3c>
+ .byte 102,68,15,111,21,70,28,0,0 // movdqa 0x1c46(%rip),%xmm10 # 4720 <_sk_callback_sse41+0xd40>
.byte 102,68,15,111,224 // movdqa %xmm0,%xmm12
.byte 102,68,15,111,232 // movdqa %xmm0,%xmm13
.byte 102,69,15,219,234 // pand %xmm10,%xmm13
.byte 102,69,15,239,229 // pxor %xmm13,%xmm12
- .byte 102,68,15,111,13,53,28,0,0 // movdqa 0x1c35(%rip),%xmm9 # 4730 <_sk_callback_sse41+0xd4c>
+ .byte 102,68,15,111,13,57,28,0,0 // movdqa 0x1c39(%rip),%xmm9 # 4730 <_sk_callback_sse41+0xd50>
.byte 102,65,15,114,213,16 // psrld $0x10,%xmm13
.byte 102,69,15,111,193 // movdqa %xmm9,%xmm8
.byte 102,69,15,102,196 // pcmpgtd %xmm12,%xmm8
.byte 102,65,15,114,212,13 // psrld $0xd,%xmm12
- .byte 102,68,15,111,29,38,28,0,0 // movdqa 0x1c26(%rip),%xmm11 # 4740 <_sk_callback_sse41+0xd5c>
+ .byte 102,68,15,111,29,42,28,0,0 // movdqa 0x1c2a(%rip),%xmm11 # 4740 <_sk_callback_sse41+0xd60>
.byte 102,69,15,235,235 // por %xmm11,%xmm13
.byte 102,69,15,254,236 // paddd %xmm12,%xmm13
.byte 102,69,15,223,197 // pandn %xmm13,%xmm8
@@ -20781,7 +20775,7 @@ _sk_load_u16_be_sse41:
.byte 102,15,235,200 // por %xmm0,%xmm1
.byte 102,15,56,51,193 // pmovzxwd %xmm1,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,245,26,0,0 // movaps 0x1af5(%rip),%xmm8 # 4750 <_sk_callback_sse41+0xd6c>
+ .byte 68,15,40,5,249,26,0,0 // movaps 0x1af9(%rip),%xmm8 # 4750 <_sk_callback_sse41+0xd70>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,113,241,8 // psllw $0x8,%xmm1
@@ -20833,7 +20827,7 @@ _sk_load_rgb_u16_be_sse41:
.byte 102,15,235,193 // por %xmm1,%xmm0
.byte 102,15,56,51,192 // pmovzxwd %xmm0,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,54,26,0,0 // movaps 0x1a36(%rip),%xmm8 # 4760 <_sk_callback_sse41+0xd7c>
+ .byte 68,15,40,5,58,26,0,0 // movaps 0x1a3a(%rip),%xmm8 # 4760 <_sk_callback_sse41+0xd80>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,113,241,8 // psllw $0x8,%xmm1
@@ -20850,7 +20844,7 @@ _sk_load_rgb_u16_be_sse41:
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,253,25,0,0 // movaps 0x19fd(%rip),%xmm3 # 4770 <_sk_callback_sse41+0xd8c>
+ .byte 15,40,29,1,26,0,0 // movaps 0x1a01(%rip),%xmm3 # 4770 <_sk_callback_sse41+0xd90>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_store_u16_be_sse41
@@ -20859,7 +20853,7 @@ FUNCTION(_sk_store_u16_be_sse41)
_sk_store_u16_be_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,13,254,25,0,0 // movaps 0x19fe(%rip),%xmm9 # 4780 <_sk_callback_sse41+0xd9c>
+ .byte 68,15,40,13,2,26,0,0 // movaps 0x1a02(%rip),%xmm9 # 4780 <_sk_callback_sse41+0xda0>
.byte 68,15,40,192 // movaps %xmm0,%xmm8
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 102,69,15,91,192 // cvtps2dq %xmm8,%xmm8
@@ -21082,10 +21076,10 @@ HIDDEN _sk_luminance_to_alpha_sse41
FUNCTION(_sk_luminance_to_alpha_sse41)
_sk_luminance_to_alpha_sse41:
.byte 15,40,218 // movaps %xmm2,%xmm3
- .byte 15,89,5,28,23,0,0 // mulps 0x171c(%rip),%xmm0 # 4790 <_sk_callback_sse41+0xdac>
- .byte 15,89,13,37,23,0,0 // mulps 0x1725(%rip),%xmm1 # 47a0 <_sk_callback_sse41+0xdbc>
+ .byte 15,89,5,32,23,0,0 // mulps 0x1720(%rip),%xmm0 # 4790 <_sk_callback_sse41+0xdb0>
+ .byte 15,89,13,41,23,0,0 // mulps 0x1729(%rip),%xmm1 # 47a0 <_sk_callback_sse41+0xdc0>
.byte 15,88,200 // addps %xmm0,%xmm1
- .byte 15,89,29,43,23,0,0 // mulps 0x172b(%rip),%xmm3 # 47b0 <_sk_callback_sse41+0xdcc>
+ .byte 15,89,29,47,23,0,0 // mulps 0x172f(%rip),%xmm3 # 47b0 <_sk_callback_sse41+0xdd0>
.byte 15,88,217 // addps %xmm1,%xmm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,87,192 // xorps %xmm0,%xmm0
@@ -21318,7 +21312,7 @@ _sk_linear_gradient_sse41:
.byte 69,15,198,237,0 // shufps $0x0,%xmm13,%xmm13
.byte 72,139,8 // mov (%rax),%rcx
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,132,254,0,0,0 // je 3527 <_sk_linear_gradient_sse41+0x138>
+ .byte 15,132,254,0,0,0 // je 3523 <_sk_linear_gradient_sse41+0x138>
.byte 15,41,100,36,168 // movaps %xmm4,-0x58(%rsp)
.byte 15,41,108,36,184 // movaps %xmm5,-0x48(%rsp)
.byte 15,41,116,36,200 // movaps %xmm6,-0x38(%rsp)
@@ -21368,12 +21362,12 @@ _sk_linear_gradient_sse41:
.byte 15,40,196 // movaps %xmm4,%xmm0
.byte 72,131,192,36 // add $0x24,%rax
.byte 72,255,201 // dec %rcx
- .byte 15,133,65,255,255,255 // jne 3452 <_sk_linear_gradient_sse41+0x63>
+ .byte 15,133,65,255,255,255 // jne 344e <_sk_linear_gradient_sse41+0x63>
.byte 15,40,124,36,216 // movaps -0x28(%rsp),%xmm7
.byte 15,40,116,36,200 // movaps -0x38(%rsp),%xmm6
.byte 15,40,108,36,184 // movaps -0x48(%rsp),%xmm5
.byte 15,40,100,36,168 // movaps -0x58(%rsp),%xmm4
- .byte 235,13 // jmp 3534 <_sk_linear_gradient_sse41+0x145>
+ .byte 235,13 // jmp 3530 <_sk_linear_gradient_sse41+0x145>
.byte 15,87,201 // xorps %xmm1,%xmm1
.byte 15,87,210 // xorps %xmm2,%xmm2
.byte 15,87,219 // xorps %xmm3,%xmm3
@@ -21442,26 +21436,26 @@ _sk_xy_to_polar_unit_sse41:
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,40,236 // movaps %xmm12,%xmm13
.byte 69,15,89,237 // mulps %xmm13,%xmm13
- .byte 68,15,40,21,180,17,0,0 // movaps 0x11b4(%rip),%xmm10 # 47c0 <_sk_callback_sse41+0xddc>
+ .byte 68,15,40,21,184,17,0,0 // movaps 0x11b8(%rip),%xmm10 # 47c0 <_sk_callback_sse41+0xde0>
.byte 69,15,89,213 // mulps %xmm13,%xmm10
- .byte 68,15,88,21,184,17,0,0 // addps 0x11b8(%rip),%xmm10 # 47d0 <_sk_callback_sse41+0xdec>
+ .byte 68,15,88,21,188,17,0,0 // addps 0x11bc(%rip),%xmm10 # 47d0 <_sk_callback_sse41+0xdf0>
.byte 69,15,89,213 // mulps %xmm13,%xmm10
- .byte 68,15,88,21,188,17,0,0 // addps 0x11bc(%rip),%xmm10 # 47e0 <_sk_callback_sse41+0xdfc>
+ .byte 68,15,88,21,192,17,0,0 // addps 0x11c0(%rip),%xmm10 # 47e0 <_sk_callback_sse41+0xe00>
.byte 69,15,89,213 // mulps %xmm13,%xmm10
- .byte 68,15,88,21,192,17,0,0 // addps 0x11c0(%rip),%xmm10 # 47f0 <_sk_callback_sse41+0xe0c>
+ .byte 68,15,88,21,196,17,0,0 // addps 0x11c4(%rip),%xmm10 # 47f0 <_sk_callback_sse41+0xe10>
.byte 69,15,89,212 // mulps %xmm12,%xmm10
.byte 65,15,194,195,1 // cmpltps %xmm11,%xmm0
- .byte 68,15,40,29,191,17,0,0 // movaps 0x11bf(%rip),%xmm11 # 4800 <_sk_callback_sse41+0xe1c>
+ .byte 68,15,40,29,195,17,0,0 // movaps 0x11c3(%rip),%xmm11 # 4800 <_sk_callback_sse41+0xe20>
.byte 69,15,92,218 // subps %xmm10,%xmm11
.byte 102,69,15,56,20,211 // blendvps %xmm0,%xmm11,%xmm10
.byte 69,15,194,200,1 // cmpltps %xmm8,%xmm9
- .byte 68,15,40,29,184,17,0,0 // movaps 0x11b8(%rip),%xmm11 # 4810 <_sk_callback_sse41+0xe2c>
+ .byte 68,15,40,29,188,17,0,0 // movaps 0x11bc(%rip),%xmm11 # 4810 <_sk_callback_sse41+0xe30>
.byte 69,15,92,218 // subps %xmm10,%xmm11
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 102,69,15,56,20,211 // blendvps %xmm0,%xmm11,%xmm10
.byte 15,40,193 // movaps %xmm1,%xmm0
.byte 65,15,194,192,1 // cmpltps %xmm8,%xmm0
- .byte 68,15,40,13,170,17,0,0 // movaps 0x11aa(%rip),%xmm9 # 4820 <_sk_callback_sse41+0xe3c>
+ .byte 68,15,40,13,174,17,0,0 // movaps 0x11ae(%rip),%xmm9 # 4820 <_sk_callback_sse41+0xe40>
.byte 69,15,92,202 // subps %xmm10,%xmm9
.byte 102,69,15,56,20,209 // blendvps %xmm0,%xmm9,%xmm10
.byte 69,15,194,194,7 // cmpordps %xmm10,%xmm8
@@ -21475,7 +21469,7 @@ HIDDEN _sk_save_xy_sse41
FUNCTION(_sk_save_xy_sse41)
_sk_save_xy_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,149,17,0,0 // movaps 0x1195(%rip),%xmm8 # 4830 <_sk_callback_sse41+0xe4c>
+ .byte 68,15,40,5,153,17,0,0 // movaps 0x1199(%rip),%xmm8 # 4830 <_sk_callback_sse41+0xe50>
.byte 15,17,0 // movups %xmm0,(%rax)
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,88,200 // addps %xmm8,%xmm9
@@ -21519,8 +21513,8 @@ _sk_bilinear_nx_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,23,17,0,0 // addps 0x1117(%rip),%xmm0 # 4840 <_sk_callback_sse41+0xe5c>
- .byte 68,15,40,13,31,17,0,0 // movaps 0x111f(%rip),%xmm9 # 4850 <_sk_callback_sse41+0xe6c>
+ .byte 15,88,5,27,17,0,0 // addps 0x111b(%rip),%xmm0 # 4840 <_sk_callback_sse41+0xe60>
+ .byte 68,15,40,13,35,17,0,0 // movaps 0x1123(%rip),%xmm9 # 4850 <_sk_callback_sse41+0xe70>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,128,0,0,0 // movups %xmm9,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -21533,7 +21527,7 @@ _sk_bilinear_px_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,14,17,0,0 // addps 0x110e(%rip),%xmm0 # 4860 <_sk_callback_sse41+0xe7c>
+ .byte 15,88,5,18,17,0,0 // addps 0x1112(%rip),%xmm0 # 4860 <_sk_callback_sse41+0xe80>
.byte 68,15,17,128,128,0,0,0 // movups %xmm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -21545,8 +21539,8 @@ _sk_bilinear_ny_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,0,17,0,0 // addps 0x1100(%rip),%xmm1 # 4870 <_sk_callback_sse41+0xe8c>
- .byte 68,15,40,13,8,17,0,0 // movaps 0x1108(%rip),%xmm9 # 4880 <_sk_callback_sse41+0xe9c>
+ .byte 15,88,13,4,17,0,0 // addps 0x1104(%rip),%xmm1 # 4870 <_sk_callback_sse41+0xe90>
+ .byte 68,15,40,13,12,17,0,0 // movaps 0x110c(%rip),%xmm9 # 4880 <_sk_callback_sse41+0xea0>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,160,0,0,0 // movups %xmm9,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -21559,7 +21553,7 @@ _sk_bilinear_py_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,246,16,0,0 // addps 0x10f6(%rip),%xmm1 # 4890 <_sk_callback_sse41+0xeac>
+ .byte 15,88,13,250,16,0,0 // addps 0x10fa(%rip),%xmm1 # 4890 <_sk_callback_sse41+0xeb0>
.byte 68,15,17,128,160,0,0,0 // movups %xmm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -21571,13 +21565,13 @@ _sk_bicubic_n3x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,233,16,0,0 // addps 0x10e9(%rip),%xmm0 # 48a0 <_sk_callback_sse41+0xebc>
- .byte 68,15,40,13,241,16,0,0 // movaps 0x10f1(%rip),%xmm9 # 48b0 <_sk_callback_sse41+0xecc>
+ .byte 15,88,5,237,16,0,0 // addps 0x10ed(%rip),%xmm0 # 48a0 <_sk_callback_sse41+0xec0>
+ .byte 68,15,40,13,245,16,0,0 // movaps 0x10f5(%rip),%xmm9 # 48b0 <_sk_callback_sse41+0xed0>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,237,16,0,0 // mulps 0x10ed(%rip),%xmm9 # 48c0 <_sk_callback_sse41+0xedc>
- .byte 68,15,88,13,245,16,0,0 // addps 0x10f5(%rip),%xmm9 # 48d0 <_sk_callback_sse41+0xeec>
+ .byte 68,15,89,13,241,16,0,0 // mulps 0x10f1(%rip),%xmm9 # 48c0 <_sk_callback_sse41+0xee0>
+ .byte 68,15,88,13,249,16,0,0 // addps 0x10f9(%rip),%xmm9 # 48d0 <_sk_callback_sse41+0xef0>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,128,0,0,0 // movups %xmm9,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -21590,16 +21584,16 @@ _sk_bicubic_n1x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,228,16,0,0 // addps 0x10e4(%rip),%xmm0 # 48e0 <_sk_callback_sse41+0xefc>
- .byte 68,15,40,13,236,16,0,0 // movaps 0x10ec(%rip),%xmm9 # 48f0 <_sk_callback_sse41+0xf0c>
+ .byte 15,88,5,232,16,0,0 // addps 0x10e8(%rip),%xmm0 # 48e0 <_sk_callback_sse41+0xf00>
+ .byte 68,15,40,13,240,16,0,0 // movaps 0x10f0(%rip),%xmm9 # 48f0 <_sk_callback_sse41+0xf10>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,240,16,0,0 // movaps 0x10f0(%rip),%xmm8 # 4900 <_sk_callback_sse41+0xf1c>
+ .byte 68,15,40,5,244,16,0,0 // movaps 0x10f4(%rip),%xmm8 # 4900 <_sk_callback_sse41+0xf20>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,244,16,0,0 // addps 0x10f4(%rip),%xmm8 # 4910 <_sk_callback_sse41+0xf2c>
+ .byte 68,15,88,5,248,16,0,0 // addps 0x10f8(%rip),%xmm8 # 4910 <_sk_callback_sse41+0xf30>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,248,16,0,0 // addps 0x10f8(%rip),%xmm8 # 4920 <_sk_callback_sse41+0xf3c>
+ .byte 68,15,88,5,252,16,0,0 // addps 0x10fc(%rip),%xmm8 # 4920 <_sk_callback_sse41+0xf40>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,252,16,0,0 // addps 0x10fc(%rip),%xmm8 # 4930 <_sk_callback_sse41+0xf4c>
+ .byte 68,15,88,5,0,17,0,0 // addps 0x1100(%rip),%xmm8 # 4930 <_sk_callback_sse41+0xf50>
.byte 68,15,17,128,128,0,0,0 // movups %xmm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -21609,17 +21603,17 @@ HIDDEN _sk_bicubic_p1x_sse41
FUNCTION(_sk_bicubic_p1x_sse41)
_sk_bicubic_p1x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,246,16,0,0 // movaps 0x10f6(%rip),%xmm8 # 4940 <_sk_callback_sse41+0xf5c>
+ .byte 68,15,40,5,250,16,0,0 // movaps 0x10fa(%rip),%xmm8 # 4940 <_sk_callback_sse41+0xf60>
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,72,64 // movups 0x40(%rax),%xmm9
.byte 65,15,88,192 // addps %xmm8,%xmm0
- .byte 68,15,40,21,242,16,0,0 // movaps 0x10f2(%rip),%xmm10 # 4950 <_sk_callback_sse41+0xf6c>
+ .byte 68,15,40,21,246,16,0,0 // movaps 0x10f6(%rip),%xmm10 # 4950 <_sk_callback_sse41+0xf70>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,246,16,0,0 // addps 0x10f6(%rip),%xmm10 # 4960 <_sk_callback_sse41+0xf7c>
+ .byte 68,15,88,21,250,16,0,0 // addps 0x10fa(%rip),%xmm10 # 4960 <_sk_callback_sse41+0xf80>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,242,16,0,0 // addps 0x10f2(%rip),%xmm10 # 4970 <_sk_callback_sse41+0xf8c>
+ .byte 68,15,88,21,246,16,0,0 // addps 0x10f6(%rip),%xmm10 # 4970 <_sk_callback_sse41+0xf90>
.byte 68,15,17,144,128,0,0,0 // movups %xmm10,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -21631,11 +21625,11 @@ _sk_bicubic_p3x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,229,16,0,0 // addps 0x10e5(%rip),%xmm0 # 4980 <_sk_callback_sse41+0xf9c>
+ .byte 15,88,5,233,16,0,0 // addps 0x10e9(%rip),%xmm0 # 4980 <_sk_callback_sse41+0xfa0>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,229,16,0,0 // mulps 0x10e5(%rip),%xmm8 # 4990 <_sk_callback_sse41+0xfac>
- .byte 68,15,88,5,237,16,0,0 // addps 0x10ed(%rip),%xmm8 # 49a0 <_sk_callback_sse41+0xfbc>
+ .byte 68,15,89,5,233,16,0,0 // mulps 0x10e9(%rip),%xmm8 # 4990 <_sk_callback_sse41+0xfb0>
+ .byte 68,15,88,5,241,16,0,0 // addps 0x10f1(%rip),%xmm8 # 49a0 <_sk_callback_sse41+0xfc0>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,128,0,0,0 // movups %xmm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -21648,13 +21642,13 @@ _sk_bicubic_n3y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,219,16,0,0 // addps 0x10db(%rip),%xmm1 # 49b0 <_sk_callback_sse41+0xfcc>
- .byte 68,15,40,13,227,16,0,0 // movaps 0x10e3(%rip),%xmm9 # 49c0 <_sk_callback_sse41+0xfdc>
+ .byte 15,88,13,223,16,0,0 // addps 0x10df(%rip),%xmm1 # 49b0 <_sk_callback_sse41+0xfd0>
+ .byte 68,15,40,13,231,16,0,0 // movaps 0x10e7(%rip),%xmm9 # 49c0 <_sk_callback_sse41+0xfe0>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,223,16,0,0 // mulps 0x10df(%rip),%xmm9 # 49d0 <_sk_callback_sse41+0xfec>
- .byte 68,15,88,13,231,16,0,0 // addps 0x10e7(%rip),%xmm9 # 49e0 <_sk_callback_sse41+0xffc>
+ .byte 68,15,89,13,227,16,0,0 // mulps 0x10e3(%rip),%xmm9 # 49d0 <_sk_callback_sse41+0xff0>
+ .byte 68,15,88,13,235,16,0,0 // addps 0x10eb(%rip),%xmm9 # 49e0 <_sk_callback_sse41+0x1000>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,160,0,0,0 // movups %xmm9,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -21667,16 +21661,16 @@ _sk_bicubic_n1y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,213,16,0,0 // addps 0x10d5(%rip),%xmm1 # 49f0 <_sk_callback_sse41+0x100c>
- .byte 68,15,40,13,221,16,0,0 // movaps 0x10dd(%rip),%xmm9 # 4a00 <_sk_callback_sse41+0x101c>
+ .byte 15,88,13,217,16,0,0 // addps 0x10d9(%rip),%xmm1 # 49f0 <_sk_callback_sse41+0x1010>
+ .byte 68,15,40,13,225,16,0,0 // movaps 0x10e1(%rip),%xmm9 # 4a00 <_sk_callback_sse41+0x1020>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,225,16,0,0 // movaps 0x10e1(%rip),%xmm8 # 4a10 <_sk_callback_sse41+0x102c>
+ .byte 68,15,40,5,229,16,0,0 // movaps 0x10e5(%rip),%xmm8 # 4a10 <_sk_callback_sse41+0x1030>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,229,16,0,0 // addps 0x10e5(%rip),%xmm8 # 4a20 <_sk_callback_sse41+0x103c>
+ .byte 68,15,88,5,233,16,0,0 // addps 0x10e9(%rip),%xmm8 # 4a20 <_sk_callback_sse41+0x1040>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,233,16,0,0 // addps 0x10e9(%rip),%xmm8 # 4a30 <_sk_callback_sse41+0x104c>
+ .byte 68,15,88,5,237,16,0,0 // addps 0x10ed(%rip),%xmm8 # 4a30 <_sk_callback_sse41+0x1050>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,237,16,0,0 // addps 0x10ed(%rip),%xmm8 # 4a40 <_sk_callback_sse41+0x105c>
+ .byte 68,15,88,5,241,16,0,0 // addps 0x10f1(%rip),%xmm8 # 4a40 <_sk_callback_sse41+0x1060>
.byte 68,15,17,128,160,0,0,0 // movups %xmm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -21686,17 +21680,17 @@ HIDDEN _sk_bicubic_p1y_sse41
FUNCTION(_sk_bicubic_p1y_sse41)
_sk_bicubic_p1y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,231,16,0,0 // movaps 0x10e7(%rip),%xmm8 # 4a50 <_sk_callback_sse41+0x106c>
+ .byte 68,15,40,5,235,16,0,0 // movaps 0x10eb(%rip),%xmm8 # 4a50 <_sk_callback_sse41+0x1070>
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,72,96 // movups 0x60(%rax),%xmm9
.byte 65,15,88,200 // addps %xmm8,%xmm1
- .byte 68,15,40,21,226,16,0,0 // movaps 0x10e2(%rip),%xmm10 # 4a60 <_sk_callback_sse41+0x107c>
+ .byte 68,15,40,21,230,16,0,0 // movaps 0x10e6(%rip),%xmm10 # 4a60 <_sk_callback_sse41+0x1080>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,230,16,0,0 // addps 0x10e6(%rip),%xmm10 # 4a70 <_sk_callback_sse41+0x108c>
+ .byte 68,15,88,21,234,16,0,0 // addps 0x10ea(%rip),%xmm10 # 4a70 <_sk_callback_sse41+0x1090>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,226,16,0,0 // addps 0x10e2(%rip),%xmm10 # 4a80 <_sk_callback_sse41+0x109c>
+ .byte 68,15,88,21,230,16,0,0 // addps 0x10e6(%rip),%xmm10 # 4a80 <_sk_callback_sse41+0x10a0>
.byte 68,15,17,144,160,0,0,0 // movups %xmm10,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -21708,11 +21702,11 @@ _sk_bicubic_p3y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,212,16,0,0 // addps 0x10d4(%rip),%xmm1 # 4a90 <_sk_callback_sse41+0x10ac>
+ .byte 15,88,13,216,16,0,0 // addps 0x10d8(%rip),%xmm1 # 4a90 <_sk_callback_sse41+0x10b0>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,212,16,0,0 // mulps 0x10d4(%rip),%xmm8 # 4aa0 <_sk_callback_sse41+0x10bc>
- .byte 68,15,88,5,220,16,0,0 // addps 0x10dc(%rip),%xmm8 # 4ab0 <_sk_callback_sse41+0x10cc>
+ .byte 68,15,89,5,216,16,0,0 // mulps 0x10d8(%rip),%xmm8 # 4aa0 <_sk_callback_sse41+0x10c0>
+ .byte 68,15,88,5,224,16,0,0 // addps 0x10e0(%rip),%xmm8 # 4ab0 <_sk_callback_sse41+0x10d0>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,160,0,0,0 // movups %xmm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -21825,15 +21819,16 @@ BALIGN16
.byte 0,0 // add %al,(%rax)
.byte 2,0 // add (%rax),%al
.byte 0,0 // add %al,(%rax)
- .byte 33,8 // and %ecx,(%rax)
- .byte 130 // (bad)
- .byte 60,33 // cmp $0x21,%al
- .byte 8,130,60,33,8,130 // or %al,-0x7df7dec4(%rdx)
- .byte 60,33 // cmp $0x21,%al
- .byte 8,130,60,0,0,0 // or %al,0x3c(%rdx)
- .byte 191,0,0,0,191 // mov $0xbf000000,%edi
.byte 0,0 // add %al,(%rax)
- .byte 0,191,0,0,0,191 // add %bh,-0x41000000(%rdi)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 252 // cld
+ .byte 190,0,0,252,190 // mov $0xbefc0000,%esi
+ .byte 0,0 // add %al,(%rax)
+ .byte 252 // cld
+ .byte 190,0,0,252,190 // mov $0xbefc0000,%esi
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
.byte 0,128,63,0,0,128 // add %al,-0x7fffffc1(%rax)
@@ -22199,10 +22194,10 @@ BALIGN16
.byte 0,1 // add %al,(%rcx)
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a003eb8 <_sk_callback_sse41+0xa0004d4>
+ .byte 255,5,255,255,255,9 // incl 0x9ffffff(%rip) # a003eb8 <_sk_callback_sse41+0xa0004d8>
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 3003ec0 <_sk_callback_sse41+0x30004dc>
+ .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 3003ec0 <_sk_callback_sse41+0x30004e0>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -22317,7 +22312,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a37fba <_sk_callback_sse41+0xffffffffe9a345d6>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a37fba <_sk_callback_sse41+0xffffffffe9a345da>
.byte 220,63 // fdivrl (%rdi)
.byte 81 // push %rcx
.byte 140,242 // mov %?,%edx
@@ -22413,7 +22408,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a3808a <_sk_callback_sse41+0xffffffffe9a346a6>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a3808a <_sk_callback_sse41+0xffffffffe9a346aa>
.byte 220,63 // fdivrl (%rdi)
.byte 81 // push %rcx
.byte 140,242 // mov %?,%edx
@@ -22509,7 +22504,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a3815a <_sk_callback_sse41+0xffffffffe9a34776>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a3815a <_sk_callback_sse41+0xffffffffe9a3477a>
.byte 220,63 // fdivrl (%rdi)
.byte 81 // push %rcx
.byte 140,242 // mov %?,%edx
@@ -22605,7 +22600,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a3822a <_sk_callback_sse41+0xffffffffe9a34846>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a3822a <_sk_callback_sse41+0xffffffffe9a3484a>
.byte 220,63 // fdivrl (%rdi)
.byte 81 // push %rcx
.byte 140,242 // mov %?,%edx
@@ -22763,7 +22758,7 @@ BALIGN16
.byte 5,255,255,255,9 // add $0x9ffffff,%eax
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 3004410 <_sk_callback_sse41+0x3000a2c>
+ .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 3004410 <_sk_callback_sse41+0x3000a30>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -23005,7 +23000,7 @@ BALIGN16
.byte 5,255,255,255,9 // add $0x9ffffff,%eax
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 3004660 <_sk_callback_sse41+0x3000c7c>
+ .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 3004660 <_sk_callback_sse41+0x3000c80>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -23032,7 +23027,7 @@ BALIGN16
.byte 5,255,255,255,9 // add $0x9ffffff,%eax
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 30046a0 <_sk_callback_sse41+0x3000cbc>
+ .byte 255,13,255,255,255,2 // decl 0x2ffffff(%rip) # 30046a0 <_sk_callback_sse41+0x3000cc0>
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255,6 // incl (%rsi)
@@ -23307,7 +23302,7 @@ BALIGN16
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d775 <_sk_callback_sse41+0x3d639d91>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d775 <_sk_callback_sse41+0x3d639d95>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 0,63 // add %bh,(%rdi)
.byte 0,0 // add %al,(%rax)
@@ -23333,7 +23328,7 @@ BALIGN16
.byte 0,192 // add %al,%al
.byte 63 // (bad)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d7b5 <_sk_callback_sse41+0x3d639dd1>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d7b5 <_sk_callback_sse41+0x3d639dd5>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 192,63,0 // sarb $0x0,(%rdi)
.byte 0,192 // add %al,%al
@@ -23417,7 +23412,7 @@ BALIGN16
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d885 <_sk_callback_sse41+0x3d639ea1>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d885 <_sk_callback_sse41+0x3d639ea5>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 0,63 // add %bh,(%rdi)
.byte 0,0 // add %al,(%rax)
@@ -23443,7 +23438,7 @@ BALIGN16
.byte 0,192 // add %al,%al
.byte 63 // (bad)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d8c5 <_sk_callback_sse41+0x3d639ee1>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63d8c5 <_sk_callback_sse41+0x3d639ee5>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 192,63,0 // sarb $0x0,(%rdi)
.byte 0,192 // add %al,%al
@@ -23454,11 +23449,11 @@ BALIGN16
.byte 63 // (bad)
.byte 114,28 // jb 4abe <.literal16+0xffe>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 4ac2 <_sk_callback_sse41+0x10de>
+ .byte 62,114,28 // jb,pt 4ac2 <_sk_callback_sse41+0x10e2>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 4ac6 <_sk_callback_sse41+0x10e2>
+ .byte 62,114,28 // jb,pt 4ac6 <_sk_callback_sse41+0x10e6>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 4aca <_sk_callback_sse41+0x10e6>
+ .byte 62,114,28 // jb,pt 4aca <_sk_callback_sse41+0x10ea>
.byte 199 // (bad)
.byte 62,171 // ds stos %eax,%es:(%rdi)
.byte 170 // stos %al,%es:(%rdi)
@@ -23528,7 +23523,7 @@ _sk_seed_shader_sse2:
.byte 102,15,110,199 // movd %edi,%xmm0
.byte 102,15,112,192,0 // pshufd $0x0,%xmm0,%xmm0
.byte 15,91,200 // cvtdq2ps %xmm0,%xmm1
- .byte 15,40,21,196,62,0,0 // movaps 0x3ec4(%rip),%xmm2 # 3f40 <_sk_callback_sse2+0xe0>
+ .byte 15,40,21,196,62,0,0 // movaps 0x3ec4(%rip),%xmm2 # 3f40 <_sk_callback_sse2+0xe4>
.byte 15,88,202 // addps %xmm2,%xmm1
.byte 15,16,2 // movups (%rdx),%xmm0
.byte 15,88,193 // addps %xmm1,%xmm0
@@ -23537,7 +23532,7 @@ _sk_seed_shader_sse2:
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 15,88,202 // addps %xmm2,%xmm1
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,21,179,62,0,0 // movaps 0x3eb3(%rip),%xmm2 # 3f50 <_sk_callback_sse2+0xf0>
+ .byte 15,40,21,179,62,0,0 // movaps 0x3eb3(%rip),%xmm2 # 3f50 <_sk_callback_sse2+0xf4>
.byte 15,87,219 // xorps %xmm3,%xmm3
.byte 15,87,228 // xorps %xmm4,%xmm4
.byte 15,87,237 // xorps %xmm5,%xmm5
@@ -23560,14 +23555,14 @@ _sk_dither_sse2:
.byte 102,68,15,110,1 // movd (%rcx),%xmm8
.byte 102,69,15,112,192,0 // pshufd $0x0,%xmm8,%xmm8
.byte 102,69,15,239,193 // pxor %xmm9,%xmm8
- .byte 102,68,15,111,21,120,62,0,0 // movdqa 0x3e78(%rip),%xmm10 # 3f60 <_sk_callback_sse2+0x100>
+ .byte 102,68,15,111,21,120,62,0,0 // movdqa 0x3e78(%rip),%xmm10 # 3f60 <_sk_callback_sse2+0x104>
.byte 102,69,15,111,216 // movdqa %xmm8,%xmm11
.byte 102,69,15,219,218 // pand %xmm10,%xmm11
.byte 102,65,15,114,243,5 // pslld $0x5,%xmm11
.byte 102,69,15,219,209 // pand %xmm9,%xmm10
.byte 102,65,15,114,242,4 // pslld $0x4,%xmm10
- .byte 102,68,15,111,37,100,62,0,0 // movdqa 0x3e64(%rip),%xmm12 # 3f70 <_sk_callback_sse2+0x110>
- .byte 102,68,15,111,45,107,62,0,0 // movdqa 0x3e6b(%rip),%xmm13 # 3f80 <_sk_callback_sse2+0x120>
+ .byte 102,68,15,111,37,100,62,0,0 // movdqa 0x3e64(%rip),%xmm12 # 3f70 <_sk_callback_sse2+0x114>
+ .byte 102,68,15,111,45,107,62,0,0 // movdqa 0x3e6b(%rip),%xmm13 # 3f80 <_sk_callback_sse2+0x124>
.byte 102,69,15,111,240 // movdqa %xmm8,%xmm14
.byte 102,69,15,219,245 // pand %xmm13,%xmm14
.byte 102,65,15,114,246,2 // pslld $0x2,%xmm14
@@ -23583,12 +23578,11 @@ _sk_dither_sse2:
.byte 102,69,15,235,245 // por %xmm13,%xmm14
.byte 102,69,15,235,240 // por %xmm8,%xmm14
.byte 69,15,91,198 // cvtdq2ps %xmm14,%xmm8
- .byte 68,15,89,5,38,62,0,0 // mulps 0x3e26(%rip),%xmm8 # 3f90 <_sk_callback_sse2+0x130>
- .byte 68,15,88,5,46,62,0,0 // addps 0x3e2e(%rip),%xmm8 # 3fa0 <_sk_callback_sse2+0x140>
+ .byte 68,15,89,5,38,62,0,0 // mulps 0x3e26(%rip),%xmm8 # 3f90 <_sk_callback_sse2+0x134>
+ .byte 68,15,88,5,46,62,0,0 // addps 0x3e2e(%rip),%xmm8 # 3fa0 <_sk_callback_sse2+0x144>
.byte 243,68,15,16,72,8 // movss 0x8(%rax),%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
- .byte 68,15,89,203 // mulps %xmm3,%xmm9
.byte 65,15,88,193 // addps %xmm9,%xmm0
.byte 65,15,88,201 // addps %xmm9,%xmm1
.byte 65,15,88,209 // addps %xmm9,%xmm2
@@ -23627,7 +23621,7 @@ HIDDEN _sk_srcatop_sse2
FUNCTION(_sk_srcatop_sse2)
_sk_srcatop_sse2:
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 68,15,40,5,215,61,0,0 // movaps 0x3dd7(%rip),%xmm8 # 3fb0 <_sk_callback_sse2+0x150>
+ .byte 68,15,40,5,219,61,0,0 // movaps 0x3ddb(%rip),%xmm8 # 3fb0 <_sk_callback_sse2+0x154>
.byte 68,15,92,195 // subps %xmm3,%xmm8
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 68,15,89,204 // mulps %xmm4,%xmm9
@@ -23652,7 +23646,7 @@ FUNCTION(_sk_dstatop_sse2)
_sk_dstatop_sse2:
.byte 68,15,40,195 // movaps %xmm3,%xmm8
.byte 68,15,89,196 // mulps %xmm4,%xmm8
- .byte 68,15,40,13,154,61,0,0 // movaps 0x3d9a(%rip),%xmm9 # 3fc0 <_sk_callback_sse2+0x160>
+ .byte 68,15,40,13,158,61,0,0 // movaps 0x3d9e(%rip),%xmm9 # 3fc0 <_sk_callback_sse2+0x164>
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 65,15,88,192 // addps %xmm8,%xmm0
@@ -23699,7 +23693,7 @@ HIDDEN _sk_srcout_sse2
.globl _sk_srcout_sse2
FUNCTION(_sk_srcout_sse2)
_sk_srcout_sse2:
- .byte 68,15,40,5,62,61,0,0 // movaps 0x3d3e(%rip),%xmm8 # 3fd0 <_sk_callback_sse2+0x170>
+ .byte 68,15,40,5,66,61,0,0 // movaps 0x3d42(%rip),%xmm8 # 3fd0 <_sk_callback_sse2+0x174>
.byte 68,15,92,199 // subps %xmm7,%xmm8
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
@@ -23712,7 +23706,7 @@ HIDDEN _sk_dstout_sse2
.globl _sk_dstout_sse2
FUNCTION(_sk_dstout_sse2)
_sk_dstout_sse2:
- .byte 68,15,40,5,46,61,0,0 // movaps 0x3d2e(%rip),%xmm8 # 3fe0 <_sk_callback_sse2+0x180>
+ .byte 68,15,40,5,50,61,0,0 // movaps 0x3d32(%rip),%xmm8 # 3fe0 <_sk_callback_sse2+0x184>
.byte 68,15,92,195 // subps %xmm3,%xmm8
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 15,89,196 // mulps %xmm4,%xmm0
@@ -23729,7 +23723,7 @@ HIDDEN _sk_srcover_sse2
.globl _sk_srcover_sse2
FUNCTION(_sk_srcover_sse2)
_sk_srcover_sse2:
- .byte 68,15,40,5,17,61,0,0 // movaps 0x3d11(%rip),%xmm8 # 3ff0 <_sk_callback_sse2+0x190>
+ .byte 68,15,40,5,21,61,0,0 // movaps 0x3d15(%rip),%xmm8 # 3ff0 <_sk_callback_sse2+0x194>
.byte 68,15,92,195 // subps %xmm3,%xmm8
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 68,15,89,204 // mulps %xmm4,%xmm9
@@ -23749,7 +23743,7 @@ HIDDEN _sk_dstover_sse2
.globl _sk_dstover_sse2
FUNCTION(_sk_dstover_sse2)
_sk_dstover_sse2:
- .byte 68,15,40,5,229,60,0,0 // movaps 0x3ce5(%rip),%xmm8 # 4000 <_sk_callback_sse2+0x1a0>
+ .byte 68,15,40,5,233,60,0,0 // movaps 0x3ce9(%rip),%xmm8 # 4000 <_sk_callback_sse2+0x1a4>
.byte 68,15,92,199 // subps %xmm7,%xmm8
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 15,88,196 // addps %xmm4,%xmm0
@@ -23777,7 +23771,7 @@ HIDDEN _sk_multiply_sse2
.globl _sk_multiply_sse2
FUNCTION(_sk_multiply_sse2)
_sk_multiply_sse2:
- .byte 68,15,40,5,185,60,0,0 // movaps 0x3cb9(%rip),%xmm8 # 4010 <_sk_callback_sse2+0x1b0>
+ .byte 68,15,40,5,189,60,0,0 // movaps 0x3cbd(%rip),%xmm8 # 4010 <_sk_callback_sse2+0x1b4>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 69,15,40,209 // movaps %xmm9,%xmm10
@@ -23853,7 +23847,7 @@ HIDDEN _sk_xor__sse2
FUNCTION(_sk_xor__sse2)
_sk_xor__sse2:
.byte 68,15,40,195 // movaps %xmm3,%xmm8
- .byte 15,40,29,234,59,0,0 // movaps 0x3bea(%rip),%xmm3 # 4020 <_sk_callback_sse2+0x1c0>
+ .byte 15,40,29,238,59,0,0 // movaps 0x3bee(%rip),%xmm3 # 4020 <_sk_callback_sse2+0x1c4>
.byte 68,15,40,203 // movaps %xmm3,%xmm9
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 65,15,89,193 // mulps %xmm9,%xmm0
@@ -23901,7 +23895,7 @@ _sk_darken_sse2:
.byte 68,15,89,206 // mulps %xmm6,%xmm9
.byte 65,15,95,209 // maxps %xmm9,%xmm2
.byte 68,15,92,194 // subps %xmm2,%xmm8
- .byte 15,40,21,85,59,0,0 // movaps 0x3b55(%rip),%xmm2 # 4030 <_sk_callback_sse2+0x1d0>
+ .byte 15,40,21,89,59,0,0 // movaps 0x3b59(%rip),%xmm2 # 4030 <_sk_callback_sse2+0x1d4>
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,215 // mulps %xmm7,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -23935,7 +23929,7 @@ _sk_lighten_sse2:
.byte 68,15,89,206 // mulps %xmm6,%xmm9
.byte 65,15,93,209 // minps %xmm9,%xmm2
.byte 68,15,92,194 // subps %xmm2,%xmm8
- .byte 15,40,21,250,58,0,0 // movaps 0x3afa(%rip),%xmm2 # 4040 <_sk_callback_sse2+0x1e0>
+ .byte 15,40,21,254,58,0,0 // movaps 0x3afe(%rip),%xmm2 # 4040 <_sk_callback_sse2+0x1e4>
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,215 // mulps %xmm7,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -23972,7 +23966,7 @@ _sk_difference_sse2:
.byte 65,15,93,209 // minps %xmm9,%xmm2
.byte 15,88,210 // addps %xmm2,%xmm2
.byte 68,15,92,194 // subps %xmm2,%xmm8
- .byte 15,40,21,148,58,0,0 // movaps 0x3a94(%rip),%xmm2 # 4050 <_sk_callback_sse2+0x1f0>
+ .byte 15,40,21,152,58,0,0 // movaps 0x3a98(%rip),%xmm2 # 4050 <_sk_callback_sse2+0x1f4>
.byte 15,92,211 // subps %xmm3,%xmm2
.byte 15,89,215 // mulps %xmm7,%xmm2
.byte 15,88,218 // addps %xmm2,%xmm3
@@ -23999,7 +23993,7 @@ _sk_exclusion_sse2:
.byte 15,89,214 // mulps %xmm6,%xmm2
.byte 15,88,210 // addps %xmm2,%xmm2
.byte 68,15,92,202 // subps %xmm2,%xmm9
- .byte 15,40,13,85,58,0,0 // movaps 0x3a55(%rip),%xmm1 # 4060 <_sk_callback_sse2+0x200>
+ .byte 15,40,13,89,58,0,0 // movaps 0x3a59(%rip),%xmm1 # 4060 <_sk_callback_sse2+0x204>
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,89,207 // mulps %xmm7,%xmm1
.byte 15,88,217 // addps %xmm1,%xmm3
@@ -24013,7 +24007,7 @@ HIDDEN _sk_colorburn_sse2
FUNCTION(_sk_colorburn_sse2)
_sk_colorburn_sse2:
.byte 68,15,40,192 // movaps %xmm0,%xmm8
- .byte 68,15,40,21,68,58,0,0 // movaps 0x3a44(%rip),%xmm10 # 4070 <_sk_callback_sse2+0x210>
+ .byte 68,15,40,21,72,58,0,0 // movaps 0x3a48(%rip),%xmm10 # 4070 <_sk_callback_sse2+0x214>
.byte 69,15,40,202 // movaps %xmm10,%xmm9
.byte 68,15,92,207 // subps %xmm7,%xmm9
.byte 69,15,40,217 // movaps %xmm9,%xmm11
@@ -24107,7 +24101,7 @@ HIDDEN _sk_colordodge_sse2
FUNCTION(_sk_colordodge_sse2)
_sk_colordodge_sse2:
.byte 68,15,40,200 // movaps %xmm0,%xmm9
- .byte 68,15,40,21,250,56,0,0 // movaps 0x38fa(%rip),%xmm10 # 4080 <_sk_callback_sse2+0x220>
+ .byte 68,15,40,21,254,56,0,0 // movaps 0x38fe(%rip),%xmm10 # 4080 <_sk_callback_sse2+0x224>
.byte 69,15,40,218 // movaps %xmm10,%xmm11
.byte 68,15,92,223 // subps %xmm7,%xmm11
.byte 69,15,40,227 // movaps %xmm11,%xmm12
@@ -24201,7 +24195,7 @@ _sk_hardlight_sse2:
.byte 15,41,116,36,232 // movaps %xmm6,-0x18(%rsp)
.byte 15,40,245 // movaps %xmm5,%xmm6
.byte 15,40,236 // movaps %xmm4,%xmm5
- .byte 68,15,40,29,175,55,0,0 // movaps 0x37af(%rip),%xmm11 # 4090 <_sk_callback_sse2+0x230>
+ .byte 68,15,40,29,179,55,0,0 // movaps 0x37b3(%rip),%xmm11 # 4090 <_sk_callback_sse2+0x234>
.byte 69,15,40,211 // movaps %xmm11,%xmm10
.byte 68,15,92,215 // subps %xmm7,%xmm10
.byte 69,15,40,194 // movaps %xmm10,%xmm8
@@ -24289,7 +24283,7 @@ FUNCTION(_sk_overlay_sse2)
_sk_overlay_sse2:
.byte 68,15,40,193 // movaps %xmm1,%xmm8
.byte 68,15,40,232 // movaps %xmm0,%xmm13
- .byte 68,15,40,13,125,54,0,0 // movaps 0x367d(%rip),%xmm9 # 40a0 <_sk_callback_sse2+0x240>
+ .byte 68,15,40,13,129,54,0,0 // movaps 0x3681(%rip),%xmm9 # 40a0 <_sk_callback_sse2+0x244>
.byte 69,15,40,209 // movaps %xmm9,%xmm10
.byte 68,15,92,215 // subps %xmm7,%xmm10
.byte 69,15,40,218 // movaps %xmm10,%xmm11
@@ -24380,7 +24374,7 @@ _sk_softlight_sse2:
.byte 68,15,40,213 // movaps %xmm5,%xmm10
.byte 68,15,94,215 // divps %xmm7,%xmm10
.byte 69,15,84,212 // andps %xmm12,%xmm10
- .byte 68,15,40,13,58,53,0,0 // movaps 0x353a(%rip),%xmm9 # 40b0 <_sk_callback_sse2+0x250>
+ .byte 68,15,40,13,62,53,0,0 // movaps 0x353e(%rip),%xmm9 # 40b0 <_sk_callback_sse2+0x254>
.byte 69,15,40,249 // movaps %xmm9,%xmm15
.byte 69,15,92,250 // subps %xmm10,%xmm15
.byte 69,15,40,218 // movaps %xmm10,%xmm11
@@ -24393,10 +24387,10 @@ _sk_softlight_sse2:
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 65,15,88,194 // addps %xmm10,%xmm0
- .byte 68,15,40,53,20,53,0,0 // movaps 0x3514(%rip),%xmm14 # 40c0 <_sk_callback_sse2+0x260>
+ .byte 68,15,40,53,24,53,0,0 // movaps 0x3518(%rip),%xmm14 # 40c0 <_sk_callback_sse2+0x264>
.byte 69,15,88,222 // addps %xmm14,%xmm11
.byte 68,15,89,216 // mulps %xmm0,%xmm11
- .byte 68,15,40,21,20,53,0,0 // movaps 0x3514(%rip),%xmm10 # 40d0 <_sk_callback_sse2+0x270>
+ .byte 68,15,40,21,24,53,0,0 // movaps 0x3518(%rip),%xmm10 # 40d0 <_sk_callback_sse2+0x274>
.byte 69,15,89,234 // mulps %xmm10,%xmm13
.byte 69,15,88,235 // addps %xmm11,%xmm13
.byte 15,88,228 // addps %xmm4,%xmm4
@@ -24548,7 +24542,7 @@ HIDDEN _sk_clamp_1_sse2
.globl _sk_clamp_1_sse2
FUNCTION(_sk_clamp_1_sse2)
_sk_clamp_1_sse2:
- .byte 68,15,40,5,35,51,0,0 // movaps 0x3323(%rip),%xmm8 # 40e0 <_sk_callback_sse2+0x280>
+ .byte 68,15,40,5,39,51,0,0 // movaps 0x3327(%rip),%xmm8 # 40e0 <_sk_callback_sse2+0x284>
.byte 65,15,93,192 // minps %xmm8,%xmm0
.byte 65,15,93,200 // minps %xmm8,%xmm1
.byte 65,15,93,208 // minps %xmm8,%xmm2
@@ -24560,7 +24554,7 @@ HIDDEN _sk_clamp_a_sse2
.globl _sk_clamp_a_sse2
FUNCTION(_sk_clamp_a_sse2)
_sk_clamp_a_sse2:
- .byte 15,93,29,24,51,0,0 // minps 0x3318(%rip),%xmm3 # 40f0 <_sk_callback_sse2+0x290>
+ .byte 15,93,29,28,51,0,0 // minps 0x331c(%rip),%xmm3 # 40f0 <_sk_callback_sse2+0x294>
.byte 15,93,195 // minps %xmm3,%xmm0
.byte 15,93,203 // minps %xmm3,%xmm1
.byte 15,93,211 // minps %xmm3,%xmm2
@@ -24647,7 +24641,7 @@ HIDDEN _sk_unpremul_sse2
FUNCTION(_sk_unpremul_sse2)
_sk_unpremul_sse2:
.byte 69,15,87,192 // xorps %xmm8,%xmm8
- .byte 68,15,40,13,131,50,0,0 // movaps 0x3283(%rip),%xmm9 # 4100 <_sk_callback_sse2+0x2a0>
+ .byte 68,15,40,13,135,50,0,0 // movaps 0x3287(%rip),%xmm9 # 4100 <_sk_callback_sse2+0x2a4>
.byte 68,15,94,203 // divps %xmm3,%xmm9
.byte 68,15,194,195,4 // cmpneqps %xmm3,%xmm8
.byte 69,15,84,193 // andps %xmm9,%xmm8
@@ -24661,20 +24655,20 @@ HIDDEN _sk_from_srgb_sse2
.globl _sk_from_srgb_sse2
FUNCTION(_sk_from_srgb_sse2)
_sk_from_srgb_sse2:
- .byte 68,15,40,5,110,50,0,0 // movaps 0x326e(%rip),%xmm8 # 4110 <_sk_callback_sse2+0x2b0>
+ .byte 68,15,40,5,114,50,0,0 // movaps 0x3272(%rip),%xmm8 # 4110 <_sk_callback_sse2+0x2b4>
.byte 68,15,40,232 // movaps %xmm0,%xmm13
.byte 69,15,89,232 // mulps %xmm8,%xmm13
.byte 68,15,40,216 // movaps %xmm0,%xmm11
.byte 69,15,89,219 // mulps %xmm11,%xmm11
- .byte 68,15,40,13,102,50,0,0 // movaps 0x3266(%rip),%xmm9 # 4120 <_sk_callback_sse2+0x2c0>
+ .byte 68,15,40,13,106,50,0,0 // movaps 0x326a(%rip),%xmm9 # 4120 <_sk_callback_sse2+0x2c4>
.byte 68,15,40,240 // movaps %xmm0,%xmm14
.byte 69,15,89,241 // mulps %xmm9,%xmm14
- .byte 68,15,40,21,102,50,0,0 // movaps 0x3266(%rip),%xmm10 # 4130 <_sk_callback_sse2+0x2d0>
+ .byte 68,15,40,21,106,50,0,0 // movaps 0x326a(%rip),%xmm10 # 4130 <_sk_callback_sse2+0x2d4>
.byte 69,15,88,242 // addps %xmm10,%xmm14
.byte 69,15,89,243 // mulps %xmm11,%xmm14
- .byte 68,15,40,29,102,50,0,0 // movaps 0x3266(%rip),%xmm11 # 4140 <_sk_callback_sse2+0x2e0>
+ .byte 68,15,40,29,106,50,0,0 // movaps 0x326a(%rip),%xmm11 # 4140 <_sk_callback_sse2+0x2e4>
.byte 69,15,88,243 // addps %xmm11,%xmm14
- .byte 68,15,40,37,106,50,0,0 // movaps 0x326a(%rip),%xmm12 # 4150 <_sk_callback_sse2+0x2f0>
+ .byte 68,15,40,37,110,50,0,0 // movaps 0x326e(%rip),%xmm12 # 4150 <_sk_callback_sse2+0x2f4>
.byte 65,15,194,196,1 // cmpltps %xmm12,%xmm0
.byte 68,15,84,232 // andps %xmm0,%xmm13
.byte 65,15,85,198 // andnps %xmm14,%xmm0
@@ -24713,20 +24707,20 @@ _sk_to_srgb_sse2:
.byte 68,15,82,192 // rsqrtps %xmm0,%xmm8
.byte 69,15,83,200 // rcpps %xmm8,%xmm9
.byte 69,15,82,232 // rsqrtps %xmm8,%xmm13
- .byte 68,15,40,5,239,49,0,0 // movaps 0x31ef(%rip),%xmm8 # 4160 <_sk_callback_sse2+0x300>
+ .byte 68,15,40,5,243,49,0,0 // movaps 0x31f3(%rip),%xmm8 # 4160 <_sk_callback_sse2+0x304>
.byte 68,15,40,240 // movaps %xmm0,%xmm14
.byte 69,15,89,240 // mulps %xmm8,%xmm14
- .byte 68,15,40,21,239,49,0,0 // movaps 0x31ef(%rip),%xmm10 # 4170 <_sk_callback_sse2+0x310>
+ .byte 68,15,40,21,243,49,0,0 // movaps 0x31f3(%rip),%xmm10 # 4170 <_sk_callback_sse2+0x314>
.byte 69,15,89,202 // mulps %xmm10,%xmm9
- .byte 68,15,40,29,243,49,0,0 // movaps 0x31f3(%rip),%xmm11 # 4180 <_sk_callback_sse2+0x320>
+ .byte 68,15,40,29,247,49,0,0 // movaps 0x31f7(%rip),%xmm11 # 4180 <_sk_callback_sse2+0x324>
.byte 69,15,88,203 // addps %xmm11,%xmm9
- .byte 68,15,40,37,247,49,0,0 // movaps 0x31f7(%rip),%xmm12 # 4190 <_sk_callback_sse2+0x330>
+ .byte 68,15,40,37,251,49,0,0 // movaps 0x31fb(%rip),%xmm12 # 4190 <_sk_callback_sse2+0x334>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
.byte 69,15,88,233 // addps %xmm9,%xmm13
- .byte 68,15,40,13,247,49,0,0 // movaps 0x31f7(%rip),%xmm9 # 41a0 <_sk_callback_sse2+0x340>
+ .byte 68,15,40,13,251,49,0,0 // movaps 0x31fb(%rip),%xmm9 # 41a0 <_sk_callback_sse2+0x344>
.byte 69,15,40,249 // movaps %xmm9,%xmm15
.byte 69,15,93,253 // minps %xmm13,%xmm15
- .byte 68,15,40,45,247,49,0,0 // movaps 0x31f7(%rip),%xmm13 # 41b0 <_sk_callback_sse2+0x350>
+ .byte 68,15,40,45,251,49,0,0 // movaps 0x31fb(%rip),%xmm13 # 41b0 <_sk_callback_sse2+0x354>
.byte 65,15,194,197,1 // cmpltps %xmm13,%xmm0
.byte 68,15,84,240 // andps %xmm0,%xmm14
.byte 65,15,85,199 // andnps %xmm15,%xmm0
@@ -24776,7 +24770,7 @@ _sk_rgb_to_hsl_sse2:
.byte 68,15,93,218 // minps %xmm2,%xmm11
.byte 65,15,40,202 // movaps %xmm10,%xmm1
.byte 65,15,92,203 // subps %xmm11,%xmm1
- .byte 68,15,40,45,80,49,0,0 // movaps 0x3150(%rip),%xmm13 # 41c0 <_sk_callback_sse2+0x360>
+ .byte 68,15,40,45,84,49,0,0 // movaps 0x3154(%rip),%xmm13 # 41c0 <_sk_callback_sse2+0x364>
.byte 68,15,94,233 // divps %xmm1,%xmm13
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 65,15,194,192,0 // cmpeqps %xmm8,%xmm0
@@ -24785,30 +24779,30 @@ _sk_rgb_to_hsl_sse2:
.byte 69,15,89,229 // mulps %xmm13,%xmm12
.byte 69,15,40,241 // movaps %xmm9,%xmm14
.byte 68,15,194,242,1 // cmpltps %xmm2,%xmm14
- .byte 68,15,84,53,54,49,0,0 // andps 0x3136(%rip),%xmm14 # 41d0 <_sk_callback_sse2+0x370>
+ .byte 68,15,84,53,58,49,0,0 // andps 0x313a(%rip),%xmm14 # 41d0 <_sk_callback_sse2+0x374>
.byte 69,15,88,244 // addps %xmm12,%xmm14
.byte 69,15,40,250 // movaps %xmm10,%xmm15
.byte 69,15,194,249,0 // cmpeqps %xmm9,%xmm15
.byte 65,15,92,208 // subps %xmm8,%xmm2
.byte 65,15,89,213 // mulps %xmm13,%xmm2
- .byte 68,15,40,37,41,49,0,0 // movaps 0x3129(%rip),%xmm12 # 41e0 <_sk_callback_sse2+0x380>
+ .byte 68,15,40,37,45,49,0,0 // movaps 0x312d(%rip),%xmm12 # 41e0 <_sk_callback_sse2+0x384>
.byte 65,15,88,212 // addps %xmm12,%xmm2
.byte 69,15,92,193 // subps %xmm9,%xmm8
.byte 69,15,89,197 // mulps %xmm13,%xmm8
- .byte 68,15,88,5,37,49,0,0 // addps 0x3125(%rip),%xmm8 # 41f0 <_sk_callback_sse2+0x390>
+ .byte 68,15,88,5,41,49,0,0 // addps 0x3129(%rip),%xmm8 # 41f0 <_sk_callback_sse2+0x394>
.byte 65,15,84,215 // andps %xmm15,%xmm2
.byte 69,15,85,248 // andnps %xmm8,%xmm15
.byte 68,15,86,250 // orps %xmm2,%xmm15
.byte 68,15,84,240 // andps %xmm0,%xmm14
.byte 65,15,85,199 // andnps %xmm15,%xmm0
.byte 65,15,86,198 // orps %xmm14,%xmm0
- .byte 15,89,5,22,49,0,0 // mulps 0x3116(%rip),%xmm0 # 4200 <_sk_callback_sse2+0x3a0>
+ .byte 15,89,5,26,49,0,0 // mulps 0x311a(%rip),%xmm0 # 4200 <_sk_callback_sse2+0x3a4>
.byte 69,15,40,194 // movaps %xmm10,%xmm8
.byte 69,15,194,195,4 // cmpneqps %xmm11,%xmm8
.byte 65,15,84,192 // andps %xmm8,%xmm0
.byte 69,15,92,226 // subps %xmm10,%xmm12
.byte 69,15,88,211 // addps %xmm11,%xmm10
- .byte 68,15,40,13,9,49,0,0 // movaps 0x3109(%rip),%xmm9 # 4210 <_sk_callback_sse2+0x3b0>
+ .byte 68,15,40,13,13,49,0,0 // movaps 0x310d(%rip),%xmm9 # 4210 <_sk_callback_sse2+0x3b4>
.byte 65,15,40,210 // movaps %xmm10,%xmm2
.byte 65,15,89,209 // mulps %xmm9,%xmm2
.byte 68,15,194,202,1 // cmpltps %xmm2,%xmm9
@@ -24832,7 +24826,7 @@ _sk_hsl_to_rgb_sse2:
.byte 15,41,92,36,168 // movaps %xmm3,-0x58(%rsp)
.byte 68,15,40,218 // movaps %xmm2,%xmm11
.byte 15,40,240 // movaps %xmm0,%xmm6
- .byte 68,15,40,13,200,48,0,0 // movaps 0x30c8(%rip),%xmm9 # 4220 <_sk_callback_sse2+0x3c0>
+ .byte 68,15,40,13,204,48,0,0 // movaps 0x30cc(%rip),%xmm9 # 4220 <_sk_callback_sse2+0x3c4>
.byte 69,15,40,209 // movaps %xmm9,%xmm10
.byte 69,15,194,211,2 // cmpleps %xmm11,%xmm10
.byte 15,40,193 // movaps %xmm1,%xmm0
@@ -24849,28 +24843,28 @@ _sk_hsl_to_rgb_sse2:
.byte 69,15,88,211 // addps %xmm11,%xmm10
.byte 69,15,88,219 // addps %xmm11,%xmm11
.byte 69,15,92,218 // subps %xmm10,%xmm11
- .byte 15,40,5,145,48,0,0 // movaps 0x3091(%rip),%xmm0 # 4230 <_sk_callback_sse2+0x3d0>
+ .byte 15,40,5,149,48,0,0 // movaps 0x3095(%rip),%xmm0 # 4230 <_sk_callback_sse2+0x3d4>
.byte 15,88,198 // addps %xmm6,%xmm0
.byte 243,15,91,200 // cvttps2dq %xmm0,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
.byte 15,40,216 // movaps %xmm0,%xmm3
.byte 15,194,217,1 // cmpltps %xmm1,%xmm3
- .byte 15,84,29,137,48,0,0 // andps 0x3089(%rip),%xmm3 # 4240 <_sk_callback_sse2+0x3e0>
+ .byte 15,84,29,141,48,0,0 // andps 0x308d(%rip),%xmm3 # 4240 <_sk_callback_sse2+0x3e4>
.byte 15,92,203 // subps %xmm3,%xmm1
.byte 15,92,193 // subps %xmm1,%xmm0
- .byte 68,15,40,45,139,48,0,0 // movaps 0x308b(%rip),%xmm13 # 4250 <_sk_callback_sse2+0x3f0>
+ .byte 68,15,40,45,143,48,0,0 // movaps 0x308f(%rip),%xmm13 # 4250 <_sk_callback_sse2+0x3f4>
.byte 69,15,40,197 // movaps %xmm13,%xmm8
.byte 68,15,194,192,2 // cmpleps %xmm0,%xmm8
.byte 69,15,40,242 // movaps %xmm10,%xmm14
.byte 69,15,92,243 // subps %xmm11,%xmm14
.byte 65,15,40,217 // movaps %xmm9,%xmm3
.byte 15,194,216,2 // cmpleps %xmm0,%xmm3
- .byte 15,40,21,155,48,0,0 // movaps 0x309b(%rip),%xmm2 # 4280 <_sk_callback_sse2+0x420>
+ .byte 15,40,21,159,48,0,0 // movaps 0x309f(%rip),%xmm2 # 4280 <_sk_callback_sse2+0x424>
.byte 68,15,40,250 // movaps %xmm2,%xmm15
.byte 68,15,194,248,2 // cmpleps %xmm0,%xmm15
- .byte 15,40,13,107,48,0,0 // movaps 0x306b(%rip),%xmm1 # 4260 <_sk_callback_sse2+0x400>
+ .byte 15,40,13,111,48,0,0 // movaps 0x306f(%rip),%xmm1 # 4260 <_sk_callback_sse2+0x404>
.byte 15,89,193 // mulps %xmm1,%xmm0
- .byte 15,40,45,113,48,0,0 // movaps 0x3071(%rip),%xmm5 # 4270 <_sk_callback_sse2+0x410>
+ .byte 15,40,45,117,48,0,0 // movaps 0x3075(%rip),%xmm5 # 4270 <_sk_callback_sse2+0x414>
.byte 15,40,229 // movaps %xmm5,%xmm4
.byte 15,92,224 // subps %xmm0,%xmm4
.byte 65,15,89,230 // mulps %xmm14,%xmm4
@@ -24893,7 +24887,7 @@ _sk_hsl_to_rgb_sse2:
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
.byte 15,40,222 // movaps %xmm6,%xmm3
.byte 15,194,216,1 // cmpltps %xmm0,%xmm3
- .byte 15,84,29,230,47,0,0 // andps 0x2fe6(%rip),%xmm3 # 4240 <_sk_callback_sse2+0x3e0>
+ .byte 15,84,29,234,47,0,0 // andps 0x2fea(%rip),%xmm3 # 4240 <_sk_callback_sse2+0x3e4>
.byte 15,92,195 // subps %xmm3,%xmm0
.byte 68,15,40,230 // movaps %xmm6,%xmm12
.byte 68,15,92,224 // subps %xmm0,%xmm12
@@ -24923,12 +24917,12 @@ _sk_hsl_to_rgb_sse2:
.byte 15,40,124,36,136 // movaps -0x78(%rsp),%xmm7
.byte 15,40,231 // movaps %xmm7,%xmm4
.byte 15,85,227 // andnps %xmm3,%xmm4
- .byte 15,88,53,190,47,0,0 // addps 0x2fbe(%rip),%xmm6 # 4290 <_sk_callback_sse2+0x430>
+ .byte 15,88,53,194,47,0,0 // addps 0x2fc2(%rip),%xmm6 # 4290 <_sk_callback_sse2+0x434>
.byte 243,15,91,198 // cvttps2dq %xmm6,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
.byte 15,40,222 // movaps %xmm6,%xmm3
.byte 15,194,216,1 // cmpltps %xmm0,%xmm3
- .byte 15,84,29,89,47,0,0 // andps 0x2f59(%rip),%xmm3 # 4240 <_sk_callback_sse2+0x3e0>
+ .byte 15,84,29,93,47,0,0 // andps 0x2f5d(%rip),%xmm3 # 4240 <_sk_callback_sse2+0x3e4>
.byte 15,92,195 // subps %xmm3,%xmm0
.byte 15,92,240 // subps %xmm0,%xmm6
.byte 15,89,206 // mulps %xmm6,%xmm1
@@ -24992,7 +24986,7 @@ _sk_scale_u8_sse2:
.byte 102,69,15,96,193 // punpcklbw %xmm9,%xmm8
.byte 102,69,15,97,193 // punpcklwd %xmm9,%xmm8
.byte 69,15,91,192 // cvtdq2ps %xmm8,%xmm8
- .byte 68,15,89,5,231,46,0,0 // mulps 0x2ee7(%rip),%xmm8 # 42a0 <_sk_callback_sse2+0x440>
+ .byte 68,15,89,5,235,46,0,0 // mulps 0x2eeb(%rip),%xmm8 # 42a0 <_sk_callback_sse2+0x444>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 65,15,89,208 // mulps %xmm8,%xmm2
@@ -25033,7 +25027,7 @@ _sk_lerp_u8_sse2:
.byte 102,69,15,96,193 // punpcklbw %xmm9,%xmm8
.byte 102,69,15,97,193 // punpcklwd %xmm9,%xmm8
.byte 69,15,91,192 // cvtdq2ps %xmm8,%xmm8
- .byte 68,15,89,5,133,46,0,0 // mulps 0x2e85(%rip),%xmm8 # 42b0 <_sk_callback_sse2+0x450>
+ .byte 68,15,89,5,137,46,0,0 // mulps 0x2e89(%rip),%xmm8 # 42b0 <_sk_callback_sse2+0x454>
.byte 15,92,196 // subps %xmm4,%xmm0
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 15,88,196 // addps %xmm4,%xmm0
@@ -25058,17 +25052,17 @@ _sk_lerp_565_sse2:
.byte 243,68,15,126,4,120 // movq (%rax,%rdi,2),%xmm8
.byte 102,15,239,219 // pxor %xmm3,%xmm3
.byte 102,68,15,97,195 // punpcklwd %xmm3,%xmm8
- .byte 102,15,111,29,77,46,0,0 // movdqa 0x2e4d(%rip),%xmm3 # 42c0 <_sk_callback_sse2+0x460>
+ .byte 102,15,111,29,81,46,0,0 // movdqa 0x2e51(%rip),%xmm3 # 42c0 <_sk_callback_sse2+0x464>
.byte 102,65,15,219,216 // pand %xmm8,%xmm3
.byte 68,15,91,203 // cvtdq2ps %xmm3,%xmm9
- .byte 68,15,89,13,76,46,0,0 // mulps 0x2e4c(%rip),%xmm9 # 42d0 <_sk_callback_sse2+0x470>
- .byte 102,15,111,29,84,46,0,0 // movdqa 0x2e54(%rip),%xmm3 # 42e0 <_sk_callback_sse2+0x480>
+ .byte 68,15,89,13,80,46,0,0 // mulps 0x2e50(%rip),%xmm9 # 42d0 <_sk_callback_sse2+0x474>
+ .byte 102,15,111,29,88,46,0,0 // movdqa 0x2e58(%rip),%xmm3 # 42e0 <_sk_callback_sse2+0x484>
.byte 102,65,15,219,216 // pand %xmm8,%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,85,46,0,0 // mulps 0x2e55(%rip),%xmm3 # 42f0 <_sk_callback_sse2+0x490>
- .byte 102,68,15,219,5,92,46,0,0 // pand 0x2e5c(%rip),%xmm8 # 4300 <_sk_callback_sse2+0x4a0>
+ .byte 15,89,29,89,46,0,0 // mulps 0x2e59(%rip),%xmm3 # 42f0 <_sk_callback_sse2+0x494>
+ .byte 102,68,15,219,5,96,46,0,0 // pand 0x2e60(%rip),%xmm8 # 4300 <_sk_callback_sse2+0x4a4>
.byte 69,15,91,192 // cvtdq2ps %xmm8,%xmm8
- .byte 68,15,89,5,96,46,0,0 // mulps 0x2e60(%rip),%xmm8 # 4310 <_sk_callback_sse2+0x4b0>
+ .byte 68,15,89,5,100,46,0,0 // mulps 0x2e64(%rip),%xmm8 # 4310 <_sk_callback_sse2+0x4b4>
.byte 15,92,196 // subps %xmm4,%xmm0
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 15,88,196 // addps %xmm4,%xmm0
@@ -25079,7 +25073,7 @@ _sk_lerp_565_sse2:
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 15,88,214 // addps %xmm6,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,74,46,0,0 // movaps 0x2e4a(%rip),%xmm3 # 4320 <_sk_callback_sse2+0x4c0>
+ .byte 15,40,29,78,46,0,0 // movaps 0x2e4e(%rip),%xmm3 # 4320 <_sk_callback_sse2+0x4c4>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_load_tables_sse2
@@ -25090,7 +25084,7 @@ _sk_load_tables_sse2:
.byte 76,139,0 // mov (%rax),%r8
.byte 76,139,72,8 // mov 0x8(%rax),%r9
.byte 243,69,15,111,12,184 // movdqu (%r8,%rdi,4),%xmm9
- .byte 102,68,15,111,5,64,46,0,0 // movdqa 0x2e40(%rip),%xmm8 # 4330 <_sk_callback_sse2+0x4d0>
+ .byte 102,68,15,111,5,68,46,0,0 // movdqa 0x2e44(%rip),%xmm8 # 4330 <_sk_callback_sse2+0x4d4>
.byte 102,65,15,111,193 // movdqa %xmm9,%xmm0
.byte 102,65,15,219,192 // pand %xmm8,%xmm0
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
@@ -25145,7 +25139,7 @@ _sk_load_tables_sse2:
.byte 65,15,20,208 // unpcklps %xmm8,%xmm2
.byte 102,65,15,114,209,24 // psrld $0x18,%xmm9
.byte 65,15,91,217 // cvtdq2ps %xmm9,%xmm3
- .byte 15,89,29,77,45,0,0 // mulps 0x2d4d(%rip),%xmm3 # 4340 <_sk_callback_sse2+0x4e0>
+ .byte 15,89,29,81,45,0,0 // mulps 0x2d51(%rip),%xmm3 # 4340 <_sk_callback_sse2+0x4e4>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -25164,7 +25158,7 @@ _sk_load_tables_u16_be_sse2:
.byte 102,65,15,111,201 // movdqa %xmm9,%xmm1
.byte 102,15,97,200 // punpcklwd %xmm0,%xmm1
.byte 102,68,15,105,200 // punpckhwd %xmm0,%xmm9
- .byte 102,68,15,111,21,32,45,0,0 // movdqa 0x2d20(%rip),%xmm10 # 4350 <_sk_callback_sse2+0x4f0>
+ .byte 102,68,15,111,21,36,45,0,0 // movdqa 0x2d24(%rip),%xmm10 # 4350 <_sk_callback_sse2+0x4f4>
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,65,15,219,194 // pand %xmm10,%xmm0
.byte 102,69,15,239,192 // pxor %xmm8,%xmm8
@@ -25225,7 +25219,7 @@ _sk_load_tables_u16_be_sse2:
.byte 102,65,15,235,217 // por %xmm9,%xmm3
.byte 102,65,15,97,216 // punpcklwd %xmm8,%xmm3
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,15,44,0,0 // mulps 0x2c0f(%rip),%xmm3 # 4360 <_sk_callback_sse2+0x500>
+ .byte 15,89,29,19,44,0,0 // mulps 0x2c13(%rip),%xmm3 # 4360 <_sk_callback_sse2+0x504>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -25247,7 +25241,7 @@ _sk_load_tables_rgb_u16_be_sse2:
.byte 102,68,15,97,208 // punpcklwd %xmm0,%xmm10
.byte 102,65,15,111,195 // movdqa %xmm11,%xmm0
.byte 102,65,15,97,194 // punpcklwd %xmm10,%xmm0
- .byte 102,68,15,111,5,207,43,0,0 // movdqa 0x2bcf(%rip),%xmm8 # 4370 <_sk_callback_sse2+0x510>
+ .byte 102,68,15,111,5,211,43,0,0 // movdqa 0x2bd3(%rip),%xmm8 # 4370 <_sk_callback_sse2+0x514>
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
.byte 102,65,15,219,192 // pand %xmm8,%xmm0
.byte 102,69,15,239,201 // pxor %xmm9,%xmm9
@@ -25302,7 +25296,7 @@ _sk_load_tables_rgb_u16_be_sse2:
.byte 15,20,211 // unpcklps %xmm3,%xmm2
.byte 65,15,20,208 // unpcklps %xmm8,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,222,42,0,0 // movaps 0x2ade(%rip),%xmm3 # 4380 <_sk_callback_sse2+0x520>
+ .byte 15,40,29,226,42,0,0 // movaps 0x2ae2(%rip),%xmm3 # 4380 <_sk_callback_sse2+0x524>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_byte_tables_sse2
@@ -25312,7 +25306,7 @@ _sk_byte_tables_sse2:
.byte 65,86 // push %r14
.byte 83 // push %rbx
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,223,42,0,0 // movaps 0x2adf(%rip),%xmm8 # 4390 <_sk_callback_sse2+0x530>
+ .byte 68,15,40,5,227,42,0,0 // movaps 0x2ae3(%rip),%xmm8 # 4390 <_sk_callback_sse2+0x534>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,91,192 // cvtps2dq %xmm0,%xmm0
.byte 102,72,15,126,193 // movq %xmm0,%rcx
@@ -25339,7 +25333,7 @@ _sk_byte_tables_sse2:
.byte 102,65,15,96,193 // punpcklbw %xmm9,%xmm0
.byte 102,65,15,97,193 // punpcklwd %xmm9,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,21,124,42,0,0 // movaps 0x2a7c(%rip),%xmm10 # 43a0 <_sk_callback_sse2+0x540>
+ .byte 68,15,40,21,128,42,0,0 // movaps 0x2a80(%rip),%xmm10 # 43a0 <_sk_callback_sse2+0x544>
.byte 65,15,89,194 // mulps %xmm10,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1
@@ -25455,7 +25449,7 @@ _sk_byte_tables_rgb_sse2:
.byte 102,65,15,96,193 // punpcklbw %xmm9,%xmm0
.byte 102,65,15,97,193 // punpcklwd %xmm9,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,21,207,40,0,0 // movaps 0x28cf(%rip),%xmm10 # 43b0 <_sk_callback_sse2+0x550>
+ .byte 68,15,40,21,211,40,0,0 // movaps 0x28d3(%rip),%xmm10 # 43b0 <_sk_callback_sse2+0x554>
.byte 65,15,89,194 // mulps %xmm10,%xmm0
.byte 65,15,89,200 // mulps %xmm8,%xmm1
.byte 102,15,91,201 // cvtps2dq %xmm1,%xmm1
@@ -25652,15 +25646,15 @@ _sk_parametric_r_sse2:
.byte 69,15,88,209 // addps %xmm9,%xmm10
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,91,202 // cvtdq2ps %xmm10,%xmm9
- .byte 68,15,89,13,14,38,0,0 // mulps 0x260e(%rip),%xmm9 # 43c0 <_sk_callback_sse2+0x560>
- .byte 68,15,84,21,22,38,0,0 // andps 0x2616(%rip),%xmm10 # 43d0 <_sk_callback_sse2+0x570>
- .byte 68,15,86,21,30,38,0,0 // orps 0x261e(%rip),%xmm10 # 43e0 <_sk_callback_sse2+0x580>
- .byte 68,15,88,13,38,38,0,0 // addps 0x2626(%rip),%xmm9 # 43f0 <_sk_callback_sse2+0x590>
- .byte 68,15,40,37,46,38,0,0 // movaps 0x262e(%rip),%xmm12 # 4400 <_sk_callback_sse2+0x5a0>
+ .byte 68,15,89,13,18,38,0,0 // mulps 0x2612(%rip),%xmm9 # 43c0 <_sk_callback_sse2+0x564>
+ .byte 68,15,84,21,26,38,0,0 // andps 0x261a(%rip),%xmm10 # 43d0 <_sk_callback_sse2+0x574>
+ .byte 68,15,86,21,34,38,0,0 // orps 0x2622(%rip),%xmm10 # 43e0 <_sk_callback_sse2+0x584>
+ .byte 68,15,88,13,42,38,0,0 // addps 0x262a(%rip),%xmm9 # 43f0 <_sk_callback_sse2+0x594>
+ .byte 68,15,40,37,50,38,0,0 // movaps 0x2632(%rip),%xmm12 # 4400 <_sk_callback_sse2+0x5a4>
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,88,21,46,38,0,0 // addps 0x262e(%rip),%xmm10 # 4410 <_sk_callback_sse2+0x5b0>
- .byte 68,15,40,37,54,38,0,0 // movaps 0x2636(%rip),%xmm12 # 4420 <_sk_callback_sse2+0x5c0>
+ .byte 68,15,88,21,50,38,0,0 // addps 0x2632(%rip),%xmm10 # 4410 <_sk_callback_sse2+0x5b4>
+ .byte 68,15,40,37,58,38,0,0 // movaps 0x263a(%rip),%xmm12 # 4420 <_sk_callback_sse2+0x5c4>
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
.byte 69,15,89,203 // mulps %xmm11,%xmm9
@@ -25668,22 +25662,22 @@ _sk_parametric_r_sse2:
.byte 69,15,91,226 // cvtdq2ps %xmm10,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,194,236,1 // cmpltps %xmm12,%xmm13
- .byte 68,15,40,21,32,38,0,0 // movaps 0x2620(%rip),%xmm10 # 4430 <_sk_callback_sse2+0x5d0>
+ .byte 68,15,40,21,36,38,0,0 // movaps 0x2624(%rip),%xmm10 # 4430 <_sk_callback_sse2+0x5d4>
.byte 69,15,84,234 // andps %xmm10,%xmm13
.byte 69,15,87,219 // xorps %xmm11,%xmm11
.byte 69,15,92,229 // subps %xmm13,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,92,236 // subps %xmm12,%xmm13
- .byte 68,15,88,13,20,38,0,0 // addps 0x2614(%rip),%xmm9 # 4440 <_sk_callback_sse2+0x5e0>
- .byte 68,15,40,37,28,38,0,0 // movaps 0x261c(%rip),%xmm12 # 4450 <_sk_callback_sse2+0x5f0>
+ .byte 68,15,88,13,24,38,0,0 // addps 0x2618(%rip),%xmm9 # 4440 <_sk_callback_sse2+0x5e4>
+ .byte 68,15,40,37,32,38,0,0 // movaps 0x2620(%rip),%xmm12 # 4450 <_sk_callback_sse2+0x5f4>
.byte 69,15,89,229 // mulps %xmm13,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,40,37,28,38,0,0 // movaps 0x261c(%rip),%xmm12 # 4460 <_sk_callback_sse2+0x600>
+ .byte 68,15,40,37,32,38,0,0 // movaps 0x2620(%rip),%xmm12 # 4460 <_sk_callback_sse2+0x604>
.byte 69,15,92,229 // subps %xmm13,%xmm12
- .byte 68,15,40,45,32,38,0,0 // movaps 0x2620(%rip),%xmm13 # 4470 <_sk_callback_sse2+0x610>
+ .byte 68,15,40,45,36,38,0,0 // movaps 0x2624(%rip),%xmm13 # 4470 <_sk_callback_sse2+0x614>
.byte 69,15,94,236 // divps %xmm12,%xmm13
.byte 69,15,88,233 // addps %xmm9,%xmm13
- .byte 68,15,89,45,32,38,0,0 // mulps 0x2620(%rip),%xmm13 # 4480 <_sk_callback_sse2+0x620>
+ .byte 68,15,89,45,36,38,0,0 // mulps 0x2624(%rip),%xmm13 # 4480 <_sk_callback_sse2+0x624>
.byte 102,69,15,91,205 // cvtps2dq %xmm13,%xmm9
.byte 243,68,15,16,96,20 // movss 0x14(%rax),%xmm12
.byte 69,15,198,228,0 // shufps $0x0,%xmm12,%xmm12
@@ -25719,15 +25713,15 @@ _sk_parametric_g_sse2:
.byte 69,15,88,209 // addps %xmm9,%xmm10
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,91,202 // cvtdq2ps %xmm10,%xmm9
- .byte 68,15,89,13,160,37,0,0 // mulps 0x25a0(%rip),%xmm9 # 4490 <_sk_callback_sse2+0x630>
- .byte 68,15,84,21,168,37,0,0 // andps 0x25a8(%rip),%xmm10 # 44a0 <_sk_callback_sse2+0x640>
- .byte 68,15,86,21,176,37,0,0 // orps 0x25b0(%rip),%xmm10 # 44b0 <_sk_callback_sse2+0x650>
- .byte 68,15,88,13,184,37,0,0 // addps 0x25b8(%rip),%xmm9 # 44c0 <_sk_callback_sse2+0x660>
- .byte 68,15,40,37,192,37,0,0 // movaps 0x25c0(%rip),%xmm12 # 44d0 <_sk_callback_sse2+0x670>
+ .byte 68,15,89,13,164,37,0,0 // mulps 0x25a4(%rip),%xmm9 # 4490 <_sk_callback_sse2+0x634>
+ .byte 68,15,84,21,172,37,0,0 // andps 0x25ac(%rip),%xmm10 # 44a0 <_sk_callback_sse2+0x644>
+ .byte 68,15,86,21,180,37,0,0 // orps 0x25b4(%rip),%xmm10 # 44b0 <_sk_callback_sse2+0x654>
+ .byte 68,15,88,13,188,37,0,0 // addps 0x25bc(%rip),%xmm9 # 44c0 <_sk_callback_sse2+0x664>
+ .byte 68,15,40,37,196,37,0,0 // movaps 0x25c4(%rip),%xmm12 # 44d0 <_sk_callback_sse2+0x674>
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,88,21,192,37,0,0 // addps 0x25c0(%rip),%xmm10 # 44e0 <_sk_callback_sse2+0x680>
- .byte 68,15,40,37,200,37,0,0 // movaps 0x25c8(%rip),%xmm12 # 44f0 <_sk_callback_sse2+0x690>
+ .byte 68,15,88,21,196,37,0,0 // addps 0x25c4(%rip),%xmm10 # 44e0 <_sk_callback_sse2+0x684>
+ .byte 68,15,40,37,204,37,0,0 // movaps 0x25cc(%rip),%xmm12 # 44f0 <_sk_callback_sse2+0x694>
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
.byte 69,15,89,203 // mulps %xmm11,%xmm9
@@ -25735,22 +25729,22 @@ _sk_parametric_g_sse2:
.byte 69,15,91,226 // cvtdq2ps %xmm10,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,194,236,1 // cmpltps %xmm12,%xmm13
- .byte 68,15,40,21,178,37,0,0 // movaps 0x25b2(%rip),%xmm10 # 4500 <_sk_callback_sse2+0x6a0>
+ .byte 68,15,40,21,182,37,0,0 // movaps 0x25b6(%rip),%xmm10 # 4500 <_sk_callback_sse2+0x6a4>
.byte 69,15,84,234 // andps %xmm10,%xmm13
.byte 69,15,87,219 // xorps %xmm11,%xmm11
.byte 69,15,92,229 // subps %xmm13,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,92,236 // subps %xmm12,%xmm13
- .byte 68,15,88,13,166,37,0,0 // addps 0x25a6(%rip),%xmm9 # 4510 <_sk_callback_sse2+0x6b0>
- .byte 68,15,40,37,174,37,0,0 // movaps 0x25ae(%rip),%xmm12 # 4520 <_sk_callback_sse2+0x6c0>
+ .byte 68,15,88,13,170,37,0,0 // addps 0x25aa(%rip),%xmm9 # 4510 <_sk_callback_sse2+0x6b4>
+ .byte 68,15,40,37,178,37,0,0 // movaps 0x25b2(%rip),%xmm12 # 4520 <_sk_callback_sse2+0x6c4>
.byte 69,15,89,229 // mulps %xmm13,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,40,37,174,37,0,0 // movaps 0x25ae(%rip),%xmm12 # 4530 <_sk_callback_sse2+0x6d0>
+ .byte 68,15,40,37,178,37,0,0 // movaps 0x25b2(%rip),%xmm12 # 4530 <_sk_callback_sse2+0x6d4>
.byte 69,15,92,229 // subps %xmm13,%xmm12
- .byte 68,15,40,45,178,37,0,0 // movaps 0x25b2(%rip),%xmm13 # 4540 <_sk_callback_sse2+0x6e0>
+ .byte 68,15,40,45,182,37,0,0 // movaps 0x25b6(%rip),%xmm13 # 4540 <_sk_callback_sse2+0x6e4>
.byte 69,15,94,236 // divps %xmm12,%xmm13
.byte 69,15,88,233 // addps %xmm9,%xmm13
- .byte 68,15,89,45,178,37,0,0 // mulps 0x25b2(%rip),%xmm13 # 4550 <_sk_callback_sse2+0x6f0>
+ .byte 68,15,89,45,182,37,0,0 // mulps 0x25b6(%rip),%xmm13 # 4550 <_sk_callback_sse2+0x6f4>
.byte 102,69,15,91,205 // cvtps2dq %xmm13,%xmm9
.byte 243,68,15,16,96,20 // movss 0x14(%rax),%xmm12
.byte 69,15,198,228,0 // shufps $0x0,%xmm12,%xmm12
@@ -25786,15 +25780,15 @@ _sk_parametric_b_sse2:
.byte 69,15,88,209 // addps %xmm9,%xmm10
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,91,202 // cvtdq2ps %xmm10,%xmm9
- .byte 68,15,89,13,50,37,0,0 // mulps 0x2532(%rip),%xmm9 # 4560 <_sk_callback_sse2+0x700>
- .byte 68,15,84,21,58,37,0,0 // andps 0x253a(%rip),%xmm10 # 4570 <_sk_callback_sse2+0x710>
- .byte 68,15,86,21,66,37,0,0 // orps 0x2542(%rip),%xmm10 # 4580 <_sk_callback_sse2+0x720>
- .byte 68,15,88,13,74,37,0,0 // addps 0x254a(%rip),%xmm9 # 4590 <_sk_callback_sse2+0x730>
- .byte 68,15,40,37,82,37,0,0 // movaps 0x2552(%rip),%xmm12 # 45a0 <_sk_callback_sse2+0x740>
+ .byte 68,15,89,13,54,37,0,0 // mulps 0x2536(%rip),%xmm9 # 4560 <_sk_callback_sse2+0x704>
+ .byte 68,15,84,21,62,37,0,0 // andps 0x253e(%rip),%xmm10 # 4570 <_sk_callback_sse2+0x714>
+ .byte 68,15,86,21,70,37,0,0 // orps 0x2546(%rip),%xmm10 # 4580 <_sk_callback_sse2+0x724>
+ .byte 68,15,88,13,78,37,0,0 // addps 0x254e(%rip),%xmm9 # 4590 <_sk_callback_sse2+0x734>
+ .byte 68,15,40,37,86,37,0,0 // movaps 0x2556(%rip),%xmm12 # 45a0 <_sk_callback_sse2+0x744>
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,88,21,82,37,0,0 // addps 0x2552(%rip),%xmm10 # 45b0 <_sk_callback_sse2+0x750>
- .byte 68,15,40,37,90,37,0,0 // movaps 0x255a(%rip),%xmm12 # 45c0 <_sk_callback_sse2+0x760>
+ .byte 68,15,88,21,86,37,0,0 // addps 0x2556(%rip),%xmm10 # 45b0 <_sk_callback_sse2+0x754>
+ .byte 68,15,40,37,94,37,0,0 // movaps 0x255e(%rip),%xmm12 # 45c0 <_sk_callback_sse2+0x764>
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
.byte 69,15,89,203 // mulps %xmm11,%xmm9
@@ -25802,22 +25796,22 @@ _sk_parametric_b_sse2:
.byte 69,15,91,226 // cvtdq2ps %xmm10,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,194,236,1 // cmpltps %xmm12,%xmm13
- .byte 68,15,40,21,68,37,0,0 // movaps 0x2544(%rip),%xmm10 # 45d0 <_sk_callback_sse2+0x770>
+ .byte 68,15,40,21,72,37,0,0 // movaps 0x2548(%rip),%xmm10 # 45d0 <_sk_callback_sse2+0x774>
.byte 69,15,84,234 // andps %xmm10,%xmm13
.byte 69,15,87,219 // xorps %xmm11,%xmm11
.byte 69,15,92,229 // subps %xmm13,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,92,236 // subps %xmm12,%xmm13
- .byte 68,15,88,13,56,37,0,0 // addps 0x2538(%rip),%xmm9 # 45e0 <_sk_callback_sse2+0x780>
- .byte 68,15,40,37,64,37,0,0 // movaps 0x2540(%rip),%xmm12 # 45f0 <_sk_callback_sse2+0x790>
+ .byte 68,15,88,13,60,37,0,0 // addps 0x253c(%rip),%xmm9 # 45e0 <_sk_callback_sse2+0x784>
+ .byte 68,15,40,37,68,37,0,0 // movaps 0x2544(%rip),%xmm12 # 45f0 <_sk_callback_sse2+0x794>
.byte 69,15,89,229 // mulps %xmm13,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,40,37,64,37,0,0 // movaps 0x2540(%rip),%xmm12 # 4600 <_sk_callback_sse2+0x7a0>
+ .byte 68,15,40,37,68,37,0,0 // movaps 0x2544(%rip),%xmm12 # 4600 <_sk_callback_sse2+0x7a4>
.byte 69,15,92,229 // subps %xmm13,%xmm12
- .byte 68,15,40,45,68,37,0,0 // movaps 0x2544(%rip),%xmm13 # 4610 <_sk_callback_sse2+0x7b0>
+ .byte 68,15,40,45,72,37,0,0 // movaps 0x2548(%rip),%xmm13 # 4610 <_sk_callback_sse2+0x7b4>
.byte 69,15,94,236 // divps %xmm12,%xmm13
.byte 69,15,88,233 // addps %xmm9,%xmm13
- .byte 68,15,89,45,68,37,0,0 // mulps 0x2544(%rip),%xmm13 # 4620 <_sk_callback_sse2+0x7c0>
+ .byte 68,15,89,45,72,37,0,0 // mulps 0x2548(%rip),%xmm13 # 4620 <_sk_callback_sse2+0x7c4>
.byte 102,69,15,91,205 // cvtps2dq %xmm13,%xmm9
.byte 243,68,15,16,96,20 // movss 0x14(%rax),%xmm12
.byte 69,15,198,228,0 // shufps $0x0,%xmm12,%xmm12
@@ -25853,15 +25847,15 @@ _sk_parametric_a_sse2:
.byte 69,15,88,209 // addps %xmm9,%xmm10
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,91,202 // cvtdq2ps %xmm10,%xmm9
- .byte 68,15,89,13,196,36,0,0 // mulps 0x24c4(%rip),%xmm9 # 4630 <_sk_callback_sse2+0x7d0>
- .byte 68,15,84,21,204,36,0,0 // andps 0x24cc(%rip),%xmm10 # 4640 <_sk_callback_sse2+0x7e0>
- .byte 68,15,86,21,212,36,0,0 // orps 0x24d4(%rip),%xmm10 # 4650 <_sk_callback_sse2+0x7f0>
- .byte 68,15,88,13,220,36,0,0 // addps 0x24dc(%rip),%xmm9 # 4660 <_sk_callback_sse2+0x800>
- .byte 68,15,40,37,228,36,0,0 // movaps 0x24e4(%rip),%xmm12 # 4670 <_sk_callback_sse2+0x810>
+ .byte 68,15,89,13,200,36,0,0 // mulps 0x24c8(%rip),%xmm9 # 4630 <_sk_callback_sse2+0x7d4>
+ .byte 68,15,84,21,208,36,0,0 // andps 0x24d0(%rip),%xmm10 # 4640 <_sk_callback_sse2+0x7e4>
+ .byte 68,15,86,21,216,36,0,0 // orps 0x24d8(%rip),%xmm10 # 4650 <_sk_callback_sse2+0x7f4>
+ .byte 68,15,88,13,224,36,0,0 // addps 0x24e0(%rip),%xmm9 # 4660 <_sk_callback_sse2+0x804>
+ .byte 68,15,40,37,232,36,0,0 // movaps 0x24e8(%rip),%xmm12 # 4670 <_sk_callback_sse2+0x814>
.byte 69,15,89,226 // mulps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,88,21,228,36,0,0 // addps 0x24e4(%rip),%xmm10 # 4680 <_sk_callback_sse2+0x820>
- .byte 68,15,40,37,236,36,0,0 // movaps 0x24ec(%rip),%xmm12 # 4690 <_sk_callback_sse2+0x830>
+ .byte 68,15,88,21,232,36,0,0 // addps 0x24e8(%rip),%xmm10 # 4680 <_sk_callback_sse2+0x824>
+ .byte 68,15,40,37,240,36,0,0 // movaps 0x24f0(%rip),%xmm12 # 4690 <_sk_callback_sse2+0x834>
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
.byte 69,15,89,203 // mulps %xmm11,%xmm9
@@ -25869,22 +25863,22 @@ _sk_parametric_a_sse2:
.byte 69,15,91,226 // cvtdq2ps %xmm10,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,194,236,1 // cmpltps %xmm12,%xmm13
- .byte 68,15,40,21,214,36,0,0 // movaps 0x24d6(%rip),%xmm10 # 46a0 <_sk_callback_sse2+0x840>
+ .byte 68,15,40,21,218,36,0,0 // movaps 0x24da(%rip),%xmm10 # 46a0 <_sk_callback_sse2+0x844>
.byte 69,15,84,234 // andps %xmm10,%xmm13
.byte 69,15,87,219 // xorps %xmm11,%xmm11
.byte 69,15,92,229 // subps %xmm13,%xmm12
.byte 69,15,40,233 // movaps %xmm9,%xmm13
.byte 69,15,92,236 // subps %xmm12,%xmm13
- .byte 68,15,88,13,202,36,0,0 // addps 0x24ca(%rip),%xmm9 # 46b0 <_sk_callback_sse2+0x850>
- .byte 68,15,40,37,210,36,0,0 // movaps 0x24d2(%rip),%xmm12 # 46c0 <_sk_callback_sse2+0x860>
+ .byte 68,15,88,13,206,36,0,0 // addps 0x24ce(%rip),%xmm9 # 46b0 <_sk_callback_sse2+0x854>
+ .byte 68,15,40,37,214,36,0,0 // movaps 0x24d6(%rip),%xmm12 # 46c0 <_sk_callback_sse2+0x864>
.byte 69,15,89,229 // mulps %xmm13,%xmm12
.byte 69,15,92,204 // subps %xmm12,%xmm9
- .byte 68,15,40,37,210,36,0,0 // movaps 0x24d2(%rip),%xmm12 # 46d0 <_sk_callback_sse2+0x870>
+ .byte 68,15,40,37,214,36,0,0 // movaps 0x24d6(%rip),%xmm12 # 46d0 <_sk_callback_sse2+0x874>
.byte 69,15,92,229 // subps %xmm13,%xmm12
- .byte 68,15,40,45,214,36,0,0 // movaps 0x24d6(%rip),%xmm13 # 46e0 <_sk_callback_sse2+0x880>
+ .byte 68,15,40,45,218,36,0,0 // movaps 0x24da(%rip),%xmm13 # 46e0 <_sk_callback_sse2+0x884>
.byte 69,15,94,236 // divps %xmm12,%xmm13
.byte 69,15,88,233 // addps %xmm9,%xmm13
- .byte 68,15,89,45,214,36,0,0 // mulps 0x24d6(%rip),%xmm13 # 46f0 <_sk_callback_sse2+0x890>
+ .byte 68,15,89,45,218,36,0,0 // mulps 0x24da(%rip),%xmm13 # 46f0 <_sk_callback_sse2+0x894>
.byte 102,69,15,91,205 // cvtps2dq %xmm13,%xmm9
.byte 243,68,15,16,96,20 // movss 0x14(%rax),%xmm12
.byte 69,15,198,228,0 // shufps $0x0,%xmm12,%xmm12
@@ -25901,29 +25895,29 @@ HIDDEN _sk_lab_to_xyz_sse2
.globl _sk_lab_to_xyz_sse2
FUNCTION(_sk_lab_to_xyz_sse2)
_sk_lab_to_xyz_sse2:
- .byte 15,89,5,179,36,0,0 // mulps 0x24b3(%rip),%xmm0 # 4700 <_sk_callback_sse2+0x8a0>
- .byte 68,15,40,5,187,36,0,0 // movaps 0x24bb(%rip),%xmm8 # 4710 <_sk_callback_sse2+0x8b0>
+ .byte 15,89,5,183,36,0,0 // mulps 0x24b7(%rip),%xmm0 # 4700 <_sk_callback_sse2+0x8a4>
+ .byte 68,15,40,5,191,36,0,0 // movaps 0x24bf(%rip),%xmm8 # 4710 <_sk_callback_sse2+0x8b4>
.byte 65,15,89,200 // mulps %xmm8,%xmm1
- .byte 68,15,40,13,191,36,0,0 // movaps 0x24bf(%rip),%xmm9 # 4720 <_sk_callback_sse2+0x8c0>
+ .byte 68,15,40,13,195,36,0,0 // movaps 0x24c3(%rip),%xmm9 # 4720 <_sk_callback_sse2+0x8c4>
.byte 65,15,88,201 // addps %xmm9,%xmm1
.byte 65,15,89,208 // mulps %xmm8,%xmm2
.byte 65,15,88,209 // addps %xmm9,%xmm2
- .byte 15,88,5,188,36,0,0 // addps 0x24bc(%rip),%xmm0 # 4730 <_sk_callback_sse2+0x8d0>
- .byte 15,89,5,197,36,0,0 // mulps 0x24c5(%rip),%xmm0 # 4740 <_sk_callback_sse2+0x8e0>
- .byte 15,89,13,206,36,0,0 // mulps 0x24ce(%rip),%xmm1 # 4750 <_sk_callback_sse2+0x8f0>
+ .byte 15,88,5,192,36,0,0 // addps 0x24c0(%rip),%xmm0 # 4730 <_sk_callback_sse2+0x8d4>
+ .byte 15,89,5,201,36,0,0 // mulps 0x24c9(%rip),%xmm0 # 4740 <_sk_callback_sse2+0x8e4>
+ .byte 15,89,13,210,36,0,0 // mulps 0x24d2(%rip),%xmm1 # 4750 <_sk_callback_sse2+0x8f4>
.byte 15,88,200 // addps %xmm0,%xmm1
- .byte 15,89,21,212,36,0,0 // mulps 0x24d4(%rip),%xmm2 # 4760 <_sk_callback_sse2+0x900>
+ .byte 15,89,21,216,36,0,0 // mulps 0x24d8(%rip),%xmm2 # 4760 <_sk_callback_sse2+0x904>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 68,15,92,202 // subps %xmm2,%xmm9
.byte 68,15,40,225 // movaps %xmm1,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
.byte 68,15,89,225 // mulps %xmm1,%xmm12
- .byte 15,40,21,201,36,0,0 // movaps 0x24c9(%rip),%xmm2 # 4770 <_sk_callback_sse2+0x910>
+ .byte 15,40,21,205,36,0,0 // movaps 0x24cd(%rip),%xmm2 # 4770 <_sk_callback_sse2+0x914>
.byte 68,15,40,194 // movaps %xmm2,%xmm8
.byte 69,15,194,196,1 // cmpltps %xmm12,%xmm8
- .byte 68,15,40,21,200,36,0,0 // movaps 0x24c8(%rip),%xmm10 # 4780 <_sk_callback_sse2+0x920>
+ .byte 68,15,40,21,204,36,0,0 // movaps 0x24cc(%rip),%xmm10 # 4780 <_sk_callback_sse2+0x924>
.byte 65,15,88,202 // addps %xmm10,%xmm1
- .byte 68,15,40,29,204,36,0,0 // movaps 0x24cc(%rip),%xmm11 # 4790 <_sk_callback_sse2+0x930>
+ .byte 68,15,40,29,208,36,0,0 // movaps 0x24d0(%rip),%xmm11 # 4790 <_sk_callback_sse2+0x934>
.byte 65,15,89,203 // mulps %xmm11,%xmm1
.byte 69,15,84,224 // andps %xmm8,%xmm12
.byte 68,15,85,193 // andnps %xmm1,%xmm8
@@ -25947,8 +25941,8 @@ _sk_lab_to_xyz_sse2:
.byte 15,84,194 // andps %xmm2,%xmm0
.byte 65,15,85,209 // andnps %xmm9,%xmm2
.byte 15,86,208 // orps %xmm0,%xmm2
- .byte 68,15,89,5,124,36,0,0 // mulps 0x247c(%rip),%xmm8 # 47a0 <_sk_callback_sse2+0x940>
- .byte 15,89,21,133,36,0,0 // mulps 0x2485(%rip),%xmm2 # 47b0 <_sk_callback_sse2+0x950>
+ .byte 68,15,89,5,128,36,0,0 // mulps 0x2480(%rip),%xmm8 # 47a0 <_sk_callback_sse2+0x944>
+ .byte 15,89,21,137,36,0,0 // mulps 0x2489(%rip),%xmm2 # 47b0 <_sk_callback_sse2+0x954>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 65,15,40,192 // movaps %xmm8,%xmm0
.byte 255,224 // jmpq *%rax
@@ -25964,7 +25958,7 @@ _sk_load_a8_sse2:
.byte 102,15,96,193 // punpcklbw %xmm1,%xmm0
.byte 102,15,97,193 // punpcklwd %xmm1,%xmm0
.byte 15,91,216 // cvtdq2ps %xmm0,%xmm3
- .byte 15,89,29,109,36,0,0 // mulps 0x246d(%rip),%xmm3 # 47c0 <_sk_callback_sse2+0x960>
+ .byte 15,89,29,113,36,0,0 // mulps 0x2471(%rip),%xmm3 # 47c0 <_sk_callback_sse2+0x964>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 102,15,239,201 // pxor %xmm1,%xmm1
@@ -26009,7 +26003,7 @@ _sk_gather_a8_sse2:
.byte 102,15,96,193 // punpcklbw %xmm1,%xmm0
.byte 102,15,97,193 // punpcklwd %xmm1,%xmm0
.byte 15,91,216 // cvtdq2ps %xmm0,%xmm3
- .byte 15,89,29,220,35,0,0 // mulps 0x23dc(%rip),%xmm3 # 47d0 <_sk_callback_sse2+0x970>
+ .byte 15,89,29,224,35,0,0 // mulps 0x23e0(%rip),%xmm3 # 47d0 <_sk_callback_sse2+0x974>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,87,192 // xorps %xmm0,%xmm0
.byte 102,15,239,201 // pxor %xmm1,%xmm1
@@ -26022,7 +26016,7 @@ FUNCTION(_sk_store_a8_sse2)
_sk_store_a8_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,208,35,0,0 // movaps 0x23d0(%rip),%xmm8 # 47e0 <_sk_callback_sse2+0x980>
+ .byte 68,15,40,5,212,35,0,0 // movaps 0x23d4(%rip),%xmm8 # 47e0 <_sk_callback_sse2+0x984>
.byte 68,15,89,195 // mulps %xmm3,%xmm8
.byte 102,69,15,91,192 // cvtps2dq %xmm8,%xmm8
.byte 102,65,15,114,240,16 // pslld $0x10,%xmm8
@@ -26044,9 +26038,9 @@ _sk_load_g8_sse2:
.byte 102,15,96,193 // punpcklbw %xmm1,%xmm0
.byte 102,15,97,193 // punpcklwd %xmm1,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,151,35,0,0 // mulps 0x2397(%rip),%xmm0 # 47f0 <_sk_callback_sse2+0x990>
+ .byte 15,89,5,155,35,0,0 // mulps 0x239b(%rip),%xmm0 # 47f0 <_sk_callback_sse2+0x994>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,158,35,0,0 // movaps 0x239e(%rip),%xmm3 # 4800 <_sk_callback_sse2+0x9a0>
+ .byte 15,40,29,162,35,0,0 // movaps 0x23a2(%rip),%xmm3 # 4800 <_sk_callback_sse2+0x9a4>
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 255,224 // jmpq *%rax
@@ -26089,9 +26083,9 @@ _sk_gather_g8_sse2:
.byte 102,15,96,193 // punpcklbw %xmm1,%xmm0
.byte 102,15,97,193 // punpcklwd %xmm1,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,19,35,0,0 // mulps 0x2313(%rip),%xmm0 # 4810 <_sk_callback_sse2+0x9b0>
+ .byte 15,89,5,23,35,0,0 // mulps 0x2317(%rip),%xmm0 # 4810 <_sk_callback_sse2+0x9b4>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,26,35,0,0 // movaps 0x231a(%rip),%xmm3 # 4820 <_sk_callback_sse2+0x9c0>
+ .byte 15,40,29,30,35,0,0 // movaps 0x231e(%rip),%xmm3 # 4820 <_sk_callback_sse2+0x9c4>
.byte 15,40,200 // movaps %xmm0,%xmm1
.byte 15,40,208 // movaps %xmm0,%xmm2
.byte 255,224 // jmpq *%rax
@@ -26103,9 +26097,9 @@ _sk_gather_i8_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 73,137,192 // mov %rax,%r8
.byte 77,133,192 // test %r8,%r8
- .byte 116,5 // je 251d <_sk_gather_i8_sse2+0xf>
+ .byte 116,5 // je 2519 <_sk_gather_i8_sse2+0xf>
.byte 76,137,192 // mov %r8,%rax
- .byte 235,2 // jmp 251f <_sk_gather_i8_sse2+0x11>
+ .byte 235,2 // jmp 251b <_sk_gather_i8_sse2+0x11>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,16 // mov (%rax),%r10
.byte 243,15,91,201 // cvttps2dq %xmm1,%xmm1
@@ -26154,11 +26148,11 @@ _sk_gather_i8_sse2:
.byte 102,67,15,110,12,136 // movd (%r8,%r9,4),%xmm1
.byte 102,68,15,98,201 // punpckldq %xmm1,%xmm9
.byte 102,68,15,98,200 // punpckldq %xmm0,%xmm9
- .byte 102,15,111,21,57,34,0,0 // movdqa 0x2239(%rip),%xmm2 # 4830 <_sk_callback_sse2+0x9d0>
+ .byte 102,15,111,21,61,34,0,0 // movdqa 0x223d(%rip),%xmm2 # 4830 <_sk_callback_sse2+0x9d4>
.byte 102,65,15,111,193 // movdqa %xmm9,%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,53,34,0,0 // movaps 0x2235(%rip),%xmm8 # 4840 <_sk_callback_sse2+0x9e0>
+ .byte 68,15,40,5,57,34,0,0 // movaps 0x2239(%rip),%xmm8 # 4840 <_sk_callback_sse2+0x9e4>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,65,15,111,201 // movdqa %xmm9,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -26185,19 +26179,19 @@ _sk_load_565_sse2:
.byte 243,15,126,20,120 // movq (%rax,%rdi,2),%xmm2
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,97,208 // punpcklwd %xmm0,%xmm2
- .byte 102,15,111,5,235,33,0,0 // movdqa 0x21eb(%rip),%xmm0 # 4850 <_sk_callback_sse2+0x9f0>
+ .byte 102,15,111,5,239,33,0,0 // movdqa 0x21ef(%rip),%xmm0 # 4850 <_sk_callback_sse2+0x9f4>
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,237,33,0,0 // mulps 0x21ed(%rip),%xmm0 # 4860 <_sk_callback_sse2+0xa00>
- .byte 102,15,111,13,245,33,0,0 // movdqa 0x21f5(%rip),%xmm1 # 4870 <_sk_callback_sse2+0xa10>
+ .byte 15,89,5,241,33,0,0 // mulps 0x21f1(%rip),%xmm0 # 4860 <_sk_callback_sse2+0xa04>
+ .byte 102,15,111,13,249,33,0,0 // movdqa 0x21f9(%rip),%xmm1 # 4870 <_sk_callback_sse2+0xa14>
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,247,33,0,0 // mulps 0x21f7(%rip),%xmm1 # 4880 <_sk_callback_sse2+0xa20>
- .byte 102,15,219,21,255,33,0,0 // pand 0x21ff(%rip),%xmm2 # 4890 <_sk_callback_sse2+0xa30>
+ .byte 15,89,13,251,33,0,0 // mulps 0x21fb(%rip),%xmm1 # 4880 <_sk_callback_sse2+0xa24>
+ .byte 102,15,219,21,3,34,0,0 // pand 0x2203(%rip),%xmm2 # 4890 <_sk_callback_sse2+0xa34>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,5,34,0,0 // mulps 0x2205(%rip),%xmm2 # 48a0 <_sk_callback_sse2+0xa40>
+ .byte 15,89,21,9,34,0,0 // mulps 0x2209(%rip),%xmm2 # 48a0 <_sk_callback_sse2+0xa44>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,12,34,0,0 // movaps 0x220c(%rip),%xmm3 # 48b0 <_sk_callback_sse2+0xa50>
+ .byte 15,40,29,16,34,0,0 // movaps 0x2210(%rip),%xmm3 # 48b0 <_sk_callback_sse2+0xa54>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_gather_565_sse2
@@ -26232,19 +26226,19 @@ _sk_gather_565_sse2:
.byte 102,15,196,208,3 // pinsrw $0x3,%eax,%xmm2
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,97,208 // punpcklwd %xmm0,%xmm2
- .byte 102,15,111,5,149,33,0,0 // movdqa 0x2195(%rip),%xmm0 # 48c0 <_sk_callback_sse2+0xa60>
+ .byte 102,15,111,5,153,33,0,0 // movdqa 0x2199(%rip),%xmm0 # 48c0 <_sk_callback_sse2+0xa64>
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,151,33,0,0 // mulps 0x2197(%rip),%xmm0 # 48d0 <_sk_callback_sse2+0xa70>
- .byte 102,15,111,13,159,33,0,0 // movdqa 0x219f(%rip),%xmm1 # 48e0 <_sk_callback_sse2+0xa80>
+ .byte 15,89,5,155,33,0,0 // mulps 0x219b(%rip),%xmm0 # 48d0 <_sk_callback_sse2+0xa74>
+ .byte 102,15,111,13,163,33,0,0 // movdqa 0x21a3(%rip),%xmm1 # 48e0 <_sk_callback_sse2+0xa84>
.byte 102,15,219,202 // pand %xmm2,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,161,33,0,0 // mulps 0x21a1(%rip),%xmm1 # 48f0 <_sk_callback_sse2+0xa90>
- .byte 102,15,219,21,169,33,0,0 // pand 0x21a9(%rip),%xmm2 # 4900 <_sk_callback_sse2+0xaa0>
+ .byte 15,89,13,165,33,0,0 // mulps 0x21a5(%rip),%xmm1 # 48f0 <_sk_callback_sse2+0xa94>
+ .byte 102,15,219,21,173,33,0,0 // pand 0x21ad(%rip),%xmm2 # 4900 <_sk_callback_sse2+0xaa4>
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,175,33,0,0 // mulps 0x21af(%rip),%xmm2 # 4910 <_sk_callback_sse2+0xab0>
+ .byte 15,89,21,179,33,0,0 // mulps 0x21b3(%rip),%xmm2 # 4910 <_sk_callback_sse2+0xab4>
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,182,33,0,0 // movaps 0x21b6(%rip),%xmm3 # 4920 <_sk_callback_sse2+0xac0>
+ .byte 15,40,29,186,33,0,0 // movaps 0x21ba(%rip),%xmm3 # 4920 <_sk_callback_sse2+0xac4>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_store_565_sse2
@@ -26253,12 +26247,12 @@ FUNCTION(_sk_store_565_sse2)
_sk_store_565_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,183,33,0,0 // movaps 0x21b7(%rip),%xmm8 # 4930 <_sk_callback_sse2+0xad0>
+ .byte 68,15,40,5,187,33,0,0 // movaps 0x21bb(%rip),%xmm8 # 4930 <_sk_callback_sse2+0xad4>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 102,69,15,91,201 // cvtps2dq %xmm9,%xmm9
.byte 102,65,15,114,241,11 // pslld $0xb,%xmm9
- .byte 68,15,40,21,172,33,0,0 // movaps 0x21ac(%rip),%xmm10 # 4940 <_sk_callback_sse2+0xae0>
+ .byte 68,15,40,21,176,33,0,0 // movaps 0x21b0(%rip),%xmm10 # 4940 <_sk_callback_sse2+0xae4>
.byte 68,15,89,209 // mulps %xmm1,%xmm10
.byte 102,69,15,91,210 // cvtps2dq %xmm10,%xmm10
.byte 102,65,15,114,242,5 // pslld $0x5,%xmm10
@@ -26282,21 +26276,21 @@ _sk_load_4444_sse2:
.byte 243,15,126,28,120 // movq (%rax,%rdi,2),%xmm3
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,97,216 // punpcklwd %xmm0,%xmm3
- .byte 102,15,111,5,101,33,0,0 // movdqa 0x2165(%rip),%xmm0 # 4950 <_sk_callback_sse2+0xaf0>
+ .byte 102,15,111,5,105,33,0,0 // movdqa 0x2169(%rip),%xmm0 # 4950 <_sk_callback_sse2+0xaf4>
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,103,33,0,0 // mulps 0x2167(%rip),%xmm0 # 4960 <_sk_callback_sse2+0xb00>
- .byte 102,15,111,13,111,33,0,0 // movdqa 0x216f(%rip),%xmm1 # 4970 <_sk_callback_sse2+0xb10>
+ .byte 15,89,5,107,33,0,0 // mulps 0x216b(%rip),%xmm0 # 4960 <_sk_callback_sse2+0xb04>
+ .byte 102,15,111,13,115,33,0,0 // movdqa 0x2173(%rip),%xmm1 # 4970 <_sk_callback_sse2+0xb14>
.byte 102,15,219,203 // pand %xmm3,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,113,33,0,0 // mulps 0x2171(%rip),%xmm1 # 4980 <_sk_callback_sse2+0xb20>
- .byte 102,15,111,21,121,33,0,0 // movdqa 0x2179(%rip),%xmm2 # 4990 <_sk_callback_sse2+0xb30>
+ .byte 15,89,13,117,33,0,0 // mulps 0x2175(%rip),%xmm1 # 4980 <_sk_callback_sse2+0xb24>
+ .byte 102,15,111,21,125,33,0,0 // movdqa 0x217d(%rip),%xmm2 # 4990 <_sk_callback_sse2+0xb34>
.byte 102,15,219,211 // pand %xmm3,%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,123,33,0,0 // mulps 0x217b(%rip),%xmm2 # 49a0 <_sk_callback_sse2+0xb40>
- .byte 102,15,219,29,131,33,0,0 // pand 0x2183(%rip),%xmm3 # 49b0 <_sk_callback_sse2+0xb50>
+ .byte 15,89,21,127,33,0,0 // mulps 0x217f(%rip),%xmm2 # 49a0 <_sk_callback_sse2+0xb44>
+ .byte 102,15,219,29,135,33,0,0 // pand 0x2187(%rip),%xmm3 # 49b0 <_sk_callback_sse2+0xb54>
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,137,33,0,0 // mulps 0x2189(%rip),%xmm3 # 49c0 <_sk_callback_sse2+0xb60>
+ .byte 15,89,29,141,33,0,0 // mulps 0x218d(%rip),%xmm3 # 49c0 <_sk_callback_sse2+0xb64>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -26332,21 +26326,21 @@ _sk_gather_4444_sse2:
.byte 102,15,196,216,3 // pinsrw $0x3,%eax,%xmm3
.byte 102,15,239,192 // pxor %xmm0,%xmm0
.byte 102,15,97,216 // punpcklwd %xmm0,%xmm3
- .byte 102,15,111,5,16,33,0,0 // movdqa 0x2110(%rip),%xmm0 # 49d0 <_sk_callback_sse2+0xb70>
+ .byte 102,15,111,5,20,33,0,0 // movdqa 0x2114(%rip),%xmm0 # 49d0 <_sk_callback_sse2+0xb74>
.byte 102,15,219,195 // pand %xmm3,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 15,89,5,18,33,0,0 // mulps 0x2112(%rip),%xmm0 # 49e0 <_sk_callback_sse2+0xb80>
- .byte 102,15,111,13,26,33,0,0 // movdqa 0x211a(%rip),%xmm1 # 49f0 <_sk_callback_sse2+0xb90>
+ .byte 15,89,5,22,33,0,0 // mulps 0x2116(%rip),%xmm0 # 49e0 <_sk_callback_sse2+0xb84>
+ .byte 102,15,111,13,30,33,0,0 // movdqa 0x211e(%rip),%xmm1 # 49f0 <_sk_callback_sse2+0xb94>
.byte 102,15,219,203 // pand %xmm3,%xmm1
.byte 15,91,201 // cvtdq2ps %xmm1,%xmm1
- .byte 15,89,13,28,33,0,0 // mulps 0x211c(%rip),%xmm1 # 4a00 <_sk_callback_sse2+0xba0>
- .byte 102,15,111,21,36,33,0,0 // movdqa 0x2124(%rip),%xmm2 # 4a10 <_sk_callback_sse2+0xbb0>
+ .byte 15,89,13,32,33,0,0 // mulps 0x2120(%rip),%xmm1 # 4a00 <_sk_callback_sse2+0xba4>
+ .byte 102,15,111,21,40,33,0,0 // movdqa 0x2128(%rip),%xmm2 # 4a10 <_sk_callback_sse2+0xbb4>
.byte 102,15,219,211 // pand %xmm3,%xmm2
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
- .byte 15,89,21,38,33,0,0 // mulps 0x2126(%rip),%xmm2 # 4a20 <_sk_callback_sse2+0xbc0>
- .byte 102,15,219,29,46,33,0,0 // pand 0x212e(%rip),%xmm3 # 4a30 <_sk_callback_sse2+0xbd0>
+ .byte 15,89,21,42,33,0,0 // mulps 0x212a(%rip),%xmm2 # 4a20 <_sk_callback_sse2+0xbc4>
+ .byte 102,15,219,29,50,33,0,0 // pand 0x2132(%rip),%xmm3 # 4a30 <_sk_callback_sse2+0xbd4>
.byte 15,91,219 // cvtdq2ps %xmm3,%xmm3
- .byte 15,89,29,52,33,0,0 // mulps 0x2134(%rip),%xmm3 # 4a40 <_sk_callback_sse2+0xbe0>
+ .byte 15,89,29,56,33,0,0 // mulps 0x2138(%rip),%xmm3 # 4a40 <_sk_callback_sse2+0xbe4>
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -26356,7 +26350,7 @@ FUNCTION(_sk_store_4444_sse2)
_sk_store_4444_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,51,33,0,0 // movaps 0x2133(%rip),%xmm8 # 4a50 <_sk_callback_sse2+0xbf0>
+ .byte 68,15,40,5,55,33,0,0 // movaps 0x2137(%rip),%xmm8 # 4a50 <_sk_callback_sse2+0xbf4>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 102,69,15,91,201 // cvtps2dq %xmm9,%xmm9
@@ -26388,11 +26382,11 @@ _sk_load_8888_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
.byte 68,15,16,12,184 // movups (%rax,%rdi,4),%xmm9
- .byte 15,40,21,198,32,0,0 // movaps 0x20c6(%rip),%xmm2 # 4a60 <_sk_callback_sse2+0xc00>
+ .byte 15,40,21,202,32,0,0 // movaps 0x20ca(%rip),%xmm2 # 4a60 <_sk_callback_sse2+0xc04>
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 15,84,194 // andps %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,196,32,0,0 // movaps 0x20c4(%rip),%xmm8 # 4a70 <_sk_callback_sse2+0xc10>
+ .byte 68,15,40,5,200,32,0,0 // movaps 0x20c8(%rip),%xmm8 # 4a70 <_sk_callback_sse2+0xc14>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 65,15,40,201 // movaps %xmm9,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -26441,11 +26435,11 @@ _sk_gather_8888_sse2:
.byte 102,67,15,110,12,129 // movd (%r9,%r8,4),%xmm1
.byte 102,68,15,98,201 // punpckldq %xmm1,%xmm9
.byte 102,68,15,98,200 // punpckldq %xmm0,%xmm9
- .byte 102,15,111,21,21,32,0,0 // movdqa 0x2015(%rip),%xmm2 # 4a80 <_sk_callback_sse2+0xc20>
+ .byte 102,15,111,21,25,32,0,0 // movdqa 0x2019(%rip),%xmm2 # 4a80 <_sk_callback_sse2+0xc24>
.byte 102,65,15,111,193 // movdqa %xmm9,%xmm0
.byte 102,15,219,194 // pand %xmm2,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,5,17,32,0,0 // movaps 0x2011(%rip),%xmm8 # 4a90 <_sk_callback_sse2+0xc30>
+ .byte 68,15,40,5,21,32,0,0 // movaps 0x2015(%rip),%xmm8 # 4a90 <_sk_callback_sse2+0xc34>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,65,15,111,201 // movdqa %xmm9,%xmm1
.byte 102,15,114,209,8 // psrld $0x8,%xmm1
@@ -26469,7 +26463,7 @@ FUNCTION(_sk_store_8888_sse2)
_sk_store_8888_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,5,212,31,0,0 // movaps 0x1fd4(%rip),%xmm8 # 4aa0 <_sk_callback_sse2+0xc40>
+ .byte 68,15,40,5,216,31,0,0 // movaps 0x1fd8(%rip),%xmm8 # 4aa0 <_sk_callback_sse2+0xc44>
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 102,69,15,91,201 // cvtps2dq %xmm9,%xmm9
@@ -26508,7 +26502,7 @@ _sk_load_f16_sse2:
.byte 102,69,15,239,210 // pxor %xmm10,%xmm10
.byte 102,65,15,111,206 // movdqa %xmm14,%xmm1
.byte 102,65,15,97,202 // punpcklwd %xmm10,%xmm1
- .byte 102,68,15,111,13,68,31,0,0 // movdqa 0x1f44(%rip),%xmm9 # 4ab0 <_sk_callback_sse2+0xc50>
+ .byte 102,68,15,111,13,72,31,0,0 // movdqa 0x1f48(%rip),%xmm9 # 4ab0 <_sk_callback_sse2+0xc54>
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,65,15,219,193 // pand %xmm9,%xmm0
.byte 102,15,239,200 // pxor %xmm0,%xmm1
@@ -26516,11 +26510,11 @@ _sk_load_f16_sse2:
.byte 102,68,15,111,233 // movdqa %xmm1,%xmm13
.byte 102,65,15,114,245,13 // pslld $0xd,%xmm13
.byte 102,68,15,235,232 // por %xmm0,%xmm13
- .byte 102,68,15,111,29,41,31,0,0 // movdqa 0x1f29(%rip),%xmm11 # 4ac0 <_sk_callback_sse2+0xc60>
+ .byte 102,68,15,111,29,45,31,0,0 // movdqa 0x1f2d(%rip),%xmm11 # 4ac0 <_sk_callback_sse2+0xc64>
.byte 102,69,15,254,235 // paddd %xmm11,%xmm13
- .byte 102,68,15,111,37,43,31,0,0 // movdqa 0x1f2b(%rip),%xmm12 # 4ad0 <_sk_callback_sse2+0xc70>
+ .byte 102,68,15,111,37,47,31,0,0 // movdqa 0x1f2f(%rip),%xmm12 # 4ad0 <_sk_callback_sse2+0xc74>
.byte 102,65,15,239,204 // pxor %xmm12,%xmm1
- .byte 102,15,111,29,46,31,0,0 // movdqa 0x1f2e(%rip),%xmm3 # 4ae0 <_sk_callback_sse2+0xc80>
+ .byte 102,15,111,29,50,31,0,0 // movdqa 0x1f32(%rip),%xmm3 # 4ae0 <_sk_callback_sse2+0xc84>
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,102,193 // pcmpgtd %xmm1,%xmm0
.byte 102,65,15,223,197 // pandn %xmm13,%xmm0
@@ -26606,7 +26600,7 @@ _sk_gather_f16_sse2:
.byte 102,69,15,239,210 // pxor %xmm10,%xmm10
.byte 102,65,15,111,206 // movdqa %xmm14,%xmm1
.byte 102,65,15,97,202 // punpcklwd %xmm10,%xmm1
- .byte 102,68,15,111,13,188,29,0,0 // movdqa 0x1dbc(%rip),%xmm9 # 4af0 <_sk_callback_sse2+0xc90>
+ .byte 102,68,15,111,13,192,29,0,0 // movdqa 0x1dc0(%rip),%xmm9 # 4af0 <_sk_callback_sse2+0xc94>
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,65,15,219,193 // pand %xmm9,%xmm0
.byte 102,15,239,200 // pxor %xmm0,%xmm1
@@ -26614,11 +26608,11 @@ _sk_gather_f16_sse2:
.byte 102,68,15,111,233 // movdqa %xmm1,%xmm13
.byte 102,65,15,114,245,13 // pslld $0xd,%xmm13
.byte 102,68,15,235,232 // por %xmm0,%xmm13
- .byte 102,68,15,111,29,161,29,0,0 // movdqa 0x1da1(%rip),%xmm11 # 4b00 <_sk_callback_sse2+0xca0>
+ .byte 102,68,15,111,29,165,29,0,0 // movdqa 0x1da5(%rip),%xmm11 # 4b00 <_sk_callback_sse2+0xca4>
.byte 102,69,15,254,235 // paddd %xmm11,%xmm13
- .byte 102,68,15,111,37,163,29,0,0 // movdqa 0x1da3(%rip),%xmm12 # 4b10 <_sk_callback_sse2+0xcb0>
+ .byte 102,68,15,111,37,167,29,0,0 // movdqa 0x1da7(%rip),%xmm12 # 4b10 <_sk_callback_sse2+0xcb4>
.byte 102,65,15,239,204 // pxor %xmm12,%xmm1
- .byte 102,15,111,29,166,29,0,0 // movdqa 0x1da6(%rip),%xmm3 # 4b20 <_sk_callback_sse2+0xcc0>
+ .byte 102,15,111,29,170,29,0,0 // movdqa 0x1daa(%rip),%xmm3 # 4b20 <_sk_callback_sse2+0xcc4>
.byte 102,15,111,195 // movdqa %xmm3,%xmm0
.byte 102,15,102,193 // pcmpgtd %xmm1,%xmm0
.byte 102,65,15,223,197 // pandn %xmm13,%xmm0
@@ -26671,17 +26665,17 @@ FUNCTION(_sk_store_f16_sse2)
_sk_store_f16_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 102,68,15,111,21,206,28,0,0 // movdqa 0x1cce(%rip),%xmm10 # 4b30 <_sk_callback_sse2+0xcd0>
+ .byte 102,68,15,111,21,210,28,0,0 // movdqa 0x1cd2(%rip),%xmm10 # 4b30 <_sk_callback_sse2+0xcd4>
.byte 102,68,15,111,224 // movdqa %xmm0,%xmm12
.byte 102,68,15,111,232 // movdqa %xmm0,%xmm13
.byte 102,69,15,219,234 // pand %xmm10,%xmm13
.byte 102,69,15,239,229 // pxor %xmm13,%xmm12
- .byte 102,68,15,111,13,193,28,0,0 // movdqa 0x1cc1(%rip),%xmm9 # 4b40 <_sk_callback_sse2+0xce0>
+ .byte 102,68,15,111,13,197,28,0,0 // movdqa 0x1cc5(%rip),%xmm9 # 4b40 <_sk_callback_sse2+0xce4>
.byte 102,65,15,114,213,16 // psrld $0x10,%xmm13
.byte 102,69,15,111,193 // movdqa %xmm9,%xmm8
.byte 102,69,15,102,196 // pcmpgtd %xmm12,%xmm8
.byte 102,65,15,114,212,13 // psrld $0xd,%xmm12
- .byte 102,68,15,111,29,178,28,0,0 // movdqa 0x1cb2(%rip),%xmm11 # 4b50 <_sk_callback_sse2+0xcf0>
+ .byte 102,68,15,111,29,182,28,0,0 // movdqa 0x1cb6(%rip),%xmm11 # 4b50 <_sk_callback_sse2+0xcf4>
.byte 102,69,15,235,235 // por %xmm11,%xmm13
.byte 102,69,15,254,236 // paddd %xmm12,%xmm13
.byte 102,65,15,114,245,16 // pslld $0x10,%xmm13
@@ -26760,7 +26754,7 @@ _sk_load_u16_be_sse2:
.byte 102,69,15,239,201 // pxor %xmm9,%xmm9
.byte 102,65,15,97,201 // punpcklwd %xmm9,%xmm1
.byte 15,91,193 // cvtdq2ps %xmm1,%xmm0
- .byte 68,15,40,5,80,27,0,0 // movaps 0x1b50(%rip),%xmm8 # 4b60 <_sk_callback_sse2+0xd00>
+ .byte 68,15,40,5,84,27,0,0 // movaps 0x1b54(%rip),%xmm8 # 4b60 <_sk_callback_sse2+0xd04>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,113,241,8 // psllw $0x8,%xmm1
@@ -26813,7 +26807,7 @@ _sk_load_rgb_u16_be_sse2:
.byte 102,69,15,239,192 // pxor %xmm8,%xmm8
.byte 102,65,15,97,192 // punpcklwd %xmm8,%xmm0
.byte 15,91,192 // cvtdq2ps %xmm0,%xmm0
- .byte 68,15,40,13,140,26,0,0 // movaps 0x1a8c(%rip),%xmm9 # 4b70 <_sk_callback_sse2+0xd10>
+ .byte 68,15,40,13,144,26,0,0 // movaps 0x1a90(%rip),%xmm9 # 4b70 <_sk_callback_sse2+0xd14>
.byte 65,15,89,193 // mulps %xmm9,%xmm0
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
.byte 102,15,113,241,8 // psllw $0x8,%xmm1
@@ -26830,7 +26824,7 @@ _sk_load_rgb_u16_be_sse2:
.byte 15,91,210 // cvtdq2ps %xmm2,%xmm2
.byte 65,15,89,209 // mulps %xmm9,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,83,26,0,0 // movaps 0x1a53(%rip),%xmm3 # 4b80 <_sk_callback_sse2+0xd20>
+ .byte 15,40,29,87,26,0,0 // movaps 0x1a57(%rip),%xmm3 # 4b80 <_sk_callback_sse2+0xd24>
.byte 255,224 // jmpq *%rax
HIDDEN _sk_store_u16_be_sse2
@@ -26839,7 +26833,7 @@ FUNCTION(_sk_store_u16_be_sse2)
_sk_store_u16_be_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 72,139,0 // mov (%rax),%rax
- .byte 68,15,40,13,84,26,0,0 // movaps 0x1a54(%rip),%xmm9 # 4b90 <_sk_callback_sse2+0xd30>
+ .byte 68,15,40,13,88,26,0,0 // movaps 0x1a58(%rip),%xmm9 # 4b90 <_sk_callback_sse2+0xd34>
.byte 68,15,40,192 // movaps %xmm0,%xmm8
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 102,69,15,91,192 // cvtps2dq %xmm8,%xmm8
@@ -26989,7 +26983,7 @@ _sk_repeat_x_sse2:
.byte 243,69,15,91,209 // cvttps2dq %xmm9,%xmm10
.byte 69,15,91,210 // cvtdq2ps %xmm10,%xmm10
.byte 69,15,194,202,1 // cmpltps %xmm10,%xmm9
- .byte 68,15,84,13,62,24,0,0 // andps 0x183e(%rip),%xmm9 # 4ba0 <_sk_callback_sse2+0xd40>
+ .byte 68,15,84,13,66,24,0,0 // andps 0x1842(%rip),%xmm9 # 4ba0 <_sk_callback_sse2+0xd44>
.byte 69,15,92,209 // subps %xmm9,%xmm10
.byte 69,15,89,208 // mulps %xmm8,%xmm10
.byte 65,15,92,194 // subps %xmm10,%xmm0
@@ -27011,7 +27005,7 @@ _sk_repeat_y_sse2:
.byte 243,69,15,91,209 // cvttps2dq %xmm9,%xmm10
.byte 69,15,91,210 // cvtdq2ps %xmm10,%xmm10
.byte 69,15,194,202,1 // cmpltps %xmm10,%xmm9
- .byte 68,15,84,13,6,24,0,0 // andps 0x1806(%rip),%xmm9 # 4bb0 <_sk_callback_sse2+0xd50>
+ .byte 68,15,84,13,10,24,0,0 // andps 0x180a(%rip),%xmm9 # 4bb0 <_sk_callback_sse2+0xd54>
.byte 69,15,92,209 // subps %xmm9,%xmm10
.byte 69,15,89,208 // mulps %xmm8,%xmm10
.byte 65,15,92,202 // subps %xmm10,%xmm1
@@ -27037,7 +27031,7 @@ _sk_mirror_x_sse2:
.byte 243,69,15,91,218 // cvttps2dq %xmm10,%xmm11
.byte 69,15,91,219 // cvtdq2ps %xmm11,%xmm11
.byte 69,15,194,211,1 // cmpltps %xmm11,%xmm10
- .byte 68,15,84,21,188,23,0,0 // andps 0x17bc(%rip),%xmm10 # 4bc0 <_sk_callback_sse2+0xd60>
+ .byte 68,15,84,21,192,23,0,0 // andps 0x17c0(%rip),%xmm10 # 4bc0 <_sk_callback_sse2+0xd64>
.byte 69,15,87,228 // xorps %xmm12,%xmm12
.byte 69,15,92,218 // subps %xmm10,%xmm11
.byte 69,15,89,216 // mulps %xmm8,%xmm11
@@ -27067,7 +27061,7 @@ _sk_mirror_y_sse2:
.byte 243,69,15,91,218 // cvttps2dq %xmm10,%xmm11
.byte 69,15,91,219 // cvtdq2ps %xmm11,%xmm11
.byte 69,15,194,211,1 // cmpltps %xmm11,%xmm10
- .byte 68,15,84,21,98,23,0,0 // andps 0x1762(%rip),%xmm10 # 4bd0 <_sk_callback_sse2+0xd70>
+ .byte 68,15,84,21,102,23,0,0 // andps 0x1766(%rip),%xmm10 # 4bd0 <_sk_callback_sse2+0xd74>
.byte 69,15,87,228 // xorps %xmm12,%xmm12
.byte 69,15,92,218 // subps %xmm10,%xmm11
.byte 69,15,89,216 // mulps %xmm8,%xmm11
@@ -27086,10 +27080,10 @@ HIDDEN _sk_luminance_to_alpha_sse2
FUNCTION(_sk_luminance_to_alpha_sse2)
_sk_luminance_to_alpha_sse2:
.byte 15,40,218 // movaps %xmm2,%xmm3
- .byte 15,89,5,58,23,0,0 // mulps 0x173a(%rip),%xmm0 # 4be0 <_sk_callback_sse2+0xd80>
- .byte 15,89,13,67,23,0,0 // mulps 0x1743(%rip),%xmm1 # 4bf0 <_sk_callback_sse2+0xd90>
+ .byte 15,89,5,62,23,0,0 // mulps 0x173e(%rip),%xmm0 # 4be0 <_sk_callback_sse2+0xd84>
+ .byte 15,89,13,71,23,0,0 // mulps 0x1747(%rip),%xmm1 # 4bf0 <_sk_callback_sse2+0xd94>
.byte 15,88,200 // addps %xmm0,%xmm1
- .byte 15,89,29,73,23,0,0 // mulps 0x1749(%rip),%xmm3 # 4c00 <_sk_callback_sse2+0xda0>
+ .byte 15,89,29,77,23,0,0 // mulps 0x174d(%rip),%xmm3 # 4c00 <_sk_callback_sse2+0xda4>
.byte 15,88,217 // addps %xmm1,%xmm3
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,87,192 // xorps %xmm0,%xmm0
@@ -27322,7 +27316,7 @@ _sk_linear_gradient_sse2:
.byte 69,15,198,228,0 // shufps $0x0,%xmm12,%xmm12
.byte 72,139,8 // mov (%rax),%rcx
.byte 72,133,201 // test %rcx,%rcx
- .byte 15,132,15,1,0,0 // je 396a <_sk_linear_gradient_sse2+0x149>
+ .byte 15,132,15,1,0,0 // je 3966 <_sk_linear_gradient_sse2+0x149>
.byte 72,139,64,8 // mov 0x8(%rax),%rax
.byte 72,131,192,32 // add $0x20,%rax
.byte 69,15,87,192 // xorps %xmm8,%xmm8
@@ -27383,8 +27377,8 @@ _sk_linear_gradient_sse2:
.byte 69,15,86,231 // orps %xmm15,%xmm12
.byte 72,131,192,36 // add $0x24,%rax
.byte 72,255,201 // dec %rcx
- .byte 15,133,8,255,255,255 // jne 3870 <_sk_linear_gradient_sse2+0x4f>
- .byte 235,13 // jmp 3977 <_sk_linear_gradient_sse2+0x156>
+ .byte 15,133,8,255,255,255 // jne 386c <_sk_linear_gradient_sse2+0x4f>
+ .byte 235,13 // jmp 3973 <_sk_linear_gradient_sse2+0x156>
.byte 15,87,201 // xorps %xmm1,%xmm1
.byte 15,87,210 // xorps %xmm2,%xmm2
.byte 15,87,219 // xorps %xmm3,%xmm3
@@ -27453,29 +27447,29 @@ _sk_xy_to_polar_unit_sse2:
.byte 69,15,94,220 // divps %xmm12,%xmm11
.byte 69,15,40,227 // movaps %xmm11,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
- .byte 68,15,40,45,193,17,0,0 // movaps 0x11c1(%rip),%xmm13 # 4c10 <_sk_callback_sse2+0xdb0>
+ .byte 68,15,40,45,197,17,0,0 // movaps 0x11c5(%rip),%xmm13 # 4c10 <_sk_callback_sse2+0xdb4>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
- .byte 68,15,88,45,197,17,0,0 // addps 0x11c5(%rip),%xmm13 # 4c20 <_sk_callback_sse2+0xdc0>
+ .byte 68,15,88,45,201,17,0,0 // addps 0x11c9(%rip),%xmm13 # 4c20 <_sk_callback_sse2+0xdc4>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
- .byte 68,15,88,45,201,17,0,0 // addps 0x11c9(%rip),%xmm13 # 4c30 <_sk_callback_sse2+0xdd0>
+ .byte 68,15,88,45,205,17,0,0 // addps 0x11cd(%rip),%xmm13 # 4c30 <_sk_callback_sse2+0xdd4>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
- .byte 68,15,88,45,205,17,0,0 // addps 0x11cd(%rip),%xmm13 # 4c40 <_sk_callback_sse2+0xde0>
+ .byte 68,15,88,45,209,17,0,0 // addps 0x11d1(%rip),%xmm13 # 4c40 <_sk_callback_sse2+0xde4>
.byte 69,15,89,235 // mulps %xmm11,%xmm13
.byte 69,15,194,202,1 // cmpltps %xmm10,%xmm9
- .byte 68,15,40,21,204,17,0,0 // movaps 0x11cc(%rip),%xmm10 # 4c50 <_sk_callback_sse2+0xdf0>
+ .byte 68,15,40,21,208,17,0,0 // movaps 0x11d0(%rip),%xmm10 # 4c50 <_sk_callback_sse2+0xdf4>
.byte 69,15,92,213 // subps %xmm13,%xmm10
.byte 69,15,84,209 // andps %xmm9,%xmm10
.byte 69,15,85,205 // andnps %xmm13,%xmm9
.byte 69,15,86,202 // orps %xmm10,%xmm9
.byte 68,15,194,192,1 // cmpltps %xmm0,%xmm8
- .byte 68,15,40,21,191,17,0,0 // movaps 0x11bf(%rip),%xmm10 # 4c60 <_sk_callback_sse2+0xe00>
+ .byte 68,15,40,21,195,17,0,0 // movaps 0x11c3(%rip),%xmm10 # 4c60 <_sk_callback_sse2+0xe04>
.byte 69,15,92,209 // subps %xmm9,%xmm10
.byte 69,15,84,208 // andps %xmm8,%xmm10
.byte 69,15,85,193 // andnps %xmm9,%xmm8
.byte 69,15,86,194 // orps %xmm10,%xmm8
.byte 68,15,40,201 // movaps %xmm1,%xmm9
.byte 68,15,194,200,1 // cmpltps %xmm0,%xmm9
- .byte 68,15,40,21,174,17,0,0 // movaps 0x11ae(%rip),%xmm10 # 4c70 <_sk_callback_sse2+0xe10>
+ .byte 68,15,40,21,178,17,0,0 // movaps 0x11b2(%rip),%xmm10 # 4c70 <_sk_callback_sse2+0xe14>
.byte 69,15,92,208 // subps %xmm8,%xmm10
.byte 69,15,84,209 // andps %xmm9,%xmm10
.byte 69,15,85,200 // andnps %xmm8,%xmm9
@@ -27490,7 +27484,7 @@ HIDDEN _sk_save_xy_sse2
FUNCTION(_sk_save_xy_sse2)
_sk_save_xy_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,151,17,0,0 // movaps 0x1197(%rip),%xmm8 # 4c80 <_sk_callback_sse2+0xe20>
+ .byte 68,15,40,5,155,17,0,0 // movaps 0x119b(%rip),%xmm8 # 4c80 <_sk_callback_sse2+0xe24>
.byte 15,17,0 // movups %xmm0,(%rax)
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,88,200 // addps %xmm8,%xmm9
@@ -27498,7 +27492,7 @@ _sk_save_xy_sse2:
.byte 69,15,91,210 // cvtdq2ps %xmm10,%xmm10
.byte 69,15,40,217 // movaps %xmm9,%xmm11
.byte 69,15,194,218,1 // cmpltps %xmm10,%xmm11
- .byte 68,15,40,37,130,17,0,0 // movaps 0x1182(%rip),%xmm12 # 4c90 <_sk_callback_sse2+0xe30>
+ .byte 68,15,40,37,134,17,0,0 // movaps 0x1186(%rip),%xmm12 # 4c90 <_sk_callback_sse2+0xe34>
.byte 69,15,84,220 // andps %xmm12,%xmm11
.byte 69,15,92,211 // subps %xmm11,%xmm10
.byte 69,15,92,202 // subps %xmm10,%xmm9
@@ -27545,8 +27539,8 @@ _sk_bilinear_nx_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,251,16,0,0 // addps 0x10fb(%rip),%xmm0 # 4ca0 <_sk_callback_sse2+0xe40>
- .byte 68,15,40,13,3,17,0,0 // movaps 0x1103(%rip),%xmm9 # 4cb0 <_sk_callback_sse2+0xe50>
+ .byte 15,88,5,255,16,0,0 // addps 0x10ff(%rip),%xmm0 # 4ca0 <_sk_callback_sse2+0xe44>
+ .byte 68,15,40,13,7,17,0,0 // movaps 0x1107(%rip),%xmm9 # 4cb0 <_sk_callback_sse2+0xe54>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,128,0,0,0 // movups %xmm9,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -27559,7 +27553,7 @@ _sk_bilinear_px_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,242,16,0,0 // addps 0x10f2(%rip),%xmm0 # 4cc0 <_sk_callback_sse2+0xe60>
+ .byte 15,88,5,246,16,0,0 // addps 0x10f6(%rip),%xmm0 # 4cc0 <_sk_callback_sse2+0xe64>
.byte 68,15,17,128,128,0,0,0 // movups %xmm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -27571,8 +27565,8 @@ _sk_bilinear_ny_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,228,16,0,0 // addps 0x10e4(%rip),%xmm1 # 4cd0 <_sk_callback_sse2+0xe70>
- .byte 68,15,40,13,236,16,0,0 // movaps 0x10ec(%rip),%xmm9 # 4ce0 <_sk_callback_sse2+0xe80>
+ .byte 15,88,13,232,16,0,0 // addps 0x10e8(%rip),%xmm1 # 4cd0 <_sk_callback_sse2+0xe74>
+ .byte 68,15,40,13,240,16,0,0 // movaps 0x10f0(%rip),%xmm9 # 4ce0 <_sk_callback_sse2+0xe84>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,160,0,0,0 // movups %xmm9,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -27585,7 +27579,7 @@ _sk_bilinear_py_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,218,16,0,0 // addps 0x10da(%rip),%xmm1 # 4cf0 <_sk_callback_sse2+0xe90>
+ .byte 15,88,13,222,16,0,0 // addps 0x10de(%rip),%xmm1 # 4cf0 <_sk_callback_sse2+0xe94>
.byte 68,15,17,128,160,0,0,0 // movups %xmm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -27597,13 +27591,13 @@ _sk_bicubic_n3x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,205,16,0,0 // addps 0x10cd(%rip),%xmm0 # 4d00 <_sk_callback_sse2+0xea0>
- .byte 68,15,40,13,213,16,0,0 // movaps 0x10d5(%rip),%xmm9 # 4d10 <_sk_callback_sse2+0xeb0>
+ .byte 15,88,5,209,16,0,0 // addps 0x10d1(%rip),%xmm0 # 4d00 <_sk_callback_sse2+0xea4>
+ .byte 68,15,40,13,217,16,0,0 // movaps 0x10d9(%rip),%xmm9 # 4d10 <_sk_callback_sse2+0xeb4>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,209,16,0,0 // mulps 0x10d1(%rip),%xmm9 # 4d20 <_sk_callback_sse2+0xec0>
- .byte 68,15,88,13,217,16,0,0 // addps 0x10d9(%rip),%xmm9 # 4d30 <_sk_callback_sse2+0xed0>
+ .byte 68,15,89,13,213,16,0,0 // mulps 0x10d5(%rip),%xmm9 # 4d20 <_sk_callback_sse2+0xec4>
+ .byte 68,15,88,13,221,16,0,0 // addps 0x10dd(%rip),%xmm9 # 4d30 <_sk_callback_sse2+0xed4>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,128,0,0,0 // movups %xmm9,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -27616,16 +27610,16 @@ _sk_bicubic_n1x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,200,16,0,0 // addps 0x10c8(%rip),%xmm0 # 4d40 <_sk_callback_sse2+0xee0>
- .byte 68,15,40,13,208,16,0,0 // movaps 0x10d0(%rip),%xmm9 # 4d50 <_sk_callback_sse2+0xef0>
+ .byte 15,88,5,204,16,0,0 // addps 0x10cc(%rip),%xmm0 # 4d40 <_sk_callback_sse2+0xee4>
+ .byte 68,15,40,13,212,16,0,0 // movaps 0x10d4(%rip),%xmm9 # 4d50 <_sk_callback_sse2+0xef4>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,212,16,0,0 // movaps 0x10d4(%rip),%xmm8 # 4d60 <_sk_callback_sse2+0xf00>
+ .byte 68,15,40,5,216,16,0,0 // movaps 0x10d8(%rip),%xmm8 # 4d60 <_sk_callback_sse2+0xf04>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,216,16,0,0 // addps 0x10d8(%rip),%xmm8 # 4d70 <_sk_callback_sse2+0xf10>
+ .byte 68,15,88,5,220,16,0,0 // addps 0x10dc(%rip),%xmm8 # 4d70 <_sk_callback_sse2+0xf14>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,220,16,0,0 // addps 0x10dc(%rip),%xmm8 # 4d80 <_sk_callback_sse2+0xf20>
+ .byte 68,15,88,5,224,16,0,0 // addps 0x10e0(%rip),%xmm8 # 4d80 <_sk_callback_sse2+0xf24>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,224,16,0,0 // addps 0x10e0(%rip),%xmm8 # 4d90 <_sk_callback_sse2+0xf30>
+ .byte 68,15,88,5,228,16,0,0 // addps 0x10e4(%rip),%xmm8 # 4d90 <_sk_callback_sse2+0xf34>
.byte 68,15,17,128,128,0,0,0 // movups %xmm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -27635,17 +27629,17 @@ HIDDEN _sk_bicubic_p1x_sse2
FUNCTION(_sk_bicubic_p1x_sse2)
_sk_bicubic_p1x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,218,16,0,0 // movaps 0x10da(%rip),%xmm8 # 4da0 <_sk_callback_sse2+0xf40>
+ .byte 68,15,40,5,222,16,0,0 // movaps 0x10de(%rip),%xmm8 # 4da0 <_sk_callback_sse2+0xf44>
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,72,64 // movups 0x40(%rax),%xmm9
.byte 65,15,88,192 // addps %xmm8,%xmm0
- .byte 68,15,40,21,214,16,0,0 // movaps 0x10d6(%rip),%xmm10 # 4db0 <_sk_callback_sse2+0xf50>
+ .byte 68,15,40,21,218,16,0,0 // movaps 0x10da(%rip),%xmm10 # 4db0 <_sk_callback_sse2+0xf54>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,218,16,0,0 // addps 0x10da(%rip),%xmm10 # 4dc0 <_sk_callback_sse2+0xf60>
+ .byte 68,15,88,21,222,16,0,0 // addps 0x10de(%rip),%xmm10 # 4dc0 <_sk_callback_sse2+0xf64>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,214,16,0,0 // addps 0x10d6(%rip),%xmm10 # 4dd0 <_sk_callback_sse2+0xf70>
+ .byte 68,15,88,21,218,16,0,0 // addps 0x10da(%rip),%xmm10 # 4dd0 <_sk_callback_sse2+0xf74>
.byte 68,15,17,144,128,0,0,0 // movups %xmm10,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -27657,11 +27651,11 @@ _sk_bicubic_p3x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,64,64 // movups 0x40(%rax),%xmm8
- .byte 15,88,5,201,16,0,0 // addps 0x10c9(%rip),%xmm0 # 4de0 <_sk_callback_sse2+0xf80>
+ .byte 15,88,5,205,16,0,0 // addps 0x10cd(%rip),%xmm0 # 4de0 <_sk_callback_sse2+0xf84>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,201,16,0,0 // mulps 0x10c9(%rip),%xmm8 # 4df0 <_sk_callback_sse2+0xf90>
- .byte 68,15,88,5,209,16,0,0 // addps 0x10d1(%rip),%xmm8 # 4e00 <_sk_callback_sse2+0xfa0>
+ .byte 68,15,89,5,205,16,0,0 // mulps 0x10cd(%rip),%xmm8 # 4df0 <_sk_callback_sse2+0xf94>
+ .byte 68,15,88,5,213,16,0,0 // addps 0x10d5(%rip),%xmm8 # 4e00 <_sk_callback_sse2+0xfa4>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,128,0,0,0 // movups %xmm8,0x80(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -27674,13 +27668,13 @@ _sk_bicubic_n3y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,191,16,0,0 // addps 0x10bf(%rip),%xmm1 # 4e10 <_sk_callback_sse2+0xfb0>
- .byte 68,15,40,13,199,16,0,0 // movaps 0x10c7(%rip),%xmm9 # 4e20 <_sk_callback_sse2+0xfc0>
+ .byte 15,88,13,195,16,0,0 // addps 0x10c3(%rip),%xmm1 # 4e10 <_sk_callback_sse2+0xfb4>
+ .byte 68,15,40,13,203,16,0,0 // movaps 0x10cb(%rip),%xmm9 # 4e20 <_sk_callback_sse2+0xfc4>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,195,16,0,0 // mulps 0x10c3(%rip),%xmm9 # 4e30 <_sk_callback_sse2+0xfd0>
- .byte 68,15,88,13,203,16,0,0 // addps 0x10cb(%rip),%xmm9 # 4e40 <_sk_callback_sse2+0xfe0>
+ .byte 68,15,89,13,199,16,0,0 // mulps 0x10c7(%rip),%xmm9 # 4e30 <_sk_callback_sse2+0xfd4>
+ .byte 68,15,88,13,207,16,0,0 // addps 0x10cf(%rip),%xmm9 # 4e40 <_sk_callback_sse2+0xfe4>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,160,0,0,0 // movups %xmm9,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -27693,16 +27687,16 @@ _sk_bicubic_n1y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,185,16,0,0 // addps 0x10b9(%rip),%xmm1 # 4e50 <_sk_callback_sse2+0xff0>
- .byte 68,15,40,13,193,16,0,0 // movaps 0x10c1(%rip),%xmm9 # 4e60 <_sk_callback_sse2+0x1000>
+ .byte 15,88,13,189,16,0,0 // addps 0x10bd(%rip),%xmm1 # 4e50 <_sk_callback_sse2+0xff4>
+ .byte 68,15,40,13,197,16,0,0 // movaps 0x10c5(%rip),%xmm9 # 4e60 <_sk_callback_sse2+0x1004>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,197,16,0,0 // movaps 0x10c5(%rip),%xmm8 # 4e70 <_sk_callback_sse2+0x1010>
+ .byte 68,15,40,5,201,16,0,0 // movaps 0x10c9(%rip),%xmm8 # 4e70 <_sk_callback_sse2+0x1014>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,201,16,0,0 // addps 0x10c9(%rip),%xmm8 # 4e80 <_sk_callback_sse2+0x1020>
+ .byte 68,15,88,5,205,16,0,0 // addps 0x10cd(%rip),%xmm8 # 4e80 <_sk_callback_sse2+0x1024>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,205,16,0,0 // addps 0x10cd(%rip),%xmm8 # 4e90 <_sk_callback_sse2+0x1030>
+ .byte 68,15,88,5,209,16,0,0 // addps 0x10d1(%rip),%xmm8 # 4e90 <_sk_callback_sse2+0x1034>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,209,16,0,0 // addps 0x10d1(%rip),%xmm8 # 4ea0 <_sk_callback_sse2+0x1040>
+ .byte 68,15,88,5,213,16,0,0 // addps 0x10d5(%rip),%xmm8 # 4ea0 <_sk_callback_sse2+0x1044>
.byte 68,15,17,128,160,0,0,0 // movups %xmm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -27712,17 +27706,17 @@ HIDDEN _sk_bicubic_p1y_sse2
FUNCTION(_sk_bicubic_p1y_sse2)
_sk_bicubic_p1y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,203,16,0,0 // movaps 0x10cb(%rip),%xmm8 # 4eb0 <_sk_callback_sse2+0x1050>
+ .byte 68,15,40,5,207,16,0,0 // movaps 0x10cf(%rip),%xmm8 # 4eb0 <_sk_callback_sse2+0x1054>
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,72,96 // movups 0x60(%rax),%xmm9
.byte 65,15,88,200 // addps %xmm8,%xmm1
- .byte 68,15,40,21,198,16,0,0 // movaps 0x10c6(%rip),%xmm10 # 4ec0 <_sk_callback_sse2+0x1060>
+ .byte 68,15,40,21,202,16,0,0 // movaps 0x10ca(%rip),%xmm10 # 4ec0 <_sk_callback_sse2+0x1064>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,202,16,0,0 // addps 0x10ca(%rip),%xmm10 # 4ed0 <_sk_callback_sse2+0x1070>
+ .byte 68,15,88,21,206,16,0,0 // addps 0x10ce(%rip),%xmm10 # 4ed0 <_sk_callback_sse2+0x1074>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,198,16,0,0 // addps 0x10c6(%rip),%xmm10 # 4ee0 <_sk_callback_sse2+0x1080>
+ .byte 68,15,88,21,202,16,0,0 // addps 0x10ca(%rip),%xmm10 # 4ee0 <_sk_callback_sse2+0x1084>
.byte 68,15,17,144,160,0,0,0 // movups %xmm10,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -27734,11 +27728,11 @@ _sk_bicubic_p3y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,32 // movups 0x20(%rax),%xmm1
.byte 68,15,16,64,96 // movups 0x60(%rax),%xmm8
- .byte 15,88,13,184,16,0,0 // addps 0x10b8(%rip),%xmm1 # 4ef0 <_sk_callback_sse2+0x1090>
+ .byte 15,88,13,188,16,0,0 // addps 0x10bc(%rip),%xmm1 # 4ef0 <_sk_callback_sse2+0x1094>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,184,16,0,0 // mulps 0x10b8(%rip),%xmm8 # 4f00 <_sk_callback_sse2+0x10a0>
- .byte 68,15,88,5,192,16,0,0 // addps 0x10c0(%rip),%xmm8 # 4f10 <_sk_callback_sse2+0x10b0>
+ .byte 68,15,89,5,188,16,0,0 // mulps 0x10bc(%rip),%xmm8 # 4f00 <_sk_callback_sse2+0x10a4>
+ .byte 68,15,88,5,196,16,0,0 // addps 0x10c4(%rip),%xmm8 # 4f10 <_sk_callback_sse2+0x10b4>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,160,0,0,0 // movups %xmm8,0xa0(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -27851,15 +27845,16 @@ BALIGN16
.byte 0,0 // add %al,(%rax)
.byte 2,0 // add (%rax),%al
.byte 0,0 // add %al,(%rax)
- .byte 33,8 // and %ecx,(%rax)
- .byte 130 // (bad)
- .byte 60,33 // cmp $0x21,%al
- .byte 8,130,60,33,8,130 // or %al,-0x7df7dec4(%rdx)
- .byte 60,33 // cmp $0x21,%al
- .byte 8,130,60,0,0,0 // or %al,0x3c(%rdx)
- .byte 191,0,0,0,191 // mov $0xbf000000,%edi
.byte 0,0 // add %al,(%rax)
- .byte 0,191,0,0,0,191 // add %bh,-0x41000000(%rdi)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 128,60,0,0 // cmpb $0x0,(%rax,%rax,1)
+ .byte 252 // cld
+ .byte 190,0,0,252,190 // mov $0xbefc0000,%esi
+ .byte 0,0 // add %al,(%rax)
+ .byte 252 // cld
+ .byte 190,0,0,252,190 // mov $0xbefc0000,%esi
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
.byte 0,128,63,0,0,128 // add %al,-0x7fffffc1(%rax)
@@ -28319,7 +28314,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a3840a <_sk_callback_sse2+0xffffffffe9a345aa>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a3840a <_sk_callback_sse2+0xffffffffe9a345ae>
.byte 220,63 // fdivrl (%rdi)
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
@@ -28414,7 +28409,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a384da <_sk_callback_sse2+0xffffffffe9a3467a>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a384da <_sk_callback_sse2+0xffffffffe9a3467e>
.byte 220,63 // fdivrl (%rdi)
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
@@ -28509,7 +28504,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a385aa <_sk_callback_sse2+0xffffffffe9a3474a>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a385aa <_sk_callback_sse2+0xffffffffe9a3474e>
.byte 220,63 // fdivrl (%rdi)
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
@@ -28604,7 +28599,7 @@ BALIGN16
.byte 249 // stc
.byte 68,180,62 // rex.R mov $0x3e,%spl
.byte 163,233,220,63,163,233,220,63,163 // movabs %eax,0xa33fdce9a33fdce9
- .byte 233,220,63,163,233 // jmpq ffffffffe9a3867a <_sk_callback_sse2+0xffffffffe9a3481a>
+ .byte 233,220,63,163,233 // jmpq ffffffffe9a3867a <_sk_callback_sse2+0xffffffffe9a3481e>
.byte 220,63 // fdivrl (%rdi)
.byte 0,0 // add %al,(%rax)
.byte 128,63,0 // cmpb $0x0,(%rdi)
@@ -29279,7 +29274,7 @@ BALIGN16
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dbd5 <_sk_callback_sse2+0x3d639d75>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dbd5 <_sk_callback_sse2+0x3d639d79>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 0,63 // add %bh,(%rdi)
.byte 0,0 // add %al,(%rax)
@@ -29305,7 +29300,7 @@ BALIGN16
.byte 0,192 // add %al,%al
.byte 63 // (bad)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dc15 <_sk_callback_sse2+0x3d639db5>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dc15 <_sk_callback_sse2+0x3d639db9>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 192,63,0 // sarb $0x0,(%rdi)
.byte 0,192 // add %al,%al
@@ -29389,7 +29384,7 @@ BALIGN16
.byte 0,0 // add %al,(%rax)
.byte 0,63 // add %bh,(%rdi)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dce5 <_sk_callback_sse2+0x3d639e85>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dce5 <_sk_callback_sse2+0x3d639e89>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 0,63 // add %bh,(%rdi)
.byte 0,0 // add %al,(%rax)
@@ -29415,7 +29410,7 @@ BALIGN16
.byte 0,192 // add %al,%al
.byte 63 // (bad)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dd25 <_sk_callback_sse2+0x3d639ec5>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d63dd25 <_sk_callback_sse2+0x3d639ec9>
.byte 57,142,99,61,0,0 // cmp %ecx,0x3d63(%rsi)
.byte 192,63,0 // sarb $0x0,(%rdi)
.byte 0,192 // add %al,%al
@@ -29426,11 +29421,11 @@ BALIGN16
.byte 63 // (bad)
.byte 114,28 // jb 4f1e <.literal16+0xfde>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 4f22 <_sk_callback_sse2+0x10c2>
+ .byte 62,114,28 // jb,pt 4f22 <_sk_callback_sse2+0x10c6>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 4f26 <_sk_callback_sse2+0x10c6>
+ .byte 62,114,28 // jb,pt 4f26 <_sk_callback_sse2+0x10ca>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 4f2a <_sk_callback_sse2+0x10ca>
+ .byte 62,114,28 // jb,pt 4f2a <_sk_callback_sse2+0x10ce>
.byte 199 // (bad)
.byte 62,171 // ds stos %eax,%es:(%rdi)
.byte 170 // stos %al,%es:(%rdi)
diff --git a/src/jumper/SkJumper_generated_win.S b/src/jumper/SkJumper_generated_win.S
index 378412e079..74fcd7bb56 100644
--- a/src/jumper/SkJumper_generated_win.S
+++ b/src/jumper/SkJumper_generated_win.S
@@ -106,14 +106,14 @@ _sk_seed_shader_hsw LABEL PROC
DB 197,249,110,199 ; vmovd %edi,%xmm0
DB 196,226,125,88,192 ; vpbroadcastd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,178,61,0,0 ; vbroadcastss 0x3db2(%rip),%ymm1 # 3f0c <_sk_callback_hsw+0x11b>
+ DB 196,226,125,24,13,174,61,0,0 ; vbroadcastss 0x3dae(%rip),%ymm1 # 3f08 <_sk_callback_hsw+0x11b>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
DB 197,252,88,2 ; vaddps (%rdx),%ymm0,%ymm0
DB 196,226,125,24,16 ; vbroadcastss (%rax),%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 197,236,88,201 ; vaddps %ymm1,%ymm2,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,21,150,61,0,0 ; vbroadcastss 0x3d96(%rip),%ymm2 # 3f10 <_sk_callback_hsw+0x11f>
+ DB 196,226,125,24,21,146,61,0,0 ; vbroadcastss 0x3d92(%rip),%ymm2 # 3f0c <_sk_callback_hsw+0x11f>
DB 197,228,87,219 ; vxorps %ymm3,%ymm3,%ymm3
DB 197,220,87,228 ; vxorps %ymm4,%ymm4,%ymm4
DB 197,212,87,237 ; vxorps %ymm5,%ymm5,%ymm5
@@ -132,13 +132,13 @@ _sk_dither_hsw LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 196,66,125,88,8 ; vpbroadcastd (%r8),%ymm9
DB 196,65,61,239,201 ; vpxor %ymm9,%ymm8,%ymm9
- DB 196,98,125,88,21,85,61,0,0 ; vpbroadcastd 0x3d55(%rip),%ymm10 # 3f14 <_sk_callback_hsw+0x123>
+ DB 196,98,125,88,21,81,61,0,0 ; vpbroadcastd 0x3d51(%rip),%ymm10 # 3f10 <_sk_callback_hsw+0x123>
DB 196,65,53,219,218 ; vpand %ymm10,%ymm9,%ymm11
DB 196,193,37,114,243,5 ; vpslld $0x5,%ymm11,%ymm11
DB 196,65,61,219,210 ; vpand %ymm10,%ymm8,%ymm10
DB 196,193,45,114,242,4 ; vpslld $0x4,%ymm10,%ymm10
- DB 196,98,125,88,37,58,61,0,0 ; vpbroadcastd 0x3d3a(%rip),%ymm12 # 3f18 <_sk_callback_hsw+0x127>
- DB 196,98,125,88,45,53,61,0,0 ; vpbroadcastd 0x3d35(%rip),%ymm13 # 3f1c <_sk_callback_hsw+0x12b>
+ DB 196,98,125,88,37,54,61,0,0 ; vpbroadcastd 0x3d36(%rip),%ymm12 # 3f14 <_sk_callback_hsw+0x127>
+ DB 196,98,125,88,45,49,61,0,0 ; vpbroadcastd 0x3d31(%rip),%ymm13 # 3f18 <_sk_callback_hsw+0x12b>
DB 196,65,53,219,245 ; vpand %ymm13,%ymm9,%ymm14
DB 196,193,13,114,246,2 ; vpslld $0x2,%ymm14,%ymm14
DB 196,65,61,219,237 ; vpand %ymm13,%ymm8,%ymm13
@@ -153,12 +153,11 @@ _sk_dither_hsw LABEL PROC
DB 196,65,61,235,194 ; vpor %ymm10,%ymm8,%ymm8
DB 196,65,61,235,193 ; vpor %ymm9,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,231,60,0,0 ; vbroadcastss 0x3ce7(%rip),%ymm9 # 3f20 <_sk_callback_hsw+0x12f>
- DB 196,98,125,24,21,226,60,0,0 ; vbroadcastss 0x3ce2(%rip),%ymm10 # 3f24 <_sk_callback_hsw+0x133>
+ DB 196,98,125,24,13,227,60,0,0 ; vbroadcastss 0x3ce3(%rip),%ymm9 # 3f1c <_sk_callback_hsw+0x12f>
+ DB 196,98,125,24,21,222,60,0,0 ; vbroadcastss 0x3cde(%rip),%ymm10 # 3f20 <_sk_callback_hsw+0x133>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 196,98,125,24,64,8 ; vbroadcastss 0x8(%rax),%ymm8
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 197,60,89,195 ; vmulps %ymm3,%ymm8,%ymm8
DB 197,188,88,192 ; vaddps %ymm0,%ymm8,%ymm0
DB 197,188,88,201 ; vaddps %ymm1,%ymm8,%ymm1
DB 197,188,88,210 ; vaddps %ymm2,%ymm8,%ymm2
@@ -187,7 +186,7 @@ _sk_clear_hsw LABEL PROC
PUBLIC _sk_srcatop_hsw
_sk_srcatop_hsw LABEL PROC
DB 197,252,89,199 ; vmulps %ymm7,%ymm0,%ymm0
- DB 196,98,125,24,5,132,60,0,0 ; vbroadcastss 0x3c84(%rip),%ymm8 # 3f28 <_sk_callback_hsw+0x137>
+ DB 196,98,125,24,5,132,60,0,0 ; vbroadcastss 0x3c84(%rip),%ymm8 # 3f24 <_sk_callback_hsw+0x137>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,226,61,184,196 ; vfmadd231ps %ymm4,%ymm8,%ymm0
DB 197,244,89,207 ; vmulps %ymm7,%ymm1,%ymm1
@@ -201,7 +200,7 @@ _sk_srcatop_hsw LABEL PROC
PUBLIC _sk_dstatop_hsw
_sk_dstatop_hsw LABEL PROC
- DB 196,98,125,24,5,87,60,0,0 ; vbroadcastss 0x3c57(%rip),%ymm8 # 3f2c <_sk_callback_hsw+0x13b>
+ DB 196,98,125,24,5,87,60,0,0 ; vbroadcastss 0x3c57(%rip),%ymm8 # 3f28 <_sk_callback_hsw+0x13b>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,226,101,184,196 ; vfmadd231ps %ymm4,%ymm3,%ymm0
@@ -234,7 +233,7 @@ _sk_dstin_hsw LABEL PROC
PUBLIC _sk_srcout_hsw
_sk_srcout_hsw LABEL PROC
- DB 196,98,125,24,5,254,59,0,0 ; vbroadcastss 0x3bfe(%rip),%ymm8 # 3f30 <_sk_callback_hsw+0x13f>
+ DB 196,98,125,24,5,254,59,0,0 ; vbroadcastss 0x3bfe(%rip),%ymm8 # 3f2c <_sk_callback_hsw+0x13f>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -245,7 +244,7 @@ _sk_srcout_hsw LABEL PROC
PUBLIC _sk_dstout_hsw
_sk_dstout_hsw LABEL PROC
- DB 196,226,125,24,5,225,59,0,0 ; vbroadcastss 0x3be1(%rip),%ymm0 # 3f34 <_sk_callback_hsw+0x143>
+ DB 196,226,125,24,5,225,59,0,0 ; vbroadcastss 0x3be1(%rip),%ymm0 # 3f30 <_sk_callback_hsw+0x143>
DB 197,252,92,219 ; vsubps %ymm3,%ymm0,%ymm3
DB 197,228,89,196 ; vmulps %ymm4,%ymm3,%ymm0
DB 197,228,89,205 ; vmulps %ymm5,%ymm3,%ymm1
@@ -256,7 +255,7 @@ _sk_dstout_hsw LABEL PROC
PUBLIC _sk_srcover_hsw
_sk_srcover_hsw LABEL PROC
- DB 196,98,125,24,5,196,59,0,0 ; vbroadcastss 0x3bc4(%rip),%ymm8 # 3f38 <_sk_callback_hsw+0x147>
+ DB 196,98,125,24,5,196,59,0,0 ; vbroadcastss 0x3bc4(%rip),%ymm8 # 3f34 <_sk_callback_hsw+0x147>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,93,184,192 ; vfmadd231ps %ymm8,%ymm4,%ymm0
DB 196,194,85,184,200 ; vfmadd231ps %ymm8,%ymm5,%ymm1
@@ -267,7 +266,7 @@ _sk_srcover_hsw LABEL PROC
PUBLIC _sk_dstover_hsw
_sk_dstover_hsw LABEL PROC
- DB 196,98,125,24,5,163,59,0,0 ; vbroadcastss 0x3ba3(%rip),%ymm8 # 3f3c <_sk_callback_hsw+0x14b>
+ DB 196,98,125,24,5,163,59,0,0 ; vbroadcastss 0x3ba3(%rip),%ymm8 # 3f38 <_sk_callback_hsw+0x14b>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 196,226,61,168,196 ; vfmadd213ps %ymm4,%ymm8,%ymm0
DB 196,226,61,168,205 ; vfmadd213ps %ymm5,%ymm8,%ymm1
@@ -287,7 +286,7 @@ _sk_modulate_hsw LABEL PROC
PUBLIC _sk_multiply_hsw
_sk_multiply_hsw LABEL PROC
- DB 196,98,125,24,5,110,59,0,0 ; vbroadcastss 0x3b6e(%rip),%ymm8 # 3f40 <_sk_callback_hsw+0x14f>
+ DB 196,98,125,24,5,110,59,0,0 ; vbroadcastss 0x3b6e(%rip),%ymm8 # 3f3c <_sk_callback_hsw+0x14f>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,208 ; vmulps %ymm0,%ymm9,%ymm10
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -329,7 +328,7 @@ _sk_screen_hsw LABEL PROC
PUBLIC _sk_xor__hsw
_sk_xor__hsw LABEL PROC
- DB 196,98,125,24,5,233,58,0,0 ; vbroadcastss 0x3ae9(%rip),%ymm8 # 3f44 <_sk_callback_hsw+0x153>
+ DB 196,98,125,24,5,233,58,0,0 ; vbroadcastss 0x3ae9(%rip),%ymm8 # 3f40 <_sk_callback_hsw+0x153>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -361,7 +360,7 @@ _sk_darken_hsw LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,95,209 ; vmaxps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,113,58,0,0 ; vbroadcastss 0x3a71(%rip),%ymm8 # 3f48 <_sk_callback_hsw+0x157>
+ DB 196,98,125,24,5,113,58,0,0 ; vbroadcastss 0x3a71(%rip),%ymm8 # 3f44 <_sk_callback_hsw+0x157>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -384,7 +383,7 @@ _sk_lighten_hsw LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,32,58,0,0 ; vbroadcastss 0x3a20(%rip),%ymm8 # 3f4c <_sk_callback_hsw+0x15b>
+ DB 196,98,125,24,5,32,58,0,0 ; vbroadcastss 0x3a20(%rip),%ymm8 # 3f48 <_sk_callback_hsw+0x15b>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -410,7 +409,7 @@ _sk_difference_hsw LABEL PROC
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,195,57,0,0 ; vbroadcastss 0x39c3(%rip),%ymm8 # 3f50 <_sk_callback_hsw+0x15f>
+ DB 196,98,125,24,5,195,57,0,0 ; vbroadcastss 0x39c3(%rip),%ymm8 # 3f4c <_sk_callback_hsw+0x15f>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -430,7 +429,7 @@ _sk_exclusion_hsw LABEL PROC
DB 197,236,89,214 ; vmulps %ymm6,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,129,57,0,0 ; vbroadcastss 0x3981(%rip),%ymm8 # 3f54 <_sk_callback_hsw+0x163>
+ DB 196,98,125,24,5,129,57,0,0 ; vbroadcastss 0x3981(%rip),%ymm8 # 3f50 <_sk_callback_hsw+0x163>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 196,194,69,184,216 ; vfmadd231ps %ymm8,%ymm7,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -438,7 +437,7 @@ _sk_exclusion_hsw LABEL PROC
PUBLIC _sk_colorburn_hsw
_sk_colorburn_hsw LABEL PROC
- DB 196,98,125,24,5,111,57,0,0 ; vbroadcastss 0x396f(%rip),%ymm8 # 3f58 <_sk_callback_hsw+0x167>
+ DB 196,98,125,24,5,111,57,0,0 ; vbroadcastss 0x396f(%rip),%ymm8 # 3f54 <_sk_callback_hsw+0x167>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,216 ; vmulps %ymm0,%ymm9,%ymm11
DB 196,65,44,87,210 ; vxorps %ymm10,%ymm10,%ymm10
@@ -494,7 +493,7 @@ _sk_colorburn_hsw LABEL PROC
PUBLIC _sk_colordodge_hsw
_sk_colordodge_hsw LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
- DB 196,98,125,24,13,122,56,0,0 ; vbroadcastss 0x387a(%rip),%ymm9 # 3f5c <_sk_callback_hsw+0x16b>
+ DB 196,98,125,24,13,122,56,0,0 ; vbroadcastss 0x387a(%rip),%ymm9 # 3f58 <_sk_callback_hsw+0x16b>
DB 197,52,92,215 ; vsubps %ymm7,%ymm9,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,52,92,203 ; vsubps %ymm3,%ymm9,%ymm9
@@ -545,7 +544,7 @@ _sk_colordodge_hsw LABEL PROC
PUBLIC _sk_hardlight_hsw
_sk_hardlight_hsw LABEL PROC
- DB 196,98,125,24,5,155,55,0,0 ; vbroadcastss 0x379b(%rip),%ymm8 # 3f60 <_sk_callback_hsw+0x16f>
+ DB 196,98,125,24,5,155,55,0,0 ; vbroadcastss 0x379b(%rip),%ymm8 # 3f5c <_sk_callback_hsw+0x16f>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -594,7 +593,7 @@ _sk_hardlight_hsw LABEL PROC
PUBLIC _sk_overlay_hsw
_sk_overlay_hsw LABEL PROC
- DB 196,98,125,24,5,211,54,0,0 ; vbroadcastss 0x36d3(%rip),%ymm8 # 3f64 <_sk_callback_hsw+0x173>
+ DB 196,98,125,24,5,211,54,0,0 ; vbroadcastss 0x36d3(%rip),%ymm8 # 3f60 <_sk_callback_hsw+0x173>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -654,10 +653,10 @@ _sk_softlight_hsw LABEL PROC
DB 196,65,20,88,197 ; vaddps %ymm13,%ymm13,%ymm8
DB 196,65,60,88,192 ; vaddps %ymm8,%ymm8,%ymm8
DB 196,66,61,168,192 ; vfmadd213ps %ymm8,%ymm8,%ymm8
- DB 196,98,125,24,29,218,53,0,0 ; vbroadcastss 0x35da(%rip),%ymm11 # 3f6c <_sk_callback_hsw+0x17b>
+ DB 196,98,125,24,29,218,53,0,0 ; vbroadcastss 0x35da(%rip),%ymm11 # 3f68 <_sk_callback_hsw+0x17b>
DB 196,65,20,88,227 ; vaddps %ymm11,%ymm13,%ymm12
DB 196,65,28,89,192 ; vmulps %ymm8,%ymm12,%ymm8
- DB 196,98,125,24,37,203,53,0,0 ; vbroadcastss 0x35cb(%rip),%ymm12 # 3f70 <_sk_callback_hsw+0x17f>
+ DB 196,98,125,24,37,203,53,0,0 ; vbroadcastss 0x35cb(%rip),%ymm12 # 3f6c <_sk_callback_hsw+0x17f>
DB 196,66,21,184,196 ; vfmadd231ps %ymm12,%ymm13,%ymm8
DB 196,65,124,82,245 ; vrsqrtps %ymm13,%ymm14
DB 196,65,124,83,246 ; vrcpps %ymm14,%ymm14
@@ -667,7 +666,7 @@ _sk_softlight_hsw LABEL PROC
DB 197,4,194,255,2 ; vcmpleps %ymm7,%ymm15,%ymm15
DB 196,67,13,74,240,240 ; vblendvps %ymm15,%ymm8,%ymm14,%ymm14
DB 197,116,88,249 ; vaddps %ymm1,%ymm1,%ymm15
- DB 196,98,125,24,5,142,53,0,0 ; vbroadcastss 0x358e(%rip),%ymm8 # 3f68 <_sk_callback_hsw+0x177>
+ DB 196,98,125,24,5,142,53,0,0 ; vbroadcastss 0x358e(%rip),%ymm8 # 3f64 <_sk_callback_hsw+0x177>
DB 196,65,60,92,237 ; vsubps %ymm13,%ymm8,%ymm13
DB 197,132,92,195 ; vsubps %ymm3,%ymm15,%ymm0
DB 196,98,125,168,235 ; vfmadd213ps %ymm3,%ymm0,%ymm13
@@ -757,7 +756,7 @@ _sk_clamp_0_hsw LABEL PROC
PUBLIC _sk_clamp_1_hsw
_sk_clamp_1_hsw LABEL PROC
- DB 196,98,125,24,5,17,52,0,0 ; vbroadcastss 0x3411(%rip),%ymm8 # 3f74 <_sk_callback_hsw+0x183>
+ DB 196,98,125,24,5,17,52,0,0 ; vbroadcastss 0x3411(%rip),%ymm8 # 3f70 <_sk_callback_hsw+0x183>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
@@ -767,7 +766,7 @@ _sk_clamp_1_hsw LABEL PROC
PUBLIC _sk_clamp_a_hsw
_sk_clamp_a_hsw LABEL PROC
- DB 196,98,125,24,5,244,51,0,0 ; vbroadcastss 0x33f4(%rip),%ymm8 # 3f78 <_sk_callback_hsw+0x187>
+ DB 196,98,125,24,5,244,51,0,0 ; vbroadcastss 0x33f4(%rip),%ymm8 # 3f74 <_sk_callback_hsw+0x187>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 197,252,93,195 ; vminps %ymm3,%ymm0,%ymm0
DB 197,244,93,203 ; vminps %ymm3,%ymm1,%ymm1
@@ -839,7 +838,7 @@ PUBLIC _sk_unpremul_hsw
_sk_unpremul_hsw LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,65,100,194,200,0 ; vcmpeqps %ymm8,%ymm3,%ymm9
- DB 196,98,125,24,21,60,51,0,0 ; vbroadcastss 0x333c(%rip),%ymm10 # 3f7c <_sk_callback_hsw+0x18b>
+ DB 196,98,125,24,21,60,51,0,0 ; vbroadcastss 0x333c(%rip),%ymm10 # 3f78 <_sk_callback_hsw+0x18b>
DB 197,44,94,211 ; vdivps %ymm3,%ymm10,%ymm10
DB 196,67,45,74,192,144 ; vblendvps %ymm9,%ymm8,%ymm10,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
@@ -850,16 +849,16 @@ _sk_unpremul_hsw LABEL PROC
PUBLIC _sk_from_srgb_hsw
_sk_from_srgb_hsw LABEL PROC
- DB 196,98,125,24,5,29,51,0,0 ; vbroadcastss 0x331d(%rip),%ymm8 # 3f80 <_sk_callback_hsw+0x18f>
+ DB 196,98,125,24,5,29,51,0,0 ; vbroadcastss 0x331d(%rip),%ymm8 # 3f7c <_sk_callback_hsw+0x18f>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 197,124,89,208 ; vmulps %ymm0,%ymm0,%ymm10
- DB 196,98,125,24,29,15,51,0,0 ; vbroadcastss 0x330f(%rip),%ymm11 # 3f84 <_sk_callback_hsw+0x193>
- DB 196,98,125,24,37,10,51,0,0 ; vbroadcastss 0x330a(%rip),%ymm12 # 3f88 <_sk_callback_hsw+0x197>
+ DB 196,98,125,24,29,15,51,0,0 ; vbroadcastss 0x330f(%rip),%ymm11 # 3f80 <_sk_callback_hsw+0x193>
+ DB 196,98,125,24,37,10,51,0,0 ; vbroadcastss 0x330a(%rip),%ymm12 # 3f84 <_sk_callback_hsw+0x197>
DB 196,65,124,40,236 ; vmovaps %ymm12,%ymm13
DB 196,66,125,168,235 ; vfmadd213ps %ymm11,%ymm0,%ymm13
- DB 196,98,125,24,53,251,50,0,0 ; vbroadcastss 0x32fb(%rip),%ymm14 # 3f8c <_sk_callback_hsw+0x19b>
+ DB 196,98,125,24,53,251,50,0,0 ; vbroadcastss 0x32fb(%rip),%ymm14 # 3f88 <_sk_callback_hsw+0x19b>
DB 196,66,45,168,238 ; vfmadd213ps %ymm14,%ymm10,%ymm13
- DB 196,98,125,24,21,241,50,0,0 ; vbroadcastss 0x32f1(%rip),%ymm10 # 3f90 <_sk_callback_hsw+0x19f>
+ DB 196,98,125,24,21,241,50,0,0 ; vbroadcastss 0x32f1(%rip),%ymm10 # 3f8c <_sk_callback_hsw+0x19f>
DB 196,193,124,194,194,1 ; vcmpltps %ymm10,%ymm0,%ymm0
DB 196,195,21,74,193,0 ; vblendvps %ymm0,%ymm9,%ymm13,%ymm0
DB 196,65,116,89,200 ; vmulps %ymm8,%ymm1,%ymm9
@@ -883,16 +882,16 @@ _sk_to_srgb_hsw LABEL PROC
DB 197,124,82,192 ; vrsqrtps %ymm0,%ymm8
DB 196,65,124,83,200 ; vrcpps %ymm8,%ymm9
DB 196,65,124,82,208 ; vrsqrtps %ymm8,%ymm10
- DB 196,98,125,24,5,139,50,0,0 ; vbroadcastss 0x328b(%rip),%ymm8 # 3f94 <_sk_callback_hsw+0x1a3>
+ DB 196,98,125,24,5,139,50,0,0 ; vbroadcastss 0x328b(%rip),%ymm8 # 3f90 <_sk_callback_hsw+0x1a3>
DB 196,65,124,89,216 ; vmulps %ymm8,%ymm0,%ymm11
- DB 196,98,125,24,37,129,50,0,0 ; vbroadcastss 0x3281(%rip),%ymm12 # 3f98 <_sk_callback_hsw+0x1a7>
- DB 196,98,125,24,45,124,50,0,0 ; vbroadcastss 0x327c(%rip),%ymm13 # 3f9c <_sk_callback_hsw+0x1ab>
+ DB 196,98,125,24,37,129,50,0,0 ; vbroadcastss 0x3281(%rip),%ymm12 # 3f94 <_sk_callback_hsw+0x1a7>
+ DB 196,98,125,24,45,124,50,0,0 ; vbroadcastss 0x327c(%rip),%ymm13 # 3f98 <_sk_callback_hsw+0x1ab>
DB 196,66,21,168,204 ; vfmadd213ps %ymm12,%ymm13,%ymm9
- DB 196,98,125,24,53,114,50,0,0 ; vbroadcastss 0x3272(%rip),%ymm14 # 3fa0 <_sk_callback_hsw+0x1af>
+ DB 196,98,125,24,53,114,50,0,0 ; vbroadcastss 0x3272(%rip),%ymm14 # 3f9c <_sk_callback_hsw+0x1af>
DB 196,66,13,184,202 ; vfmadd231ps %ymm10,%ymm14,%ymm9
- DB 196,98,125,24,21,104,50,0,0 ; vbroadcastss 0x3268(%rip),%ymm10 # 3fa4 <_sk_callback_hsw+0x1b3>
+ DB 196,98,125,24,21,104,50,0,0 ; vbroadcastss 0x3268(%rip),%ymm10 # 3fa0 <_sk_callback_hsw+0x1b3>
DB 196,65,44,93,201 ; vminps %ymm9,%ymm10,%ymm9
- DB 196,98,125,24,61,94,50,0,0 ; vbroadcastss 0x325e(%rip),%ymm15 # 3fa8 <_sk_callback_hsw+0x1b7>
+ DB 196,98,125,24,61,94,50,0,0 ; vbroadcastss 0x325e(%rip),%ymm15 # 3fa4 <_sk_callback_hsw+0x1b7>
DB 196,193,124,194,199,1 ; vcmpltps %ymm15,%ymm0,%ymm0
DB 196,195,53,74,195,0 ; vblendvps %ymm0,%ymm11,%ymm9,%ymm0
DB 197,124,82,201 ; vrsqrtps %ymm1,%ymm9
@@ -923,26 +922,26 @@ _sk_rgb_to_hsl_hsw LABEL PROC
DB 197,124,93,201 ; vminps %ymm1,%ymm0,%ymm9
DB 197,52,93,202 ; vminps %ymm2,%ymm9,%ymm9
DB 196,65,60,92,209 ; vsubps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,29,216,49,0,0 ; vbroadcastss 0x31d8(%rip),%ymm11 # 3fac <_sk_callback_hsw+0x1bb>
+ DB 196,98,125,24,29,216,49,0,0 ; vbroadcastss 0x31d8(%rip),%ymm11 # 3fa8 <_sk_callback_hsw+0x1bb>
DB 196,65,36,94,218 ; vdivps %ymm10,%ymm11,%ymm11
DB 197,116,92,226 ; vsubps %ymm2,%ymm1,%ymm12
DB 197,116,194,234,1 ; vcmpltps %ymm2,%ymm1,%ymm13
- DB 196,98,125,24,53,197,49,0,0 ; vbroadcastss 0x31c5(%rip),%ymm14 # 3fb0 <_sk_callback_hsw+0x1bf>
+ DB 196,98,125,24,53,197,49,0,0 ; vbroadcastss 0x31c5(%rip),%ymm14 # 3fac <_sk_callback_hsw+0x1bf>
DB 196,65,4,87,255 ; vxorps %ymm15,%ymm15,%ymm15
DB 196,67,5,74,238,208 ; vblendvps %ymm13,%ymm14,%ymm15,%ymm13
DB 196,66,37,168,229 ; vfmadd213ps %ymm13,%ymm11,%ymm12
DB 197,236,92,208 ; vsubps %ymm0,%ymm2,%ymm2
DB 197,124,92,233 ; vsubps %ymm1,%ymm0,%ymm13
- DB 196,98,125,24,53,172,49,0,0 ; vbroadcastss 0x31ac(%rip),%ymm14 # 3fb8 <_sk_callback_hsw+0x1c7>
+ DB 196,98,125,24,53,172,49,0,0 ; vbroadcastss 0x31ac(%rip),%ymm14 # 3fb4 <_sk_callback_hsw+0x1c7>
DB 196,66,37,168,238 ; vfmadd213ps %ymm14,%ymm11,%ymm13
- DB 196,98,125,24,53,154,49,0,0 ; vbroadcastss 0x319a(%rip),%ymm14 # 3fb4 <_sk_callback_hsw+0x1c3>
+ DB 196,98,125,24,53,154,49,0,0 ; vbroadcastss 0x319a(%rip),%ymm14 # 3fb0 <_sk_callback_hsw+0x1c3>
DB 196,194,37,168,214 ; vfmadd213ps %ymm14,%ymm11,%ymm2
DB 197,188,194,201,0 ; vcmpeqps %ymm1,%ymm8,%ymm1
DB 196,227,21,74,202,16 ; vblendvps %ymm1,%ymm2,%ymm13,%ymm1
DB 197,188,194,192,0 ; vcmpeqps %ymm0,%ymm8,%ymm0
DB 196,195,117,74,196,0 ; vblendvps %ymm0,%ymm12,%ymm1,%ymm0
DB 196,193,60,88,201 ; vaddps %ymm9,%ymm8,%ymm1
- DB 196,98,125,24,29,125,49,0,0 ; vbroadcastss 0x317d(%rip),%ymm11 # 3fc0 <_sk_callback_hsw+0x1cf>
+ DB 196,98,125,24,29,125,49,0,0 ; vbroadcastss 0x317d(%rip),%ymm11 # 3fbc <_sk_callback_hsw+0x1cf>
DB 196,193,116,89,211 ; vmulps %ymm11,%ymm1,%ymm2
DB 197,36,194,218,1 ; vcmpltps %ymm2,%ymm11,%ymm11
DB 196,65,12,92,224 ; vsubps %ymm8,%ymm14,%ymm12
@@ -952,7 +951,7 @@ _sk_rgb_to_hsl_hsw LABEL PROC
DB 197,172,94,201 ; vdivps %ymm1,%ymm10,%ymm1
DB 196,195,125,74,199,128 ; vblendvps %ymm8,%ymm15,%ymm0,%ymm0
DB 196,195,117,74,207,128 ; vblendvps %ymm8,%ymm15,%ymm1,%ymm1
- DB 196,98,125,24,5,64,49,0,0 ; vbroadcastss 0x3140(%rip),%ymm8 # 3fbc <_sk_callback_hsw+0x1cb>
+ DB 196,98,125,24,5,64,49,0,0 ; vbroadcastss 0x3140(%rip),%ymm8 # 3fb8 <_sk_callback_hsw+0x1cb>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -967,30 +966,30 @@ _sk_hsl_to_rgb_hsw LABEL PROC
DB 197,252,17,28,36 ; vmovups %ymm3,(%rsp)
DB 197,252,40,233 ; vmovaps %ymm1,%ymm5
DB 197,252,40,224 ; vmovaps %ymm0,%ymm4
- DB 196,98,125,24,5,7,49,0,0 ; vbroadcastss 0x3107(%rip),%ymm8 # 3fc4 <_sk_callback_hsw+0x1d3>
+ DB 196,98,125,24,5,7,49,0,0 ; vbroadcastss 0x3107(%rip),%ymm8 # 3fc0 <_sk_callback_hsw+0x1d3>
DB 197,60,194,202,2 ; vcmpleps %ymm2,%ymm8,%ymm9
DB 197,84,89,210 ; vmulps %ymm2,%ymm5,%ymm10
DB 196,65,84,92,218 ; vsubps %ymm10,%ymm5,%ymm11
DB 196,67,45,74,203,144 ; vblendvps %ymm9,%ymm11,%ymm10,%ymm9
DB 197,52,88,210 ; vaddps %ymm2,%ymm9,%ymm10
- DB 196,98,125,24,13,234,48,0,0 ; vbroadcastss 0x30ea(%rip),%ymm9 # 3fc8 <_sk_callback_hsw+0x1d7>
+ DB 196,98,125,24,13,234,48,0,0 ; vbroadcastss 0x30ea(%rip),%ymm9 # 3fc4 <_sk_callback_hsw+0x1d7>
DB 196,66,109,170,202 ; vfmsub213ps %ymm10,%ymm2,%ymm9
- DB 196,98,125,24,29,224,48,0,0 ; vbroadcastss 0x30e0(%rip),%ymm11 # 3fcc <_sk_callback_hsw+0x1db>
+ DB 196,98,125,24,29,224,48,0,0 ; vbroadcastss 0x30e0(%rip),%ymm11 # 3fc8 <_sk_callback_hsw+0x1db>
DB 196,65,92,88,219 ; vaddps %ymm11,%ymm4,%ymm11
DB 196,67,125,8,227,1 ; vroundps $0x1,%ymm11,%ymm12
DB 196,65,36,92,252 ; vsubps %ymm12,%ymm11,%ymm15
DB 196,65,44,92,217 ; vsubps %ymm9,%ymm10,%ymm11
- DB 196,98,125,24,45,202,48,0,0 ; vbroadcastss 0x30ca(%rip),%ymm13 # 3fd4 <_sk_callback_hsw+0x1e3>
+ DB 196,98,125,24,45,202,48,0,0 ; vbroadcastss 0x30ca(%rip),%ymm13 # 3fd0 <_sk_callback_hsw+0x1e3>
DB 196,193,4,89,197 ; vmulps %ymm13,%ymm15,%ymm0
- DB 196,98,125,24,53,192,48,0,0 ; vbroadcastss 0x30c0(%rip),%ymm14 # 3fd8 <_sk_callback_hsw+0x1e7>
+ DB 196,98,125,24,53,192,48,0,0 ; vbroadcastss 0x30c0(%rip),%ymm14 # 3fd4 <_sk_callback_hsw+0x1e7>
DB 197,12,92,224 ; vsubps %ymm0,%ymm14,%ymm12
DB 196,66,37,168,225 ; vfmadd213ps %ymm9,%ymm11,%ymm12
- DB 196,226,125,24,29,166,48,0,0 ; vbroadcastss 0x30a6(%rip),%ymm3 # 3fd0 <_sk_callback_hsw+0x1df>
+ DB 196,226,125,24,29,166,48,0,0 ; vbroadcastss 0x30a6(%rip),%ymm3 # 3fcc <_sk_callback_hsw+0x1df>
DB 196,193,100,194,255,2 ; vcmpleps %ymm15,%ymm3,%ymm7
DB 196,195,29,74,249,112 ; vblendvps %ymm7,%ymm9,%ymm12,%ymm7
DB 196,65,60,194,231,2 ; vcmpleps %ymm15,%ymm8,%ymm12
DB 196,227,45,74,255,192 ; vblendvps %ymm12,%ymm7,%ymm10,%ymm7
- DB 196,98,125,24,37,145,48,0,0 ; vbroadcastss 0x3091(%rip),%ymm12 # 3fdc <_sk_callback_hsw+0x1eb>
+ DB 196,98,125,24,37,145,48,0,0 ; vbroadcastss 0x3091(%rip),%ymm12 # 3fd8 <_sk_callback_hsw+0x1eb>
DB 196,65,28,194,255,2 ; vcmpleps %ymm15,%ymm12,%ymm15
DB 196,194,37,168,193 ; vfmadd213ps %ymm9,%ymm11,%ymm0
DB 196,99,125,74,255,240 ; vblendvps %ymm15,%ymm7,%ymm0,%ymm15
@@ -1006,7 +1005,7 @@ _sk_hsl_to_rgb_hsw LABEL PROC
DB 197,156,194,192,2 ; vcmpleps %ymm0,%ymm12,%ymm0
DB 196,194,37,168,249 ; vfmadd213ps %ymm9,%ymm11,%ymm7
DB 196,227,69,74,201,0 ; vblendvps %ymm0,%ymm1,%ymm7,%ymm1
- DB 196,226,125,24,5,61,48,0,0 ; vbroadcastss 0x303d(%rip),%ymm0 # 3fe0 <_sk_callback_hsw+0x1ef>
+ DB 196,226,125,24,5,61,48,0,0 ; vbroadcastss 0x303d(%rip),%ymm0 # 3fdc <_sk_callback_hsw+0x1ef>
DB 197,220,88,192 ; vaddps %ymm0,%ymm4,%ymm0
DB 196,227,125,8,224,1 ; vroundps $0x1,%ymm0,%ymm4
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
@@ -1052,11 +1051,11 @@ _sk_scale_u8_hsw LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,51 ; jne 1089 <_sk_scale_u8_hsw+0x43>
+ DB 117,51 ; jne 1085 <_sk_scale_u8_hsw+0x43>
DB 197,122,126,0 ; vmovq (%rax),%xmm8
DB 196,66,125,49,192 ; vpmovzxbd %xmm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,119,47,0,0 ; vbroadcastss 0x2f77(%rip),%ymm9 # 3fe4 <_sk_callback_hsw+0x1f3>
+ DB 196,98,125,24,13,119,47,0,0 ; vbroadcastss 0x2f77(%rip),%ymm9 # 3fe0 <_sk_callback_hsw+0x1f3>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -1074,9 +1073,9 @@ _sk_scale_u8_hsw LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 1091 <_sk_scale_u8_hsw+0x4b>
+ DB 117,234 ; jne 108d <_sk_scale_u8_hsw+0x4b>
DB 196,65,249,110,193 ; vmovq %r9,%xmm8
- DB 235,172 ; jmp 105a <_sk_scale_u8_hsw+0x14>
+ DB 235,172 ; jmp 1056 <_sk_scale_u8_hsw+0x14>
PUBLIC _sk_lerp_1_float_hsw
_sk_lerp_1_float_hsw LABEL PROC
@@ -1100,11 +1099,11 @@ _sk_lerp_u8_hsw LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,71 ; jne 1134 <_sk_lerp_u8_hsw+0x57>
+ DB 117,71 ; jne 1130 <_sk_lerp_u8_hsw+0x57>
DB 197,122,126,0 ; vmovq (%rax),%xmm8
DB 196,66,125,49,192 ; vpmovzxbd %xmm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,228,46,0,0 ; vbroadcastss 0x2ee4(%rip),%ymm9 # 3fe8 <_sk_callback_hsw+0x1f7>
+ DB 196,98,125,24,13,228,46,0,0 ; vbroadcastss 0x2ee4(%rip),%ymm9 # 3fe4 <_sk_callback_hsw+0x1f7>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
DB 196,226,61,168,196 ; vfmadd213ps %ymm4,%ymm8,%ymm0
@@ -1126,32 +1125,32 @@ _sk_lerp_u8_hsw LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 113c <_sk_lerp_u8_hsw+0x5f>
+ DB 117,234 ; jne 1138 <_sk_lerp_u8_hsw+0x5f>
DB 196,65,249,110,193 ; vmovq %r9,%xmm8
- DB 235,152 ; jmp 10f1 <_sk_lerp_u8_hsw+0x14>
+ DB 235,152 ; jmp 10ed <_sk_lerp_u8_hsw+0x14>
PUBLIC _sk_lerp_565_hsw
_sk_lerp_565_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,149,0,0,0 ; jne 11fc <_sk_lerp_565_hsw+0xa3>
+ DB 15,133,149,0,0,0 ; jne 11f8 <_sk_lerp_565_hsw+0xa3>
DB 196,193,122,111,28,122 ; vmovdqu (%r10,%rdi,2),%xmm3
DB 196,226,125,51,219 ; vpmovzxwd %xmm3,%ymm3
- DB 196,98,125,88,5,113,46,0,0 ; vpbroadcastd 0x2e71(%rip),%ymm8 # 3fec <_sk_callback_hsw+0x1fb>
+ DB 196,98,125,88,5,113,46,0,0 ; vpbroadcastd 0x2e71(%rip),%ymm8 # 3fe8 <_sk_callback_hsw+0x1fb>
DB 196,65,101,219,192 ; vpand %ymm8,%ymm3,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,98,46,0,0 ; vbroadcastss 0x2e62(%rip),%ymm9 # 3ff0 <_sk_callback_hsw+0x1ff>
+ DB 196,98,125,24,13,98,46,0,0 ; vbroadcastss 0x2e62(%rip),%ymm9 # 3fec <_sk_callback_hsw+0x1ff>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,88,13,88,46,0,0 ; vpbroadcastd 0x2e58(%rip),%ymm9 # 3ff4 <_sk_callback_hsw+0x203>
+ DB 196,98,125,88,13,88,46,0,0 ; vpbroadcastd 0x2e58(%rip),%ymm9 # 3ff0 <_sk_callback_hsw+0x203>
DB 196,65,101,219,201 ; vpand %ymm9,%ymm3,%ymm9
DB 196,65,124,91,201 ; vcvtdq2ps %ymm9,%ymm9
- DB 196,98,125,24,21,73,46,0,0 ; vbroadcastss 0x2e49(%rip),%ymm10 # 3ff8 <_sk_callback_hsw+0x207>
+ DB 196,98,125,24,21,73,46,0,0 ; vbroadcastss 0x2e49(%rip),%ymm10 # 3ff4 <_sk_callback_hsw+0x207>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
- DB 196,98,125,88,21,63,46,0,0 ; vpbroadcastd 0x2e3f(%rip),%ymm10 # 3ffc <_sk_callback_hsw+0x20b>
+ DB 196,98,125,88,21,63,46,0,0 ; vpbroadcastd 0x2e3f(%rip),%ymm10 # 3ff8 <_sk_callback_hsw+0x20b>
DB 196,193,101,219,218 ; vpand %ymm10,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,21,49,46,0,0 ; vbroadcastss 0x2e31(%rip),%ymm10 # 4000 <_sk_callback_hsw+0x20f>
+ DB 196,98,125,24,21,49,46,0,0 ; vbroadcastss 0x2e31(%rip),%ymm10 # 3ffc <_sk_callback_hsw+0x20f>
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
DB 196,226,61,168,196 ; vfmadd213ps %ymm4,%ymm8,%ymm0
@@ -1160,16 +1159,16 @@ _sk_lerp_565_hsw LABEL PROC
DB 197,236,92,214 ; vsubps %ymm6,%ymm2,%ymm2
DB 196,226,101,168,214 ; vfmadd213ps %ymm6,%ymm3,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,10,46,0,0 ; vbroadcastss 0x2e0a(%rip),%ymm3 # 4004 <_sk_callback_hsw+0x213>
+ DB 196,226,125,24,29,10,46,0,0 ; vbroadcastss 0x2e0a(%rip),%ymm3 # 4000 <_sk_callback_hsw+0x213>
DB 255,224 ; jmpq *%rax
DB 65,137,200 ; mov %ecx,%r8d
DB 65,128,224,7 ; and $0x7,%r8b
DB 197,225,239,219 ; vpxor %xmm3,%xmm3,%xmm3
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 15,135,89,255,255,255 ; ja 116d <_sk_lerp_565_hsw+0x14>
+ DB 15,135,89,255,255,255 ; ja 1169 <_sk_lerp_565_hsw+0x14>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 1268 <_sk_lerp_565_hsw+0x10f>
+ DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 1264 <_sk_lerp_565_hsw+0x10f>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -1181,7 +1180,7 @@ _sk_lerp_565_hsw LABEL PROC
DB 196,193,97,196,92,122,4,2 ; vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm3,%xmm3
DB 196,193,97,196,92,122,2,1 ; vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm3,%xmm3
DB 196,193,97,196,28,122,0 ; vpinsrw $0x0,(%r10,%rdi,2),%xmm3,%xmm3
- DB 233,5,255,255,255 ; jmpq 116d <_sk_lerp_565_hsw+0x14>
+ DB 233,5,255,255,255 ; jmpq 1169 <_sk_lerp_565_hsw+0x14>
DB 244 ; hlt
DB 255 ; (bad)
DB 255 ; (bad)
@@ -1213,23 +1212,23 @@ _sk_load_tables_hsw LABEL PROC
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
DB 76,3,8 ; add (%rax),%r9
DB 77,133,192 ; test %r8,%r8
- DB 117,105 ; jne 1302 <_sk_load_tables_hsw+0x7e>
+ DB 117,105 ; jne 12fe <_sk_load_tables_hsw+0x7e>
DB 196,193,126,111,25 ; vmovdqu (%r9),%ymm3
- DB 197,229,219,13,26,48,0,0 ; vpand 0x301a(%rip),%ymm3,%ymm1 # 42c0 <_sk_callback_hsw+0x4cf>
+ DB 197,229,219,13,30,48,0,0 ; vpand 0x301e(%rip),%ymm3,%ymm1 # 42c0 <_sk_callback_hsw+0x4d3>
DB 196,65,61,118,192 ; vpcmpeqd %ymm8,%ymm8,%ymm8
DB 72,139,72,8 ; mov 0x8(%rax),%rcx
DB 76,139,72,16 ; mov 0x10(%rax),%r9
DB 197,237,118,210 ; vpcmpeqd %ymm2,%ymm2,%ymm2
DB 196,226,109,146,4,137 ; vgatherdps %ymm2,(%rcx,%ymm1,4),%ymm0
- DB 196,226,101,0,21,26,48,0,0 ; vpshufb 0x301a(%rip),%ymm3,%ymm2 # 42e0 <_sk_callback_hsw+0x4ef>
+ DB 196,226,101,0,21,30,48,0,0 ; vpshufb 0x301e(%rip),%ymm3,%ymm2 # 42e0 <_sk_callback_hsw+0x4f3>
DB 196,65,53,118,201 ; vpcmpeqd %ymm9,%ymm9,%ymm9
DB 196,194,53,146,12,145 ; vgatherdps %ymm9,(%r9,%ymm2,4),%ymm1
DB 72,139,64,24 ; mov 0x18(%rax),%rax
- DB 196,98,101,0,13,34,48,0,0 ; vpshufb 0x3022(%rip),%ymm3,%ymm9 # 4300 <_sk_callback_hsw+0x50f>
+ DB 196,98,101,0,13,38,48,0,0 ; vpshufb 0x3026(%rip),%ymm3,%ymm9 # 4300 <_sk_callback_hsw+0x513>
DB 196,162,61,146,20,136 ; vgatherdps %ymm8,(%rax,%ymm9,4),%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,18,45,0,0 ; vbroadcastss 0x2d12(%rip),%ymm8 # 4008 <_sk_callback_hsw+0x217>
+ DB 196,98,125,24,5,18,45,0,0 ; vbroadcastss 0x2d12(%rip),%ymm8 # 4004 <_sk_callback_hsw+0x217>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,137,193 ; mov %r8,%rcx
@@ -1242,7 +1241,7 @@ _sk_load_tables_hsw LABEL PROC
DB 196,193,249,110,194 ; vmovq %r10,%xmm0
DB 196,226,125,33,192 ; vpmovsxbd %xmm0,%ymm0
DB 196,194,125,140,25 ; vpmaskmovd (%r9),%ymm0,%ymm3
- DB 233,115,255,255,255 ; jmpq 129e <_sk_load_tables_hsw+0x1a>
+ DB 233,115,255,255,255 ; jmpq 129a <_sk_load_tables_hsw+0x1a>
PUBLIC _sk_load_tables_u16_be_hsw
_sk_load_tables_u16_be_hsw LABEL PROC
@@ -1250,7 +1249,7 @@ _sk_load_tables_u16_be_hsw LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,201,0,0,0 ; jne 140a <_sk_load_tables_u16_be_hsw+0xdf>
+ DB 15,133,201,0,0,0 ; jne 1406 <_sk_load_tables_u16_be_hsw+0xdf>
DB 196,1,121,16,4,72 ; vmovupd (%r8,%r9,2),%xmm8
DB 196,129,121,16,84,72,16 ; vmovupd 0x10(%r8,%r9,2),%xmm2
DB 196,129,121,16,92,72,32 ; vmovupd 0x20(%r8,%r9,2),%xmm3
@@ -1266,7 +1265,7 @@ _sk_load_tables_u16_be_hsw LABEL PROC
DB 197,185,108,200 ; vpunpcklqdq %xmm0,%xmm8,%xmm1
DB 197,185,109,208 ; vpunpckhqdq %xmm0,%xmm8,%xmm2
DB 197,49,108,195 ; vpunpcklqdq %xmm3,%xmm9,%xmm8
- DB 197,121,111,21,174,48,0,0 ; vmovdqa 0x30ae(%rip),%xmm10 # 4440 <_sk_callback_hsw+0x64f>
+ DB 197,121,111,21,178,48,0,0 ; vmovdqa 0x30b2(%rip),%xmm10 # 4440 <_sk_callback_hsw+0x653>
DB 196,193,113,219,194 ; vpand %xmm10,%xmm1,%xmm0
DB 196,226,125,51,200 ; vpmovzxwd %xmm0,%ymm1
DB 196,65,37,118,219 ; vpcmpeqd %ymm11,%ymm11,%ymm11
@@ -1288,36 +1287,36 @@ _sk_load_tables_u16_be_hsw LABEL PROC
DB 197,185,235,219 ; vpor %xmm3,%xmm8,%xmm3
DB 196,226,125,51,219 ; vpmovzxwd %xmm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,11,44,0,0 ; vbroadcastss 0x2c0b(%rip),%ymm8 # 400c <_sk_callback_hsw+0x21b>
+ DB 196,98,125,24,5,11,44,0,0 ; vbroadcastss 0x2c0b(%rip),%ymm8 # 4008 <_sk_callback_hsw+0x21b>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
DB 196,1,123,16,4,72 ; vmovsd (%r8,%r9,2),%xmm8
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,85 ; je 1470 <_sk_load_tables_u16_be_hsw+0x145>
+ DB 116,85 ; je 146c <_sk_load_tables_u16_be_hsw+0x145>
DB 196,1,57,22,68,72,8 ; vmovhpd 0x8(%r8,%r9,2),%xmm8,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,72 ; jb 1470 <_sk_load_tables_u16_be_hsw+0x145>
+ DB 114,72 ; jb 146c <_sk_load_tables_u16_be_hsw+0x145>
DB 196,129,123,16,84,72,16 ; vmovsd 0x10(%r8,%r9,2),%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 116,72 ; je 147d <_sk_load_tables_u16_be_hsw+0x152>
+ DB 116,72 ; je 1479 <_sk_load_tables_u16_be_hsw+0x152>
DB 196,129,105,22,84,72,24 ; vmovhpd 0x18(%r8,%r9,2),%xmm2,%xmm2
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,59 ; jb 147d <_sk_load_tables_u16_be_hsw+0x152>
+ DB 114,59 ; jb 1479 <_sk_load_tables_u16_be_hsw+0x152>
DB 196,129,123,16,92,72,32 ; vmovsd 0x20(%r8,%r9,2),%xmm3
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 15,132,9,255,255,255 ; je 135c <_sk_load_tables_u16_be_hsw+0x31>
+ DB 15,132,9,255,255,255 ; je 1358 <_sk_load_tables_u16_be_hsw+0x31>
DB 196,129,97,22,92,72,40 ; vmovhpd 0x28(%r8,%r9,2),%xmm3,%xmm3
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 15,130,248,254,255,255 ; jb 135c <_sk_load_tables_u16_be_hsw+0x31>
+ DB 15,130,248,254,255,255 ; jb 1358 <_sk_load_tables_u16_be_hsw+0x31>
DB 196,1,122,126,76,72,48 ; vmovq 0x30(%r8,%r9,2),%xmm9
- DB 233,236,254,255,255 ; jmpq 135c <_sk_load_tables_u16_be_hsw+0x31>
+ DB 233,236,254,255,255 ; jmpq 1358 <_sk_load_tables_u16_be_hsw+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
DB 197,233,87,210 ; vxorpd %xmm2,%xmm2,%xmm2
- DB 233,223,254,255,255 ; jmpq 135c <_sk_load_tables_u16_be_hsw+0x31>
+ DB 233,223,254,255,255 ; jmpq 1358 <_sk_load_tables_u16_be_hsw+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
- DB 233,214,254,255,255 ; jmpq 135c <_sk_load_tables_u16_be_hsw+0x31>
+ DB 233,214,254,255,255 ; jmpq 1358 <_sk_load_tables_u16_be_hsw+0x31>
PUBLIC _sk_load_tables_rgb_u16_be_hsw
_sk_load_tables_rgb_u16_be_hsw LABEL PROC
@@ -1325,7 +1324,7 @@ _sk_load_tables_rgb_u16_be_hsw LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 76,141,12,127 ; lea (%rdi,%rdi,2),%r9
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,193,0,0,0 ; jne 1559 <_sk_load_tables_rgb_u16_be_hsw+0xd3>
+ DB 15,133,193,0,0,0 ; jne 1555 <_sk_load_tables_rgb_u16_be_hsw+0xd3>
DB 196,129,122,111,4,72 ; vmovdqu (%r8,%r9,2),%xmm0
DB 196,129,122,111,84,72,12 ; vmovdqu 0xc(%r8,%r9,2),%xmm2
DB 196,129,122,111,76,72,24 ; vmovdqu 0x18(%r8,%r9,2),%xmm1
@@ -1346,7 +1345,7 @@ _sk_load_tables_rgb_u16_be_hsw LABEL PROC
DB 197,185,108,218 ; vpunpcklqdq %xmm2,%xmm8,%xmm3
DB 197,185,109,210 ; vpunpckhqdq %xmm2,%xmm8,%xmm2
DB 197,121,108,193 ; vpunpcklqdq %xmm1,%xmm0,%xmm8
- DB 197,121,111,13,78,47,0,0 ; vmovdqa 0x2f4e(%rip),%xmm9 # 4450 <_sk_callback_hsw+0x65f>
+ DB 197,121,111,13,82,47,0,0 ; vmovdqa 0x2f52(%rip),%xmm9 # 4450 <_sk_callback_hsw+0x663>
DB 196,193,97,219,193 ; vpand %xmm9,%xmm3,%xmm0
DB 196,226,125,51,200 ; vpmovzxwd %xmm0,%ymm1
DB 197,229,118,219 ; vpcmpeqd %ymm3,%ymm3,%ymm3
@@ -1363,41 +1362,41 @@ _sk_load_tables_rgb_u16_be_hsw LABEL PROC
DB 196,98,125,51,194 ; vpmovzxwd %xmm2,%ymm8
DB 196,162,101,146,20,128 ; vgatherdps %ymm3,(%rax,%ymm8,4),%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,185,42,0,0 ; vbroadcastss 0x2ab9(%rip),%ymm3 # 4010 <_sk_callback_hsw+0x21f>
+ DB 196,226,125,24,29,185,42,0,0 ; vbroadcastss 0x2ab9(%rip),%ymm3 # 400c <_sk_callback_hsw+0x21f>
DB 255,224 ; jmpq *%rax
DB 196,129,121,110,4,72 ; vmovd (%r8,%r9,2),%xmm0
DB 196,129,121,196,68,72,4,2 ; vpinsrw $0x2,0x4(%r8,%r9,2),%xmm0,%xmm0
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 117,5 ; jne 1572 <_sk_load_tables_rgb_u16_be_hsw+0xec>
- DB 233,90,255,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 117,5 ; jne 156e <_sk_load_tables_rgb_u16_be_hsw+0xec>
+ DB 233,90,255,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
DB 196,129,121,110,76,72,6 ; vmovd 0x6(%r8,%r9,2),%xmm1
DB 196,1,113,196,68,72,10,2 ; vpinsrw $0x2,0xa(%r8,%r9,2),%xmm1,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,26 ; jb 15a1 <_sk_load_tables_rgb_u16_be_hsw+0x11b>
+ DB 114,26 ; jb 159d <_sk_load_tables_rgb_u16_be_hsw+0x11b>
DB 196,129,121,110,76,72,12 ; vmovd 0xc(%r8,%r9,2),%xmm1
DB 196,129,113,196,84,72,16,2 ; vpinsrw $0x2,0x10(%r8,%r9,2),%xmm1,%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 117,10 ; jne 15a6 <_sk_load_tables_rgb_u16_be_hsw+0x120>
- DB 233,43,255,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
- DB 233,38,255,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 117,10 ; jne 15a2 <_sk_load_tables_rgb_u16_be_hsw+0x120>
+ DB 233,43,255,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 233,38,255,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
DB 196,129,121,110,76,72,18 ; vmovd 0x12(%r8,%r9,2),%xmm1
DB 196,1,113,196,76,72,22,2 ; vpinsrw $0x2,0x16(%r8,%r9,2),%xmm1,%xmm9
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,26 ; jb 15d5 <_sk_load_tables_rgb_u16_be_hsw+0x14f>
+ DB 114,26 ; jb 15d1 <_sk_load_tables_rgb_u16_be_hsw+0x14f>
DB 196,129,121,110,76,72,24 ; vmovd 0x18(%r8,%r9,2),%xmm1
DB 196,129,113,196,76,72,28,2 ; vpinsrw $0x2,0x1c(%r8,%r9,2),%xmm1,%xmm1
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 117,10 ; jne 15da <_sk_load_tables_rgb_u16_be_hsw+0x154>
- DB 233,247,254,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
- DB 233,242,254,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 117,10 ; jne 15d6 <_sk_load_tables_rgb_u16_be_hsw+0x154>
+ DB 233,247,254,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 233,242,254,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
DB 196,129,121,110,92,72,30 ; vmovd 0x1e(%r8,%r9,2),%xmm3
DB 196,1,97,196,92,72,34,2 ; vpinsrw $0x2,0x22(%r8,%r9,2),%xmm3,%xmm11
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,20 ; jb 1603 <_sk_load_tables_rgb_u16_be_hsw+0x17d>
+ DB 114,20 ; jb 15ff <_sk_load_tables_rgb_u16_be_hsw+0x17d>
DB 196,129,121,110,92,72,36 ; vmovd 0x24(%r8,%r9,2),%xmm3
DB 196,129,97,196,92,72,40,2 ; vpinsrw $0x2,0x28(%r8,%r9,2),%xmm3,%xmm3
- DB 233,201,254,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
- DB 233,196,254,255,255 ; jmpq 14cc <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 233,201,254,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
+ DB 233,196,254,255,255 ; jmpq 14c8 <_sk_load_tables_rgb_u16_be_hsw+0x46>
PUBLIC _sk_byte_tables_hsw
_sk_byte_tables_hsw LABEL PROC
@@ -1408,7 +1407,7 @@ _sk_byte_tables_hsw LABEL PROC
DB 65,84 ; push %r12
DB 83 ; push %rbx
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,247,41,0,0 ; vbroadcastss 0x29f7(%rip),%ymm8 # 4014 <_sk_callback_hsw+0x223>
+ DB 196,98,125,24,5,247,41,0,0 ; vbroadcastss 0x29f7(%rip),%ymm8 # 4010 <_sk_callback_hsw+0x223>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 197,253,91,192 ; vcvtps2dq %ymm0,%ymm0
DB 196,195,249,22,192,1 ; vpextrq $0x1,%xmm0,%r8
@@ -1445,7 +1444,7 @@ _sk_byte_tables_hsw LABEL PROC
DB 196,227,121,32,197,7 ; vpinsrb $0x7,%ebp,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,72,41,0,0 ; vbroadcastss 0x2948(%rip),%ymm9 # 4018 <_sk_callback_hsw+0x227>
+ DB 196,98,125,24,13,72,41,0,0 ; vbroadcastss 0x2948(%rip),%ymm9 # 4014 <_sk_callback_hsw+0x227>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
@@ -1604,7 +1603,7 @@ _sk_byte_tables_rgb_hsw LABEL PROC
DB 196,227,121,32,197,7 ; vpinsrb $0x7,%ebp,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,129,38,0,0 ; vbroadcastss 0x2681(%rip),%ymm9 # 401c <_sk_callback_hsw+0x22b>
+ DB 196,98,125,24,13,129,38,0,0 ; vbroadcastss 0x2681(%rip),%ymm9 # 4018 <_sk_callback_hsw+0x22b>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
@@ -1757,33 +1756,33 @@ _sk_parametric_r_hsw LABEL PROC
DB 196,66,125,168,211 ; vfmadd213ps %ymm11,%ymm0,%ymm10
DB 196,226,125,24,0 ; vbroadcastss (%rax),%ymm0
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,52,36,0,0 ; vbroadcastss 0x2434(%rip),%ymm12 # 4020 <_sk_callback_hsw+0x22f>
- DB 196,98,125,24,45,47,36,0,0 ; vbroadcastss 0x242f(%rip),%ymm13 # 4024 <_sk_callback_hsw+0x233>
+ DB 196,98,125,24,37,52,36,0,0 ; vbroadcastss 0x2434(%rip),%ymm12 # 401c <_sk_callback_hsw+0x22f>
+ DB 196,98,125,24,45,47,36,0,0 ; vbroadcastss 0x242f(%rip),%ymm13 # 4020 <_sk_callback_hsw+0x233>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,37,36,0,0 ; vbroadcastss 0x2425(%rip),%ymm13 # 4028 <_sk_callback_hsw+0x237>
+ DB 196,98,125,24,45,37,36,0,0 ; vbroadcastss 0x2425(%rip),%ymm13 # 4024 <_sk_callback_hsw+0x237>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,27,36,0,0 ; vbroadcastss 0x241b(%rip),%ymm13 # 402c <_sk_callback_hsw+0x23b>
+ DB 196,98,125,24,45,27,36,0,0 ; vbroadcastss 0x241b(%rip),%ymm13 # 4028 <_sk_callback_hsw+0x23b>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,17,36,0,0 ; vbroadcastss 0x2411(%rip),%ymm11 # 4030 <_sk_callback_hsw+0x23f>
+ DB 196,98,125,24,29,17,36,0,0 ; vbroadcastss 0x2411(%rip),%ymm11 # 402c <_sk_callback_hsw+0x23f>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,7,36,0,0 ; vbroadcastss 0x2407(%rip),%ymm12 # 4034 <_sk_callback_hsw+0x243>
+ DB 196,98,125,24,37,7,36,0,0 ; vbroadcastss 0x2407(%rip),%ymm12 # 4030 <_sk_callback_hsw+0x243>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,253,35,0,0 ; vbroadcastss 0x23fd(%rip),%ymm12 # 4038 <_sk_callback_hsw+0x247>
+ DB 196,98,125,24,37,253,35,0,0 ; vbroadcastss 0x23fd(%rip),%ymm12 # 4034 <_sk_callback_hsw+0x247>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 196,99,125,8,208,1 ; vroundps $0x1,%ymm0,%ymm10
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,222,35,0,0 ; vbroadcastss 0x23de(%rip),%ymm11 # 403c <_sk_callback_hsw+0x24b>
+ DB 196,98,125,24,29,222,35,0,0 ; vbroadcastss 0x23de(%rip),%ymm11 # 4038 <_sk_callback_hsw+0x24b>
DB 196,193,124,88,195 ; vaddps %ymm11,%ymm0,%ymm0
- DB 196,98,125,24,29,212,35,0,0 ; vbroadcastss 0x23d4(%rip),%ymm11 # 4040 <_sk_callback_hsw+0x24f>
+ DB 196,98,125,24,29,212,35,0,0 ; vbroadcastss 0x23d4(%rip),%ymm11 # 403c <_sk_callback_hsw+0x24f>
DB 196,98,45,172,216 ; vfnmadd213ps %ymm0,%ymm10,%ymm11
- DB 196,226,125,24,5,202,35,0,0 ; vbroadcastss 0x23ca(%rip),%ymm0 # 4044 <_sk_callback_hsw+0x253>
+ DB 196,226,125,24,5,202,35,0,0 ; vbroadcastss 0x23ca(%rip),%ymm0 # 4040 <_sk_callback_hsw+0x253>
DB 196,193,124,92,194 ; vsubps %ymm10,%ymm0,%ymm0
- DB 196,98,125,24,21,192,35,0,0 ; vbroadcastss 0x23c0(%rip),%ymm10 # 4048 <_sk_callback_hsw+0x257>
+ DB 196,98,125,24,21,192,35,0,0 ; vbroadcastss 0x23c0(%rip),%ymm10 # 4044 <_sk_callback_hsw+0x257>
DB 197,172,94,192 ; vdivps %ymm0,%ymm10,%ymm0
DB 197,164,88,192 ; vaddps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,21,179,35,0,0 ; vbroadcastss 0x23b3(%rip),%ymm10 # 404c <_sk_callback_hsw+0x25b>
+ DB 196,98,125,24,21,179,35,0,0 ; vbroadcastss 0x23b3(%rip),%ymm10 # 4048 <_sk_callback_hsw+0x25b>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,253,91,192 ; vcvtps2dq %ymm0,%ymm0
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -1791,7 +1790,7 @@ _sk_parametric_r_hsw LABEL PROC
DB 196,195,125,74,193,128 ; vblendvps %ymm8,%ymm9,%ymm0,%ymm0
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,124,95,192 ; vmaxps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,138,35,0,0 ; vbroadcastss 0x238a(%rip),%ymm8 # 4050 <_sk_callback_hsw+0x25f>
+ DB 196,98,125,24,5,138,35,0,0 ; vbroadcastss 0x238a(%rip),%ymm8 # 404c <_sk_callback_hsw+0x25f>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -1809,33 +1808,33 @@ _sk_parametric_g_hsw LABEL PROC
DB 196,66,117,168,211 ; vfmadd213ps %ymm11,%ymm1,%ymm10
DB 196,226,125,24,8 ; vbroadcastss (%rax),%ymm1
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,66,35,0,0 ; vbroadcastss 0x2342(%rip),%ymm12 # 4054 <_sk_callback_hsw+0x263>
- DB 196,98,125,24,45,61,35,0,0 ; vbroadcastss 0x233d(%rip),%ymm13 # 4058 <_sk_callback_hsw+0x267>
+ DB 196,98,125,24,37,66,35,0,0 ; vbroadcastss 0x2342(%rip),%ymm12 # 4050 <_sk_callback_hsw+0x263>
+ DB 196,98,125,24,45,61,35,0,0 ; vbroadcastss 0x233d(%rip),%ymm13 # 4054 <_sk_callback_hsw+0x267>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,51,35,0,0 ; vbroadcastss 0x2333(%rip),%ymm13 # 405c <_sk_callback_hsw+0x26b>
+ DB 196,98,125,24,45,51,35,0,0 ; vbroadcastss 0x2333(%rip),%ymm13 # 4058 <_sk_callback_hsw+0x26b>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,41,35,0,0 ; vbroadcastss 0x2329(%rip),%ymm13 # 4060 <_sk_callback_hsw+0x26f>
+ DB 196,98,125,24,45,41,35,0,0 ; vbroadcastss 0x2329(%rip),%ymm13 # 405c <_sk_callback_hsw+0x26f>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,31,35,0,0 ; vbroadcastss 0x231f(%rip),%ymm11 # 4064 <_sk_callback_hsw+0x273>
+ DB 196,98,125,24,29,31,35,0,0 ; vbroadcastss 0x231f(%rip),%ymm11 # 4060 <_sk_callback_hsw+0x273>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,21,35,0,0 ; vbroadcastss 0x2315(%rip),%ymm12 # 4068 <_sk_callback_hsw+0x277>
+ DB 196,98,125,24,37,21,35,0,0 ; vbroadcastss 0x2315(%rip),%ymm12 # 4064 <_sk_callback_hsw+0x277>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,11,35,0,0 ; vbroadcastss 0x230b(%rip),%ymm12 # 406c <_sk_callback_hsw+0x27b>
+ DB 196,98,125,24,37,11,35,0,0 ; vbroadcastss 0x230b(%rip),%ymm12 # 4068 <_sk_callback_hsw+0x27b>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,116,89,202 ; vmulps %ymm10,%ymm1,%ymm1
DB 196,99,125,8,209,1 ; vroundps $0x1,%ymm1,%ymm10
DB 196,65,116,92,210 ; vsubps %ymm10,%ymm1,%ymm10
- DB 196,98,125,24,29,236,34,0,0 ; vbroadcastss 0x22ec(%rip),%ymm11 # 4070 <_sk_callback_hsw+0x27f>
+ DB 196,98,125,24,29,236,34,0,0 ; vbroadcastss 0x22ec(%rip),%ymm11 # 406c <_sk_callback_hsw+0x27f>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,226,34,0,0 ; vbroadcastss 0x22e2(%rip),%ymm11 # 4074 <_sk_callback_hsw+0x283>
+ DB 196,98,125,24,29,226,34,0,0 ; vbroadcastss 0x22e2(%rip),%ymm11 # 4070 <_sk_callback_hsw+0x283>
DB 196,98,45,172,217 ; vfnmadd213ps %ymm1,%ymm10,%ymm11
- DB 196,226,125,24,13,216,34,0,0 ; vbroadcastss 0x22d8(%rip),%ymm1 # 4078 <_sk_callback_hsw+0x287>
+ DB 196,226,125,24,13,216,34,0,0 ; vbroadcastss 0x22d8(%rip),%ymm1 # 4074 <_sk_callback_hsw+0x287>
DB 196,193,116,92,202 ; vsubps %ymm10,%ymm1,%ymm1
- DB 196,98,125,24,21,206,34,0,0 ; vbroadcastss 0x22ce(%rip),%ymm10 # 407c <_sk_callback_hsw+0x28b>
+ DB 196,98,125,24,21,206,34,0,0 ; vbroadcastss 0x22ce(%rip),%ymm10 # 4078 <_sk_callback_hsw+0x28b>
DB 197,172,94,201 ; vdivps %ymm1,%ymm10,%ymm1
DB 197,164,88,201 ; vaddps %ymm1,%ymm11,%ymm1
- DB 196,98,125,24,21,193,34,0,0 ; vbroadcastss 0x22c1(%rip),%ymm10 # 4080 <_sk_callback_hsw+0x28f>
+ DB 196,98,125,24,21,193,34,0,0 ; vbroadcastss 0x22c1(%rip),%ymm10 # 407c <_sk_callback_hsw+0x28f>
DB 196,193,116,89,202 ; vmulps %ymm10,%ymm1,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -1843,7 +1842,7 @@ _sk_parametric_g_hsw LABEL PROC
DB 196,195,117,74,201,128 ; vblendvps %ymm8,%ymm9,%ymm1,%ymm1
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,116,95,200 ; vmaxps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,5,152,34,0,0 ; vbroadcastss 0x2298(%rip),%ymm8 # 4084 <_sk_callback_hsw+0x293>
+ DB 196,98,125,24,5,152,34,0,0 ; vbroadcastss 0x2298(%rip),%ymm8 # 4080 <_sk_callback_hsw+0x293>
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -1861,33 +1860,33 @@ _sk_parametric_b_hsw LABEL PROC
DB 196,66,109,168,211 ; vfmadd213ps %ymm11,%ymm2,%ymm10
DB 196,226,125,24,16 ; vbroadcastss (%rax),%ymm2
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,80,34,0,0 ; vbroadcastss 0x2250(%rip),%ymm12 # 4088 <_sk_callback_hsw+0x297>
- DB 196,98,125,24,45,75,34,0,0 ; vbroadcastss 0x224b(%rip),%ymm13 # 408c <_sk_callback_hsw+0x29b>
+ DB 196,98,125,24,37,80,34,0,0 ; vbroadcastss 0x2250(%rip),%ymm12 # 4084 <_sk_callback_hsw+0x297>
+ DB 196,98,125,24,45,75,34,0,0 ; vbroadcastss 0x224b(%rip),%ymm13 # 4088 <_sk_callback_hsw+0x29b>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,65,34,0,0 ; vbroadcastss 0x2241(%rip),%ymm13 # 4090 <_sk_callback_hsw+0x29f>
+ DB 196,98,125,24,45,65,34,0,0 ; vbroadcastss 0x2241(%rip),%ymm13 # 408c <_sk_callback_hsw+0x29f>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,55,34,0,0 ; vbroadcastss 0x2237(%rip),%ymm13 # 4094 <_sk_callback_hsw+0x2a3>
+ DB 196,98,125,24,45,55,34,0,0 ; vbroadcastss 0x2237(%rip),%ymm13 # 4090 <_sk_callback_hsw+0x2a3>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,45,34,0,0 ; vbroadcastss 0x222d(%rip),%ymm11 # 4098 <_sk_callback_hsw+0x2a7>
+ DB 196,98,125,24,29,45,34,0,0 ; vbroadcastss 0x222d(%rip),%ymm11 # 4094 <_sk_callback_hsw+0x2a7>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,35,34,0,0 ; vbroadcastss 0x2223(%rip),%ymm12 # 409c <_sk_callback_hsw+0x2ab>
+ DB 196,98,125,24,37,35,34,0,0 ; vbroadcastss 0x2223(%rip),%ymm12 # 4098 <_sk_callback_hsw+0x2ab>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,25,34,0,0 ; vbroadcastss 0x2219(%rip),%ymm12 # 40a0 <_sk_callback_hsw+0x2af>
+ DB 196,98,125,24,37,25,34,0,0 ; vbroadcastss 0x2219(%rip),%ymm12 # 409c <_sk_callback_hsw+0x2af>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 196,99,125,8,210,1 ; vroundps $0x1,%ymm2,%ymm10
DB 196,65,108,92,210 ; vsubps %ymm10,%ymm2,%ymm10
- DB 196,98,125,24,29,250,33,0,0 ; vbroadcastss 0x21fa(%rip),%ymm11 # 40a4 <_sk_callback_hsw+0x2b3>
+ DB 196,98,125,24,29,250,33,0,0 ; vbroadcastss 0x21fa(%rip),%ymm11 # 40a0 <_sk_callback_hsw+0x2b3>
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
- DB 196,98,125,24,29,240,33,0,0 ; vbroadcastss 0x21f0(%rip),%ymm11 # 40a8 <_sk_callback_hsw+0x2b7>
+ DB 196,98,125,24,29,240,33,0,0 ; vbroadcastss 0x21f0(%rip),%ymm11 # 40a4 <_sk_callback_hsw+0x2b7>
DB 196,98,45,172,218 ; vfnmadd213ps %ymm2,%ymm10,%ymm11
- DB 196,226,125,24,21,230,33,0,0 ; vbroadcastss 0x21e6(%rip),%ymm2 # 40ac <_sk_callback_hsw+0x2bb>
+ DB 196,226,125,24,21,230,33,0,0 ; vbroadcastss 0x21e6(%rip),%ymm2 # 40a8 <_sk_callback_hsw+0x2bb>
DB 196,193,108,92,210 ; vsubps %ymm10,%ymm2,%ymm2
- DB 196,98,125,24,21,220,33,0,0 ; vbroadcastss 0x21dc(%rip),%ymm10 # 40b0 <_sk_callback_hsw+0x2bf>
+ DB 196,98,125,24,21,220,33,0,0 ; vbroadcastss 0x21dc(%rip),%ymm10 # 40ac <_sk_callback_hsw+0x2bf>
DB 197,172,94,210 ; vdivps %ymm2,%ymm10,%ymm2
DB 197,164,88,210 ; vaddps %ymm2,%ymm11,%ymm2
- DB 196,98,125,24,21,207,33,0,0 ; vbroadcastss 0x21cf(%rip),%ymm10 # 40b4 <_sk_callback_hsw+0x2c3>
+ DB 196,98,125,24,21,207,33,0,0 ; vbroadcastss 0x21cf(%rip),%ymm10 # 40b0 <_sk_callback_hsw+0x2c3>
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 197,253,91,210 ; vcvtps2dq %ymm2,%ymm2
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -1895,7 +1894,7 @@ _sk_parametric_b_hsw LABEL PROC
DB 196,195,109,74,209,128 ; vblendvps %ymm8,%ymm9,%ymm2,%ymm2
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,108,95,208 ; vmaxps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,166,33,0,0 ; vbroadcastss 0x21a6(%rip),%ymm8 # 40b8 <_sk_callback_hsw+0x2c7>
+ DB 196,98,125,24,5,166,33,0,0 ; vbroadcastss 0x21a6(%rip),%ymm8 # 40b4 <_sk_callback_hsw+0x2c7>
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -1913,33 +1912,33 @@ _sk_parametric_a_hsw LABEL PROC
DB 196,66,101,168,211 ; vfmadd213ps %ymm11,%ymm3,%ymm10
DB 196,226,125,24,24 ; vbroadcastss (%rax),%ymm3
DB 196,65,124,91,218 ; vcvtdq2ps %ymm10,%ymm11
- DB 196,98,125,24,37,94,33,0,0 ; vbroadcastss 0x215e(%rip),%ymm12 # 40bc <_sk_callback_hsw+0x2cb>
- DB 196,98,125,24,45,89,33,0,0 ; vbroadcastss 0x2159(%rip),%ymm13 # 40c0 <_sk_callback_hsw+0x2cf>
+ DB 196,98,125,24,37,94,33,0,0 ; vbroadcastss 0x215e(%rip),%ymm12 # 40b8 <_sk_callback_hsw+0x2cb>
+ DB 196,98,125,24,45,89,33,0,0 ; vbroadcastss 0x2159(%rip),%ymm13 # 40bc <_sk_callback_hsw+0x2cf>
DB 196,65,44,84,213 ; vandps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,79,33,0,0 ; vbroadcastss 0x214f(%rip),%ymm13 # 40c4 <_sk_callback_hsw+0x2d3>
+ DB 196,98,125,24,45,79,33,0,0 ; vbroadcastss 0x214f(%rip),%ymm13 # 40c0 <_sk_callback_hsw+0x2d3>
DB 196,65,44,86,213 ; vorps %ymm13,%ymm10,%ymm10
- DB 196,98,125,24,45,69,33,0,0 ; vbroadcastss 0x2145(%rip),%ymm13 # 40c8 <_sk_callback_hsw+0x2d7>
+ DB 196,98,125,24,45,69,33,0,0 ; vbroadcastss 0x2145(%rip),%ymm13 # 40c4 <_sk_callback_hsw+0x2d7>
DB 196,66,37,184,236 ; vfmadd231ps %ymm12,%ymm11,%ymm13
- DB 196,98,125,24,29,59,33,0,0 ; vbroadcastss 0x213b(%rip),%ymm11 # 40cc <_sk_callback_hsw+0x2db>
+ DB 196,98,125,24,29,59,33,0,0 ; vbroadcastss 0x213b(%rip),%ymm11 # 40c8 <_sk_callback_hsw+0x2db>
DB 196,66,45,172,221 ; vfnmadd213ps %ymm13,%ymm10,%ymm11
- DB 196,98,125,24,37,49,33,0,0 ; vbroadcastss 0x2131(%rip),%ymm12 # 40d0 <_sk_callback_hsw+0x2df>
+ DB 196,98,125,24,37,49,33,0,0 ; vbroadcastss 0x2131(%rip),%ymm12 # 40cc <_sk_callback_hsw+0x2df>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,39,33,0,0 ; vbroadcastss 0x2127(%rip),%ymm12 # 40d4 <_sk_callback_hsw+0x2e3>
+ DB 196,98,125,24,37,39,33,0,0 ; vbroadcastss 0x2127(%rip),%ymm12 # 40d0 <_sk_callback_hsw+0x2e3>
DB 196,65,28,94,210 ; vdivps %ymm10,%ymm12,%ymm10
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 196,99,125,8,211,1 ; vroundps $0x1,%ymm3,%ymm10
DB 196,65,100,92,210 ; vsubps %ymm10,%ymm3,%ymm10
- DB 196,98,125,24,29,8,33,0,0 ; vbroadcastss 0x2108(%rip),%ymm11 # 40d8 <_sk_callback_hsw+0x2e7>
+ DB 196,98,125,24,29,8,33,0,0 ; vbroadcastss 0x2108(%rip),%ymm11 # 40d4 <_sk_callback_hsw+0x2e7>
DB 196,193,100,88,219 ; vaddps %ymm11,%ymm3,%ymm3
- DB 196,98,125,24,29,254,32,0,0 ; vbroadcastss 0x20fe(%rip),%ymm11 # 40dc <_sk_callback_hsw+0x2eb>
+ DB 196,98,125,24,29,254,32,0,0 ; vbroadcastss 0x20fe(%rip),%ymm11 # 40d8 <_sk_callback_hsw+0x2eb>
DB 196,98,45,172,219 ; vfnmadd213ps %ymm3,%ymm10,%ymm11
- DB 196,226,125,24,29,244,32,0,0 ; vbroadcastss 0x20f4(%rip),%ymm3 # 40e0 <_sk_callback_hsw+0x2ef>
+ DB 196,226,125,24,29,244,32,0,0 ; vbroadcastss 0x20f4(%rip),%ymm3 # 40dc <_sk_callback_hsw+0x2ef>
DB 196,193,100,92,218 ; vsubps %ymm10,%ymm3,%ymm3
- DB 196,98,125,24,21,234,32,0,0 ; vbroadcastss 0x20ea(%rip),%ymm10 # 40e4 <_sk_callback_hsw+0x2f3>
+ DB 196,98,125,24,21,234,32,0,0 ; vbroadcastss 0x20ea(%rip),%ymm10 # 40e0 <_sk_callback_hsw+0x2f3>
DB 197,172,94,219 ; vdivps %ymm3,%ymm10,%ymm3
DB 197,164,88,219 ; vaddps %ymm3,%ymm11,%ymm3
- DB 196,98,125,24,21,221,32,0,0 ; vbroadcastss 0x20dd(%rip),%ymm10 # 40e8 <_sk_callback_hsw+0x2f7>
+ DB 196,98,125,24,21,221,32,0,0 ; vbroadcastss 0x20dd(%rip),%ymm10 # 40e4 <_sk_callback_hsw+0x2f7>
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 197,253,91,219 ; vcvtps2dq %ymm3,%ymm3
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -1947,33 +1946,33 @@ _sk_parametric_a_hsw LABEL PROC
DB 196,195,101,74,217,128 ; vblendvps %ymm8,%ymm9,%ymm3,%ymm3
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,100,95,216 ; vmaxps %ymm8,%ymm3,%ymm3
- DB 196,98,125,24,5,180,32,0,0 ; vbroadcastss 0x20b4(%rip),%ymm8 # 40ec <_sk_callback_hsw+0x2fb>
+ DB 196,98,125,24,5,180,32,0,0 ; vbroadcastss 0x20b4(%rip),%ymm8 # 40e8 <_sk_callback_hsw+0x2fb>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
PUBLIC _sk_lab_to_xyz_hsw
_sk_lab_to_xyz_hsw LABEL PROC
- DB 196,98,125,24,5,166,32,0,0 ; vbroadcastss 0x20a6(%rip),%ymm8 # 40f0 <_sk_callback_hsw+0x2ff>
- DB 196,98,125,24,13,161,32,0,0 ; vbroadcastss 0x20a1(%rip),%ymm9 # 40f4 <_sk_callback_hsw+0x303>
- DB 196,98,125,24,21,156,32,0,0 ; vbroadcastss 0x209c(%rip),%ymm10 # 40f8 <_sk_callback_hsw+0x307>
+ DB 196,98,125,24,5,166,32,0,0 ; vbroadcastss 0x20a6(%rip),%ymm8 # 40ec <_sk_callback_hsw+0x2ff>
+ DB 196,98,125,24,13,161,32,0,0 ; vbroadcastss 0x20a1(%rip),%ymm9 # 40f0 <_sk_callback_hsw+0x303>
+ DB 196,98,125,24,21,156,32,0,0 ; vbroadcastss 0x209c(%rip),%ymm10 # 40f4 <_sk_callback_hsw+0x307>
DB 196,194,53,168,202 ; vfmadd213ps %ymm10,%ymm9,%ymm1
DB 196,194,53,168,210 ; vfmadd213ps %ymm10,%ymm9,%ymm2
- DB 196,98,125,24,13,141,32,0,0 ; vbroadcastss 0x208d(%rip),%ymm9 # 40fc <_sk_callback_hsw+0x30b>
+ DB 196,98,125,24,13,141,32,0,0 ; vbroadcastss 0x208d(%rip),%ymm9 # 40f8 <_sk_callback_hsw+0x30b>
DB 196,66,125,184,200 ; vfmadd231ps %ymm8,%ymm0,%ymm9
- DB 196,226,125,24,5,131,32,0,0 ; vbroadcastss 0x2083(%rip),%ymm0 # 4100 <_sk_callback_hsw+0x30f>
+ DB 196,226,125,24,5,131,32,0,0 ; vbroadcastss 0x2083(%rip),%ymm0 # 40fc <_sk_callback_hsw+0x30f>
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
- DB 196,98,125,24,5,122,32,0,0 ; vbroadcastss 0x207a(%rip),%ymm8 # 4104 <_sk_callback_hsw+0x313>
+ DB 196,98,125,24,5,122,32,0,0 ; vbroadcastss 0x207a(%rip),%ymm8 # 4100 <_sk_callback_hsw+0x313>
DB 196,98,117,168,192 ; vfmadd213ps %ymm0,%ymm1,%ymm8
- DB 196,98,125,24,13,112,32,0,0 ; vbroadcastss 0x2070(%rip),%ymm9 # 4108 <_sk_callback_hsw+0x317>
+ DB 196,98,125,24,13,112,32,0,0 ; vbroadcastss 0x2070(%rip),%ymm9 # 4104 <_sk_callback_hsw+0x317>
DB 196,98,109,172,200 ; vfnmadd213ps %ymm0,%ymm2,%ymm9
DB 196,193,60,89,200 ; vmulps %ymm8,%ymm8,%ymm1
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
- DB 196,226,125,24,21,93,32,0,0 ; vbroadcastss 0x205d(%rip),%ymm2 # 410c <_sk_callback_hsw+0x31b>
+ DB 196,226,125,24,21,93,32,0,0 ; vbroadcastss 0x205d(%rip),%ymm2 # 4108 <_sk_callback_hsw+0x31b>
DB 197,108,194,209,1 ; vcmpltps %ymm1,%ymm2,%ymm10
- DB 196,98,125,24,29,83,32,0,0 ; vbroadcastss 0x2053(%rip),%ymm11 # 4110 <_sk_callback_hsw+0x31f>
+ DB 196,98,125,24,29,83,32,0,0 ; vbroadcastss 0x2053(%rip),%ymm11 # 410c <_sk_callback_hsw+0x31f>
DB 196,65,60,88,195 ; vaddps %ymm11,%ymm8,%ymm8
- DB 196,98,125,24,37,73,32,0,0 ; vbroadcastss 0x2049(%rip),%ymm12 # 4114 <_sk_callback_hsw+0x323>
+ DB 196,98,125,24,37,73,32,0,0 ; vbroadcastss 0x2049(%rip),%ymm12 # 4110 <_sk_callback_hsw+0x323>
DB 196,65,60,89,196 ; vmulps %ymm12,%ymm8,%ymm8
DB 196,99,61,74,193,160 ; vblendvps %ymm10,%ymm1,%ymm8,%ymm8
DB 197,252,89,200 ; vmulps %ymm0,%ymm0,%ymm1
@@ -1988,9 +1987,9 @@ _sk_lab_to_xyz_hsw LABEL PROC
DB 196,65,52,88,203 ; vaddps %ymm11,%ymm9,%ymm9
DB 196,65,52,89,204 ; vmulps %ymm12,%ymm9,%ymm9
DB 196,227,53,74,208,32 ; vblendvps %ymm2,%ymm0,%ymm9,%ymm2
- DB 196,226,125,24,5,254,31,0,0 ; vbroadcastss 0x1ffe(%rip),%ymm0 # 4118 <_sk_callback_hsw+0x327>
+ DB 196,226,125,24,5,254,31,0,0 ; vbroadcastss 0x1ffe(%rip),%ymm0 # 4114 <_sk_callback_hsw+0x327>
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
- DB 196,98,125,24,5,245,31,0,0 ; vbroadcastss 0x1ff5(%rip),%ymm8 # 411c <_sk_callback_hsw+0x32b>
+ DB 196,98,125,24,5,245,31,0,0 ; vbroadcastss 0x1ff5(%rip),%ymm8 # 4118 <_sk_callback_hsw+0x32b>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2002,11 +2001,11 @@ _sk_load_a8_hsw LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,45 ; jne 216d <_sk_load_a8_hsw+0x3d>
+ DB 117,45 ; jne 2169 <_sk_load_a8_hsw+0x3d>
DB 197,250,126,0 ; vmovq (%rax),%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,202,31,0,0 ; vbroadcastss 0x1fca(%rip),%ymm1 # 4120 <_sk_callback_hsw+0x32f>
+ DB 196,226,125,24,13,202,31,0,0 ; vbroadcastss 0x1fca(%rip),%ymm1 # 411c <_sk_callback_hsw+0x32f>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -2023,9 +2022,9 @@ _sk_load_a8_hsw LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 2175 <_sk_load_a8_hsw+0x45>
+ DB 117,234 ; jne 2171 <_sk_load_a8_hsw+0x45>
DB 196,193,249,110,193 ; vmovq %r9,%xmm0
- DB 235,178 ; jmp 2144 <_sk_load_a8_hsw+0x14>
+ DB 235,178 ; jmp 2140 <_sk_load_a8_hsw+0x14>
PUBLIC _sk_gather_a8_hsw
_sk_gather_a8_hsw LABEL PROC
@@ -2069,7 +2068,7 @@ _sk_gather_a8_hsw LABEL PROC
DB 196,227,121,32,192,7 ; vpinsrb $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,213,30,0,0 ; vbroadcastss 0x1ed5(%rip),%ymm1 # 4124 <_sk_callback_hsw+0x333>
+ DB 196,226,125,24,13,213,30,0,0 ; vbroadcastss 0x1ed5(%rip),%ymm1 # 4120 <_sk_callback_hsw+0x333>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -2085,14 +2084,14 @@ PUBLIC _sk_store_a8_hsw
_sk_store_a8_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,176,30,0,0 ; vbroadcastss 0x1eb0(%rip),%ymm8 # 4128 <_sk_callback_hsw+0x337>
+ DB 196,98,125,24,5,176,30,0,0 ; vbroadcastss 0x1eb0(%rip),%ymm8 # 4124 <_sk_callback_hsw+0x337>
DB 196,65,100,89,192 ; vmulps %ymm8,%ymm3,%ymm8
DB 196,65,125,91,192 ; vcvtps2dq %ymm8,%ymm8
DB 196,67,125,25,193,1 ; vextractf128 $0x1,%ymm8,%xmm9
DB 196,66,57,43,193 ; vpackusdw %xmm9,%xmm8,%xmm8
DB 196,65,57,103,192 ; vpackuswb %xmm8,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 22a1 <_sk_store_a8_hsw+0x37>
+ DB 117,10 ; jne 229d <_sk_store_a8_hsw+0x37>
DB 196,65,123,17,4,58 ; vmovsd %xmm8,(%r10,%rdi,1)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2100,10 +2099,10 @@ _sk_store_a8_hsw LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 229d <_sk_store_a8_hsw+0x33>
+ DB 119,236 ; ja 2299 <_sk_store_a8_hsw+0x33>
DB 196,66,121,48,192 ; vpmovzxbw %xmm8,%xmm8
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,67,0,0,0 ; lea 0x43(%rip),%r9 # 2304 <_sk_store_a8_hsw+0x9a>
+ DB 76,141,13,67,0,0,0 ; lea 0x43(%rip),%r9 # 2300 <_sk_store_a8_hsw+0x9a>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -2114,7 +2113,7 @@ _sk_store_a8_hsw LABEL PROC
DB 196,67,121,20,68,58,2,4 ; vpextrb $0x4,%xmm8,0x2(%r10,%rdi,1)
DB 196,67,121,20,68,58,1,2 ; vpextrb $0x2,%xmm8,0x1(%r10,%rdi,1)
DB 196,67,121,20,4,58,0 ; vpextrb $0x0,%xmm8,(%r10,%rdi,1)
- DB 235,154 ; jmp 229d <_sk_store_a8_hsw+0x33>
+ DB 235,154 ; jmp 2299 <_sk_store_a8_hsw+0x33>
DB 144 ; nop
DB 246,255 ; idiv %bh
DB 255 ; (bad)
@@ -2146,14 +2145,14 @@ _sk_load_g8_hsw LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,50 ; jne 2362 <_sk_load_g8_hsw+0x42>
+ DB 117,50 ; jne 235e <_sk_load_g8_hsw+0x42>
DB 197,250,126,0 ; vmovq (%rax),%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,230,29,0,0 ; vbroadcastss 0x1de6(%rip),%ymm1 # 412c <_sk_callback_hsw+0x33b>
+ DB 196,226,125,24,13,230,29,0,0 ; vbroadcastss 0x1de6(%rip),%ymm1 # 4128 <_sk_callback_hsw+0x33b>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,219,29,0,0 ; vbroadcastss 0x1ddb(%rip),%ymm3 # 4130 <_sk_callback_hsw+0x33f>
+ DB 196,226,125,24,29,219,29,0,0 ; vbroadcastss 0x1ddb(%rip),%ymm3 # 412c <_sk_callback_hsw+0x33f>
DB 76,137,193 ; mov %r8,%rcx
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
@@ -2167,9 +2166,9 @@ _sk_load_g8_hsw LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 236a <_sk_load_g8_hsw+0x4a>
+ DB 117,234 ; jne 2366 <_sk_load_g8_hsw+0x4a>
DB 196,193,249,110,193 ; vmovq %r9,%xmm0
- DB 235,173 ; jmp 2334 <_sk_load_g8_hsw+0x14>
+ DB 235,173 ; jmp 2330 <_sk_load_g8_hsw+0x14>
PUBLIC _sk_gather_g8_hsw
_sk_gather_g8_hsw LABEL PROC
@@ -2213,10 +2212,10 @@ _sk_gather_g8_hsw LABEL PROC
DB 196,227,121,32,192,7 ; vpinsrb $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,49,192 ; vpmovzxbd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,240,28,0,0 ; vbroadcastss 0x1cf0(%rip),%ymm1 # 4134 <_sk_callback_hsw+0x343>
+ DB 196,226,125,24,13,240,28,0,0 ; vbroadcastss 0x1cf0(%rip),%ymm1 # 4130 <_sk_callback_hsw+0x343>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,229,28,0,0 ; vbroadcastss 0x1ce5(%rip),%ymm3 # 4138 <_sk_callback_hsw+0x347>
+ DB 196,226,125,24,29,229,28,0,0 ; vbroadcastss 0x1ce5(%rip),%ymm3 # 4134 <_sk_callback_hsw+0x347>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 91 ; pop %rbx
@@ -2230,9 +2229,9 @@ _sk_gather_i8_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,192 ; mov %rax,%r8
DB 77,133,192 ; test %r8,%r8
- DB 116,5 ; je 2473 <_sk_gather_i8_hsw+0xf>
+ DB 116,5 ; je 246f <_sk_gather_i8_hsw+0xf>
DB 76,137,192 ; mov %r8,%rax
- DB 235,2 ; jmp 2475 <_sk_gather_i8_hsw+0x11>
+ DB 235,2 ; jmp 2471 <_sk_gather_i8_hsw+0x11>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,87 ; push %r15
DB 65,86 ; push %r14
@@ -2270,14 +2269,14 @@ _sk_gather_i8_hsw LABEL PROC
DB 73,139,64,8 ; mov 0x8(%r8),%rax
DB 197,245,118,201 ; vpcmpeqd %ymm1,%ymm1,%ymm1
DB 196,226,117,144,28,128 ; vpgatherdd %ymm1,(%rax,%ymm0,4),%ymm3
- DB 197,229,219,5,253,29,0,0 ; vpand 0x1dfd(%rip),%ymm3,%ymm0 # 4320 <_sk_callback_hsw+0x52f>
+ DB 197,229,219,5,1,30,0,0 ; vpand 0x1e01(%rip),%ymm3,%ymm0 # 4320 <_sk_callback_hsw+0x533>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,12,28,0,0 ; vbroadcastss 0x1c0c(%rip),%ymm8 # 413c <_sk_callback_hsw+0x34b>
+ DB 196,98,125,24,5,12,28,0,0 ; vbroadcastss 0x1c0c(%rip),%ymm8 # 4138 <_sk_callback_hsw+0x34b>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,226,101,0,13,2,30,0,0 ; vpshufb 0x1e02(%rip),%ymm3,%ymm1 # 4340 <_sk_callback_hsw+0x54f>
+ DB 196,226,101,0,13,6,30,0,0 ; vpshufb 0x1e06(%rip),%ymm3,%ymm1 # 4340 <_sk_callback_hsw+0x553>
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,226,101,0,21,16,30,0,0 ; vpshufb 0x1e10(%rip),%ymm3,%ymm2 # 4360 <_sk_callback_hsw+0x56f>
+ DB 196,226,101,0,21,20,30,0,0 ; vpshufb 0x1e14(%rip),%ymm3,%ymm2 # 4360 <_sk_callback_hsw+0x573>
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -2296,35 +2295,35 @@ _sk_load_565_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 117,114 ; jne 25f0 <_sk_load_565_hsw+0x7c>
+ DB 117,114 ; jne 25ec <_sk_load_565_hsw+0x7c>
DB 196,193,122,111,4,122 ; vmovdqu (%r10,%rdi,2),%xmm0
DB 196,226,125,51,208 ; vpmovzxwd %xmm0,%ymm2
- DB 196,226,125,88,5,174,27,0,0 ; vpbroadcastd 0x1bae(%rip),%ymm0 # 4140 <_sk_callback_hsw+0x34f>
+ DB 196,226,125,88,5,174,27,0,0 ; vpbroadcastd 0x1bae(%rip),%ymm0 # 413c <_sk_callback_hsw+0x34f>
DB 197,237,219,192 ; vpand %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,161,27,0,0 ; vbroadcastss 0x1ba1(%rip),%ymm1 # 4144 <_sk_callback_hsw+0x353>
+ DB 196,226,125,24,13,161,27,0,0 ; vbroadcastss 0x1ba1(%rip),%ymm1 # 4140 <_sk_callback_hsw+0x353>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,152,27,0,0 ; vpbroadcastd 0x1b98(%rip),%ymm1 # 4148 <_sk_callback_hsw+0x357>
+ DB 196,226,125,88,13,152,27,0,0 ; vpbroadcastd 0x1b98(%rip),%ymm1 # 4144 <_sk_callback_hsw+0x357>
DB 197,237,219,201 ; vpand %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,139,27,0,0 ; vbroadcastss 0x1b8b(%rip),%ymm3 # 414c <_sk_callback_hsw+0x35b>
+ DB 196,226,125,24,29,139,27,0,0 ; vbroadcastss 0x1b8b(%rip),%ymm3 # 4148 <_sk_callback_hsw+0x35b>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,88,29,130,27,0,0 ; vpbroadcastd 0x1b82(%rip),%ymm3 # 4150 <_sk_callback_hsw+0x35f>
+ DB 196,226,125,88,29,130,27,0,0 ; vpbroadcastd 0x1b82(%rip),%ymm3 # 414c <_sk_callback_hsw+0x35f>
DB 197,237,219,211 ; vpand %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,117,27,0,0 ; vbroadcastss 0x1b75(%rip),%ymm3 # 4154 <_sk_callback_hsw+0x363>
+ DB 196,226,125,24,29,117,27,0,0 ; vbroadcastss 0x1b75(%rip),%ymm3 # 4150 <_sk_callback_hsw+0x363>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,106,27,0,0 ; vbroadcastss 0x1b6a(%rip),%ymm3 # 4158 <_sk_callback_hsw+0x367>
+ DB 196,226,125,24,29,106,27,0,0 ; vbroadcastss 0x1b6a(%rip),%ymm3 # 4154 <_sk_callback_hsw+0x367>
DB 255,224 ; jmpq *%rax
DB 65,137,200 ; mov %ecx,%r8d
DB 65,128,224,7 ; and $0x7,%r8b
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,128 ; ja 2584 <_sk_load_565_hsw+0x10>
+ DB 119,128 ; ja 2580 <_sk_load_565_hsw+0x10>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 2658 <_sk_load_565_hsw+0xe4>
+ DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 2654 <_sk_load_565_hsw+0xe4>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -2336,7 +2335,7 @@ _sk_load_565_hsw LABEL PROC
DB 196,193,121,196,68,122,4,2 ; vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,68,122,2,1 ; vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,4,122,0 ; vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- DB 233,44,255,255,255 ; jmpq 2584 <_sk_load_565_hsw+0x10>
+ DB 233,44,255,255,255 ; jmpq 2580 <_sk_load_565_hsw+0x10>
DB 244 ; hlt
DB 255 ; (bad)
DB 255 ; (bad)
@@ -2404,23 +2403,23 @@ _sk_gather_565_hsw LABEL PROC
DB 65,15,183,4,88 ; movzwl (%r8,%rbx,2),%eax
DB 197,249,196,192,7 ; vpinsrw $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,51,208 ; vpmovzxwd %xmm0,%ymm2
- DB 196,226,125,88,5,45,26,0,0 ; vpbroadcastd 0x1a2d(%rip),%ymm0 # 415c <_sk_callback_hsw+0x36b>
+ DB 196,226,125,88,5,45,26,0,0 ; vpbroadcastd 0x1a2d(%rip),%ymm0 # 4158 <_sk_callback_hsw+0x36b>
DB 197,237,219,192 ; vpand %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,32,26,0,0 ; vbroadcastss 0x1a20(%rip),%ymm1 # 4160 <_sk_callback_hsw+0x36f>
+ DB 196,226,125,24,13,32,26,0,0 ; vbroadcastss 0x1a20(%rip),%ymm1 # 415c <_sk_callback_hsw+0x36f>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,23,26,0,0 ; vpbroadcastd 0x1a17(%rip),%ymm1 # 4164 <_sk_callback_hsw+0x373>
+ DB 196,226,125,88,13,23,26,0,0 ; vpbroadcastd 0x1a17(%rip),%ymm1 # 4160 <_sk_callback_hsw+0x373>
DB 197,237,219,201 ; vpand %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,10,26,0,0 ; vbroadcastss 0x1a0a(%rip),%ymm3 # 4168 <_sk_callback_hsw+0x377>
+ DB 196,226,125,24,29,10,26,0,0 ; vbroadcastss 0x1a0a(%rip),%ymm3 # 4164 <_sk_callback_hsw+0x377>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,88,29,1,26,0,0 ; vpbroadcastd 0x1a01(%rip),%ymm3 # 416c <_sk_callback_hsw+0x37b>
+ DB 196,226,125,88,29,1,26,0,0 ; vpbroadcastd 0x1a01(%rip),%ymm3 # 4168 <_sk_callback_hsw+0x37b>
DB 197,237,219,211 ; vpand %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,244,25,0,0 ; vbroadcastss 0x19f4(%rip),%ymm3 # 4170 <_sk_callback_hsw+0x37f>
+ DB 196,226,125,24,29,244,25,0,0 ; vbroadcastss 0x19f4(%rip),%ymm3 # 416c <_sk_callback_hsw+0x37f>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,233,25,0,0 ; vbroadcastss 0x19e9(%rip),%ymm3 # 4174 <_sk_callback_hsw+0x383>
+ DB 196,226,125,24,29,233,25,0,0 ; vbroadcastss 0x19e9(%rip),%ymm3 # 4170 <_sk_callback_hsw+0x383>
DB 91 ; pop %rbx
DB 65,92 ; pop %r12
DB 65,94 ; pop %r14
@@ -2431,11 +2430,11 @@ PUBLIC _sk_store_565_hsw
_sk_store_565_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,214,25,0,0 ; vbroadcastss 0x19d6(%rip),%ymm8 # 4178 <_sk_callback_hsw+0x387>
+ DB 196,98,125,24,5,214,25,0,0 ; vbroadcastss 0x19d6(%rip),%ymm8 # 4174 <_sk_callback_hsw+0x387>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,53,114,241,11 ; vpslld $0xb,%ymm9,%ymm9
- DB 196,98,125,24,21,193,25,0,0 ; vbroadcastss 0x19c1(%rip),%ymm10 # 417c <_sk_callback_hsw+0x38b>
+ DB 196,98,125,24,21,193,25,0,0 ; vbroadcastss 0x19c1(%rip),%ymm10 # 4178 <_sk_callback_hsw+0x38b>
DB 196,65,116,89,210 ; vmulps %ymm10,%ymm1,%ymm10
DB 196,65,125,91,210 ; vcvtps2dq %ymm10,%ymm10
DB 196,193,45,114,242,5 ; vpslld $0x5,%ymm10,%ymm10
@@ -2446,7 +2445,7 @@ _sk_store_565_hsw LABEL PROC
DB 196,67,125,57,193,1 ; vextracti128 $0x1,%ymm8,%xmm9
DB 196,66,57,43,193 ; vpackusdw %xmm9,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 27f9 <_sk_store_565_hsw+0x65>
+ DB 117,10 ; jne 27f5 <_sk_store_565_hsw+0x65>
DB 196,65,122,127,4,122 ; vmovdqu %xmm8,(%r10,%rdi,2)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2454,9 +2453,9 @@ _sk_store_565_hsw LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 27f5 <_sk_store_565_hsw+0x61>
+ DB 119,236 ; ja 27f1 <_sk_store_565_hsw+0x61>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,68,0,0,0 ; lea 0x44(%rip),%r9 # 2858 <_sk_store_565_hsw+0xc4>
+ DB 76,141,13,68,0,0,0 ; lea 0x44(%rip),%r9 # 2854 <_sk_store_565_hsw+0xc4>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -2467,7 +2466,7 @@ _sk_store_565_hsw LABEL PROC
DB 196,67,121,21,68,122,4,2 ; vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
DB 196,67,121,21,68,122,2,1 ; vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
DB 196,67,121,21,4,122,0 ; vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- DB 235,159 ; jmp 27f5 <_sk_store_565_hsw+0x61>
+ DB 235,159 ; jmp 27f1 <_sk_store_565_hsw+0x61>
DB 102,144 ; xchg %ax,%ax
DB 245 ; cmc
DB 255 ; (bad)
@@ -2498,28 +2497,28 @@ _sk_load_4444_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,138,0,0,0 ; jne 290c <_sk_load_4444_hsw+0x98>
+ DB 15,133,138,0,0,0 ; jne 2908 <_sk_load_4444_hsw+0x98>
DB 196,193,122,111,4,122 ; vmovdqu (%r10,%rdi,2),%xmm0
DB 196,226,125,51,216 ; vpmovzxwd %xmm0,%ymm3
- DB 196,226,125,88,5,234,24,0,0 ; vpbroadcastd 0x18ea(%rip),%ymm0 # 4180 <_sk_callback_hsw+0x38f>
+ DB 196,226,125,88,5,234,24,0,0 ; vpbroadcastd 0x18ea(%rip),%ymm0 # 417c <_sk_callback_hsw+0x38f>
DB 197,229,219,192 ; vpand %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,221,24,0,0 ; vbroadcastss 0x18dd(%rip),%ymm1 # 4184 <_sk_callback_hsw+0x393>
+ DB 196,226,125,24,13,221,24,0,0 ; vbroadcastss 0x18dd(%rip),%ymm1 # 4180 <_sk_callback_hsw+0x393>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,212,24,0,0 ; vpbroadcastd 0x18d4(%rip),%ymm1 # 4188 <_sk_callback_hsw+0x397>
+ DB 196,226,125,88,13,212,24,0,0 ; vpbroadcastd 0x18d4(%rip),%ymm1 # 4184 <_sk_callback_hsw+0x397>
DB 197,229,219,201 ; vpand %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,199,24,0,0 ; vbroadcastss 0x18c7(%rip),%ymm2 # 418c <_sk_callback_hsw+0x39b>
+ DB 196,226,125,24,21,199,24,0,0 ; vbroadcastss 0x18c7(%rip),%ymm2 # 4188 <_sk_callback_hsw+0x39b>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,88,21,190,24,0,0 ; vpbroadcastd 0x18be(%rip),%ymm2 # 4190 <_sk_callback_hsw+0x39f>
+ DB 196,226,125,88,21,190,24,0,0 ; vpbroadcastd 0x18be(%rip),%ymm2 # 418c <_sk_callback_hsw+0x39f>
DB 197,229,219,210 ; vpand %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,177,24,0,0 ; vbroadcastss 0x18b1(%rip),%ymm8 # 4194 <_sk_callback_hsw+0x3a3>
+ DB 196,98,125,24,5,177,24,0,0 ; vbroadcastss 0x18b1(%rip),%ymm8 # 4190 <_sk_callback_hsw+0x3a3>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,88,5,167,24,0,0 ; vpbroadcastd 0x18a7(%rip),%ymm8 # 4198 <_sk_callback_hsw+0x3a7>
+ DB 196,98,125,88,5,167,24,0,0 ; vpbroadcastd 0x18a7(%rip),%ymm8 # 4194 <_sk_callback_hsw+0x3a7>
DB 196,193,101,219,216 ; vpand %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,153,24,0,0 ; vbroadcastss 0x1899(%rip),%ymm8 # 419c <_sk_callback_hsw+0x3ab>
+ DB 196,98,125,24,5,153,24,0,0 ; vbroadcastss 0x1899(%rip),%ymm8 # 4198 <_sk_callback_hsw+0x3ab>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2528,9 +2527,9 @@ _sk_load_4444_hsw LABEL PROC
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 15,135,100,255,255,255 ; ja 2888 <_sk_load_4444_hsw+0x14>
+ DB 15,135,100,255,255,255 ; ja 2884 <_sk_load_4444_hsw+0x14>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 2978 <_sk_load_4444_hsw+0x104>
+ DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 2974 <_sk_load_4444_hsw+0x104>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -2542,7 +2541,7 @@ _sk_load_4444_hsw LABEL PROC
DB 196,193,121,196,68,122,4,2 ; vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,68,122,2,1 ; vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,4,122,0 ; vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- DB 233,16,255,255,255 ; jmpq 2888 <_sk_load_4444_hsw+0x14>
+ DB 233,16,255,255,255 ; jmpq 2884 <_sk_load_4444_hsw+0x14>
DB 244 ; hlt
DB 255 ; (bad)
DB 255 ; (bad)
@@ -2610,25 +2609,25 @@ _sk_gather_4444_hsw LABEL PROC
DB 65,15,183,4,88 ; movzwl (%r8,%rbx,2),%eax
DB 197,249,196,192,7 ; vpinsrw $0x7,%eax,%xmm0,%xmm0
DB 196,226,125,51,216 ; vpmovzxwd %xmm0,%ymm3
- DB 196,226,125,88,5,81,23,0,0 ; vpbroadcastd 0x1751(%rip),%ymm0 # 41a0 <_sk_callback_hsw+0x3af>
+ DB 196,226,125,88,5,81,23,0,0 ; vpbroadcastd 0x1751(%rip),%ymm0 # 419c <_sk_callback_hsw+0x3af>
DB 197,229,219,192 ; vpand %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,68,23,0,0 ; vbroadcastss 0x1744(%rip),%ymm1 # 41a4 <_sk_callback_hsw+0x3b3>
+ DB 196,226,125,24,13,68,23,0,0 ; vbroadcastss 0x1744(%rip),%ymm1 # 41a0 <_sk_callback_hsw+0x3b3>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,88,13,59,23,0,0 ; vpbroadcastd 0x173b(%rip),%ymm1 # 41a8 <_sk_callback_hsw+0x3b7>
+ DB 196,226,125,88,13,59,23,0,0 ; vpbroadcastd 0x173b(%rip),%ymm1 # 41a4 <_sk_callback_hsw+0x3b7>
DB 197,229,219,201 ; vpand %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,46,23,0,0 ; vbroadcastss 0x172e(%rip),%ymm2 # 41ac <_sk_callback_hsw+0x3bb>
+ DB 196,226,125,24,21,46,23,0,0 ; vbroadcastss 0x172e(%rip),%ymm2 # 41a8 <_sk_callback_hsw+0x3bb>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,88,21,37,23,0,0 ; vpbroadcastd 0x1725(%rip),%ymm2 # 41b0 <_sk_callback_hsw+0x3bf>
+ DB 196,226,125,88,21,37,23,0,0 ; vpbroadcastd 0x1725(%rip),%ymm2 # 41ac <_sk_callback_hsw+0x3bf>
DB 197,229,219,210 ; vpand %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,24,23,0,0 ; vbroadcastss 0x1718(%rip),%ymm8 # 41b4 <_sk_callback_hsw+0x3c3>
+ DB 196,98,125,24,5,24,23,0,0 ; vbroadcastss 0x1718(%rip),%ymm8 # 41b0 <_sk_callback_hsw+0x3c3>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,88,5,14,23,0,0 ; vpbroadcastd 0x170e(%rip),%ymm8 # 41b8 <_sk_callback_hsw+0x3c7>
+ DB 196,98,125,88,5,14,23,0,0 ; vpbroadcastd 0x170e(%rip),%ymm8 # 41b4 <_sk_callback_hsw+0x3c7>
DB 196,193,101,219,216 ; vpand %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,0,23,0,0 ; vbroadcastss 0x1700(%rip),%ymm8 # 41bc <_sk_callback_hsw+0x3cb>
+ DB 196,98,125,24,5,0,23,0,0 ; vbroadcastss 0x1700(%rip),%ymm8 # 41b8 <_sk_callback_hsw+0x3cb>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
@@ -2641,7 +2640,7 @@ PUBLIC _sk_store_4444_hsw
_sk_store_4444_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,230,22,0,0 ; vbroadcastss 0x16e6(%rip),%ymm8 # 41c0 <_sk_callback_hsw+0x3cf>
+ DB 196,98,125,24,5,230,22,0,0 ; vbroadcastss 0x16e6(%rip),%ymm8 # 41bc <_sk_callback_hsw+0x3cf>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,53,114,241,12 ; vpslld $0xc,%ymm9,%ymm9
@@ -2659,7 +2658,7 @@ _sk_store_4444_hsw LABEL PROC
DB 196,67,125,57,193,1 ; vextracti128 $0x1,%ymm8,%xmm9
DB 196,66,57,43,193 ; vpackusdw %xmm9,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 2b3d <_sk_store_4444_hsw+0x71>
+ DB 117,10 ; jne 2b39 <_sk_store_4444_hsw+0x71>
DB 196,65,122,127,4,122 ; vmovdqu %xmm8,(%r10,%rdi,2)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -2667,9 +2666,9 @@ _sk_store_4444_hsw LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 2b39 <_sk_store_4444_hsw+0x6d>
+ DB 119,236 ; ja 2b35 <_sk_store_4444_hsw+0x6d>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,68,0,0,0 ; lea 0x44(%rip),%r9 # 2b9c <_sk_store_4444_hsw+0xd0>
+ DB 76,141,13,68,0,0,0 ; lea 0x44(%rip),%r9 # 2b98 <_sk_store_4444_hsw+0xd0>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -2680,7 +2679,7 @@ _sk_store_4444_hsw LABEL PROC
DB 196,67,121,21,68,122,4,2 ; vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
DB 196,67,121,21,68,122,2,1 ; vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
DB 196,67,121,21,4,122,0 ; vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- DB 235,159 ; jmp 2b39 <_sk_store_4444_hsw+0x6d>
+ DB 235,159 ; jmp 2b35 <_sk_store_4444_hsw+0x6d>
DB 102,144 ; xchg %ax,%ax
DB 245 ; cmc
DB 255 ; (bad)
@@ -2713,16 +2712,16 @@ _sk_load_8888_hsw LABEL PROC
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
DB 76,3,8 ; add (%rax),%r9
DB 77,133,192 ; test %r8,%r8
- DB 117,88 ; jne 2c25 <_sk_load_8888_hsw+0x6d>
+ DB 117,88 ; jne 2c21 <_sk_load_8888_hsw+0x6d>
DB 196,193,126,111,25 ; vmovdqu (%r9),%ymm3
- DB 197,229,219,5,166,23,0,0 ; vpand 0x17a6(%rip),%ymm3,%ymm0 # 4380 <_sk_callback_hsw+0x58f>
+ DB 197,229,219,5,170,23,0,0 ; vpand 0x17aa(%rip),%ymm3,%ymm0 # 4380 <_sk_callback_hsw+0x593>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,221,21,0,0 ; vbroadcastss 0x15dd(%rip),%ymm8 # 41c4 <_sk_callback_hsw+0x3d3>
+ DB 196,98,125,24,5,221,21,0,0 ; vbroadcastss 0x15dd(%rip),%ymm8 # 41c0 <_sk_callback_hsw+0x3d3>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,226,101,0,13,171,23,0,0 ; vpshufb 0x17ab(%rip),%ymm3,%ymm1 # 43a0 <_sk_callback_hsw+0x5af>
+ DB 196,226,101,0,13,175,23,0,0 ; vpshufb 0x17af(%rip),%ymm3,%ymm1 # 43a0 <_sk_callback_hsw+0x5b3>
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,226,101,0,21,185,23,0,0 ; vpshufb 0x17b9(%rip),%ymm3,%ymm2 # 43c0 <_sk_callback_hsw+0x5cf>
+ DB 196,226,101,0,21,189,23,0,0 ; vpshufb 0x17bd(%rip),%ymm3,%ymm2 # 43c0 <_sk_callback_hsw+0x5d3>
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -2739,7 +2738,7 @@ _sk_load_8888_hsw LABEL PROC
DB 196,225,249,110,192 ; vmovq %rax,%xmm0
DB 196,226,125,33,192 ; vpmovsxbd %xmm0,%ymm0
DB 196,194,125,140,25 ; vpmaskmovd (%r9),%ymm0,%ymm3
- DB 235,135 ; jmp 2bd2 <_sk_load_8888_hsw+0x1a>
+ DB 235,135 ; jmp 2bce <_sk_load_8888_hsw+0x1a>
PUBLIC _sk_gather_8888_hsw
_sk_gather_8888_hsw LABEL PROC
@@ -2752,14 +2751,14 @@ _sk_gather_8888_hsw LABEL PROC
DB 197,245,254,192 ; vpaddd %ymm0,%ymm1,%ymm0
DB 197,245,118,201 ; vpcmpeqd %ymm1,%ymm1,%ymm1
DB 196,194,117,144,28,128 ; vpgatherdd %ymm1,(%r8,%ymm0,4),%ymm3
- DB 197,229,219,5,103,23,0,0 ; vpand 0x1767(%rip),%ymm3,%ymm0 # 43e0 <_sk_callback_hsw+0x5ef>
+ DB 197,229,219,5,107,23,0,0 ; vpand 0x176b(%rip),%ymm3,%ymm0 # 43e0 <_sk_callback_hsw+0x5f3>
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,66,21,0,0 ; vbroadcastss 0x1542(%rip),%ymm8 # 41c8 <_sk_callback_hsw+0x3d7>
+ DB 196,98,125,24,5,66,21,0,0 ; vbroadcastss 0x1542(%rip),%ymm8 # 41c4 <_sk_callback_hsw+0x3d7>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,226,101,0,13,108,23,0,0 ; vpshufb 0x176c(%rip),%ymm3,%ymm1 # 4400 <_sk_callback_hsw+0x60f>
+ DB 196,226,101,0,13,112,23,0,0 ; vpshufb 0x1770(%rip),%ymm3,%ymm1 # 4400 <_sk_callback_hsw+0x613>
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,226,101,0,21,122,23,0,0 ; vpshufb 0x177a(%rip),%ymm3,%ymm2 # 4420 <_sk_callback_hsw+0x62f>
+ DB 196,226,101,0,21,126,23,0,0 ; vpshufb 0x177e(%rip),%ymm3,%ymm2 # 4420 <_sk_callback_hsw+0x633>
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,229,114,211,24 ; vpsrld $0x18,%ymm3,%ymm3
@@ -2774,7 +2773,7 @@ _sk_store_8888_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
DB 76,3,8 ; add (%rax),%r9
- DB 196,98,125,24,5,242,20,0,0 ; vbroadcastss 0x14f2(%rip),%ymm8 # 41cc <_sk_callback_hsw+0x3db>
+ DB 196,98,125,24,5,242,20,0,0 ; vbroadcastss 0x14f2(%rip),%ymm8 # 41c8 <_sk_callback_hsw+0x3db>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,65,116,89,208 ; vmulps %ymm8,%ymm1,%ymm10
@@ -2790,7 +2789,7 @@ _sk_store_8888_hsw LABEL PROC
DB 196,65,45,235,192 ; vpor %ymm8,%ymm10,%ymm8
DB 196,65,53,235,192 ; vpor %ymm8,%ymm9,%ymm8
DB 77,133,192 ; test %r8,%r8
- DB 117,12 ; jne 2d34 <_sk_store_8888_hsw+0x73>
+ DB 117,12 ; jne 2d30 <_sk_store_8888_hsw+0x73>
DB 196,65,126,127,1 ; vmovdqu %ymm8,(%r9)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,137,193 ; mov %r8,%rcx
@@ -2803,14 +2802,14 @@ _sk_store_8888_hsw LABEL PROC
DB 196,97,249,110,200 ; vmovq %rax,%xmm9
DB 196,66,125,33,201 ; vpmovsxbd %xmm9,%ymm9
DB 196,66,53,142,1 ; vpmaskmovd %ymm8,%ymm9,(%r9)
- DB 235,211 ; jmp 2d2d <_sk_store_8888_hsw+0x6c>
+ DB 235,211 ; jmp 2d29 <_sk_store_8888_hsw+0x6c>
PUBLIC _sk_load_f16_hsw
_sk_load_f16_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 72,133,201 ; test %rcx,%rcx
- DB 117,97 ; jne 2dc5 <_sk_load_f16_hsw+0x6b>
+ DB 117,97 ; jne 2dc1 <_sk_load_f16_hsw+0x6b>
DB 197,121,16,4,248 ; vmovupd (%rax,%rdi,8),%xmm8
DB 197,249,16,84,248,16 ; vmovupd 0x10(%rax,%rdi,8),%xmm2
DB 197,249,16,92,248,32 ; vmovupd 0x20(%rax,%rdi,8),%xmm3
@@ -2836,29 +2835,29 @@ _sk_load_f16_hsw LABEL PROC
DB 197,123,16,4,248 ; vmovsd (%rax,%rdi,8),%xmm8
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,79 ; je 2e24 <_sk_load_f16_hsw+0xca>
+ DB 116,79 ; je 2e20 <_sk_load_f16_hsw+0xca>
DB 197,57,22,68,248,8 ; vmovhpd 0x8(%rax,%rdi,8),%xmm8,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,67 ; jb 2e24 <_sk_load_f16_hsw+0xca>
+ DB 114,67 ; jb 2e20 <_sk_load_f16_hsw+0xca>
DB 197,251,16,84,248,16 ; vmovsd 0x10(%rax,%rdi,8),%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 116,68 ; je 2e31 <_sk_load_f16_hsw+0xd7>
+ DB 116,68 ; je 2e2d <_sk_load_f16_hsw+0xd7>
DB 197,233,22,84,248,24 ; vmovhpd 0x18(%rax,%rdi,8),%xmm2,%xmm2
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,56 ; jb 2e31 <_sk_load_f16_hsw+0xd7>
+ DB 114,56 ; jb 2e2d <_sk_load_f16_hsw+0xd7>
DB 197,251,16,92,248,32 ; vmovsd 0x20(%rax,%rdi,8),%xmm3
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 15,132,114,255,255,255 ; je 2d7b <_sk_load_f16_hsw+0x21>
+ DB 15,132,114,255,255,255 ; je 2d77 <_sk_load_f16_hsw+0x21>
DB 197,225,22,92,248,40 ; vmovhpd 0x28(%rax,%rdi,8),%xmm3,%xmm3
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 15,130,98,255,255,255 ; jb 2d7b <_sk_load_f16_hsw+0x21>
+ DB 15,130,98,255,255,255 ; jb 2d77 <_sk_load_f16_hsw+0x21>
DB 197,122,126,76,248,48 ; vmovq 0x30(%rax,%rdi,8),%xmm9
- DB 233,87,255,255,255 ; jmpq 2d7b <_sk_load_f16_hsw+0x21>
+ DB 233,87,255,255,255 ; jmpq 2d77 <_sk_load_f16_hsw+0x21>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
DB 197,233,87,210 ; vxorpd %xmm2,%xmm2,%xmm2
- DB 233,74,255,255,255 ; jmpq 2d7b <_sk_load_f16_hsw+0x21>
+ DB 233,74,255,255,255 ; jmpq 2d77 <_sk_load_f16_hsw+0x21>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
- DB 233,65,255,255,255 ; jmpq 2d7b <_sk_load_f16_hsw+0x21>
+ DB 233,65,255,255,255 ; jmpq 2d77 <_sk_load_f16_hsw+0x21>
PUBLIC _sk_gather_f16_hsw
_sk_gather_f16_hsw LABEL PROC
@@ -2912,7 +2911,7 @@ _sk_store_f16_hsw LABEL PROC
DB 196,65,57,98,205 ; vpunpckldq %xmm13,%xmm8,%xmm9
DB 196,65,57,106,197 ; vpunpckhdq %xmm13,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,27 ; jne 2f29 <_sk_store_f16_hsw+0x65>
+ DB 117,27 ; jne 2f25 <_sk_store_f16_hsw+0x65>
DB 197,120,17,28,248 ; vmovups %xmm11,(%rax,%rdi,8)
DB 197,120,17,84,248,16 ; vmovups %xmm10,0x10(%rax,%rdi,8)
DB 197,120,17,76,248,32 ; vmovups %xmm9,0x20(%rax,%rdi,8)
@@ -2921,22 +2920,22 @@ _sk_store_f16_hsw LABEL PROC
DB 255,224 ; jmpq *%rax
DB 197,121,214,28,248 ; vmovq %xmm11,(%rax,%rdi,8)
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,241 ; je 2f25 <_sk_store_f16_hsw+0x61>
+ DB 116,241 ; je 2f21 <_sk_store_f16_hsw+0x61>
DB 197,121,23,92,248,8 ; vmovhpd %xmm11,0x8(%rax,%rdi,8)
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,229 ; jb 2f25 <_sk_store_f16_hsw+0x61>
+ DB 114,229 ; jb 2f21 <_sk_store_f16_hsw+0x61>
DB 197,121,214,84,248,16 ; vmovq %xmm10,0x10(%rax,%rdi,8)
- DB 116,221 ; je 2f25 <_sk_store_f16_hsw+0x61>
+ DB 116,221 ; je 2f21 <_sk_store_f16_hsw+0x61>
DB 197,121,23,84,248,24 ; vmovhpd %xmm10,0x18(%rax,%rdi,8)
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,209 ; jb 2f25 <_sk_store_f16_hsw+0x61>
+ DB 114,209 ; jb 2f21 <_sk_store_f16_hsw+0x61>
DB 197,121,214,76,248,32 ; vmovq %xmm9,0x20(%rax,%rdi,8)
- DB 116,201 ; je 2f25 <_sk_store_f16_hsw+0x61>
+ DB 116,201 ; je 2f21 <_sk_store_f16_hsw+0x61>
DB 197,121,23,76,248,40 ; vmovhpd %xmm9,0x28(%rax,%rdi,8)
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,189 ; jb 2f25 <_sk_store_f16_hsw+0x61>
+ DB 114,189 ; jb 2f21 <_sk_store_f16_hsw+0x61>
DB 197,121,214,68,248,48 ; vmovq %xmm8,0x30(%rax,%rdi,8)
- DB 235,181 ; jmp 2f25 <_sk_store_f16_hsw+0x61>
+ DB 235,181 ; jmp 2f21 <_sk_store_f16_hsw+0x61>
PUBLIC _sk_load_u16_be_hsw
_sk_load_u16_be_hsw LABEL PROC
@@ -2944,7 +2943,7 @@ _sk_load_u16_be_hsw LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 72,141,4,189,0,0,0,0 ; lea 0x0(,%rdi,4),%rax
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,204,0,0,0 ; jne 3052 <_sk_load_u16_be_hsw+0xe2>
+ DB 15,133,204,0,0,0 ; jne 304e <_sk_load_u16_be_hsw+0xe2>
DB 196,65,121,16,4,64 ; vmovupd (%r8,%rax,2),%xmm8
DB 196,193,121,16,84,64,16 ; vmovupd 0x10(%r8,%rax,2),%xmm2
DB 196,193,121,16,92,64,32 ; vmovupd 0x20(%r8,%rax,2),%xmm3
@@ -2963,7 +2962,7 @@ _sk_load_u16_be_hsw LABEL PROC
DB 197,241,235,192 ; vpor %xmm0,%xmm1,%xmm0
DB 196,226,125,51,192 ; vpmovzxwd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,21,233,17,0,0 ; vbroadcastss 0x11e9(%rip),%ymm10 # 41d0 <_sk_callback_hsw+0x3df>
+ DB 196,98,125,24,21,233,17,0,0 ; vbroadcastss 0x11e9(%rip),%ymm10 # 41cc <_sk_callback_hsw+0x3df>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,185,109,202 ; vpunpckhqdq %xmm2,%xmm8,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -2991,29 +2990,29 @@ _sk_load_u16_be_hsw LABEL PROC
DB 196,65,123,16,4,64 ; vmovsd (%r8,%rax,2),%xmm8
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,85 ; je 30b8 <_sk_load_u16_be_hsw+0x148>
+ DB 116,85 ; je 30b4 <_sk_load_u16_be_hsw+0x148>
DB 196,65,57,22,68,64,8 ; vmovhpd 0x8(%r8,%rax,2),%xmm8,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,72 ; jb 30b8 <_sk_load_u16_be_hsw+0x148>
+ DB 114,72 ; jb 30b4 <_sk_load_u16_be_hsw+0x148>
DB 196,193,123,16,84,64,16 ; vmovsd 0x10(%r8,%rax,2),%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 116,72 ; je 30c5 <_sk_load_u16_be_hsw+0x155>
+ DB 116,72 ; je 30c1 <_sk_load_u16_be_hsw+0x155>
DB 196,193,105,22,84,64,24 ; vmovhpd 0x18(%r8,%rax,2),%xmm2,%xmm2
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,59 ; jb 30c5 <_sk_load_u16_be_hsw+0x155>
+ DB 114,59 ; jb 30c1 <_sk_load_u16_be_hsw+0x155>
DB 196,193,123,16,92,64,32 ; vmovsd 0x20(%r8,%rax,2),%xmm3
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 15,132,6,255,255,255 ; je 2fa1 <_sk_load_u16_be_hsw+0x31>
+ DB 15,132,6,255,255,255 ; je 2f9d <_sk_load_u16_be_hsw+0x31>
DB 196,193,97,22,92,64,40 ; vmovhpd 0x28(%r8,%rax,2),%xmm3,%xmm3
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 15,130,245,254,255,255 ; jb 2fa1 <_sk_load_u16_be_hsw+0x31>
+ DB 15,130,245,254,255,255 ; jb 2f9d <_sk_load_u16_be_hsw+0x31>
DB 196,65,122,126,76,64,48 ; vmovq 0x30(%r8,%rax,2),%xmm9
- DB 233,233,254,255,255 ; jmpq 2fa1 <_sk_load_u16_be_hsw+0x31>
+ DB 233,233,254,255,255 ; jmpq 2f9d <_sk_load_u16_be_hsw+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
DB 197,233,87,210 ; vxorpd %xmm2,%xmm2,%xmm2
- DB 233,220,254,255,255 ; jmpq 2fa1 <_sk_load_u16_be_hsw+0x31>
+ DB 233,220,254,255,255 ; jmpq 2f9d <_sk_load_u16_be_hsw+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
- DB 233,211,254,255,255 ; jmpq 2fa1 <_sk_load_u16_be_hsw+0x31>
+ DB 233,211,254,255,255 ; jmpq 2f9d <_sk_load_u16_be_hsw+0x31>
PUBLIC _sk_load_rgb_u16_be_hsw
_sk_load_rgb_u16_be_hsw LABEL PROC
@@ -3021,7 +3020,7 @@ _sk_load_rgb_u16_be_hsw LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 72,141,4,127 ; lea (%rdi,%rdi,2),%rax
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,204,0,0,0 ; jne 31ac <_sk_load_rgb_u16_be_hsw+0xde>
+ DB 15,133,204,0,0,0 ; jne 31a8 <_sk_load_rgb_u16_be_hsw+0xde>
DB 196,193,122,111,4,64 ; vmovdqu (%r8,%rax,2),%xmm0
DB 196,193,122,111,84,64,12 ; vmovdqu 0xc(%r8,%rax,2),%xmm2
DB 196,193,122,111,76,64,24 ; vmovdqu 0x18(%r8,%rax,2),%xmm1
@@ -3045,7 +3044,7 @@ _sk_load_rgb_u16_be_hsw LABEL PROC
DB 197,241,235,192 ; vpor %xmm0,%xmm1,%xmm0
DB 196,226,125,51,192 ; vpmovzxwd %xmm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,21,122,16,0,0 ; vbroadcastss 0x107a(%rip),%ymm10 # 41d4 <_sk_callback_hsw+0x3e3>
+ DB 196,98,125,24,21,122,16,0,0 ; vbroadcastss 0x107a(%rip),%ymm10 # 41d0 <_sk_callback_hsw+0x3e3>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,185,109,202 ; vpunpckhqdq %xmm2,%xmm8,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -3062,48 +3061,48 @@ _sk_load_rgb_u16_be_hsw LABEL PROC
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,46,16,0,0 ; vbroadcastss 0x102e(%rip),%ymm3 # 41d8 <_sk_callback_hsw+0x3e7>
+ DB 196,226,125,24,29,46,16,0,0 ; vbroadcastss 0x102e(%rip),%ymm3 # 41d4 <_sk_callback_hsw+0x3e7>
DB 255,224 ; jmpq *%rax
DB 196,193,121,110,4,64 ; vmovd (%r8,%rax,2),%xmm0
DB 196,193,121,196,68,64,4,2 ; vpinsrw $0x2,0x4(%r8,%rax,2),%xmm0,%xmm0
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 117,5 ; jne 31c5 <_sk_load_rgb_u16_be_hsw+0xf7>
- DB 233,79,255,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 117,5 ; jne 31c1 <_sk_load_rgb_u16_be_hsw+0xf7>
+ DB 233,79,255,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
DB 196,193,121,110,76,64,6 ; vmovd 0x6(%r8,%rax,2),%xmm1
DB 196,65,113,196,68,64,10,2 ; vpinsrw $0x2,0xa(%r8,%rax,2),%xmm1,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,26 ; jb 31f4 <_sk_load_rgb_u16_be_hsw+0x126>
+ DB 114,26 ; jb 31f0 <_sk_load_rgb_u16_be_hsw+0x126>
DB 196,193,121,110,76,64,12 ; vmovd 0xc(%r8,%rax,2),%xmm1
DB 196,193,113,196,84,64,16,2 ; vpinsrw $0x2,0x10(%r8,%rax,2),%xmm1,%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 117,10 ; jne 31f9 <_sk_load_rgb_u16_be_hsw+0x12b>
- DB 233,32,255,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
- DB 233,27,255,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 117,10 ; jne 31f5 <_sk_load_rgb_u16_be_hsw+0x12b>
+ DB 233,32,255,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 233,27,255,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
DB 196,193,121,110,76,64,18 ; vmovd 0x12(%r8,%rax,2),%xmm1
DB 196,65,113,196,76,64,22,2 ; vpinsrw $0x2,0x16(%r8,%rax,2),%xmm1,%xmm9
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,26 ; jb 3228 <_sk_load_rgb_u16_be_hsw+0x15a>
+ DB 114,26 ; jb 3224 <_sk_load_rgb_u16_be_hsw+0x15a>
DB 196,193,121,110,76,64,24 ; vmovd 0x18(%r8,%rax,2),%xmm1
DB 196,193,113,196,76,64,28,2 ; vpinsrw $0x2,0x1c(%r8,%rax,2),%xmm1,%xmm1
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 117,10 ; jne 322d <_sk_load_rgb_u16_be_hsw+0x15f>
- DB 233,236,254,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
- DB 233,231,254,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 117,10 ; jne 3229 <_sk_load_rgb_u16_be_hsw+0x15f>
+ DB 233,236,254,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 233,231,254,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
DB 196,193,121,110,92,64,30 ; vmovd 0x1e(%r8,%rax,2),%xmm3
DB 196,65,97,196,92,64,34,2 ; vpinsrw $0x2,0x22(%r8,%rax,2),%xmm3,%xmm11
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,20 ; jb 3256 <_sk_load_rgb_u16_be_hsw+0x188>
+ DB 114,20 ; jb 3252 <_sk_load_rgb_u16_be_hsw+0x188>
DB 196,193,121,110,92,64,36 ; vmovd 0x24(%r8,%rax,2),%xmm3
DB 196,193,97,196,92,64,40,2 ; vpinsrw $0x2,0x28(%r8,%rax,2),%xmm3,%xmm3
- DB 233,190,254,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
- DB 233,185,254,255,255 ; jmpq 3114 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 233,190,254,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
+ DB 233,185,254,255,255 ; jmpq 3110 <_sk_load_rgb_u16_be_hsw+0x46>
PUBLIC _sk_store_u16_be_hsw
_sk_store_u16_be_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,0 ; mov (%rax),%r8
DB 72,141,4,189,0,0,0,0 ; lea 0x0(,%rdi,4),%rax
- DB 196,98,125,24,5,107,15,0,0 ; vbroadcastss 0xf6b(%rip),%ymm8 # 41dc <_sk_callback_hsw+0x3eb>
+ DB 196,98,125,24,5,107,15,0,0 ; vbroadcastss 0xf6b(%rip),%ymm8 # 41d8 <_sk_callback_hsw+0x3eb>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,67,125,25,202,1 ; vextractf128 $0x1,%ymm9,%xmm10
@@ -3141,7 +3140,7 @@ _sk_store_u16_be_hsw LABEL PROC
DB 196,65,17,98,200 ; vpunpckldq %xmm8,%xmm13,%xmm9
DB 196,65,17,106,192 ; vpunpckhdq %xmm8,%xmm13,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,31 ; jne 3355 <_sk_store_u16_be_hsw+0xfa>
+ DB 117,31 ; jne 3351 <_sk_store_u16_be_hsw+0xfa>
DB 196,65,120,17,28,64 ; vmovups %xmm11,(%r8,%rax,2)
DB 196,65,120,17,84,64,16 ; vmovups %xmm10,0x10(%r8,%rax,2)
DB 196,65,120,17,76,64,32 ; vmovups %xmm9,0x20(%r8,%rax,2)
@@ -3150,31 +3149,31 @@ _sk_store_u16_be_hsw LABEL PROC
DB 255,224 ; jmpq *%rax
DB 196,65,121,214,28,64 ; vmovq %xmm11,(%r8,%rax,2)
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,240 ; je 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 116,240 ; je 334d <_sk_store_u16_be_hsw+0xf6>
DB 196,65,121,23,92,64,8 ; vmovhpd %xmm11,0x8(%r8,%rax,2)
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,227 ; jb 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 114,227 ; jb 334d <_sk_store_u16_be_hsw+0xf6>
DB 196,65,121,214,84,64,16 ; vmovq %xmm10,0x10(%r8,%rax,2)
- DB 116,218 ; je 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 116,218 ; je 334d <_sk_store_u16_be_hsw+0xf6>
DB 196,65,121,23,84,64,24 ; vmovhpd %xmm10,0x18(%r8,%rax,2)
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,205 ; jb 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 114,205 ; jb 334d <_sk_store_u16_be_hsw+0xf6>
DB 196,65,121,214,76,64,32 ; vmovq %xmm9,0x20(%r8,%rax,2)
- DB 116,196 ; je 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 116,196 ; je 334d <_sk_store_u16_be_hsw+0xf6>
DB 196,65,121,23,76,64,40 ; vmovhpd %xmm9,0x28(%r8,%rax,2)
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,183 ; jb 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 114,183 ; jb 334d <_sk_store_u16_be_hsw+0xf6>
DB 196,65,121,214,68,64,48 ; vmovq %xmm8,0x30(%r8,%rax,2)
- DB 235,174 ; jmp 3351 <_sk_store_u16_be_hsw+0xf6>
+ DB 235,174 ; jmp 334d <_sk_store_u16_be_hsw+0xf6>
PUBLIC _sk_load_f32_hsw
_sk_load_f32_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 119,110 ; ja 3419 <_sk_load_f32_hsw+0x76>
+ DB 119,110 ; ja 3415 <_sk_load_f32_hsw+0x76>
DB 76,139,0 ; mov (%rax),%r8
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
- DB 76,141,21,135,0,0,0 ; lea 0x87(%rip),%r10 # 3444 <_sk_load_f32_hsw+0xa1>
+ DB 76,141,21,135,0,0,0 ; lea 0x87(%rip),%r10 # 3440 <_sk_load_f32_hsw+0xa1>
DB 73,99,4,138 ; movslq (%r10,%rcx,4),%rax
DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
@@ -3233,7 +3232,7 @@ _sk_store_f32_hsw LABEL PROC
DB 196,65,37,20,196 ; vunpcklpd %ymm12,%ymm11,%ymm8
DB 196,65,37,21,220 ; vunpckhpd %ymm12,%ymm11,%ymm11
DB 72,133,201 ; test %rcx,%rcx
- DB 117,55 ; jne 34d1 <_sk_store_f32_hsw+0x6d>
+ DB 117,55 ; jne 34cd <_sk_store_f32_hsw+0x6d>
DB 196,67,45,24,225,1 ; vinsertf128 $0x1,%xmm9,%ymm10,%ymm12
DB 196,67,61,24,235,1 ; vinsertf128 $0x1,%xmm11,%ymm8,%ymm13
DB 196,67,45,6,201,49 ; vperm2f128 $0x31,%ymm9,%ymm10,%ymm9
@@ -3246,22 +3245,22 @@ _sk_store_f32_hsw LABEL PROC
DB 255,224 ; jmpq *%rax
DB 196,65,121,17,20,128 ; vmovupd %xmm10,(%r8,%rax,4)
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,240 ; je 34cd <_sk_store_f32_hsw+0x69>
+ DB 116,240 ; je 34c9 <_sk_store_f32_hsw+0x69>
DB 196,65,121,17,76,128,16 ; vmovupd %xmm9,0x10(%r8,%rax,4)
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,227 ; jb 34cd <_sk_store_f32_hsw+0x69>
+ DB 114,227 ; jb 34c9 <_sk_store_f32_hsw+0x69>
DB 196,65,121,17,68,128,32 ; vmovupd %xmm8,0x20(%r8,%rax,4)
- DB 116,218 ; je 34cd <_sk_store_f32_hsw+0x69>
+ DB 116,218 ; je 34c9 <_sk_store_f32_hsw+0x69>
DB 196,65,121,17,92,128,48 ; vmovupd %xmm11,0x30(%r8,%rax,4)
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,205 ; jb 34cd <_sk_store_f32_hsw+0x69>
+ DB 114,205 ; jb 34c9 <_sk_store_f32_hsw+0x69>
DB 196,67,125,25,84,128,64,1 ; vextractf128 $0x1,%ymm10,0x40(%r8,%rax,4)
- DB 116,195 ; je 34cd <_sk_store_f32_hsw+0x69>
+ DB 116,195 ; je 34c9 <_sk_store_f32_hsw+0x69>
DB 196,67,125,25,76,128,80,1 ; vextractf128 $0x1,%ymm9,0x50(%r8,%rax,4)
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,181 ; jb 34cd <_sk_store_f32_hsw+0x69>
+ DB 114,181 ; jb 34c9 <_sk_store_f32_hsw+0x69>
DB 196,67,125,25,68,128,96,1 ; vextractf128 $0x1,%ymm8,0x60(%r8,%rax,4)
- DB 235,171 ; jmp 34cd <_sk_store_f32_hsw+0x69>
+ DB 235,171 ; jmp 34c9 <_sk_store_f32_hsw+0x69>
PUBLIC _sk_clamp_x_hsw
_sk_clamp_x_hsw LABEL PROC
@@ -3357,11 +3356,11 @@ _sk_mirror_y_hsw LABEL PROC
PUBLIC _sk_luminance_to_alpha_hsw
_sk_luminance_to_alpha_hsw LABEL PROC
- DB 196,226,125,24,29,133,11,0,0 ; vbroadcastss 0xb85(%rip),%ymm3 # 41e0 <_sk_callback_hsw+0x3ef>
- DB 196,98,125,24,5,128,11,0,0 ; vbroadcastss 0xb80(%rip),%ymm8 # 41e4 <_sk_callback_hsw+0x3f3>
+ DB 196,226,125,24,29,133,11,0,0 ; vbroadcastss 0xb85(%rip),%ymm3 # 41dc <_sk_callback_hsw+0x3ef>
+ DB 196,98,125,24,5,128,11,0,0 ; vbroadcastss 0xb80(%rip),%ymm8 # 41e0 <_sk_callback_hsw+0x3f3>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
DB 196,226,125,184,203 ; vfmadd231ps %ymm3,%ymm0,%ymm1
- DB 196,226,125,24,29,113,11,0,0 ; vbroadcastss 0xb71(%rip),%ymm3 # 41e8 <_sk_callback_hsw+0x3f7>
+ DB 196,226,125,24,29,113,11,0,0 ; vbroadcastss 0xb71(%rip),%ymm3 # 41e4 <_sk_callback_hsw+0x3f7>
DB 196,226,109,168,217 ; vfmadd213ps %ymm1,%ymm2,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -3496,7 +3495,7 @@ _sk_linear_gradient_hsw LABEL PROC
DB 196,98,125,24,72,28 ; vbroadcastss 0x1c(%rax),%ymm9
DB 76,139,0 ; mov (%rax),%r8
DB 77,133,192 ; test %r8,%r8
- DB 15,132,143,0,0,0 ; je 394f <_sk_linear_gradient_hsw+0xb5>
+ DB 15,132,143,0,0,0 ; je 394b <_sk_linear_gradient_hsw+0xb5>
DB 72,139,64,8 ; mov 0x8(%rax),%rax
DB 72,131,192,32 ; add $0x20,%rax
DB 196,65,28,87,228 ; vxorps %ymm12,%ymm12,%ymm12
@@ -3523,8 +3522,8 @@ _sk_linear_gradient_hsw LABEL PROC
DB 196,67,13,74,201,208 ; vblendvps %ymm13,%ymm9,%ymm14,%ymm9
DB 72,131,192,36 ; add $0x24,%rax
DB 73,255,200 ; dec %r8
- DB 117,140 ; jne 38d9 <_sk_linear_gradient_hsw+0x3f>
- DB 235,17 ; jmp 3960 <_sk_linear_gradient_hsw+0xc6>
+ DB 117,140 ; jne 38d5 <_sk_linear_gradient_hsw+0x3f>
+ DB 235,17 ; jmp 395c <_sk_linear_gradient_hsw+0xc6>
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 197,236,87,210 ; vxorps %ymm2,%ymm2,%ymm2
DB 197,228,87,219 ; vxorps %ymm3,%ymm3,%ymm3
@@ -3567,24 +3566,24 @@ _sk_xy_to_polar_unit_hsw LABEL PROC
DB 196,65,52,95,226 ; vmaxps %ymm10,%ymm9,%ymm12
DB 196,65,36,94,220 ; vdivps %ymm12,%ymm11,%ymm11
DB 196,65,36,89,227 ; vmulps %ymm11,%ymm11,%ymm12
- DB 196,98,125,24,45,241,7,0,0 ; vbroadcastss 0x7f1(%rip),%ymm13 # 41ec <_sk_callback_hsw+0x3fb>
- DB 196,98,125,24,53,236,7,0,0 ; vbroadcastss 0x7ec(%rip),%ymm14 # 41f0 <_sk_callback_hsw+0x3ff>
+ DB 196,98,125,24,45,241,7,0,0 ; vbroadcastss 0x7f1(%rip),%ymm13 # 41e8 <_sk_callback_hsw+0x3fb>
+ DB 196,98,125,24,53,236,7,0,0 ; vbroadcastss 0x7ec(%rip),%ymm14 # 41ec <_sk_callback_hsw+0x3ff>
DB 196,66,29,184,245 ; vfmadd231ps %ymm13,%ymm12,%ymm14
- DB 196,98,125,24,45,226,7,0,0 ; vbroadcastss 0x7e2(%rip),%ymm13 # 41f4 <_sk_callback_hsw+0x403>
+ DB 196,98,125,24,45,226,7,0,0 ; vbroadcastss 0x7e2(%rip),%ymm13 # 41f0 <_sk_callback_hsw+0x403>
DB 196,66,29,184,238 ; vfmadd231ps %ymm14,%ymm12,%ymm13
- DB 196,98,125,24,53,216,7,0,0 ; vbroadcastss 0x7d8(%rip),%ymm14 # 41f8 <_sk_callback_hsw+0x407>
+ DB 196,98,125,24,53,216,7,0,0 ; vbroadcastss 0x7d8(%rip),%ymm14 # 41f4 <_sk_callback_hsw+0x407>
DB 196,66,29,184,245 ; vfmadd231ps %ymm13,%ymm12,%ymm14
DB 196,65,36,89,222 ; vmulps %ymm14,%ymm11,%ymm11
DB 196,65,52,194,202,1 ; vcmpltps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,195,7,0,0 ; vbroadcastss 0x7c3(%rip),%ymm10 # 41fc <_sk_callback_hsw+0x40b>
+ DB 196,98,125,24,21,195,7,0,0 ; vbroadcastss 0x7c3(%rip),%ymm10 # 41f8 <_sk_callback_hsw+0x40b>
DB 196,65,44,92,211 ; vsubps %ymm11,%ymm10,%ymm10
DB 196,67,37,74,202,144 ; vblendvps %ymm9,%ymm10,%ymm11,%ymm9
DB 196,193,124,194,192,1 ; vcmpltps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,21,173,7,0,0 ; vbroadcastss 0x7ad(%rip),%ymm10 # 4200 <_sk_callback_hsw+0x40f>
+ DB 196,98,125,24,21,173,7,0,0 ; vbroadcastss 0x7ad(%rip),%ymm10 # 41fc <_sk_callback_hsw+0x40f>
DB 196,65,44,92,209 ; vsubps %ymm9,%ymm10,%ymm10
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 196,65,116,194,200,1 ; vcmpltps %ymm8,%ymm1,%ymm9
- DB 196,98,125,24,21,151,7,0,0 ; vbroadcastss 0x797(%rip),%ymm10 # 4204 <_sk_callback_hsw+0x413>
+ DB 196,98,125,24,21,151,7,0,0 ; vbroadcastss 0x797(%rip),%ymm10 # 4200 <_sk_callback_hsw+0x413>
DB 197,44,92,208 ; vsubps %ymm0,%ymm10,%ymm10
DB 196,195,125,74,194,144 ; vblendvps %ymm9,%ymm10,%ymm0,%ymm0
DB 196,65,124,194,200,3 ; vcmpunordps %ymm8,%ymm0,%ymm9
@@ -3595,7 +3594,7 @@ _sk_xy_to_polar_unit_hsw LABEL PROC
PUBLIC _sk_save_xy_hsw
_sk_save_xy_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,118,7,0,0 ; vbroadcastss 0x776(%rip),%ymm8 # 4208 <_sk_callback_hsw+0x417>
+ DB 196,98,125,24,5,118,7,0,0 ; vbroadcastss 0x776(%rip),%ymm8 # 4204 <_sk_callback_hsw+0x417>
DB 196,65,124,88,200 ; vaddps %ymm8,%ymm0,%ymm9
DB 196,67,125,8,209,1 ; vroundps $0x1,%ymm9,%ymm10
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
@@ -3625,9 +3624,9 @@ _sk_accumulate_hsw LABEL PROC
PUBLIC _sk_bilinear_nx_hsw
_sk_bilinear_nx_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,10,7,0,0 ; vbroadcastss 0x70a(%rip),%ymm0 # 420c <_sk_callback_hsw+0x41b>
+ DB 196,226,125,24,5,10,7,0,0 ; vbroadcastss 0x70a(%rip),%ymm0 # 4208 <_sk_callback_hsw+0x41b>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,1,7,0,0 ; vbroadcastss 0x701(%rip),%ymm8 # 4210 <_sk_callback_hsw+0x41f>
+ DB 196,98,125,24,5,1,7,0,0 ; vbroadcastss 0x701(%rip),%ymm8 # 420c <_sk_callback_hsw+0x41f>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -3636,7 +3635,7 @@ _sk_bilinear_nx_hsw LABEL PROC
PUBLIC _sk_bilinear_px_hsw
_sk_bilinear_px_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,233,6,0,0 ; vbroadcastss 0x6e9(%rip),%ymm0 # 4214 <_sk_callback_hsw+0x423>
+ DB 196,226,125,24,5,233,6,0,0 ; vbroadcastss 0x6e9(%rip),%ymm0 # 4210 <_sk_callback_hsw+0x423>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -3646,9 +3645,9 @@ _sk_bilinear_px_hsw LABEL PROC
PUBLIC _sk_bilinear_ny_hsw
_sk_bilinear_ny_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,205,6,0,0 ; vbroadcastss 0x6cd(%rip),%ymm1 # 4218 <_sk_callback_hsw+0x427>
+ DB 196,226,125,24,13,205,6,0,0 ; vbroadcastss 0x6cd(%rip),%ymm1 # 4214 <_sk_callback_hsw+0x427>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,195,6,0,0 ; vbroadcastss 0x6c3(%rip),%ymm8 # 421c <_sk_callback_hsw+0x42b>
+ DB 196,98,125,24,5,195,6,0,0 ; vbroadcastss 0x6c3(%rip),%ymm8 # 4218 <_sk_callback_hsw+0x42b>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -3657,7 +3656,7 @@ _sk_bilinear_ny_hsw LABEL PROC
PUBLIC _sk_bilinear_py_hsw
_sk_bilinear_py_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,171,6,0,0 ; vbroadcastss 0x6ab(%rip),%ymm1 # 4220 <_sk_callback_hsw+0x42f>
+ DB 196,226,125,24,13,171,6,0,0 ; vbroadcastss 0x6ab(%rip),%ymm1 # 421c <_sk_callback_hsw+0x42f>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -3667,13 +3666,13 @@ _sk_bilinear_py_hsw LABEL PROC
PUBLIC _sk_bicubic_n3x_hsw
_sk_bicubic_n3x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,142,6,0,0 ; vbroadcastss 0x68e(%rip),%ymm0 # 4224 <_sk_callback_hsw+0x433>
+ DB 196,226,125,24,5,142,6,0,0 ; vbroadcastss 0x68e(%rip),%ymm0 # 4220 <_sk_callback_hsw+0x433>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,133,6,0,0 ; vbroadcastss 0x685(%rip),%ymm8 # 4228 <_sk_callback_hsw+0x437>
+ DB 196,98,125,24,5,133,6,0,0 ; vbroadcastss 0x685(%rip),%ymm8 # 4224 <_sk_callback_hsw+0x437>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,118,6,0,0 ; vbroadcastss 0x676(%rip),%ymm10 # 422c <_sk_callback_hsw+0x43b>
- DB 196,98,125,24,29,113,6,0,0 ; vbroadcastss 0x671(%rip),%ymm11 # 4230 <_sk_callback_hsw+0x43f>
+ DB 196,98,125,24,21,118,6,0,0 ; vbroadcastss 0x676(%rip),%ymm10 # 4228 <_sk_callback_hsw+0x43b>
+ DB 196,98,125,24,29,113,6,0,0 ; vbroadcastss 0x671(%rip),%ymm11 # 422c <_sk_callback_hsw+0x43f>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,36,89,193 ; vmulps %ymm9,%ymm11,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -3683,16 +3682,16 @@ _sk_bicubic_n3x_hsw LABEL PROC
PUBLIC _sk_bicubic_n1x_hsw
_sk_bicubic_n1x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,84,6,0,0 ; vbroadcastss 0x654(%rip),%ymm0 # 4234 <_sk_callback_hsw+0x443>
+ DB 196,226,125,24,5,84,6,0,0 ; vbroadcastss 0x654(%rip),%ymm0 # 4230 <_sk_callback_hsw+0x443>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,75,6,0,0 ; vbroadcastss 0x64b(%rip),%ymm8 # 4238 <_sk_callback_hsw+0x447>
+ DB 196,98,125,24,5,75,6,0,0 ; vbroadcastss 0x64b(%rip),%ymm8 # 4234 <_sk_callback_hsw+0x447>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,65,6,0,0 ; vbroadcastss 0x641(%rip),%ymm9 # 423c <_sk_callback_hsw+0x44b>
- DB 196,98,125,24,21,60,6,0,0 ; vbroadcastss 0x63c(%rip),%ymm10 # 4240 <_sk_callback_hsw+0x44f>
+ DB 196,98,125,24,13,65,6,0,0 ; vbroadcastss 0x641(%rip),%ymm9 # 4238 <_sk_callback_hsw+0x44b>
+ DB 196,98,125,24,21,60,6,0,0 ; vbroadcastss 0x63c(%rip),%ymm10 # 423c <_sk_callback_hsw+0x44f>
DB 196,66,61,168,209 ; vfmadd213ps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,13,50,6,0,0 ; vbroadcastss 0x632(%rip),%ymm9 # 4244 <_sk_callback_hsw+0x453>
+ DB 196,98,125,24,13,50,6,0,0 ; vbroadcastss 0x632(%rip),%ymm9 # 4240 <_sk_callback_hsw+0x453>
DB 196,66,61,184,202 ; vfmadd231ps %ymm10,%ymm8,%ymm9
- DB 196,98,125,24,21,40,6,0,0 ; vbroadcastss 0x628(%rip),%ymm10 # 4248 <_sk_callback_hsw+0x457>
+ DB 196,98,125,24,21,40,6,0,0 ; vbroadcastss 0x628(%rip),%ymm10 # 4244 <_sk_callback_hsw+0x457>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 197,124,17,144,128,0,0,0 ; vmovups %ymm10,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -3701,14 +3700,14 @@ _sk_bicubic_n1x_hsw LABEL PROC
PUBLIC _sk_bicubic_p1x_hsw
_sk_bicubic_p1x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,16,6,0,0 ; vbroadcastss 0x610(%rip),%ymm8 # 424c <_sk_callback_hsw+0x45b>
+ DB 196,98,125,24,5,16,6,0,0 ; vbroadcastss 0x610(%rip),%ymm8 # 4248 <_sk_callback_hsw+0x45b>
DB 197,188,88,0 ; vaddps (%rax),%ymm8,%ymm0
DB 197,124,16,72,64 ; vmovups 0x40(%rax),%ymm9
- DB 196,98,125,24,21,2,6,0,0 ; vbroadcastss 0x602(%rip),%ymm10 # 4250 <_sk_callback_hsw+0x45f>
- DB 196,98,125,24,29,253,5,0,0 ; vbroadcastss 0x5fd(%rip),%ymm11 # 4254 <_sk_callback_hsw+0x463>
+ DB 196,98,125,24,21,2,6,0,0 ; vbroadcastss 0x602(%rip),%ymm10 # 424c <_sk_callback_hsw+0x45f>
+ DB 196,98,125,24,29,253,5,0,0 ; vbroadcastss 0x5fd(%rip),%ymm11 # 4250 <_sk_callback_hsw+0x463>
DB 196,66,53,168,218 ; vfmadd213ps %ymm10,%ymm9,%ymm11
DB 196,66,53,168,216 ; vfmadd213ps %ymm8,%ymm9,%ymm11
- DB 196,98,125,24,5,238,5,0,0 ; vbroadcastss 0x5ee(%rip),%ymm8 # 4258 <_sk_callback_hsw+0x467>
+ DB 196,98,125,24,5,238,5,0,0 ; vbroadcastss 0x5ee(%rip),%ymm8 # 4254 <_sk_callback_hsw+0x467>
DB 196,66,53,184,195 ; vfmadd231ps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -3717,12 +3716,12 @@ _sk_bicubic_p1x_hsw LABEL PROC
PUBLIC _sk_bicubic_p3x_hsw
_sk_bicubic_p3x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,214,5,0,0 ; vbroadcastss 0x5d6(%rip),%ymm0 # 425c <_sk_callback_hsw+0x46b>
+ DB 196,226,125,24,5,214,5,0,0 ; vbroadcastss 0x5d6(%rip),%ymm0 # 4258 <_sk_callback_hsw+0x46b>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,195,5,0,0 ; vbroadcastss 0x5c3(%rip),%ymm10 # 4260 <_sk_callback_hsw+0x46f>
- DB 196,98,125,24,29,190,5,0,0 ; vbroadcastss 0x5be(%rip),%ymm11 # 4264 <_sk_callback_hsw+0x473>
+ DB 196,98,125,24,21,195,5,0,0 ; vbroadcastss 0x5c3(%rip),%ymm10 # 425c <_sk_callback_hsw+0x46f>
+ DB 196,98,125,24,29,190,5,0,0 ; vbroadcastss 0x5be(%rip),%ymm11 # 4260 <_sk_callback_hsw+0x473>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,52,89,195 ; vmulps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -3732,13 +3731,13 @@ _sk_bicubic_p3x_hsw LABEL PROC
PUBLIC _sk_bicubic_n3y_hsw
_sk_bicubic_n3y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,161,5,0,0 ; vbroadcastss 0x5a1(%rip),%ymm1 # 4268 <_sk_callback_hsw+0x477>
+ DB 196,226,125,24,13,161,5,0,0 ; vbroadcastss 0x5a1(%rip),%ymm1 # 4264 <_sk_callback_hsw+0x477>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,151,5,0,0 ; vbroadcastss 0x597(%rip),%ymm8 # 426c <_sk_callback_hsw+0x47b>
+ DB 196,98,125,24,5,151,5,0,0 ; vbroadcastss 0x597(%rip),%ymm8 # 4268 <_sk_callback_hsw+0x47b>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,136,5,0,0 ; vbroadcastss 0x588(%rip),%ymm10 # 4270 <_sk_callback_hsw+0x47f>
- DB 196,98,125,24,29,131,5,0,0 ; vbroadcastss 0x583(%rip),%ymm11 # 4274 <_sk_callback_hsw+0x483>
+ DB 196,98,125,24,21,136,5,0,0 ; vbroadcastss 0x588(%rip),%ymm10 # 426c <_sk_callback_hsw+0x47f>
+ DB 196,98,125,24,29,131,5,0,0 ; vbroadcastss 0x583(%rip),%ymm11 # 4270 <_sk_callback_hsw+0x483>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,36,89,193 ; vmulps %ymm9,%ymm11,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -3748,16 +3747,16 @@ _sk_bicubic_n3y_hsw LABEL PROC
PUBLIC _sk_bicubic_n1y_hsw
_sk_bicubic_n1y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,102,5,0,0 ; vbroadcastss 0x566(%rip),%ymm1 # 4278 <_sk_callback_hsw+0x487>
+ DB 196,226,125,24,13,102,5,0,0 ; vbroadcastss 0x566(%rip),%ymm1 # 4274 <_sk_callback_hsw+0x487>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,92,5,0,0 ; vbroadcastss 0x55c(%rip),%ymm8 # 427c <_sk_callback_hsw+0x48b>
+ DB 196,98,125,24,5,92,5,0,0 ; vbroadcastss 0x55c(%rip),%ymm8 # 4278 <_sk_callback_hsw+0x48b>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,82,5,0,0 ; vbroadcastss 0x552(%rip),%ymm9 # 4280 <_sk_callback_hsw+0x48f>
- DB 196,98,125,24,21,77,5,0,0 ; vbroadcastss 0x54d(%rip),%ymm10 # 4284 <_sk_callback_hsw+0x493>
+ DB 196,98,125,24,13,82,5,0,0 ; vbroadcastss 0x552(%rip),%ymm9 # 427c <_sk_callback_hsw+0x48f>
+ DB 196,98,125,24,21,77,5,0,0 ; vbroadcastss 0x54d(%rip),%ymm10 # 4280 <_sk_callback_hsw+0x493>
DB 196,66,61,168,209 ; vfmadd213ps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,13,67,5,0,0 ; vbroadcastss 0x543(%rip),%ymm9 # 4288 <_sk_callback_hsw+0x497>
+ DB 196,98,125,24,13,67,5,0,0 ; vbroadcastss 0x543(%rip),%ymm9 # 4284 <_sk_callback_hsw+0x497>
DB 196,66,61,184,202 ; vfmadd231ps %ymm10,%ymm8,%ymm9
- DB 196,98,125,24,21,57,5,0,0 ; vbroadcastss 0x539(%rip),%ymm10 # 428c <_sk_callback_hsw+0x49b>
+ DB 196,98,125,24,21,57,5,0,0 ; vbroadcastss 0x539(%rip),%ymm10 # 4288 <_sk_callback_hsw+0x49b>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 197,124,17,144,160,0,0,0 ; vmovups %ymm10,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -3766,14 +3765,14 @@ _sk_bicubic_n1y_hsw LABEL PROC
PUBLIC _sk_bicubic_p1y_hsw
_sk_bicubic_p1y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,33,5,0,0 ; vbroadcastss 0x521(%rip),%ymm8 # 4290 <_sk_callback_hsw+0x49f>
+ DB 196,98,125,24,5,33,5,0,0 ; vbroadcastss 0x521(%rip),%ymm8 # 428c <_sk_callback_hsw+0x49f>
DB 197,188,88,72,32 ; vaddps 0x20(%rax),%ymm8,%ymm1
DB 197,124,16,72,96 ; vmovups 0x60(%rax),%ymm9
- DB 196,98,125,24,21,18,5,0,0 ; vbroadcastss 0x512(%rip),%ymm10 # 4294 <_sk_callback_hsw+0x4a3>
- DB 196,98,125,24,29,13,5,0,0 ; vbroadcastss 0x50d(%rip),%ymm11 # 4298 <_sk_callback_hsw+0x4a7>
+ DB 196,98,125,24,21,18,5,0,0 ; vbroadcastss 0x512(%rip),%ymm10 # 4290 <_sk_callback_hsw+0x4a3>
+ DB 196,98,125,24,29,13,5,0,0 ; vbroadcastss 0x50d(%rip),%ymm11 # 4294 <_sk_callback_hsw+0x4a7>
DB 196,66,53,168,218 ; vfmadd213ps %ymm10,%ymm9,%ymm11
DB 196,66,53,168,216 ; vfmadd213ps %ymm8,%ymm9,%ymm11
- DB 196,98,125,24,5,254,4,0,0 ; vbroadcastss 0x4fe(%rip),%ymm8 # 429c <_sk_callback_hsw+0x4ab>
+ DB 196,98,125,24,5,254,4,0,0 ; vbroadcastss 0x4fe(%rip),%ymm8 # 4298 <_sk_callback_hsw+0x4ab>
DB 196,66,53,184,195 ; vfmadd231ps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -3782,12 +3781,12 @@ _sk_bicubic_p1y_hsw LABEL PROC
PUBLIC _sk_bicubic_p3y_hsw
_sk_bicubic_p3y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,230,4,0,0 ; vbroadcastss 0x4e6(%rip),%ymm1 # 42a0 <_sk_callback_hsw+0x4af>
+ DB 196,226,125,24,13,230,4,0,0 ; vbroadcastss 0x4e6(%rip),%ymm1 # 429c <_sk_callback_hsw+0x4af>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,210,4,0,0 ; vbroadcastss 0x4d2(%rip),%ymm10 # 42a4 <_sk_callback_hsw+0x4b3>
- DB 196,98,125,24,29,205,4,0,0 ; vbroadcastss 0x4cd(%rip),%ymm11 # 42a8 <_sk_callback_hsw+0x4b7>
+ DB 196,98,125,24,21,210,4,0,0 ; vbroadcastss 0x4d2(%rip),%ymm10 # 42a0 <_sk_callback_hsw+0x4b3>
+ DB 196,98,125,24,29,205,4,0,0 ; vbroadcastss 0x4cd(%rip),%ymm11 # 42a4 <_sk_callback_hsw+0x4b7>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,52,89,195 ; vmulps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -3870,11 +3869,10 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 2,0 ; add (%rax),%al
DB 0,0 ; add %al,(%rax)
- DB 33,8 ; and %ecx,(%rax)
- DB 130 ; (bad)
- DB 60,0 ; cmp $0x0,%al
DB 0,0 ; add %al,(%rax)
- DB 191,0,0,128,63 ; mov $0x3f800000,%edi
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 252 ; cld
+ DB 190,0,0,128,63 ; mov $0x3f800000,%esi
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
DB 0,128,63,0,0,128 ; add %al,-0x7fffffc1(%rax)
@@ -3946,7 +3944,7 @@ ALIGN 4
DB 190,129,128,128,59 ; mov $0x3b808081,%esi
DB 129,128,128,59,0,248,0,0,8,33 ; addl $0x21080000,-0x7ffc480(%rax)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 3ffd <.literal4+0xf1>
+ DB 224,7 ; loopne 3ff9 <.literal4+0xf1>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -3960,10 +3958,10 @@ ALIGN 4
DB 129,128,128,59,129,128,128,59,0,0 ; addl $0x3b80,-0x7f7ec480(%rax)
DB 0,52,255 ; add %dh,(%rdi,%rdi,8)
DB 255 ; (bad)
- DB 127,0 ; jg 4028 <.literal4+0x11c>
+ DB 127,0 ; jg 4024 <.literal4+0x11c>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 40a1 <.literal4+0x195>
+ DB 119,115 ; ja 409d <.literal4+0x195>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -3977,10 +3975,10 @@ ALIGN 4
DB 0,128,63,0,0,0 ; add %al,0x3f(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 405c <.literal4+0x150>
+ DB 127,0 ; jg 4058 <.literal4+0x150>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 40d5 <.literal4+0x1c9>
+ DB 119,115 ; ja 40d1 <.literal4+0x1c9>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -3994,10 +3992,10 @@ ALIGN 4
DB 0,128,63,0,0,0 ; add %al,0x3f(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 4090 <.literal4+0x184>
+ DB 127,0 ; jg 408c <.literal4+0x184>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 4109 <.literal4+0x1fd>
+ DB 119,115 ; ja 4105 <.literal4+0x1fd>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -4011,10 +4009,10 @@ ALIGN 4
DB 0,128,63,0,0,0 ; add %al,0x3f(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 40c4 <.literal4+0x1b8>
+ DB 127,0 ; jg 40c0 <.literal4+0x1b8>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 413d <.literal4+0x231>
+ DB 119,115 ; ja 4139 <.literal4+0x231>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -4027,7 +4025,7 @@ ALIGN 4
DB 0,75,0 ; add %cl,0x0(%rbx)
DB 0,128,63,0,0,200 ; add %al,-0x37ffffc1(%rax)
DB 66,0,0 ; rex.X add %al,(%rax)
- DB 127,67 ; jg 413b <.literal4+0x22f>
+ DB 127,67 ; jg 4137 <.literal4+0x22f>
DB 0,0 ; add %al,(%rax)
DB 0,195 ; add %al,%bl
DB 0,0 ; add %al,(%rax)
@@ -4039,10 +4037,10 @@ ALIGN 4
DB 190,80,128,3,62 ; mov $0x3e038050,%esi
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 415b <.literal4+0x24f>
+ DB 118,63 ; jbe 4157 <.literal4+0x24f>
DB 246,64,83,63 ; testb $0x3f,0x53(%rax)
DB 129,128,128,59,129,128,128,59,0,0 ; addl $0x3b80,-0x7f7ec480(%rax)
- DB 127,67 ; jg 416f <.literal4+0x263>
+ DB 127,67 ; jg 416b <.literal4+0x263>
DB 129,128,128,59,0,0,128,63,129,128 ; addl $0x80813f80,0x3b80(%rax)
DB 128,59,0 ; cmpb $0x0,(%rbx)
DB 0,128,63,129,128,128 ; add %al,-0x7f7f7ec1(%rax)
@@ -4051,7 +4049,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 8,33 ; or %ah,(%rcx)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 4151 <.literal4+0x245>
+ DB 224,7 ; loopne 414d <.literal4+0x245>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -4063,7 +4061,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 8,33 ; or %ah,(%rcx)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 416d <.literal4+0x261>
+ DB 224,7 ; loopne 4169 <.literal4+0x261>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -4074,7 +4072,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 248 ; clc
DB 65,0,0 ; add %al,(%r8)
- DB 124,66 ; jl 41c2 <.literal4+0x2b6>
+ DB 124,66 ; jl 41be <.literal4+0x2b6>
DB 0,240 ; add %dh,%al
DB 0,0 ; add %al,(%rax)
DB 137,136,136,55,0,15 ; mov %ecx,0xf003788(%rax)
@@ -4092,9 +4090,9 @@ ALIGN 4
DB 137,136,136,59,15,0 ; mov %ecx,0xf3b88(%rax)
DB 0,0 ; add %al,(%rax)
DB 137,136,136,61,0,0 ; mov %ecx,0x3d88(%rax)
- DB 112,65 ; jo 4205 <.literal4+0x2f9>
+ DB 112,65 ; jo 4201 <.literal4+0x2f9>
DB 129,128,128,59,129,128,128,59,0,0 ; addl $0x3b80,-0x7f7ec480(%rax)
- DB 127,67 ; jg 4213 <.literal4+0x307>
+ DB 127,67 ; jg 420f <.literal4+0x307>
DB 128,0,128 ; addb $0x80,(%rax)
DB 55 ; (bad)
DB 128,0,128 ; addb $0x80,(%rax)
@@ -4102,7 +4100,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
DB 255 ; (bad)
- DB 127,71 ; jg 4227 <.literal4+0x31b>
+ DB 127,71 ; jg 4223 <.literal4+0x31b>
DB 208 ; (bad)
DB 179,89 ; mov $0x59,%bl
DB 62,89 ; ds pop %rcx
@@ -4199,16 +4197,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a0042e8 <_sk_callback_hsw+0xa0004f7>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a0042e8 <_sk_callback_hsw+0xa0004fb>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 120042f0 <_sk_callback_hsw+0x120004ff>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 120042f0 <_sk_callback_hsw+0x12000503>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a0042f8 <_sk_callback_hsw+0x1a000507>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a0042f8 <_sk_callback_hsw+0x1a00050b>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 3004300 <_sk_callback_hsw+0x300050f>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 3004300 <_sk_callback_hsw+0x3000513>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -4251,16 +4249,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a004348 <_sk_callback_hsw+0xa000557>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a004348 <_sk_callback_hsw+0xa00055b>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 12004350 <_sk_callback_hsw+0x1200055f>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 12004350 <_sk_callback_hsw+0x12000563>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a004358 <_sk_callback_hsw+0x1a000567>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a004358 <_sk_callback_hsw+0x1a00056b>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 3004360 <_sk_callback_hsw+0x300056f>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 3004360 <_sk_callback_hsw+0x3000573>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -4303,16 +4301,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a0043a8 <_sk_callback_hsw+0xa0005b7>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a0043a8 <_sk_callback_hsw+0xa0005bb>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 120043b0 <_sk_callback_hsw+0x120005bf>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 120043b0 <_sk_callback_hsw+0x120005c3>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a0043b8 <_sk_callback_hsw+0x1a0005c7>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a0043b8 <_sk_callback_hsw+0x1a0005cb>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 30043c0 <_sk_callback_hsw+0x30005cf>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 30043c0 <_sk_callback_hsw+0x30005d3>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -4355,16 +4353,16 @@ ALIGN 32
DB 0,0 ; add %al,(%rax)
DB 1,255 ; add %edi,%edi
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a004408 <_sk_callback_hsw+0xa000617>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a004408 <_sk_callback_hsw+0xa00061b>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 12004410 <_sk_callback_hsw+0x1200061f>
+ DB 255,13,255,255,255,17 ; decl 0x11ffffff(%rip) # 12004410 <_sk_callback_hsw+0x12000623>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a004418 <_sk_callback_hsw+0x1a000627>
+ DB 255,21,255,255,255,25 ; callq *0x19ffffff(%rip) # 1a004418 <_sk_callback_hsw+0x1a00062b>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 3004420 <_sk_callback_hsw+0x300062f>
+ DB 255,29,255,255,255,2 ; lcall *0x2ffffff(%rip) # 3004420 <_sk_callback_hsw+0x3000633>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -4506,14 +4504,14 @@ _sk_seed_shader_avx LABEL PROC
DB 197,249,112,192,0 ; vpshufd $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,244,84,0,0 ; vbroadcastss 0x54f4(%rip),%ymm1 # 5654 <_sk_callback_avx+0x119>
+ DB 196,226,125,24,13,240,84,0,0 ; vbroadcastss 0x54f0(%rip),%ymm1 # 5650 <_sk_callback_avx+0x119>
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
DB 197,252,88,2 ; vaddps (%rdx),%ymm0,%ymm0
DB 196,226,125,24,16 ; vbroadcastss (%rax),%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 197,236,88,201 ; vaddps %ymm1,%ymm2,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,21,216,84,0,0 ; vbroadcastss 0x54d8(%rip),%ymm2 # 5658 <_sk_callback_avx+0x11d>
+ DB 196,226,125,24,21,212,84,0,0 ; vbroadcastss 0x54d4(%rip),%ymm2 # 5654 <_sk_callback_avx+0x11d>
DB 197,228,87,219 ; vxorps %ymm3,%ymm3,%ymm3
DB 197,220,87,228 ; vxorps %ymm4,%ymm4,%ymm4
DB 197,212,87,237 ; vxorps %ymm5,%ymm5,%ymm5
@@ -4533,7 +4531,7 @@ _sk_dither_avx LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 196,66,125,24,8 ; vbroadcastss (%r8),%ymm9
DB 196,65,60,87,209 ; vxorps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,29,144,84,0,0 ; vbroadcastss 0x5490(%rip),%ymm11 # 565c <_sk_callback_avx+0x121>
+ DB 196,98,125,24,29,140,84,0,0 ; vbroadcastss 0x548c(%rip),%ymm11 # 5658 <_sk_callback_avx+0x121>
DB 196,65,44,84,203 ; vandps %ymm11,%ymm10,%ymm9
DB 196,193,25,114,241,5 ; vpslld $0x5,%xmm9,%xmm12
DB 196,67,125,25,201,1 ; vextractf128 $0x1,%ymm9,%xmm9
@@ -4544,8 +4542,8 @@ _sk_dither_avx LABEL PROC
DB 196,67,125,25,219,1 ; vextractf128 $0x1,%ymm11,%xmm11
DB 196,193,33,114,243,4 ; vpslld $0x4,%xmm11,%xmm11
DB 196,67,29,24,219,1 ; vinsertf128 $0x1,%xmm11,%ymm12,%ymm11
- DB 196,98,125,24,37,81,84,0,0 ; vbroadcastss 0x5451(%rip),%ymm12 # 5660 <_sk_callback_avx+0x125>
- DB 196,98,125,24,45,76,84,0,0 ; vbroadcastss 0x544c(%rip),%ymm13 # 5664 <_sk_callback_avx+0x129>
+ DB 196,98,125,24,37,77,84,0,0 ; vbroadcastss 0x544d(%rip),%ymm12 # 565c <_sk_callback_avx+0x125>
+ DB 196,98,125,24,45,72,84,0,0 ; vbroadcastss 0x5448(%rip),%ymm13 # 5660 <_sk_callback_avx+0x129>
DB 196,65,44,84,245 ; vandps %ymm13,%ymm10,%ymm14
DB 196,193,1,114,246,2 ; vpslld $0x2,%xmm14,%xmm15
DB 196,67,125,25,246,1 ; vextractf128 $0x1,%ymm14,%xmm14
@@ -4572,13 +4570,12 @@ _sk_dither_avx LABEL PROC
DB 196,65,60,86,193 ; vorps %ymm9,%ymm8,%ymm8
DB 196,65,60,86,194 ; vorps %ymm10,%ymm8,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,183,83,0,0 ; vbroadcastss 0x53b7(%rip),%ymm9 # 5668 <_sk_callback_avx+0x12d>
+ DB 196,98,125,24,13,179,83,0,0 ; vbroadcastss 0x53b3(%rip),%ymm9 # 5664 <_sk_callback_avx+0x12d>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,173,83,0,0 ; vbroadcastss 0x53ad(%rip),%ymm9 # 566c <_sk_callback_avx+0x131>
+ DB 196,98,125,24,13,169,83,0,0 ; vbroadcastss 0x53a9(%rip),%ymm9 # 5668 <_sk_callback_avx+0x131>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 196,98,125,24,72,8 ; vbroadcastss 0x8(%rax),%ymm9
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 197,60,89,195 ; vmulps %ymm3,%ymm8,%ymm8
DB 197,188,88,192 ; vaddps %ymm0,%ymm8,%ymm0
DB 197,188,88,201 ; vaddps %ymm1,%ymm8,%ymm1
DB 197,188,88,210 ; vaddps %ymm2,%ymm8,%ymm2
@@ -4607,7 +4604,7 @@ _sk_clear_avx LABEL PROC
PUBLIC _sk_srcatop_avx
_sk_srcatop_avx LABEL PROC
DB 197,252,89,199 ; vmulps %ymm7,%ymm0,%ymm0
- DB 196,98,125,24,5,79,83,0,0 ; vbroadcastss 0x534f(%rip),%ymm8 # 5670 <_sk_callback_avx+0x135>
+ DB 196,98,125,24,5,79,83,0,0 ; vbroadcastss 0x534f(%rip),%ymm8 # 566c <_sk_callback_avx+0x135>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,204 ; vmulps %ymm4,%ymm8,%ymm9
DB 197,180,88,192 ; vaddps %ymm0,%ymm9,%ymm0
@@ -4626,7 +4623,7 @@ _sk_srcatop_avx LABEL PROC
PUBLIC _sk_dstatop_avx
_sk_dstatop_avx LABEL PROC
DB 197,100,89,196 ; vmulps %ymm4,%ymm3,%ymm8
- DB 196,98,125,24,13,17,83,0,0 ; vbroadcastss 0x5311(%rip),%ymm9 # 5674 <_sk_callback_avx+0x139>
+ DB 196,98,125,24,13,17,83,0,0 ; vbroadcastss 0x5311(%rip),%ymm9 # 5670 <_sk_callback_avx+0x139>
DB 197,52,92,207 ; vsubps %ymm7,%ymm9,%ymm9
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
DB 197,188,88,192 ; vaddps %ymm0,%ymm8,%ymm0
@@ -4662,7 +4659,7 @@ _sk_dstin_avx LABEL PROC
PUBLIC _sk_srcout_avx
_sk_srcout_avx LABEL PROC
- DB 196,98,125,24,5,176,82,0,0 ; vbroadcastss 0x52b0(%rip),%ymm8 # 5678 <_sk_callback_avx+0x13d>
+ DB 196,98,125,24,5,176,82,0,0 ; vbroadcastss 0x52b0(%rip),%ymm8 # 5674 <_sk_callback_avx+0x13d>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -4673,7 +4670,7 @@ _sk_srcout_avx LABEL PROC
PUBLIC _sk_dstout_avx
_sk_dstout_avx LABEL PROC
- DB 196,226,125,24,5,147,82,0,0 ; vbroadcastss 0x5293(%rip),%ymm0 # 567c <_sk_callback_avx+0x141>
+ DB 196,226,125,24,5,147,82,0,0 ; vbroadcastss 0x5293(%rip),%ymm0 # 5678 <_sk_callback_avx+0x141>
DB 197,252,92,219 ; vsubps %ymm3,%ymm0,%ymm3
DB 197,228,89,196 ; vmulps %ymm4,%ymm3,%ymm0
DB 197,228,89,205 ; vmulps %ymm5,%ymm3,%ymm1
@@ -4684,7 +4681,7 @@ _sk_dstout_avx LABEL PROC
PUBLIC _sk_srcover_avx
_sk_srcover_avx LABEL PROC
- DB 196,98,125,24,5,118,82,0,0 ; vbroadcastss 0x5276(%rip),%ymm8 # 5680 <_sk_callback_avx+0x145>
+ DB 196,98,125,24,5,118,82,0,0 ; vbroadcastss 0x5276(%rip),%ymm8 # 567c <_sk_callback_avx+0x145>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,204 ; vmulps %ymm4,%ymm8,%ymm9
DB 197,180,88,192 ; vaddps %ymm0,%ymm9,%ymm0
@@ -4699,7 +4696,7 @@ _sk_srcover_avx LABEL PROC
PUBLIC _sk_dstover_avx
_sk_dstover_avx LABEL PROC
- DB 196,98,125,24,5,73,82,0,0 ; vbroadcastss 0x5249(%rip),%ymm8 # 5684 <_sk_callback_avx+0x149>
+ DB 196,98,125,24,5,73,82,0,0 ; vbroadcastss 0x5249(%rip),%ymm8 # 5680 <_sk_callback_avx+0x149>
DB 197,60,92,199 ; vsubps %ymm7,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,252,88,196 ; vaddps %ymm4,%ymm0,%ymm0
@@ -4723,7 +4720,7 @@ _sk_modulate_avx LABEL PROC
PUBLIC _sk_multiply_avx
_sk_multiply_avx LABEL PROC
- DB 196,98,125,24,5,8,82,0,0 ; vbroadcastss 0x5208(%rip),%ymm8 # 5688 <_sk_callback_avx+0x14d>
+ DB 196,98,125,24,5,8,82,0,0 ; vbroadcastss 0x5208(%rip),%ymm8 # 5684 <_sk_callback_avx+0x14d>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,208 ; vmulps %ymm0,%ymm9,%ymm10
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -4777,7 +4774,7 @@ _sk_screen_avx LABEL PROC
PUBLIC _sk_xor__avx
_sk_xor__avx LABEL PROC
- DB 196,98,125,24,5,87,81,0,0 ; vbroadcastss 0x5157(%rip),%ymm8 # 568c <_sk_callback_avx+0x151>
+ DB 196,98,125,24,5,87,81,0,0 ; vbroadcastss 0x5157(%rip),%ymm8 # 5688 <_sk_callback_avx+0x151>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,180,89,192 ; vmulps %ymm0,%ymm9,%ymm0
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -4812,7 +4809,7 @@ _sk_darken_avx LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,95,209 ; vmaxps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,215,80,0,0 ; vbroadcastss 0x50d7(%rip),%ymm8 # 5690 <_sk_callback_avx+0x155>
+ DB 196,98,125,24,5,215,80,0,0 ; vbroadcastss 0x50d7(%rip),%ymm8 # 568c <_sk_callback_avx+0x155>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -4836,7 +4833,7 @@ _sk_lighten_avx LABEL PROC
DB 197,100,89,206 ; vmulps %ymm6,%ymm3,%ymm9
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,131,80,0,0 ; vbroadcastss 0x5083(%rip),%ymm8 # 5694 <_sk_callback_avx+0x159>
+ DB 196,98,125,24,5,131,80,0,0 ; vbroadcastss 0x5083(%rip),%ymm8 # 5690 <_sk_callback_avx+0x159>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -4863,7 +4860,7 @@ _sk_difference_avx LABEL PROC
DB 196,193,108,93,209 ; vminps %ymm9,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,35,80,0,0 ; vbroadcastss 0x5023(%rip),%ymm8 # 5698 <_sk_callback_avx+0x15d>
+ DB 196,98,125,24,5,35,80,0,0 ; vbroadcastss 0x5023(%rip),%ymm8 # 5694 <_sk_callback_avx+0x15d>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -4884,7 +4881,7 @@ _sk_exclusion_avx LABEL PROC
DB 197,236,89,214 ; vmulps %ymm6,%ymm2,%ymm2
DB 197,236,88,210 ; vaddps %ymm2,%ymm2,%ymm2
DB 197,188,92,210 ; vsubps %ymm2,%ymm8,%ymm2
- DB 196,98,125,24,5,222,79,0,0 ; vbroadcastss 0x4fde(%rip),%ymm8 # 569c <_sk_callback_avx+0x161>
+ DB 196,98,125,24,5,222,79,0,0 ; vbroadcastss 0x4fde(%rip),%ymm8 # 5698 <_sk_callback_avx+0x161>
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
DB 197,60,89,199 ; vmulps %ymm7,%ymm8,%ymm8
DB 197,188,88,219 ; vaddps %ymm3,%ymm8,%ymm3
@@ -4893,7 +4890,7 @@ _sk_exclusion_avx LABEL PROC
PUBLIC _sk_colorburn_avx
_sk_colorburn_avx LABEL PROC
- DB 196,98,125,24,5,201,79,0,0 ; vbroadcastss 0x4fc9(%rip),%ymm8 # 56a0 <_sk_callback_avx+0x165>
+ DB 196,98,125,24,5,201,79,0,0 ; vbroadcastss 0x4fc9(%rip),%ymm8 # 569c <_sk_callback_avx+0x165>
DB 197,60,92,207 ; vsubps %ymm7,%ymm8,%ymm9
DB 197,52,89,216 ; vmulps %ymm0,%ymm9,%ymm11
DB 196,65,44,87,210 ; vxorps %ymm10,%ymm10,%ymm10
@@ -4953,7 +4950,7 @@ _sk_colorburn_avx LABEL PROC
PUBLIC _sk_colordodge_avx
_sk_colordodge_avx LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
- DB 196,98,125,24,13,197,78,0,0 ; vbroadcastss 0x4ec5(%rip),%ymm9 # 56a4 <_sk_callback_avx+0x169>
+ DB 196,98,125,24,13,197,78,0,0 ; vbroadcastss 0x4ec5(%rip),%ymm9 # 56a0 <_sk_callback_avx+0x169>
DB 197,52,92,215 ; vsubps %ymm7,%ymm9,%ymm10
DB 197,44,89,216 ; vmulps %ymm0,%ymm10,%ymm11
DB 197,52,92,203 ; vsubps %ymm3,%ymm9,%ymm9
@@ -5008,7 +5005,7 @@ _sk_colordodge_avx LABEL PROC
PUBLIC _sk_hardlight_avx
_sk_hardlight_avx LABEL PROC
- DB 196,98,125,24,5,215,77,0,0 ; vbroadcastss 0x4dd7(%rip),%ymm8 # 56a8 <_sk_callback_avx+0x16d>
+ DB 196,98,125,24,5,215,77,0,0 ; vbroadcastss 0x4dd7(%rip),%ymm8 # 56a4 <_sk_callback_avx+0x16d>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,200 ; vmulps %ymm0,%ymm10,%ymm9
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -5061,7 +5058,7 @@ _sk_hardlight_avx LABEL PROC
PUBLIC _sk_overlay_avx
_sk_overlay_avx LABEL PROC
- DB 196,98,125,24,5,0,77,0,0 ; vbroadcastss 0x4d00(%rip),%ymm8 # 56ac <_sk_callback_avx+0x171>
+ DB 196,98,125,24,5,0,77,0,0 ; vbroadcastss 0x4d00(%rip),%ymm8 # 56a8 <_sk_callback_avx+0x171>
DB 197,60,92,215 ; vsubps %ymm7,%ymm8,%ymm10
DB 197,44,89,200 ; vmulps %ymm0,%ymm10,%ymm9
DB 197,60,92,195 ; vsubps %ymm3,%ymm8,%ymm8
@@ -5126,10 +5123,10 @@ _sk_softlight_avx LABEL PROC
DB 196,65,60,88,192 ; vaddps %ymm8,%ymm8,%ymm8
DB 196,65,60,89,216 ; vmulps %ymm8,%ymm8,%ymm11
DB 196,65,60,88,195 ; vaddps %ymm11,%ymm8,%ymm8
- DB 196,98,125,24,29,243,75,0,0 ; vbroadcastss 0x4bf3(%rip),%ymm11 # 56b4 <_sk_callback_avx+0x179>
+ DB 196,98,125,24,29,243,75,0,0 ; vbroadcastss 0x4bf3(%rip),%ymm11 # 56b0 <_sk_callback_avx+0x179>
DB 196,65,28,88,235 ; vaddps %ymm11,%ymm12,%ymm13
DB 196,65,20,89,192 ; vmulps %ymm8,%ymm13,%ymm8
- DB 196,98,125,24,45,228,75,0,0 ; vbroadcastss 0x4be4(%rip),%ymm13 # 56b8 <_sk_callback_avx+0x17d>
+ DB 196,98,125,24,45,228,75,0,0 ; vbroadcastss 0x4be4(%rip),%ymm13 # 56b4 <_sk_callback_avx+0x17d>
DB 196,65,28,89,245 ; vmulps %ymm13,%ymm12,%ymm14
DB 196,65,12,88,192 ; vaddps %ymm8,%ymm14,%ymm8
DB 196,65,124,82,244 ; vrsqrtps %ymm12,%ymm14
@@ -5140,7 +5137,7 @@ _sk_softlight_avx LABEL PROC
DB 197,4,194,255,2 ; vcmpleps %ymm7,%ymm15,%ymm15
DB 196,67,13,74,240,240 ; vblendvps %ymm15,%ymm8,%ymm14,%ymm14
DB 197,116,88,249 ; vaddps %ymm1,%ymm1,%ymm15
- DB 196,98,125,24,5,162,75,0,0 ; vbroadcastss 0x4ba2(%rip),%ymm8 # 56b0 <_sk_callback_avx+0x175>
+ DB 196,98,125,24,5,162,75,0,0 ; vbroadcastss 0x4ba2(%rip),%ymm8 # 56ac <_sk_callback_avx+0x175>
DB 196,65,60,92,228 ; vsubps %ymm12,%ymm8,%ymm12
DB 197,132,92,195 ; vsubps %ymm3,%ymm15,%ymm0
DB 196,65,124,89,228 ; vmulps %ymm12,%ymm0,%ymm12
@@ -5244,7 +5241,7 @@ _sk_clamp_0_avx LABEL PROC
PUBLIC _sk_clamp_1_avx
_sk_clamp_1_avx LABEL PROC
- DB 196,98,125,24,5,240,73,0,0 ; vbroadcastss 0x49f0(%rip),%ymm8 # 56bc <_sk_callback_avx+0x181>
+ DB 196,98,125,24,5,240,73,0,0 ; vbroadcastss 0x49f0(%rip),%ymm8 # 56b8 <_sk_callback_avx+0x181>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
@@ -5254,7 +5251,7 @@ _sk_clamp_1_avx LABEL PROC
PUBLIC _sk_clamp_a_avx
_sk_clamp_a_avx LABEL PROC
- DB 196,98,125,24,5,211,73,0,0 ; vbroadcastss 0x49d3(%rip),%ymm8 # 56c0 <_sk_callback_avx+0x185>
+ DB 196,98,125,24,5,211,73,0,0 ; vbroadcastss 0x49d3(%rip),%ymm8 # 56bc <_sk_callback_avx+0x185>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 197,252,93,195 ; vminps %ymm3,%ymm0,%ymm0
DB 197,244,93,203 ; vminps %ymm3,%ymm1,%ymm1
@@ -5326,7 +5323,7 @@ PUBLIC _sk_unpremul_avx
_sk_unpremul_avx LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,65,100,194,200,0 ; vcmpeqps %ymm8,%ymm3,%ymm9
- DB 196,98,125,24,21,27,73,0,0 ; vbroadcastss 0x491b(%rip),%ymm10 # 56c4 <_sk_callback_avx+0x189>
+ DB 196,98,125,24,21,27,73,0,0 ; vbroadcastss 0x491b(%rip),%ymm10 # 56c0 <_sk_callback_avx+0x189>
DB 197,44,94,211 ; vdivps %ymm3,%ymm10,%ymm10
DB 196,67,45,74,192,144 ; vblendvps %ymm9,%ymm8,%ymm10,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
@@ -5337,17 +5334,17 @@ _sk_unpremul_avx LABEL PROC
PUBLIC _sk_from_srgb_avx
_sk_from_srgb_avx LABEL PROC
- DB 196,98,125,24,5,252,72,0,0 ; vbroadcastss 0x48fc(%rip),%ymm8 # 56c8 <_sk_callback_avx+0x18d>
+ DB 196,98,125,24,5,252,72,0,0 ; vbroadcastss 0x48fc(%rip),%ymm8 # 56c4 <_sk_callback_avx+0x18d>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 197,124,89,208 ; vmulps %ymm0,%ymm0,%ymm10
- DB 196,98,125,24,29,238,72,0,0 ; vbroadcastss 0x48ee(%rip),%ymm11 # 56cc <_sk_callback_avx+0x191>
+ DB 196,98,125,24,29,238,72,0,0 ; vbroadcastss 0x48ee(%rip),%ymm11 # 56c8 <_sk_callback_avx+0x191>
DB 196,65,124,89,227 ; vmulps %ymm11,%ymm0,%ymm12
- DB 196,98,125,24,45,228,72,0,0 ; vbroadcastss 0x48e4(%rip),%ymm13 # 56d0 <_sk_callback_avx+0x195>
+ DB 196,98,125,24,45,228,72,0,0 ; vbroadcastss 0x48e4(%rip),%ymm13 # 56cc <_sk_callback_avx+0x195>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,44,89,212 ; vmulps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,37,213,72,0,0 ; vbroadcastss 0x48d5(%rip),%ymm12 # 56d4 <_sk_callback_avx+0x199>
+ DB 196,98,125,24,37,213,72,0,0 ; vbroadcastss 0x48d5(%rip),%ymm12 # 56d0 <_sk_callback_avx+0x199>
DB 196,65,44,88,212 ; vaddps %ymm12,%ymm10,%ymm10
- DB 196,98,125,24,53,203,72,0,0 ; vbroadcastss 0x48cb(%rip),%ymm14 # 56d8 <_sk_callback_avx+0x19d>
+ DB 196,98,125,24,53,203,72,0,0 ; vbroadcastss 0x48cb(%rip),%ymm14 # 56d4 <_sk_callback_avx+0x19d>
DB 196,193,124,194,198,1 ; vcmpltps %ymm14,%ymm0,%ymm0
DB 196,195,45,74,193,0 ; vblendvps %ymm0,%ymm9,%ymm10,%ymm0
DB 196,65,116,89,200 ; vmulps %ymm8,%ymm1,%ymm9
@@ -5374,18 +5371,18 @@ _sk_to_srgb_avx LABEL PROC
DB 197,124,82,192 ; vrsqrtps %ymm0,%ymm8
DB 196,65,124,83,200 ; vrcpps %ymm8,%ymm9
DB 196,65,124,82,208 ; vrsqrtps %ymm8,%ymm10
- DB 196,98,125,24,5,86,72,0,0 ; vbroadcastss 0x4856(%rip),%ymm8 # 56dc <_sk_callback_avx+0x1a1>
+ DB 196,98,125,24,5,86,72,0,0 ; vbroadcastss 0x4856(%rip),%ymm8 # 56d8 <_sk_callback_avx+0x1a1>
DB 196,65,124,89,216 ; vmulps %ymm8,%ymm0,%ymm11
- DB 196,98,125,24,37,76,72,0,0 ; vbroadcastss 0x484c(%rip),%ymm12 # 56e0 <_sk_callback_avx+0x1a5>
+ DB 196,98,125,24,37,76,72,0,0 ; vbroadcastss 0x484c(%rip),%ymm12 # 56dc <_sk_callback_avx+0x1a5>
DB 196,65,52,89,204 ; vmulps %ymm12,%ymm9,%ymm9
- DB 196,98,125,24,45,66,72,0,0 ; vbroadcastss 0x4842(%rip),%ymm13 # 56e4 <_sk_callback_avx+0x1a9>
+ DB 196,98,125,24,45,66,72,0,0 ; vbroadcastss 0x4842(%rip),%ymm13 # 56e0 <_sk_callback_avx+0x1a9>
DB 196,65,52,88,205 ; vaddps %ymm13,%ymm9,%ymm9
- DB 196,98,125,24,53,56,72,0,0 ; vbroadcastss 0x4838(%rip),%ymm14 # 56e8 <_sk_callback_avx+0x1ad>
+ DB 196,98,125,24,53,56,72,0,0 ; vbroadcastss 0x4838(%rip),%ymm14 # 56e4 <_sk_callback_avx+0x1ad>
DB 196,65,44,89,214 ; vmulps %ymm14,%ymm10,%ymm10
DB 196,65,44,88,201 ; vaddps %ymm9,%ymm10,%ymm9
- DB 196,98,125,24,21,41,72,0,0 ; vbroadcastss 0x4829(%rip),%ymm10 # 56ec <_sk_callback_avx+0x1b1>
+ DB 196,98,125,24,21,41,72,0,0 ; vbroadcastss 0x4829(%rip),%ymm10 # 56e8 <_sk_callback_avx+0x1b1>
DB 196,65,44,93,201 ; vminps %ymm9,%ymm10,%ymm9
- DB 196,98,125,24,61,31,72,0,0 ; vbroadcastss 0x481f(%rip),%ymm15 # 56f0 <_sk_callback_avx+0x1b5>
+ DB 196,98,125,24,61,31,72,0,0 ; vbroadcastss 0x481f(%rip),%ymm15 # 56ec <_sk_callback_avx+0x1b5>
DB 196,193,124,194,199,1 ; vcmpltps %ymm15,%ymm0,%ymm0
DB 196,195,53,74,195,0 ; vblendvps %ymm0,%ymm11,%ymm9,%ymm0
DB 197,124,82,201 ; vrsqrtps %ymm1,%ymm9
@@ -5420,7 +5417,7 @@ _sk_rgb_to_hsl_avx LABEL PROC
DB 197,124,93,201 ; vminps %ymm1,%ymm0,%ymm9
DB 197,52,93,202 ; vminps %ymm2,%ymm9,%ymm9
DB 196,65,60,92,209 ; vsubps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,29,133,71,0,0 ; vbroadcastss 0x4785(%rip),%ymm11 # 56f4 <_sk_callback_avx+0x1b9>
+ DB 196,98,125,24,29,133,71,0,0 ; vbroadcastss 0x4785(%rip),%ymm11 # 56f0 <_sk_callback_avx+0x1b9>
DB 196,65,36,94,218 ; vdivps %ymm10,%ymm11,%ymm11
DB 197,116,92,226 ; vsubps %ymm2,%ymm1,%ymm12
DB 196,65,28,89,227 ; vmulps %ymm11,%ymm12,%ymm12
@@ -5430,19 +5427,19 @@ _sk_rgb_to_hsl_avx LABEL PROC
DB 196,193,108,89,211 ; vmulps %ymm11,%ymm2,%ymm2
DB 197,252,92,201 ; vsubps %ymm1,%ymm0,%ymm1
DB 196,193,116,89,203 ; vmulps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,94,71,0,0 ; vbroadcastss 0x475e(%rip),%ymm11 # 5700 <_sk_callback_avx+0x1c5>
+ DB 196,98,125,24,29,94,71,0,0 ; vbroadcastss 0x475e(%rip),%ymm11 # 56fc <_sk_callback_avx+0x1c5>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,76,71,0,0 ; vbroadcastss 0x474c(%rip),%ymm11 # 56fc <_sk_callback_avx+0x1c1>
+ DB 196,98,125,24,29,76,71,0,0 ; vbroadcastss 0x474c(%rip),%ymm11 # 56f8 <_sk_callback_avx+0x1c1>
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
DB 196,227,117,74,202,224 ; vblendvps %ymm14,%ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,52,71,0,0 ; vbroadcastss 0x4734(%rip),%ymm2 # 56f8 <_sk_callback_avx+0x1bd>
+ DB 196,226,125,24,21,52,71,0,0 ; vbroadcastss 0x4734(%rip),%ymm2 # 56f4 <_sk_callback_avx+0x1bd>
DB 196,65,12,87,246 ; vxorps %ymm14,%ymm14,%ymm14
DB 196,227,13,74,210,208 ; vblendvps %ymm13,%ymm2,%ymm14,%ymm2
DB 197,188,194,192,0 ; vcmpeqps %ymm0,%ymm8,%ymm0
DB 196,193,108,88,212 ; vaddps %ymm12,%ymm2,%ymm2
DB 196,227,117,74,194,0 ; vblendvps %ymm0,%ymm2,%ymm1,%ymm0
DB 196,193,60,88,201 ; vaddps %ymm9,%ymm8,%ymm1
- DB 196,98,125,24,37,27,71,0,0 ; vbroadcastss 0x471b(%rip),%ymm12 # 5708 <_sk_callback_avx+0x1cd>
+ DB 196,98,125,24,37,27,71,0,0 ; vbroadcastss 0x471b(%rip),%ymm12 # 5704 <_sk_callback_avx+0x1cd>
DB 196,193,116,89,212 ; vmulps %ymm12,%ymm1,%ymm2
DB 197,28,194,226,1 ; vcmpltps %ymm2,%ymm12,%ymm12
DB 196,65,36,92,216 ; vsubps %ymm8,%ymm11,%ymm11
@@ -5452,7 +5449,7 @@ _sk_rgb_to_hsl_avx LABEL PROC
DB 197,172,94,201 ; vdivps %ymm1,%ymm10,%ymm1
DB 196,195,125,74,198,128 ; vblendvps %ymm8,%ymm14,%ymm0,%ymm0
DB 196,195,117,74,206,128 ; vblendvps %ymm8,%ymm14,%ymm1,%ymm1
- DB 196,98,125,24,5,222,70,0,0 ; vbroadcastss 0x46de(%rip),%ymm8 # 5704 <_sk_callback_avx+0x1c9>
+ DB 196,98,125,24,5,222,70,0,0 ; vbroadcastss 0x46de(%rip),%ymm8 # 5700 <_sk_callback_avx+0x1c9>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -5467,7 +5464,7 @@ _sk_hsl_to_rgb_avx LABEL PROC
DB 197,252,17,28,36 ; vmovups %ymm3,(%rsp)
DB 197,252,40,225 ; vmovaps %ymm1,%ymm4
DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
- DB 196,98,125,24,5,165,70,0,0 ; vbroadcastss 0x46a5(%rip),%ymm8 # 570c <_sk_callback_avx+0x1d1>
+ DB 196,98,125,24,5,165,70,0,0 ; vbroadcastss 0x46a5(%rip),%ymm8 # 5708 <_sk_callback_avx+0x1d1>
DB 197,60,194,202,2 ; vcmpleps %ymm2,%ymm8,%ymm9
DB 197,92,89,210 ; vmulps %ymm2,%ymm4,%ymm10
DB 196,65,92,92,218 ; vsubps %ymm10,%ymm4,%ymm11
@@ -5475,23 +5472,23 @@ _sk_hsl_to_rgb_avx LABEL PROC
DB 197,52,88,210 ; vaddps %ymm2,%ymm9,%ymm10
DB 197,108,88,202 ; vaddps %ymm2,%ymm2,%ymm9
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,29,127,70,0,0 ; vbroadcastss 0x467f(%rip),%ymm11 # 5710 <_sk_callback_avx+0x1d5>
+ DB 196,98,125,24,29,127,70,0,0 ; vbroadcastss 0x467f(%rip),%ymm11 # 570c <_sk_callback_avx+0x1d5>
DB 196,65,100,88,219 ; vaddps %ymm11,%ymm3,%ymm11
DB 196,67,125,8,227,1 ; vroundps $0x1,%ymm11,%ymm12
DB 196,65,36,92,252 ; vsubps %ymm12,%ymm11,%ymm15
DB 196,65,44,92,217 ; vsubps %ymm9,%ymm10,%ymm11
- DB 196,98,125,24,37,105,70,0,0 ; vbroadcastss 0x4669(%rip),%ymm12 # 5718 <_sk_callback_avx+0x1dd>
+ DB 196,98,125,24,37,105,70,0,0 ; vbroadcastss 0x4669(%rip),%ymm12 # 5714 <_sk_callback_avx+0x1dd>
DB 196,193,4,89,196 ; vmulps %ymm12,%ymm15,%ymm0
- DB 196,98,125,24,45,95,70,0,0 ; vbroadcastss 0x465f(%rip),%ymm13 # 571c <_sk_callback_avx+0x1e1>
+ DB 196,98,125,24,45,95,70,0,0 ; vbroadcastss 0x465f(%rip),%ymm13 # 5718 <_sk_callback_avx+0x1e1>
DB 197,20,92,240 ; vsubps %ymm0,%ymm13,%ymm14
DB 196,65,36,89,246 ; vmulps %ymm14,%ymm11,%ymm14
DB 196,65,52,88,246 ; vaddps %ymm14,%ymm9,%ymm14
- DB 196,226,125,24,13,64,70,0,0 ; vbroadcastss 0x4640(%rip),%ymm1 # 5714 <_sk_callback_avx+0x1d9>
+ DB 196,226,125,24,13,64,70,0,0 ; vbroadcastss 0x4640(%rip),%ymm1 # 5710 <_sk_callback_avx+0x1d9>
DB 196,193,116,194,255,2 ; vcmpleps %ymm15,%ymm1,%ymm7
DB 196,195,13,74,249,112 ; vblendvps %ymm7,%ymm9,%ymm14,%ymm7
DB 196,65,60,194,247,2 ; vcmpleps %ymm15,%ymm8,%ymm14
DB 196,227,45,74,255,224 ; vblendvps %ymm14,%ymm7,%ymm10,%ymm7
- DB 196,98,125,24,53,43,70,0,0 ; vbroadcastss 0x462b(%rip),%ymm14 # 5720 <_sk_callback_avx+0x1e5>
+ DB 196,98,125,24,53,43,70,0,0 ; vbroadcastss 0x462b(%rip),%ymm14 # 571c <_sk_callback_avx+0x1e5>
DB 196,65,12,194,255,2 ; vcmpleps %ymm15,%ymm14,%ymm15
DB 196,193,124,89,195 ; vmulps %ymm11,%ymm0,%ymm0
DB 197,180,88,192 ; vaddps %ymm0,%ymm9,%ymm0
@@ -5510,7 +5507,7 @@ _sk_hsl_to_rgb_avx LABEL PROC
DB 197,164,89,247 ; vmulps %ymm7,%ymm11,%ymm6
DB 197,180,88,246 ; vaddps %ymm6,%ymm9,%ymm6
DB 196,227,77,74,237,0 ; vblendvps %ymm0,%ymm5,%ymm6,%ymm5
- DB 196,226,125,24,5,205,69,0,0 ; vbroadcastss 0x45cd(%rip),%ymm0 # 5724 <_sk_callback_avx+0x1e9>
+ DB 196,226,125,24,5,205,69,0,0 ; vbroadcastss 0x45cd(%rip),%ymm0 # 5720 <_sk_callback_avx+0x1e9>
DB 197,228,88,192 ; vaddps %ymm0,%ymm3,%ymm0
DB 196,227,125,8,216,1 ; vroundps $0x1,%ymm0,%ymm3
DB 197,252,92,195 ; vsubps %ymm3,%ymm0,%ymm0
@@ -5558,14 +5555,14 @@ _sk_scale_u8_avx LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,68 ; jne 1254 <_sk_scale_u8_avx+0x54>
+ DB 117,68 ; jne 1250 <_sk_scale_u8_avx+0x54>
DB 197,122,126,0 ; vmovq (%rax),%xmm8
DB 196,66,121,49,200 ; vpmovzxbd %xmm8,%xmm9
DB 196,67,121,4,192,229 ; vpermilps $0xe5,%xmm8,%xmm8
DB 196,66,121,49,192 ; vpmovzxbd %xmm8,%xmm8
DB 196,67,53,24,192,1 ; vinsertf128 $0x1,%xmm8,%ymm9,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,240,68,0,0 ; vbroadcastss 0x44f0(%rip),%ymm9 # 5728 <_sk_callback_avx+0x1ed>
+ DB 196,98,125,24,13,240,68,0,0 ; vbroadcastss 0x44f0(%rip),%ymm9 # 5724 <_sk_callback_avx+0x1ed>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
@@ -5583,9 +5580,9 @@ _sk_scale_u8_avx LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 125c <_sk_scale_u8_avx+0x5c>
+ DB 117,234 ; jne 1258 <_sk_scale_u8_avx+0x5c>
DB 196,65,249,110,193 ; vmovq %r9,%xmm8
- DB 235,155 ; jmp 1214 <_sk_scale_u8_avx+0x14>
+ DB 235,155 ; jmp 1210 <_sk_scale_u8_avx+0x14>
PUBLIC _sk_lerp_1_float_avx
_sk_lerp_1_float_avx LABEL PROC
@@ -5613,14 +5610,14 @@ _sk_lerp_u8_avx LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,104 ; jne 1330 <_sk_lerp_u8_avx+0x78>
+ DB 117,104 ; jne 132c <_sk_lerp_u8_avx+0x78>
DB 197,122,126,0 ; vmovq (%rax),%xmm8
DB 196,66,121,49,200 ; vpmovzxbd %xmm8,%xmm9
DB 196,67,121,4,192,229 ; vpermilps $0xe5,%xmm8,%xmm8
DB 196,66,121,49,192 ; vpmovzxbd %xmm8,%xmm8
DB 196,67,53,24,192,1 ; vinsertf128 $0x1,%xmm8,%ymm9,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,60,68,0,0 ; vbroadcastss 0x443c(%rip),%ymm9 # 572c <_sk_callback_avx+0x1f1>
+ DB 196,98,125,24,13,60,68,0,0 ; vbroadcastss 0x443c(%rip),%ymm9 # 5728 <_sk_callback_avx+0x1f1>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
@@ -5646,35 +5643,35 @@ _sk_lerp_u8_avx LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 1338 <_sk_lerp_u8_avx+0x80>
+ DB 117,234 ; jne 1334 <_sk_lerp_u8_avx+0x80>
DB 196,65,249,110,193 ; vmovq %r9,%xmm8
- DB 233,116,255,255,255 ; jmpq 12cc <_sk_lerp_u8_avx+0x14>
+ DB 233,116,255,255,255 ; jmpq 12c8 <_sk_lerp_u8_avx+0x14>
PUBLIC _sk_lerp_565_avx
_sk_lerp_565_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,174,0,0,0 ; jne 1414 <_sk_lerp_565_avx+0xbc>
+ DB 15,133,174,0,0,0 ; jne 1410 <_sk_lerp_565_avx+0xbc>
DB 196,65,122,111,4,122 ; vmovdqu (%r10,%rdi,2),%xmm8
DB 197,225,239,219 ; vpxor %xmm3,%xmm3,%xmm3
DB 197,185,105,219 ; vpunpckhwd %xmm3,%xmm8,%xmm3
DB 196,66,121,51,192 ; vpmovzxwd %xmm8,%xmm8
DB 196,227,61,24,219,1 ; vinsertf128 $0x1,%xmm3,%ymm8,%ymm3
- DB 196,98,125,24,5,168,67,0,0 ; vbroadcastss 0x43a8(%rip),%ymm8 # 5730 <_sk_callback_avx+0x1f5>
+ DB 196,98,125,24,5,168,67,0,0 ; vbroadcastss 0x43a8(%rip),%ymm8 # 572c <_sk_callback_avx+0x1f5>
DB 196,65,100,84,192 ; vandps %ymm8,%ymm3,%ymm8
DB 196,65,124,91,192 ; vcvtdq2ps %ymm8,%ymm8
- DB 196,98,125,24,13,153,67,0,0 ; vbroadcastss 0x4399(%rip),%ymm9 # 5734 <_sk_callback_avx+0x1f9>
+ DB 196,98,125,24,13,153,67,0,0 ; vbroadcastss 0x4399(%rip),%ymm9 # 5730 <_sk_callback_avx+0x1f9>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,143,67,0,0 ; vbroadcastss 0x438f(%rip),%ymm9 # 5738 <_sk_callback_avx+0x1fd>
+ DB 196,98,125,24,13,143,67,0,0 ; vbroadcastss 0x438f(%rip),%ymm9 # 5734 <_sk_callback_avx+0x1fd>
DB 196,65,100,84,201 ; vandps %ymm9,%ymm3,%ymm9
DB 196,65,124,91,201 ; vcvtdq2ps %ymm9,%ymm9
- DB 196,98,125,24,21,128,67,0,0 ; vbroadcastss 0x4380(%rip),%ymm10 # 573c <_sk_callback_avx+0x201>
+ DB 196,98,125,24,21,128,67,0,0 ; vbroadcastss 0x4380(%rip),%ymm10 # 5738 <_sk_callback_avx+0x201>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,118,67,0,0 ; vbroadcastss 0x4376(%rip),%ymm10 # 5740 <_sk_callback_avx+0x205>
+ DB 196,98,125,24,21,118,67,0,0 ; vbroadcastss 0x4376(%rip),%ymm10 # 573c <_sk_callback_avx+0x205>
DB 196,193,100,84,218 ; vandps %ymm10,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,21,104,67,0,0 ; vbroadcastss 0x4368(%rip),%ymm10 # 5744 <_sk_callback_avx+0x209>
+ DB 196,98,125,24,21,104,67,0,0 ; vbroadcastss 0x4368(%rip),%ymm10 # 5740 <_sk_callback_avx+0x209>
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 197,252,92,196 ; vsubps %ymm4,%ymm0,%ymm0
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
@@ -5686,16 +5683,16 @@ _sk_lerp_565_avx LABEL PROC
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 197,236,88,214 ; vaddps %ymm6,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,54,67,0,0 ; vbroadcastss 0x4336(%rip),%ymm3 # 5748 <_sk_callback_avx+0x20d>
+ DB 196,226,125,24,29,54,67,0,0 ; vbroadcastss 0x4336(%rip),%ymm3 # 5744 <_sk_callback_avx+0x20d>
DB 255,224 ; jmpq *%rax
DB 65,137,200 ; mov %ecx,%r8d
DB 65,128,224,7 ; and $0x7,%r8b
DB 196,65,57,239,192 ; vpxor %xmm8,%xmm8,%xmm8
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 15,135,63,255,255,255 ; ja 136c <_sk_lerp_565_avx+0x14>
+ DB 15,135,63,255,255,255 ; ja 1368 <_sk_lerp_565_avx+0x14>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,76,0,0,0 ; lea 0x4c(%rip),%r9 # 1484 <_sk_lerp_565_avx+0x12c>
+ DB 76,141,13,76,0,0,0 ; lea 0x4c(%rip),%r9 # 1480 <_sk_lerp_565_avx+0x12c>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -5707,13 +5704,13 @@ _sk_lerp_565_avx LABEL PROC
DB 196,65,57,196,68,122,4,2 ; vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm8,%xmm8
DB 196,65,57,196,68,122,2,1 ; vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm8,%xmm8
DB 196,65,57,196,4,122,0 ; vpinsrw $0x0,(%r10,%rdi,2),%xmm8,%xmm8
- DB 233,235,254,255,255 ; jmpq 136c <_sk_lerp_565_avx+0x14>
+ DB 233,235,254,255,255 ; jmpq 1368 <_sk_lerp_565_avx+0x14>
DB 15,31,0 ; nopl (%rax)
DB 241 ; icebp
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 233,255,255,255,225 ; jmpq ffffffffe200148c <_sk_callback_avx+0xffffffffe1ffbf51>
+ DB 233,255,255,255,225 ; jmpq ffffffffe2001488 <_sk_callback_avx+0xffffffffe1ffbf51>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
@@ -5736,7 +5733,7 @@ _sk_load_tables_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,0 ; mov (%rax),%r8
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,26,2,0,0 ; jne 16c8 <_sk_load_tables_avx+0x228>
+ DB 15,133,26,2,0,0 ; jne 16c4 <_sk_load_tables_avx+0x228>
DB 196,65,124,16,4,184 ; vmovups (%r8,%rdi,4),%ymm8
DB 85 ; push %rbp
DB 65,87 ; push %r15
@@ -5744,7 +5741,7 @@ _sk_load_tables_avx LABEL PROC
DB 65,85 ; push %r13
DB 65,84 ; push %r12
DB 83 ; push %rbx
- DB 197,124,40,13,90,69,0,0 ; vmovaps 0x455a(%rip),%ymm9 # 5a20 <_sk_callback_avx+0x4e5>
+ DB 197,124,40,13,94,69,0,0 ; vmovaps 0x455e(%rip),%ymm9 # 5a20 <_sk_callback_avx+0x4e9>
DB 196,193,60,84,193 ; vandps %ymm9,%ymm8,%ymm0
DB 196,193,249,126,193 ; vmovq %xmm0,%r9
DB 69,137,203 ; mov %r9d,%r11d
@@ -5836,7 +5833,7 @@ _sk_load_tables_avx LABEL PROC
DB 196,193,97,114,210,24 ; vpsrld $0x18,%xmm10,%xmm3
DB 196,227,61,24,219,1 ; vinsertf128 $0x1,%xmm3,%ymm8,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,151,64,0,0 ; vbroadcastss 0x4097(%rip),%ymm8 # 574c <_sk_callback_avx+0x211>
+ DB 196,98,125,24,5,151,64,0,0 ; vbroadcastss 0x4097(%rip),%ymm8 # 5748 <_sk_callback_avx+0x211>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
@@ -5851,9 +5848,9 @@ _sk_load_tables_avx LABEL PROC
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 65,254,201 ; dec %r9b
DB 65,128,249,6 ; cmp $0x6,%r9b
- DB 15,135,211,253,255,255 ; ja 14b4 <_sk_load_tables_avx+0x14>
+ DB 15,135,211,253,255,255 ; ja 14b0 <_sk_load_tables_avx+0x14>
DB 69,15,182,201 ; movzbl %r9b,%r9d
- DB 76,141,21,140,0,0,0 ; lea 0x8c(%rip),%r10 # 1778 <_sk_load_tables_avx+0x2d8>
+ DB 76,141,21,140,0,0,0 ; lea 0x8c(%rip),%r10 # 1774 <_sk_load_tables_avx+0x2d8>
DB 79,99,12,138 ; movslq (%r10,%r9,4),%r9
DB 77,1,209 ; add %r10,%r9
DB 65,255,225 ; jmpq *%r9
@@ -5876,7 +5873,7 @@ _sk_load_tables_avx LABEL PROC
DB 196,99,61,12,192,15 ; vblendps $0xf,%ymm0,%ymm8,%ymm8
DB 196,195,57,34,4,184,0 ; vpinsrd $0x0,(%r8,%rdi,4),%xmm8,%xmm0
DB 196,99,61,12,192,15 ; vblendps $0xf,%ymm0,%ymm8,%ymm8
- DB 233,62,253,255,255 ; jmpq 14b4 <_sk_load_tables_avx+0x14>
+ DB 233,62,253,255,255 ; jmpq 14b0 <_sk_load_tables_avx+0x14>
DB 102,144 ; xchg %ax,%ax
DB 236 ; in (%dx),%al
DB 255 ; (bad)
@@ -5894,7 +5891,7 @@ _sk_load_tables_avx LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 126,255 ; jle 1791 <_sk_load_tables_avx+0x2f1>
+ DB 126,255 ; jle 178d <_sk_load_tables_avx+0x2f1>
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -5904,7 +5901,7 @@ _sk_load_tables_u16_be_avx LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,113,2,0,0 ; jne 1a1b <_sk_load_tables_u16_be_avx+0x287>
+ DB 15,133,113,2,0,0 ; jne 1a17 <_sk_load_tables_u16_be_avx+0x287>
DB 196,1,121,16,4,72 ; vmovupd (%r8,%r9,2),%xmm8
DB 196,129,121,16,84,72,16 ; vmovupd 0x10(%r8,%r9,2),%xmm2
DB 196,129,121,16,92,72,32 ; vmovupd 0x20(%r8,%r9,2),%xmm3
@@ -5926,7 +5923,7 @@ _sk_load_tables_u16_be_avx LABEL PROC
DB 197,177,108,208 ; vpunpcklqdq %xmm0,%xmm9,%xmm2
DB 197,177,109,200 ; vpunpckhqdq %xmm0,%xmm9,%xmm1
DB 196,65,57,108,212 ; vpunpcklqdq %xmm12,%xmm8,%xmm10
- DB 197,121,111,29,154,66,0,0 ; vmovdqa 0x429a(%rip),%xmm11 # 5aa0 <_sk_callback_avx+0x565>
+ DB 197,121,111,29,158,66,0,0 ; vmovdqa 0x429e(%rip),%xmm11 # 5aa0 <_sk_callback_avx+0x569>
DB 196,193,105,219,195 ; vpand %xmm11,%xmm2,%xmm0
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 196,193,121,105,209 ; vpunpckhwd %xmm9,%xmm0,%xmm2
@@ -6025,7 +6022,7 @@ _sk_load_tables_u16_be_avx LABEL PROC
DB 196,226,121,51,219 ; vpmovzxwd %xmm3,%xmm3
DB 196,195,101,24,216,1 ; vinsertf128 $0x1,%xmm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,72,61,0,0 ; vbroadcastss 0x3d48(%rip),%ymm8 # 5750 <_sk_callback_avx+0x215>
+ DB 196,98,125,24,5,72,61,0,0 ; vbroadcastss 0x3d48(%rip),%ymm8 # 574c <_sk_callback_avx+0x215>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
@@ -6038,29 +6035,29 @@ _sk_load_tables_u16_be_avx LABEL PROC
DB 196,1,123,16,4,72 ; vmovsd (%r8,%r9,2),%xmm8
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,85 ; je 1a81 <_sk_load_tables_u16_be_avx+0x2ed>
+ DB 116,85 ; je 1a7d <_sk_load_tables_u16_be_avx+0x2ed>
DB 196,1,57,22,68,72,8 ; vmovhpd 0x8(%r8,%r9,2),%xmm8,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,72 ; jb 1a81 <_sk_load_tables_u16_be_avx+0x2ed>
+ DB 114,72 ; jb 1a7d <_sk_load_tables_u16_be_avx+0x2ed>
DB 196,129,123,16,84,72,16 ; vmovsd 0x10(%r8,%r9,2),%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 116,72 ; je 1a8e <_sk_load_tables_u16_be_avx+0x2fa>
+ DB 116,72 ; je 1a8a <_sk_load_tables_u16_be_avx+0x2fa>
DB 196,129,105,22,84,72,24 ; vmovhpd 0x18(%r8,%r9,2),%xmm2,%xmm2
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,59 ; jb 1a8e <_sk_load_tables_u16_be_avx+0x2fa>
+ DB 114,59 ; jb 1a8a <_sk_load_tables_u16_be_avx+0x2fa>
DB 196,129,123,16,92,72,32 ; vmovsd 0x20(%r8,%r9,2),%xmm3
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 15,132,97,253,255,255 ; je 17c5 <_sk_load_tables_u16_be_avx+0x31>
+ DB 15,132,97,253,255,255 ; je 17c1 <_sk_load_tables_u16_be_avx+0x31>
DB 196,129,97,22,92,72,40 ; vmovhpd 0x28(%r8,%r9,2),%xmm3,%xmm3
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 15,130,80,253,255,255 ; jb 17c5 <_sk_load_tables_u16_be_avx+0x31>
+ DB 15,130,80,253,255,255 ; jb 17c1 <_sk_load_tables_u16_be_avx+0x31>
DB 196,1,122,126,76,72,48 ; vmovq 0x30(%r8,%r9,2),%xmm9
- DB 233,68,253,255,255 ; jmpq 17c5 <_sk_load_tables_u16_be_avx+0x31>
+ DB 233,68,253,255,255 ; jmpq 17c1 <_sk_load_tables_u16_be_avx+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
DB 197,233,87,210 ; vxorpd %xmm2,%xmm2,%xmm2
- DB 233,55,253,255,255 ; jmpq 17c5 <_sk_load_tables_u16_be_avx+0x31>
+ DB 233,55,253,255,255 ; jmpq 17c1 <_sk_load_tables_u16_be_avx+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
- DB 233,46,253,255,255 ; jmpq 17c5 <_sk_load_tables_u16_be_avx+0x31>
+ DB 233,46,253,255,255 ; jmpq 17c1 <_sk_load_tables_u16_be_avx+0x31>
PUBLIC _sk_load_tables_rgb_u16_be_avx
_sk_load_tables_rgb_u16_be_avx LABEL PROC
@@ -6068,7 +6065,7 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 76,141,12,127 ; lea (%rdi,%rdi,2),%r9
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,93,2,0,0 ; jne 1d06 <_sk_load_tables_rgb_u16_be_avx+0x26f>
+ DB 15,133,93,2,0,0 ; jne 1d02 <_sk_load_tables_rgb_u16_be_avx+0x26f>
DB 196,129,122,111,4,72 ; vmovdqu (%r8,%r9,2),%xmm0
DB 196,129,122,111,84,72,12 ; vmovdqu 0xc(%r8,%r9,2),%xmm2
DB 196,129,122,111,76,72,24 ; vmovdqu 0x18(%r8,%r9,2),%xmm1
@@ -6095,7 +6092,7 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
DB 197,185,108,202 ; vpunpcklqdq %xmm2,%xmm8,%xmm1
DB 197,185,109,210 ; vpunpckhqdq %xmm2,%xmm8,%xmm2
DB 197,121,108,195 ; vpunpcklqdq %xmm3,%xmm0,%xmm8
- DB 197,121,111,13,147,63,0,0 ; vmovdqa 0x3f93(%rip),%xmm9 # 5ab0 <_sk_callback_avx+0x575>
+ DB 197,121,111,13,151,63,0,0 ; vmovdqa 0x3f97(%rip),%xmm9 # 5ab0 <_sk_callback_avx+0x579>
DB 196,193,113,219,193 ; vpand %xmm9,%xmm1,%xmm0
DB 196,65,41,239,210 ; vpxor %xmm10,%xmm10,%xmm10
DB 196,193,121,105,202 ; vpunpckhwd %xmm10,%xmm0,%xmm1
@@ -6187,7 +6184,7 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
DB 196,227,105,33,211,48 ; vinsertps $0x30,%xmm3,%xmm2,%xmm2
DB 196,195,109,24,208,1 ; vinsertf128 $0x1,%xmm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,90,58,0,0 ; vbroadcastss 0x3a5a(%rip),%ymm3 # 5754 <_sk_callback_avx+0x219>
+ DB 196,226,125,24,29,90,58,0,0 ; vbroadcastss 0x3a5a(%rip),%ymm3 # 5750 <_sk_callback_avx+0x219>
DB 91 ; pop %rbx
DB 65,92 ; pop %r12
DB 65,93 ; pop %r13
@@ -6198,36 +6195,36 @@ _sk_load_tables_rgb_u16_be_avx LABEL PROC
DB 196,129,121,110,4,72 ; vmovd (%r8,%r9,2),%xmm0
DB 196,129,121,196,68,72,4,2 ; vpinsrw $0x2,0x4(%r8,%r9,2),%xmm0,%xmm0
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 117,5 ; jne 1d1f <_sk_load_tables_rgb_u16_be_avx+0x288>
- DB 233,190,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 117,5 ; jne 1d1b <_sk_load_tables_rgb_u16_be_avx+0x288>
+ DB 233,190,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
DB 196,129,121,110,76,72,6 ; vmovd 0x6(%r8,%r9,2),%xmm1
DB 196,1,113,196,68,72,10,2 ; vpinsrw $0x2,0xa(%r8,%r9,2),%xmm1,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,26 ; jb 1d4e <_sk_load_tables_rgb_u16_be_avx+0x2b7>
+ DB 114,26 ; jb 1d4a <_sk_load_tables_rgb_u16_be_avx+0x2b7>
DB 196,129,121,110,76,72,12 ; vmovd 0xc(%r8,%r9,2),%xmm1
DB 196,129,113,196,84,72,16,2 ; vpinsrw $0x2,0x10(%r8,%r9,2),%xmm1,%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 117,10 ; jne 1d53 <_sk_load_tables_rgb_u16_be_avx+0x2bc>
- DB 233,143,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
- DB 233,138,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 117,10 ; jne 1d4f <_sk_load_tables_rgb_u16_be_avx+0x2bc>
+ DB 233,143,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 233,138,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
DB 196,129,121,110,76,72,18 ; vmovd 0x12(%r8,%r9,2),%xmm1
DB 196,1,113,196,76,72,22,2 ; vpinsrw $0x2,0x16(%r8,%r9,2),%xmm1,%xmm9
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,26 ; jb 1d82 <_sk_load_tables_rgb_u16_be_avx+0x2eb>
+ DB 114,26 ; jb 1d7e <_sk_load_tables_rgb_u16_be_avx+0x2eb>
DB 196,129,121,110,76,72,24 ; vmovd 0x18(%r8,%r9,2),%xmm1
DB 196,129,113,196,76,72,28,2 ; vpinsrw $0x2,0x1c(%r8,%r9,2),%xmm1,%xmm1
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 117,10 ; jne 1d87 <_sk_load_tables_rgb_u16_be_avx+0x2f0>
- DB 233,91,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
- DB 233,86,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 117,10 ; jne 1d83 <_sk_load_tables_rgb_u16_be_avx+0x2f0>
+ DB 233,91,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 233,86,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
DB 196,129,121,110,92,72,30 ; vmovd 0x1e(%r8,%r9,2),%xmm3
DB 196,1,97,196,92,72,34,2 ; vpinsrw $0x2,0x22(%r8,%r9,2),%xmm3,%xmm11
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,20 ; jb 1db0 <_sk_load_tables_rgb_u16_be_avx+0x319>
+ DB 114,20 ; jb 1dac <_sk_load_tables_rgb_u16_be_avx+0x319>
DB 196,129,121,110,92,72,36 ; vmovd 0x24(%r8,%r9,2),%xmm3
DB 196,129,97,196,92,72,40,2 ; vpinsrw $0x2,0x28(%r8,%r9,2),%xmm3,%xmm3
- DB 233,45,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
- DB 233,40,253,255,255 ; jmpq 1add <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 233,45,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
+ DB 233,40,253,255,255 ; jmpq 1ad9 <_sk_load_tables_rgb_u16_be_avx+0x46>
PUBLIC _sk_byte_tables_avx
_sk_byte_tables_avx LABEL PROC
@@ -6238,7 +6235,7 @@ _sk_byte_tables_avx LABEL PROC
DB 65,84 ; push %r12
DB 83 ; push %rbx
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,142,57,0,0 ; vbroadcastss 0x398e(%rip),%ymm8 # 5758 <_sk_callback_avx+0x21d>
+ DB 196,98,125,24,5,142,57,0,0 ; vbroadcastss 0x398e(%rip),%ymm8 # 5754 <_sk_callback_avx+0x21d>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 197,253,91,192 ; vcvtps2dq %ymm0,%ymm0
DB 196,195,249,22,192,1 ; vpextrq $0x1,%xmm0,%r8
@@ -6275,7 +6272,7 @@ _sk_byte_tables_avx LABEL PROC
DB 196,226,121,49,192 ; vpmovzxbd %xmm0,%xmm0
DB 196,227,53,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm9,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,220,56,0,0 ; vbroadcastss 0x38dc(%rip),%ymm9 # 575c <_sk_callback_avx+0x221>
+ DB 196,98,125,24,13,220,56,0,0 ; vbroadcastss 0x38dc(%rip),%ymm9 # 5758 <_sk_callback_avx+0x221>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
@@ -6435,7 +6432,7 @@ _sk_byte_tables_rgb_avx LABEL PROC
DB 196,226,121,49,192 ; vpmovzxbd %xmm0,%xmm0
DB 196,227,53,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm9,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,2,54,0,0 ; vbroadcastss 0x3602(%rip),%ymm9 # 5760 <_sk_callback_avx+0x225>
+ DB 196,98,125,24,13,2,54,0,0 ; vbroadcastss 0x3602(%rip),%ymm9 # 575c <_sk_callback_avx+0x225>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 197,188,89,201 ; vmulps %ymm1,%ymm8,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
@@ -6722,36 +6719,36 @@ _sk_parametric_r_avx LABEL PROC
DB 196,193,124,88,195 ; vaddps %ymm11,%ymm0,%ymm0
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,216 ; vcvtdq2ps %ymm0,%ymm11
- DB 196,98,125,24,37,96,49,0,0 ; vbroadcastss 0x3160(%rip),%ymm12 # 5764 <_sk_callback_avx+0x229>
+ DB 196,98,125,24,37,96,49,0,0 ; vbroadcastss 0x3160(%rip),%ymm12 # 5760 <_sk_callback_avx+0x229>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,86,49,0,0 ; vbroadcastss 0x3156(%rip),%ymm12 # 5768 <_sk_callback_avx+0x22d>
+ DB 196,98,125,24,37,86,49,0,0 ; vbroadcastss 0x3156(%rip),%ymm12 # 5764 <_sk_callback_avx+0x22d>
DB 196,193,124,84,196 ; vandps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,37,76,49,0,0 ; vbroadcastss 0x314c(%rip),%ymm12 # 576c <_sk_callback_avx+0x231>
+ DB 196,98,125,24,37,76,49,0,0 ; vbroadcastss 0x314c(%rip),%ymm12 # 5768 <_sk_callback_avx+0x231>
DB 196,193,124,86,196 ; vorps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,37,66,49,0,0 ; vbroadcastss 0x3142(%rip),%ymm12 # 5770 <_sk_callback_avx+0x235>
+ DB 196,98,125,24,37,66,49,0,0 ; vbroadcastss 0x3142(%rip),%ymm12 # 576c <_sk_callback_avx+0x235>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,56,49,0,0 ; vbroadcastss 0x3138(%rip),%ymm12 # 5774 <_sk_callback_avx+0x239>
+ DB 196,98,125,24,37,56,49,0,0 ; vbroadcastss 0x3138(%rip),%ymm12 # 5770 <_sk_callback_avx+0x239>
DB 196,65,124,89,228 ; vmulps %ymm12,%ymm0,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,41,49,0,0 ; vbroadcastss 0x3129(%rip),%ymm12 # 5778 <_sk_callback_avx+0x23d>
+ DB 196,98,125,24,37,41,49,0,0 ; vbroadcastss 0x3129(%rip),%ymm12 # 5774 <_sk_callback_avx+0x23d>
DB 196,193,124,88,196 ; vaddps %ymm12,%ymm0,%ymm0
- DB 196,98,125,24,37,31,49,0,0 ; vbroadcastss 0x311f(%rip),%ymm12 # 577c <_sk_callback_avx+0x241>
+ DB 196,98,125,24,37,31,49,0,0 ; vbroadcastss 0x311f(%rip),%ymm12 # 5778 <_sk_callback_avx+0x241>
DB 197,156,94,192 ; vdivps %ymm0,%ymm12,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
DB 197,172,89,192 ; vmulps %ymm0,%ymm10,%ymm0
DB 196,99,125,8,208,1 ; vroundps $0x1,%ymm0,%ymm10
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,3,49,0,0 ; vbroadcastss 0x3103(%rip),%ymm11 # 5780 <_sk_callback_avx+0x245>
+ DB 196,98,125,24,29,3,49,0,0 ; vbroadcastss 0x3103(%rip),%ymm11 # 577c <_sk_callback_avx+0x245>
DB 196,193,124,88,195 ; vaddps %ymm11,%ymm0,%ymm0
- DB 196,98,125,24,29,249,48,0,0 ; vbroadcastss 0x30f9(%rip),%ymm11 # 5784 <_sk_callback_avx+0x249>
+ DB 196,98,125,24,29,249,48,0,0 ; vbroadcastss 0x30f9(%rip),%ymm11 # 5780 <_sk_callback_avx+0x249>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,124,92,195 ; vsubps %ymm11,%ymm0,%ymm0
- DB 196,98,125,24,29,234,48,0,0 ; vbroadcastss 0x30ea(%rip),%ymm11 # 5788 <_sk_callback_avx+0x24d>
+ DB 196,98,125,24,29,234,48,0,0 ; vbroadcastss 0x30ea(%rip),%ymm11 # 5784 <_sk_callback_avx+0x24d>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,224,48,0,0 ; vbroadcastss 0x30e0(%rip),%ymm11 # 578c <_sk_callback_avx+0x251>
+ DB 196,98,125,24,29,224,48,0,0 ; vbroadcastss 0x30e0(%rip),%ymm11 # 5788 <_sk_callback_avx+0x251>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,124,88,194 ; vaddps %ymm10,%ymm0,%ymm0
- DB 196,98,125,24,21,209,48,0,0 ; vbroadcastss 0x30d1(%rip),%ymm10 # 5790 <_sk_callback_avx+0x255>
+ DB 196,98,125,24,21,209,48,0,0 ; vbroadcastss 0x30d1(%rip),%ymm10 # 578c <_sk_callback_avx+0x255>
DB 196,193,124,89,194 ; vmulps %ymm10,%ymm0,%ymm0
DB 197,253,91,192 ; vcvtps2dq %ymm0,%ymm0
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -6759,7 +6756,7 @@ _sk_parametric_r_avx LABEL PROC
DB 196,195,125,74,193,128 ; vblendvps %ymm8,%ymm9,%ymm0,%ymm0
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,124,95,192 ; vmaxps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,168,48,0,0 ; vbroadcastss 0x30a8(%rip),%ymm8 # 5794 <_sk_callback_avx+0x259>
+ DB 196,98,125,24,5,168,48,0,0 ; vbroadcastss 0x30a8(%rip),%ymm8 # 5790 <_sk_callback_avx+0x259>
DB 196,193,124,93,192 ; vminps %ymm8,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -6779,36 +6776,36 @@ _sk_parametric_g_avx LABEL PROC
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,217 ; vcvtdq2ps %ymm1,%ymm11
- DB 196,98,125,24,37,89,48,0,0 ; vbroadcastss 0x3059(%rip),%ymm12 # 5798 <_sk_callback_avx+0x25d>
+ DB 196,98,125,24,37,89,48,0,0 ; vbroadcastss 0x3059(%rip),%ymm12 # 5794 <_sk_callback_avx+0x25d>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,79,48,0,0 ; vbroadcastss 0x304f(%rip),%ymm12 # 579c <_sk_callback_avx+0x261>
+ DB 196,98,125,24,37,79,48,0,0 ; vbroadcastss 0x304f(%rip),%ymm12 # 5798 <_sk_callback_avx+0x261>
DB 196,193,116,84,204 ; vandps %ymm12,%ymm1,%ymm1
- DB 196,98,125,24,37,69,48,0,0 ; vbroadcastss 0x3045(%rip),%ymm12 # 57a0 <_sk_callback_avx+0x265>
+ DB 196,98,125,24,37,69,48,0,0 ; vbroadcastss 0x3045(%rip),%ymm12 # 579c <_sk_callback_avx+0x265>
DB 196,193,116,86,204 ; vorps %ymm12,%ymm1,%ymm1
- DB 196,98,125,24,37,59,48,0,0 ; vbroadcastss 0x303b(%rip),%ymm12 # 57a4 <_sk_callback_avx+0x269>
+ DB 196,98,125,24,37,59,48,0,0 ; vbroadcastss 0x303b(%rip),%ymm12 # 57a0 <_sk_callback_avx+0x269>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,49,48,0,0 ; vbroadcastss 0x3031(%rip),%ymm12 # 57a8 <_sk_callback_avx+0x26d>
+ DB 196,98,125,24,37,49,48,0,0 ; vbroadcastss 0x3031(%rip),%ymm12 # 57a4 <_sk_callback_avx+0x26d>
DB 196,65,116,89,228 ; vmulps %ymm12,%ymm1,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,34,48,0,0 ; vbroadcastss 0x3022(%rip),%ymm12 # 57ac <_sk_callback_avx+0x271>
+ DB 196,98,125,24,37,34,48,0,0 ; vbroadcastss 0x3022(%rip),%ymm12 # 57a8 <_sk_callback_avx+0x271>
DB 196,193,116,88,204 ; vaddps %ymm12,%ymm1,%ymm1
- DB 196,98,125,24,37,24,48,0,0 ; vbroadcastss 0x3018(%rip),%ymm12 # 57b0 <_sk_callback_avx+0x275>
+ DB 196,98,125,24,37,24,48,0,0 ; vbroadcastss 0x3018(%rip),%ymm12 # 57ac <_sk_callback_avx+0x275>
DB 197,156,94,201 ; vdivps %ymm1,%ymm12,%ymm1
DB 197,164,92,201 ; vsubps %ymm1,%ymm11,%ymm1
DB 197,172,89,201 ; vmulps %ymm1,%ymm10,%ymm1
DB 196,99,125,8,209,1 ; vroundps $0x1,%ymm1,%ymm10
DB 196,65,116,92,210 ; vsubps %ymm10,%ymm1,%ymm10
- DB 196,98,125,24,29,252,47,0,0 ; vbroadcastss 0x2ffc(%rip),%ymm11 # 57b4 <_sk_callback_avx+0x279>
+ DB 196,98,125,24,29,252,47,0,0 ; vbroadcastss 0x2ffc(%rip),%ymm11 # 57b0 <_sk_callback_avx+0x279>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,242,47,0,0 ; vbroadcastss 0x2ff2(%rip),%ymm11 # 57b8 <_sk_callback_avx+0x27d>
+ DB 196,98,125,24,29,242,47,0,0 ; vbroadcastss 0x2ff2(%rip),%ymm11 # 57b4 <_sk_callback_avx+0x27d>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,116,92,203 ; vsubps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,29,227,47,0,0 ; vbroadcastss 0x2fe3(%rip),%ymm11 # 57bc <_sk_callback_avx+0x281>
+ DB 196,98,125,24,29,227,47,0,0 ; vbroadcastss 0x2fe3(%rip),%ymm11 # 57b8 <_sk_callback_avx+0x281>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,217,47,0,0 ; vbroadcastss 0x2fd9(%rip),%ymm11 # 57c0 <_sk_callback_avx+0x285>
+ DB 196,98,125,24,29,217,47,0,0 ; vbroadcastss 0x2fd9(%rip),%ymm11 # 57bc <_sk_callback_avx+0x285>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,116,88,202 ; vaddps %ymm10,%ymm1,%ymm1
- DB 196,98,125,24,21,202,47,0,0 ; vbroadcastss 0x2fca(%rip),%ymm10 # 57c4 <_sk_callback_avx+0x289>
+ DB 196,98,125,24,21,202,47,0,0 ; vbroadcastss 0x2fca(%rip),%ymm10 # 57c0 <_sk_callback_avx+0x289>
DB 196,193,116,89,202 ; vmulps %ymm10,%ymm1,%ymm1
DB 197,253,91,201 ; vcvtps2dq %ymm1,%ymm1
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -6816,7 +6813,7 @@ _sk_parametric_g_avx LABEL PROC
DB 196,195,117,74,201,128 ; vblendvps %ymm8,%ymm9,%ymm1,%ymm1
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,116,95,200 ; vmaxps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,5,161,47,0,0 ; vbroadcastss 0x2fa1(%rip),%ymm8 # 57c8 <_sk_callback_avx+0x28d>
+ DB 196,98,125,24,5,161,47,0,0 ; vbroadcastss 0x2fa1(%rip),%ymm8 # 57c4 <_sk_callback_avx+0x28d>
DB 196,193,116,93,200 ; vminps %ymm8,%ymm1,%ymm1
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -6836,36 +6833,36 @@ _sk_parametric_b_avx LABEL PROC
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,218 ; vcvtdq2ps %ymm2,%ymm11
- DB 196,98,125,24,37,82,47,0,0 ; vbroadcastss 0x2f52(%rip),%ymm12 # 57cc <_sk_callback_avx+0x291>
+ DB 196,98,125,24,37,82,47,0,0 ; vbroadcastss 0x2f52(%rip),%ymm12 # 57c8 <_sk_callback_avx+0x291>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,72,47,0,0 ; vbroadcastss 0x2f48(%rip),%ymm12 # 57d0 <_sk_callback_avx+0x295>
+ DB 196,98,125,24,37,72,47,0,0 ; vbroadcastss 0x2f48(%rip),%ymm12 # 57cc <_sk_callback_avx+0x295>
DB 196,193,108,84,212 ; vandps %ymm12,%ymm2,%ymm2
- DB 196,98,125,24,37,62,47,0,0 ; vbroadcastss 0x2f3e(%rip),%ymm12 # 57d4 <_sk_callback_avx+0x299>
+ DB 196,98,125,24,37,62,47,0,0 ; vbroadcastss 0x2f3e(%rip),%ymm12 # 57d0 <_sk_callback_avx+0x299>
DB 196,193,108,86,212 ; vorps %ymm12,%ymm2,%ymm2
- DB 196,98,125,24,37,52,47,0,0 ; vbroadcastss 0x2f34(%rip),%ymm12 # 57d8 <_sk_callback_avx+0x29d>
+ DB 196,98,125,24,37,52,47,0,0 ; vbroadcastss 0x2f34(%rip),%ymm12 # 57d4 <_sk_callback_avx+0x29d>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,42,47,0,0 ; vbroadcastss 0x2f2a(%rip),%ymm12 # 57dc <_sk_callback_avx+0x2a1>
+ DB 196,98,125,24,37,42,47,0,0 ; vbroadcastss 0x2f2a(%rip),%ymm12 # 57d8 <_sk_callback_avx+0x2a1>
DB 196,65,108,89,228 ; vmulps %ymm12,%ymm2,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,27,47,0,0 ; vbroadcastss 0x2f1b(%rip),%ymm12 # 57e0 <_sk_callback_avx+0x2a5>
+ DB 196,98,125,24,37,27,47,0,0 ; vbroadcastss 0x2f1b(%rip),%ymm12 # 57dc <_sk_callback_avx+0x2a5>
DB 196,193,108,88,212 ; vaddps %ymm12,%ymm2,%ymm2
- DB 196,98,125,24,37,17,47,0,0 ; vbroadcastss 0x2f11(%rip),%ymm12 # 57e4 <_sk_callback_avx+0x2a9>
+ DB 196,98,125,24,37,17,47,0,0 ; vbroadcastss 0x2f11(%rip),%ymm12 # 57e0 <_sk_callback_avx+0x2a9>
DB 197,156,94,210 ; vdivps %ymm2,%ymm12,%ymm2
DB 197,164,92,210 ; vsubps %ymm2,%ymm11,%ymm2
DB 197,172,89,210 ; vmulps %ymm2,%ymm10,%ymm2
DB 196,99,125,8,210,1 ; vroundps $0x1,%ymm2,%ymm10
DB 196,65,108,92,210 ; vsubps %ymm10,%ymm2,%ymm10
- DB 196,98,125,24,29,245,46,0,0 ; vbroadcastss 0x2ef5(%rip),%ymm11 # 57e8 <_sk_callback_avx+0x2ad>
+ DB 196,98,125,24,29,245,46,0,0 ; vbroadcastss 0x2ef5(%rip),%ymm11 # 57e4 <_sk_callback_avx+0x2ad>
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
- DB 196,98,125,24,29,235,46,0,0 ; vbroadcastss 0x2eeb(%rip),%ymm11 # 57ec <_sk_callback_avx+0x2b1>
+ DB 196,98,125,24,29,235,46,0,0 ; vbroadcastss 0x2eeb(%rip),%ymm11 # 57e8 <_sk_callback_avx+0x2b1>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,108,92,211 ; vsubps %ymm11,%ymm2,%ymm2
- DB 196,98,125,24,29,220,46,0,0 ; vbroadcastss 0x2edc(%rip),%ymm11 # 57f0 <_sk_callback_avx+0x2b5>
+ DB 196,98,125,24,29,220,46,0,0 ; vbroadcastss 0x2edc(%rip),%ymm11 # 57ec <_sk_callback_avx+0x2b5>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,210,46,0,0 ; vbroadcastss 0x2ed2(%rip),%ymm11 # 57f4 <_sk_callback_avx+0x2b9>
+ DB 196,98,125,24,29,210,46,0,0 ; vbroadcastss 0x2ed2(%rip),%ymm11 # 57f0 <_sk_callback_avx+0x2b9>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,108,88,210 ; vaddps %ymm10,%ymm2,%ymm2
- DB 196,98,125,24,21,195,46,0,0 ; vbroadcastss 0x2ec3(%rip),%ymm10 # 57f8 <_sk_callback_avx+0x2bd>
+ DB 196,98,125,24,21,195,46,0,0 ; vbroadcastss 0x2ec3(%rip),%ymm10 # 57f4 <_sk_callback_avx+0x2bd>
DB 196,193,108,89,210 ; vmulps %ymm10,%ymm2,%ymm2
DB 197,253,91,210 ; vcvtps2dq %ymm2,%ymm2
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -6873,7 +6870,7 @@ _sk_parametric_b_avx LABEL PROC
DB 196,195,109,74,209,128 ; vblendvps %ymm8,%ymm9,%ymm2,%ymm2
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,108,95,208 ; vmaxps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,154,46,0,0 ; vbroadcastss 0x2e9a(%rip),%ymm8 # 57fc <_sk_callback_avx+0x2c1>
+ DB 196,98,125,24,5,154,46,0,0 ; vbroadcastss 0x2e9a(%rip),%ymm8 # 57f8 <_sk_callback_avx+0x2c1>
DB 196,193,108,93,208 ; vminps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -6893,36 +6890,36 @@ _sk_parametric_a_avx LABEL PROC
DB 196,193,100,88,219 ; vaddps %ymm11,%ymm3,%ymm3
DB 196,98,125,24,16 ; vbroadcastss (%rax),%ymm10
DB 197,124,91,219 ; vcvtdq2ps %ymm3,%ymm11
- DB 196,98,125,24,37,75,46,0,0 ; vbroadcastss 0x2e4b(%rip),%ymm12 # 5800 <_sk_callback_avx+0x2c5>
+ DB 196,98,125,24,37,75,46,0,0 ; vbroadcastss 0x2e4b(%rip),%ymm12 # 57fc <_sk_callback_avx+0x2c5>
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,65,46,0,0 ; vbroadcastss 0x2e41(%rip),%ymm12 # 5804 <_sk_callback_avx+0x2c9>
+ DB 196,98,125,24,37,65,46,0,0 ; vbroadcastss 0x2e41(%rip),%ymm12 # 5800 <_sk_callback_avx+0x2c9>
DB 196,193,100,84,220 ; vandps %ymm12,%ymm3,%ymm3
- DB 196,98,125,24,37,55,46,0,0 ; vbroadcastss 0x2e37(%rip),%ymm12 # 5808 <_sk_callback_avx+0x2cd>
+ DB 196,98,125,24,37,55,46,0,0 ; vbroadcastss 0x2e37(%rip),%ymm12 # 5804 <_sk_callback_avx+0x2cd>
DB 196,193,100,86,220 ; vorps %ymm12,%ymm3,%ymm3
- DB 196,98,125,24,37,45,46,0,0 ; vbroadcastss 0x2e2d(%rip),%ymm12 # 580c <_sk_callback_avx+0x2d1>
+ DB 196,98,125,24,37,45,46,0,0 ; vbroadcastss 0x2e2d(%rip),%ymm12 # 5808 <_sk_callback_avx+0x2d1>
DB 196,65,36,88,220 ; vaddps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,35,46,0,0 ; vbroadcastss 0x2e23(%rip),%ymm12 # 5810 <_sk_callback_avx+0x2d5>
+ DB 196,98,125,24,37,35,46,0,0 ; vbroadcastss 0x2e23(%rip),%ymm12 # 580c <_sk_callback_avx+0x2d5>
DB 196,65,100,89,228 ; vmulps %ymm12,%ymm3,%ymm12
DB 196,65,36,92,220 ; vsubps %ymm12,%ymm11,%ymm11
- DB 196,98,125,24,37,20,46,0,0 ; vbroadcastss 0x2e14(%rip),%ymm12 # 5814 <_sk_callback_avx+0x2d9>
+ DB 196,98,125,24,37,20,46,0,0 ; vbroadcastss 0x2e14(%rip),%ymm12 # 5810 <_sk_callback_avx+0x2d9>
DB 196,193,100,88,220 ; vaddps %ymm12,%ymm3,%ymm3
- DB 196,98,125,24,37,10,46,0,0 ; vbroadcastss 0x2e0a(%rip),%ymm12 # 5818 <_sk_callback_avx+0x2dd>
+ DB 196,98,125,24,37,10,46,0,0 ; vbroadcastss 0x2e0a(%rip),%ymm12 # 5814 <_sk_callback_avx+0x2dd>
DB 197,156,94,219 ; vdivps %ymm3,%ymm12,%ymm3
DB 197,164,92,219 ; vsubps %ymm3,%ymm11,%ymm3
DB 197,172,89,219 ; vmulps %ymm3,%ymm10,%ymm3
DB 196,99,125,8,211,1 ; vroundps $0x1,%ymm3,%ymm10
DB 196,65,100,92,210 ; vsubps %ymm10,%ymm3,%ymm10
- DB 196,98,125,24,29,238,45,0,0 ; vbroadcastss 0x2dee(%rip),%ymm11 # 581c <_sk_callback_avx+0x2e1>
+ DB 196,98,125,24,29,238,45,0,0 ; vbroadcastss 0x2dee(%rip),%ymm11 # 5818 <_sk_callback_avx+0x2e1>
DB 196,193,100,88,219 ; vaddps %ymm11,%ymm3,%ymm3
- DB 196,98,125,24,29,228,45,0,0 ; vbroadcastss 0x2de4(%rip),%ymm11 # 5820 <_sk_callback_avx+0x2e5>
+ DB 196,98,125,24,29,228,45,0,0 ; vbroadcastss 0x2de4(%rip),%ymm11 # 581c <_sk_callback_avx+0x2e5>
DB 196,65,44,89,219 ; vmulps %ymm11,%ymm10,%ymm11
DB 196,193,100,92,219 ; vsubps %ymm11,%ymm3,%ymm3
- DB 196,98,125,24,29,213,45,0,0 ; vbroadcastss 0x2dd5(%rip),%ymm11 # 5824 <_sk_callback_avx+0x2e9>
+ DB 196,98,125,24,29,213,45,0,0 ; vbroadcastss 0x2dd5(%rip),%ymm11 # 5820 <_sk_callback_avx+0x2e9>
DB 196,65,36,92,210 ; vsubps %ymm10,%ymm11,%ymm10
- DB 196,98,125,24,29,203,45,0,0 ; vbroadcastss 0x2dcb(%rip),%ymm11 # 5828 <_sk_callback_avx+0x2ed>
+ DB 196,98,125,24,29,203,45,0,0 ; vbroadcastss 0x2dcb(%rip),%ymm11 # 5824 <_sk_callback_avx+0x2ed>
DB 196,65,36,94,210 ; vdivps %ymm10,%ymm11,%ymm10
DB 196,193,100,88,218 ; vaddps %ymm10,%ymm3,%ymm3
- DB 196,98,125,24,21,188,45,0,0 ; vbroadcastss 0x2dbc(%rip),%ymm10 # 582c <_sk_callback_avx+0x2f1>
+ DB 196,98,125,24,21,188,45,0,0 ; vbroadcastss 0x2dbc(%rip),%ymm10 # 5828 <_sk_callback_avx+0x2f1>
DB 196,193,100,89,218 ; vmulps %ymm10,%ymm3,%ymm3
DB 197,253,91,219 ; vcvtps2dq %ymm3,%ymm3
DB 196,98,125,24,80,20 ; vbroadcastss 0x14(%rax),%ymm10
@@ -6930,38 +6927,38 @@ _sk_parametric_a_avx LABEL PROC
DB 196,195,101,74,217,128 ; vblendvps %ymm8,%ymm9,%ymm3,%ymm3
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
DB 196,193,100,95,216 ; vmaxps %ymm8,%ymm3,%ymm3
- DB 196,98,125,24,5,147,45,0,0 ; vbroadcastss 0x2d93(%rip),%ymm8 # 5830 <_sk_callback_avx+0x2f5>
+ DB 196,98,125,24,5,147,45,0,0 ; vbroadcastss 0x2d93(%rip),%ymm8 # 582c <_sk_callback_avx+0x2f5>
DB 196,193,100,93,216 ; vminps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
PUBLIC _sk_lab_to_xyz_avx
_sk_lab_to_xyz_avx LABEL PROC
- DB 196,98,125,24,5,133,45,0,0 ; vbroadcastss 0x2d85(%rip),%ymm8 # 5834 <_sk_callback_avx+0x2f9>
+ DB 196,98,125,24,5,133,45,0,0 ; vbroadcastss 0x2d85(%rip),%ymm8 # 5830 <_sk_callback_avx+0x2f9>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,123,45,0,0 ; vbroadcastss 0x2d7b(%rip),%ymm8 # 5838 <_sk_callback_avx+0x2fd>
+ DB 196,98,125,24,5,123,45,0,0 ; vbroadcastss 0x2d7b(%rip),%ymm8 # 5834 <_sk_callback_avx+0x2fd>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
- DB 196,98,125,24,13,113,45,0,0 ; vbroadcastss 0x2d71(%rip),%ymm9 # 583c <_sk_callback_avx+0x301>
+ DB 196,98,125,24,13,113,45,0,0 ; vbroadcastss 0x2d71(%rip),%ymm9 # 5838 <_sk_callback_avx+0x301>
DB 196,193,116,88,201 ; vaddps %ymm9,%ymm1,%ymm1
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 196,193,108,88,209 ; vaddps %ymm9,%ymm2,%ymm2
- DB 196,98,125,24,5,93,45,0,0 ; vbroadcastss 0x2d5d(%rip),%ymm8 # 5840 <_sk_callback_avx+0x305>
+ DB 196,98,125,24,5,93,45,0,0 ; vbroadcastss 0x2d5d(%rip),%ymm8 # 583c <_sk_callback_avx+0x305>
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,83,45,0,0 ; vbroadcastss 0x2d53(%rip),%ymm8 # 5844 <_sk_callback_avx+0x309>
+ DB 196,98,125,24,5,83,45,0,0 ; vbroadcastss 0x2d53(%rip),%ymm8 # 5840 <_sk_callback_avx+0x309>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,5,73,45,0,0 ; vbroadcastss 0x2d49(%rip),%ymm8 # 5848 <_sk_callback_avx+0x30d>
+ DB 196,98,125,24,5,73,45,0,0 ; vbroadcastss 0x2d49(%rip),%ymm8 # 5844 <_sk_callback_avx+0x30d>
DB 196,193,116,89,200 ; vmulps %ymm8,%ymm1,%ymm1
DB 197,252,88,201 ; vaddps %ymm1,%ymm0,%ymm1
- DB 196,98,125,24,5,59,45,0,0 ; vbroadcastss 0x2d3b(%rip),%ymm8 # 584c <_sk_callback_avx+0x311>
+ DB 196,98,125,24,5,59,45,0,0 ; vbroadcastss 0x2d3b(%rip),%ymm8 # 5848 <_sk_callback_avx+0x311>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 197,252,92,210 ; vsubps %ymm2,%ymm0,%ymm2
DB 197,116,89,193 ; vmulps %ymm1,%ymm1,%ymm8
DB 196,65,116,89,192 ; vmulps %ymm8,%ymm1,%ymm8
- DB 196,98,125,24,13,36,45,0,0 ; vbroadcastss 0x2d24(%rip),%ymm9 # 5850 <_sk_callback_avx+0x315>
+ DB 196,98,125,24,13,36,45,0,0 ; vbroadcastss 0x2d24(%rip),%ymm9 # 584c <_sk_callback_avx+0x315>
DB 196,65,52,194,208,1 ; vcmpltps %ymm8,%ymm9,%ymm10
- DB 196,98,125,24,29,25,45,0,0 ; vbroadcastss 0x2d19(%rip),%ymm11 # 5854 <_sk_callback_avx+0x319>
+ DB 196,98,125,24,29,25,45,0,0 ; vbroadcastss 0x2d19(%rip),%ymm11 # 5850 <_sk_callback_avx+0x319>
DB 196,193,116,88,203 ; vaddps %ymm11,%ymm1,%ymm1
- DB 196,98,125,24,37,15,45,0,0 ; vbroadcastss 0x2d0f(%rip),%ymm12 # 5858 <_sk_callback_avx+0x31d>
+ DB 196,98,125,24,37,15,45,0,0 ; vbroadcastss 0x2d0f(%rip),%ymm12 # 5854 <_sk_callback_avx+0x31d>
DB 196,193,116,89,204 ; vmulps %ymm12,%ymm1,%ymm1
DB 196,67,117,74,192,160 ; vblendvps %ymm10,%ymm8,%ymm1,%ymm8
DB 197,252,89,200 ; vmulps %ymm0,%ymm0,%ymm1
@@ -6976,9 +6973,9 @@ _sk_lab_to_xyz_avx LABEL PROC
DB 196,193,108,88,211 ; vaddps %ymm11,%ymm2,%ymm2
DB 196,193,108,89,212 ; vmulps %ymm12,%ymm2,%ymm2
DB 196,227,109,74,208,144 ; vblendvps %ymm9,%ymm0,%ymm2,%ymm2
- DB 196,226,125,24,5,197,44,0,0 ; vbroadcastss 0x2cc5(%rip),%ymm0 # 585c <_sk_callback_avx+0x321>
+ DB 196,226,125,24,5,197,44,0,0 ; vbroadcastss 0x2cc5(%rip),%ymm0 # 5858 <_sk_callback_avx+0x321>
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
- DB 196,98,125,24,5,188,44,0,0 ; vbroadcastss 0x2cbc(%rip),%ymm8 # 5860 <_sk_callback_avx+0x325>
+ DB 196,98,125,24,5,188,44,0,0 ; vbroadcastss 0x2cbc(%rip),%ymm8 # 585c <_sk_callback_avx+0x325>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -6990,14 +6987,14 @@ _sk_load_a8_avx LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,62 ; jne 2bfb <_sk_load_a8_avx+0x4e>
+ DB 117,62 ; jne 2bf7 <_sk_load_a8_avx+0x4e>
DB 197,250,126,0 ; vmovq (%rax),%xmm0
DB 196,226,121,49,200 ; vpmovzxbd %xmm0,%xmm1
DB 196,227,121,4,192,229 ; vpermilps $0xe5,%xmm0,%xmm0
DB 196,226,121,49,192 ; vpmovzxbd %xmm0,%xmm0
DB 196,227,117,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm1,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,128,44,0,0 ; vbroadcastss 0x2c80(%rip),%ymm1 # 5864 <_sk_callback_avx+0x329>
+ DB 196,226,125,24,13,128,44,0,0 ; vbroadcastss 0x2c80(%rip),%ymm1 # 5860 <_sk_callback_avx+0x329>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -7014,9 +7011,9 @@ _sk_load_a8_avx LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 2c03 <_sk_load_a8_avx+0x56>
+ DB 117,234 ; jne 2bff <_sk_load_a8_avx+0x56>
DB 196,193,249,110,193 ; vmovq %r9,%xmm0
- DB 235,161 ; jmp 2bc1 <_sk_load_a8_avx+0x14>
+ DB 235,161 ; jmp 2bbd <_sk_load_a8_avx+0x14>
PUBLIC _sk_gather_a8_avx
_sk_gather_a8_avx LABEL PROC
@@ -7064,7 +7061,7 @@ _sk_gather_a8_avx LABEL PROC
DB 196,226,121,49,201 ; vpmovzxbd %xmm1,%xmm1
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,117,43,0,0 ; vbroadcastss 0x2b75(%rip),%ymm1 # 5868 <_sk_callback_avx+0x32d>
+ DB 196,226,125,24,13,117,43,0,0 ; vbroadcastss 0x2b75(%rip),%ymm1 # 5864 <_sk_callback_avx+0x32d>
DB 197,252,89,217 ; vmulps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 197,252,87,192 ; vxorps %ymm0,%ymm0,%ymm0
@@ -7080,14 +7077,14 @@ PUBLIC _sk_store_a8_avx
_sk_store_a8_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,80,43,0,0 ; vbroadcastss 0x2b50(%rip),%ymm8 # 586c <_sk_callback_avx+0x331>
+ DB 196,98,125,24,5,80,43,0,0 ; vbroadcastss 0x2b50(%rip),%ymm8 # 5868 <_sk_callback_avx+0x331>
DB 196,65,100,89,192 ; vmulps %ymm8,%ymm3,%ymm8
DB 196,65,125,91,192 ; vcvtps2dq %ymm8,%ymm8
DB 196,67,125,25,193,1 ; vextractf128 $0x1,%ymm8,%xmm9
DB 196,66,57,43,193 ; vpackusdw %xmm9,%xmm8,%xmm8
DB 196,65,57,103,192 ; vpackuswb %xmm8,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 2d45 <_sk_store_a8_avx+0x37>
+ DB 117,10 ; jne 2d41 <_sk_store_a8_avx+0x37>
DB 196,65,123,17,4,58 ; vmovsd %xmm8,(%r10,%rdi,1)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -7095,10 +7092,10 @@ _sk_store_a8_avx LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 2d41 <_sk_store_a8_avx+0x33>
+ DB 119,236 ; ja 2d3d <_sk_store_a8_avx+0x33>
DB 196,66,121,48,192 ; vpmovzxbw %xmm8,%xmm8
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,67,0,0,0 ; lea 0x43(%rip),%r9 # 2da8 <_sk_store_a8_avx+0x9a>
+ DB 76,141,13,67,0,0,0 ; lea 0x43(%rip),%r9 # 2da4 <_sk_store_a8_avx+0x9a>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7109,7 +7106,7 @@ _sk_store_a8_avx LABEL PROC
DB 196,67,121,20,68,58,2,4 ; vpextrb $0x4,%xmm8,0x2(%r10,%rdi,1)
DB 196,67,121,20,68,58,1,2 ; vpextrb $0x2,%xmm8,0x1(%r10,%rdi,1)
DB 196,67,121,20,4,58,0 ; vpextrb $0x0,%xmm8,(%r10,%rdi,1)
- DB 235,154 ; jmp 2d41 <_sk_store_a8_avx+0x33>
+ DB 235,154 ; jmp 2d3d <_sk_store_a8_avx+0x33>
DB 144 ; nop
DB 246,255 ; idiv %bh
DB 255 ; (bad)
@@ -7141,17 +7138,17 @@ _sk_load_g8_avx LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 72,1,248 ; add %rdi,%rax
DB 77,133,192 ; test %r8,%r8
- DB 117,67 ; jne 2e17 <_sk_load_g8_avx+0x53>
+ DB 117,67 ; jne 2e13 <_sk_load_g8_avx+0x53>
DB 197,250,126,0 ; vmovq (%rax),%xmm0
DB 196,226,121,49,200 ; vpmovzxbd %xmm0,%xmm1
DB 196,227,121,4,192,229 ; vpermilps $0xe5,%xmm0,%xmm0
DB 196,226,121,49,192 ; vpmovzxbd %xmm0,%xmm0
DB 196,227,117,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm1,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,117,42,0,0 ; vbroadcastss 0x2a75(%rip),%ymm1 # 5870 <_sk_callback_avx+0x335>
+ DB 196,226,125,24,13,117,42,0,0 ; vbroadcastss 0x2a75(%rip),%ymm1 # 586c <_sk_callback_avx+0x335>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,106,42,0,0 ; vbroadcastss 0x2a6a(%rip),%ymm3 # 5874 <_sk_callback_avx+0x339>
+ DB 196,226,125,24,29,106,42,0,0 ; vbroadcastss 0x2a6a(%rip),%ymm3 # 5870 <_sk_callback_avx+0x339>
DB 76,137,193 ; mov %r8,%rcx
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
@@ -7165,9 +7162,9 @@ _sk_load_g8_avx LABEL PROC
DB 77,9,217 ; or %r11,%r9
DB 72,131,193,8 ; add $0x8,%rcx
DB 73,255,202 ; dec %r10
- DB 117,234 ; jne 2e1f <_sk_load_g8_avx+0x5b>
+ DB 117,234 ; jne 2e1b <_sk_load_g8_avx+0x5b>
DB 196,193,249,110,193 ; vmovq %r9,%xmm0
- DB 235,156 ; jmp 2dd8 <_sk_load_g8_avx+0x14>
+ DB 235,156 ; jmp 2dd4 <_sk_load_g8_avx+0x14>
PUBLIC _sk_gather_g8_avx
_sk_gather_g8_avx LABEL PROC
@@ -7215,10 +7212,10 @@ _sk_gather_g8_avx LABEL PROC
DB 196,226,121,49,201 ; vpmovzxbd %xmm1,%xmm1
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,105,41,0,0 ; vbroadcastss 0x2969(%rip),%ymm1 # 5878 <_sk_callback_avx+0x33d>
+ DB 196,226,125,24,13,105,41,0,0 ; vbroadcastss 0x2969(%rip),%ymm1 # 5874 <_sk_callback_avx+0x33d>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,94,41,0,0 ; vbroadcastss 0x295e(%rip),%ymm3 # 587c <_sk_callback_avx+0x341>
+ DB 196,226,125,24,29,94,41,0,0 ; vbroadcastss 0x295e(%rip),%ymm3 # 5878 <_sk_callback_avx+0x341>
DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
DB 91 ; pop %rbx
@@ -7232,9 +7229,9 @@ _sk_gather_i8_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,192 ; mov %rax,%r8
DB 77,133,192 ; test %r8,%r8
- DB 116,5 ; je 2f3e <_sk_gather_i8_avx+0xf>
+ DB 116,5 ; je 2f3a <_sk_gather_i8_avx+0xf>
DB 76,137,192 ; mov %r8,%rax
- DB 235,2 ; jmp 2f40 <_sk_gather_i8_avx+0x11>
+ DB 235,2 ; jmp 2f3c <_sk_gather_i8_avx+0x11>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,87 ; push %r15
DB 65,86 ; push %r14
@@ -7296,10 +7293,10 @@ _sk_gather_i8_avx LABEL PROC
DB 196,163,121,34,4,163,2 ; vpinsrd $0x2,(%rbx,%r12,4),%xmm0,%xmm0
DB 196,163,121,34,28,19,3 ; vpinsrd $0x3,(%rbx,%r10,1),%xmm0,%xmm3
DB 196,227,61,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm8,%ymm0
- DB 197,124,40,21,214,41,0,0 ; vmovaps 0x29d6(%rip),%ymm10 # 5a40 <_sk_callback_avx+0x505>
+ DB 197,124,40,21,218,41,0,0 ; vmovaps 0x29da(%rip),%ymm10 # 5a40 <_sk_callback_avx+0x509>
DB 196,193,124,84,194 ; vandps %ymm10,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,4,40,0,0 ; vbroadcastss 0x2804(%rip),%ymm9 # 5880 <_sk_callback_avx+0x345>
+ DB 196,98,125,24,13,4,40,0,0 ; vbroadcastss 0x2804(%rip),%ymm9 # 587c <_sk_callback_avx+0x345>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,193,113,114,208,8 ; vpsrld $0x8,%xmm8,%xmm1
DB 197,233,114,211,8 ; vpsrld $0x8,%xmm3,%xmm2
@@ -7331,38 +7328,38 @@ _sk_load_565_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,128,0,0,0 ; jne 3174 <_sk_load_565_avx+0x8e>
+ DB 15,133,128,0,0,0 ; jne 3170 <_sk_load_565_avx+0x8e>
DB 196,193,122,111,4,122 ; vmovdqu (%r10,%rdi,2),%xmm0
DB 197,241,239,201 ; vpxor %xmm1,%xmm1,%xmm1
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,209,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm2
- DB 196,226,125,24,5,110,39,0,0 ; vbroadcastss 0x276e(%rip),%ymm0 # 5884 <_sk_callback_avx+0x349>
+ DB 196,226,125,24,5,110,39,0,0 ; vbroadcastss 0x276e(%rip),%ymm0 # 5880 <_sk_callback_avx+0x349>
DB 197,236,84,192 ; vandps %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,97,39,0,0 ; vbroadcastss 0x2761(%rip),%ymm1 # 5888 <_sk_callback_avx+0x34d>
+ DB 196,226,125,24,13,97,39,0,0 ; vbroadcastss 0x2761(%rip),%ymm1 # 5884 <_sk_callback_avx+0x34d>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,88,39,0,0 ; vbroadcastss 0x2758(%rip),%ymm1 # 588c <_sk_callback_avx+0x351>
+ DB 196,226,125,24,13,88,39,0,0 ; vbroadcastss 0x2758(%rip),%ymm1 # 5888 <_sk_callback_avx+0x351>
DB 197,236,84,201 ; vandps %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,75,39,0,0 ; vbroadcastss 0x274b(%rip),%ymm3 # 5890 <_sk_callback_avx+0x355>
+ DB 196,226,125,24,29,75,39,0,0 ; vbroadcastss 0x274b(%rip),%ymm3 # 588c <_sk_callback_avx+0x355>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,24,29,66,39,0,0 ; vbroadcastss 0x2742(%rip),%ymm3 # 5894 <_sk_callback_avx+0x359>
+ DB 196,226,125,24,29,66,39,0,0 ; vbroadcastss 0x2742(%rip),%ymm3 # 5890 <_sk_callback_avx+0x359>
DB 197,236,84,211 ; vandps %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,53,39,0,0 ; vbroadcastss 0x2735(%rip),%ymm3 # 5898 <_sk_callback_avx+0x35d>
+ DB 196,226,125,24,29,53,39,0,0 ; vbroadcastss 0x2735(%rip),%ymm3 # 5894 <_sk_callback_avx+0x35d>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,42,39,0,0 ; vbroadcastss 0x272a(%rip),%ymm3 # 589c <_sk_callback_avx+0x361>
+ DB 196,226,125,24,29,42,39,0,0 ; vbroadcastss 0x272a(%rip),%ymm3 # 5898 <_sk_callback_avx+0x361>
DB 255,224 ; jmpq *%rax
DB 65,137,200 ; mov %ecx,%r8d
DB 65,128,224,7 ; and $0x7,%r8b
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 15,135,110,255,255,255 ; ja 30fa <_sk_load_565_avx+0x14>
+ DB 15,135,110,255,255,255 ; ja 30f6 <_sk_load_565_avx+0x14>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 31e0 <_sk_load_565_avx+0xfa>
+ DB 76,141,13,73,0,0,0 ; lea 0x49(%rip),%r9 # 31dc <_sk_load_565_avx+0xfa>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7374,7 +7371,7 @@ _sk_load_565_avx LABEL PROC
DB 196,193,121,196,68,122,4,2 ; vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,68,122,2,1 ; vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,4,122,0 ; vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- DB 233,26,255,255,255 ; jmpq 30fa <_sk_load_565_avx+0x14>
+ DB 233,26,255,255,255 ; jmpq 30f6 <_sk_load_565_avx+0x14>
DB 244 ; hlt
DB 255 ; (bad)
DB 255 ; (bad)
@@ -7450,23 +7447,23 @@ _sk_gather_565_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,209,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm2
- DB 196,226,125,24,5,202,37,0,0 ; vbroadcastss 0x25ca(%rip),%ymm0 # 58a0 <_sk_callback_avx+0x365>
+ DB 196,226,125,24,5,202,37,0,0 ; vbroadcastss 0x25ca(%rip),%ymm0 # 589c <_sk_callback_avx+0x365>
DB 197,236,84,192 ; vandps %ymm0,%ymm2,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,189,37,0,0 ; vbroadcastss 0x25bd(%rip),%ymm1 # 58a4 <_sk_callback_avx+0x369>
+ DB 196,226,125,24,13,189,37,0,0 ; vbroadcastss 0x25bd(%rip),%ymm1 # 58a0 <_sk_callback_avx+0x369>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,180,37,0,0 ; vbroadcastss 0x25b4(%rip),%ymm1 # 58a8 <_sk_callback_avx+0x36d>
+ DB 196,226,125,24,13,180,37,0,0 ; vbroadcastss 0x25b4(%rip),%ymm1 # 58a4 <_sk_callback_avx+0x36d>
DB 197,236,84,201 ; vandps %ymm1,%ymm2,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,29,167,37,0,0 ; vbroadcastss 0x25a7(%rip),%ymm3 # 58ac <_sk_callback_avx+0x371>
+ DB 196,226,125,24,29,167,37,0,0 ; vbroadcastss 0x25a7(%rip),%ymm3 # 58a8 <_sk_callback_avx+0x371>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
- DB 196,226,125,24,29,158,37,0,0 ; vbroadcastss 0x259e(%rip),%ymm3 # 58b0 <_sk_callback_avx+0x375>
+ DB 196,226,125,24,29,158,37,0,0 ; vbroadcastss 0x259e(%rip),%ymm3 # 58ac <_sk_callback_avx+0x375>
DB 197,236,84,211 ; vandps %ymm3,%ymm2,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,226,125,24,29,145,37,0,0 ; vbroadcastss 0x2591(%rip),%ymm3 # 58b4 <_sk_callback_avx+0x379>
+ DB 196,226,125,24,29,145,37,0,0 ; vbroadcastss 0x2591(%rip),%ymm3 # 58b0 <_sk_callback_avx+0x379>
DB 197,236,89,211 ; vmulps %ymm3,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,134,37,0,0 ; vbroadcastss 0x2586(%rip),%ymm3 # 58b8 <_sk_callback_avx+0x37d>
+ DB 196,226,125,24,29,134,37,0,0 ; vbroadcastss 0x2586(%rip),%ymm3 # 58b4 <_sk_callback_avx+0x37d>
DB 91 ; pop %rbx
DB 65,92 ; pop %r12
DB 65,94 ; pop %r14
@@ -7478,14 +7475,14 @@ PUBLIC _sk_store_565_avx
_sk_store_565_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,114,37,0,0 ; vbroadcastss 0x2572(%rip),%ymm8 # 58bc <_sk_callback_avx+0x381>
+ DB 196,98,125,24,5,114,37,0,0 ; vbroadcastss 0x2572(%rip),%ymm8 # 58b8 <_sk_callback_avx+0x381>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,41,114,241,11 ; vpslld $0xb,%xmm9,%xmm10
DB 196,67,125,25,201,1 ; vextractf128 $0x1,%ymm9,%xmm9
DB 196,193,49,114,241,11 ; vpslld $0xb,%xmm9,%xmm9
DB 196,67,45,24,201,1 ; vinsertf128 $0x1,%xmm9,%ymm10,%ymm9
- DB 196,98,125,24,21,75,37,0,0 ; vbroadcastss 0x254b(%rip),%ymm10 # 58c0 <_sk_callback_avx+0x385>
+ DB 196,98,125,24,21,75,37,0,0 ; vbroadcastss 0x254b(%rip),%ymm10 # 58bc <_sk_callback_avx+0x385>
DB 196,65,116,89,210 ; vmulps %ymm10,%ymm1,%ymm10
DB 196,65,125,91,210 ; vcvtps2dq %ymm10,%ymm10
DB 196,193,33,114,242,5 ; vpslld $0x5,%xmm10,%xmm11
@@ -7499,7 +7496,7 @@ _sk_store_565_avx LABEL PROC
DB 196,67,125,25,193,1 ; vextractf128 $0x1,%ymm8,%xmm9
DB 196,66,57,43,193 ; vpackusdw %xmm9,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 33c5 <_sk_store_565_avx+0x89>
+ DB 117,10 ; jne 33c1 <_sk_store_565_avx+0x89>
DB 196,65,122,127,4,122 ; vmovdqu %xmm8,(%r10,%rdi,2)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -7507,9 +7504,9 @@ _sk_store_565_avx LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 33c1 <_sk_store_565_avx+0x85>
+ DB 119,236 ; ja 33bd <_sk_store_565_avx+0x85>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,68,0,0,0 ; lea 0x44(%rip),%r9 # 3424 <_sk_store_565_avx+0xe8>
+ DB 76,141,13,68,0,0,0 ; lea 0x44(%rip),%r9 # 3420 <_sk_store_565_avx+0xe8>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7520,7 +7517,7 @@ _sk_store_565_avx LABEL PROC
DB 196,67,121,21,68,122,4,2 ; vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
DB 196,67,121,21,68,122,2,1 ; vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
DB 196,67,121,21,4,122,0 ; vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- DB 235,159 ; jmp 33c1 <_sk_store_565_avx+0x85>
+ DB 235,159 ; jmp 33bd <_sk_store_565_avx+0x85>
DB 102,144 ; xchg %ax,%ax
DB 245 ; cmc
DB 255 ; (bad)
@@ -7551,31 +7548,31 @@ _sk_load_4444_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,152,0,0,0 ; jne 34e6 <_sk_load_4444_avx+0xa6>
+ DB 15,133,152,0,0,0 ; jne 34e2 <_sk_load_4444_avx+0xa6>
DB 196,193,122,111,4,122 ; vmovdqu (%r10,%rdi,2),%xmm0
DB 197,241,239,201 ; vpxor %xmm1,%xmm1,%xmm1
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,217,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm3
- DB 196,226,125,24,5,84,36,0,0 ; vbroadcastss 0x2454(%rip),%ymm0 # 58c4 <_sk_callback_avx+0x389>
+ DB 196,226,125,24,5,84,36,0,0 ; vbroadcastss 0x2454(%rip),%ymm0 # 58c0 <_sk_callback_avx+0x389>
DB 197,228,84,192 ; vandps %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,71,36,0,0 ; vbroadcastss 0x2447(%rip),%ymm1 # 58c8 <_sk_callback_avx+0x38d>
+ DB 196,226,125,24,13,71,36,0,0 ; vbroadcastss 0x2447(%rip),%ymm1 # 58c4 <_sk_callback_avx+0x38d>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,62,36,0,0 ; vbroadcastss 0x243e(%rip),%ymm1 # 58cc <_sk_callback_avx+0x391>
+ DB 196,226,125,24,13,62,36,0,0 ; vbroadcastss 0x243e(%rip),%ymm1 # 58c8 <_sk_callback_avx+0x391>
DB 197,228,84,201 ; vandps %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,49,36,0,0 ; vbroadcastss 0x2431(%rip),%ymm2 # 58d0 <_sk_callback_avx+0x395>
+ DB 196,226,125,24,21,49,36,0,0 ; vbroadcastss 0x2431(%rip),%ymm2 # 58cc <_sk_callback_avx+0x395>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,40,36,0,0 ; vbroadcastss 0x2428(%rip),%ymm2 # 58d4 <_sk_callback_avx+0x399>
+ DB 196,226,125,24,21,40,36,0,0 ; vbroadcastss 0x2428(%rip),%ymm2 # 58d0 <_sk_callback_avx+0x399>
DB 197,228,84,210 ; vandps %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,27,36,0,0 ; vbroadcastss 0x241b(%rip),%ymm8 # 58d8 <_sk_callback_avx+0x39d>
+ DB 196,98,125,24,5,27,36,0,0 ; vbroadcastss 0x241b(%rip),%ymm8 # 58d4 <_sk_callback_avx+0x39d>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,17,36,0,0 ; vbroadcastss 0x2411(%rip),%ymm8 # 58dc <_sk_callback_avx+0x3a1>
+ DB 196,98,125,24,5,17,36,0,0 ; vbroadcastss 0x2411(%rip),%ymm8 # 58d8 <_sk_callback_avx+0x3a1>
DB 196,193,100,84,216 ; vandps %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,3,36,0,0 ; vbroadcastss 0x2403(%rip),%ymm8 # 58e0 <_sk_callback_avx+0x3a5>
+ DB 196,98,125,24,5,3,36,0,0 ; vbroadcastss 0x2403(%rip),%ymm8 # 58dc <_sk_callback_avx+0x3a5>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -7584,9 +7581,9 @@ _sk_load_4444_avx LABEL PROC
DB 197,249,239,192 ; vpxor %xmm0,%xmm0,%xmm0
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 15,135,86,255,255,255 ; ja 3454 <_sk_load_4444_avx+0x14>
+ DB 15,135,86,255,255,255 ; ja 3450 <_sk_load_4444_avx+0x14>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,75,0,0,0 ; lea 0x4b(%rip),%r9 # 3554 <_sk_load_4444_avx+0x114>
+ DB 76,141,13,75,0,0,0 ; lea 0x4b(%rip),%r9 # 3550 <_sk_load_4444_avx+0x114>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7598,7 +7595,7 @@ _sk_load_4444_avx LABEL PROC
DB 196,193,121,196,68,122,4,2 ; vpinsrw $0x2,0x4(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,68,122,2,1 ; vpinsrw $0x1,0x2(%r10,%rdi,2),%xmm0,%xmm0
DB 196,193,121,196,4,122,0 ; vpinsrw $0x0,(%r10,%rdi,2),%xmm0,%xmm0
- DB 233,2,255,255,255 ; jmpq 3454 <_sk_load_4444_avx+0x14>
+ DB 233,2,255,255,255 ; jmpq 3450 <_sk_load_4444_avx+0x14>
DB 102,144 ; xchg %ax,%ax
DB 242,255 ; repnz (bad)
DB 255 ; (bad)
@@ -7675,25 +7672,25 @@ _sk_gather_4444_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,217,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm3
- DB 196,226,125,24,5,154,34,0,0 ; vbroadcastss 0x229a(%rip),%ymm0 # 58e4 <_sk_callback_avx+0x3a9>
+ DB 196,226,125,24,5,154,34,0,0 ; vbroadcastss 0x229a(%rip),%ymm0 # 58e0 <_sk_callback_avx+0x3a9>
DB 197,228,84,192 ; vandps %ymm0,%ymm3,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,226,125,24,13,141,34,0,0 ; vbroadcastss 0x228d(%rip),%ymm1 # 58e8 <_sk_callback_avx+0x3ad>
+ DB 196,226,125,24,13,141,34,0,0 ; vbroadcastss 0x228d(%rip),%ymm1 # 58e4 <_sk_callback_avx+0x3ad>
DB 197,252,89,193 ; vmulps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,132,34,0,0 ; vbroadcastss 0x2284(%rip),%ymm1 # 58ec <_sk_callback_avx+0x3b1>
+ DB 196,226,125,24,13,132,34,0,0 ; vbroadcastss 0x2284(%rip),%ymm1 # 58e8 <_sk_callback_avx+0x3b1>
DB 197,228,84,201 ; vandps %ymm1,%ymm3,%ymm1
DB 197,252,91,201 ; vcvtdq2ps %ymm1,%ymm1
- DB 196,226,125,24,21,119,34,0,0 ; vbroadcastss 0x2277(%rip),%ymm2 # 58f0 <_sk_callback_avx+0x3b5>
+ DB 196,226,125,24,21,119,34,0,0 ; vbroadcastss 0x2277(%rip),%ymm2 # 58ec <_sk_callback_avx+0x3b5>
DB 197,244,89,202 ; vmulps %ymm2,%ymm1,%ymm1
- DB 196,226,125,24,21,110,34,0,0 ; vbroadcastss 0x226e(%rip),%ymm2 # 58f4 <_sk_callback_avx+0x3b9>
+ DB 196,226,125,24,21,110,34,0,0 ; vbroadcastss 0x226e(%rip),%ymm2 # 58f0 <_sk_callback_avx+0x3b9>
DB 197,228,84,210 ; vandps %ymm2,%ymm3,%ymm2
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
- DB 196,98,125,24,5,97,34,0,0 ; vbroadcastss 0x2261(%rip),%ymm8 # 58f8 <_sk_callback_avx+0x3bd>
+ DB 196,98,125,24,5,97,34,0,0 ; vbroadcastss 0x2261(%rip),%ymm8 # 58f4 <_sk_callback_avx+0x3bd>
DB 196,193,108,89,208 ; vmulps %ymm8,%ymm2,%ymm2
- DB 196,98,125,24,5,87,34,0,0 ; vbroadcastss 0x2257(%rip),%ymm8 # 58fc <_sk_callback_avx+0x3c1>
+ DB 196,98,125,24,5,87,34,0,0 ; vbroadcastss 0x2257(%rip),%ymm8 # 58f8 <_sk_callback_avx+0x3c1>
DB 196,193,100,84,216 ; vandps %ymm8,%ymm3,%ymm3
DB 197,252,91,219 ; vcvtdq2ps %ymm3,%ymm3
- DB 196,98,125,24,5,73,34,0,0 ; vbroadcastss 0x2249(%rip),%ymm8 # 5900 <_sk_callback_avx+0x3c5>
+ DB 196,98,125,24,5,73,34,0,0 ; vbroadcastss 0x2249(%rip),%ymm8 # 58fc <_sk_callback_avx+0x3c5>
DB 196,193,100,89,216 ; vmulps %ymm8,%ymm3,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 91 ; pop %rbx
@@ -7707,7 +7704,7 @@ PUBLIC _sk_store_4444_avx
_sk_store_4444_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,46,34,0,0 ; vbroadcastss 0x222e(%rip),%ymm8 # 5904 <_sk_callback_avx+0x3c9>
+ DB 196,98,125,24,5,46,34,0,0 ; vbroadcastss 0x222e(%rip),%ymm8 # 5900 <_sk_callback_avx+0x3c9>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,193,41,114,241,12 ; vpslld $0xc,%xmm9,%xmm10
@@ -7734,7 +7731,7 @@ _sk_store_4444_avx LABEL PROC
DB 196,67,125,25,193,1 ; vextractf128 $0x1,%ymm8,%xmm9
DB 196,66,57,43,193 ; vpackusdw %xmm9,%xmm8,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 376f <_sk_store_4444_avx+0xa7>
+ DB 117,10 ; jne 376b <_sk_store_4444_avx+0xa7>
DB 196,65,122,127,4,122 ; vmovdqu %xmm8,(%r10,%rdi,2)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -7742,9 +7739,9 @@ _sk_store_4444_avx LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 376b <_sk_store_4444_avx+0xa3>
+ DB 119,236 ; ja 3767 <_sk_store_4444_avx+0xa3>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,66,0,0,0 ; lea 0x42(%rip),%r9 # 37cc <_sk_store_4444_avx+0x104>
+ DB 76,141,13,66,0,0,0 ; lea 0x42(%rip),%r9 # 37c8 <_sk_store_4444_avx+0x104>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7755,7 +7752,7 @@ _sk_store_4444_avx LABEL PROC
DB 196,67,121,21,68,122,4,2 ; vpextrw $0x2,%xmm8,0x4(%r10,%rdi,2)
DB 196,67,121,21,68,122,2,1 ; vpextrw $0x1,%xmm8,0x2(%r10,%rdi,2)
DB 196,67,121,21,4,122,0 ; vpextrw $0x0,%xmm8,(%r10,%rdi,2)
- DB 235,159 ; jmp 376b <_sk_store_4444_avx+0xa3>
+ DB 235,159 ; jmp 3767 <_sk_store_4444_avx+0xa3>
DB 247,255 ; idiv %edi
DB 255 ; (bad)
DB 255 ; (bad)
@@ -7784,12 +7781,12 @@ _sk_load_8888_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,135,0,0,0 ; jne 387d <_sk_load_8888_avx+0x95>
+ DB 15,133,135,0,0,0 ; jne 3879 <_sk_load_8888_avx+0x95>
DB 196,65,124,16,12,186 ; vmovups (%r10,%rdi,4),%ymm9
- DB 197,124,40,21,92,34,0,0 ; vmovaps 0x225c(%rip),%ymm10 # 5a60 <_sk_callback_avx+0x525>
+ DB 197,124,40,21,96,34,0,0 ; vmovaps 0x2260(%rip),%ymm10 # 5a60 <_sk_callback_avx+0x529>
DB 196,193,52,84,194 ; vandps %ymm10,%ymm9,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,5,242,32,0,0 ; vbroadcastss 0x20f2(%rip),%ymm8 # 5908 <_sk_callback_avx+0x3cd>
+ DB 196,98,125,24,5,242,32,0,0 ; vbroadcastss 0x20f2(%rip),%ymm8 # 5904 <_sk_callback_avx+0x3cd>
DB 196,193,124,89,192 ; vmulps %ymm8,%ymm0,%ymm0
DB 196,193,113,114,209,8 ; vpsrld $0x8,%xmm9,%xmm1
DB 196,99,125,25,203,1 ; vextractf128 $0x1,%ymm9,%xmm3
@@ -7816,9 +7813,9 @@ _sk_load_8888_avx LABEL PROC
DB 196,65,52,87,201 ; vxorps %ymm9,%ymm9,%ymm9
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 15,135,102,255,255,255 ; ja 37fc <_sk_load_8888_avx+0x14>
+ DB 15,135,102,255,255,255 ; ja 37f8 <_sk_load_8888_avx+0x14>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,139,0,0,0 ; lea 0x8b(%rip),%r9 # 392c <_sk_load_8888_avx+0x144>
+ DB 76,141,13,139,0,0,0 ; lea 0x8b(%rip),%r9 # 3928 <_sk_load_8888_avx+0x144>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7841,7 +7838,7 @@ _sk_load_8888_avx LABEL PROC
DB 196,99,53,12,200,15 ; vblendps $0xf,%ymm0,%ymm9,%ymm9
DB 196,195,49,34,4,186,0 ; vpinsrd $0x0,(%r10,%rdi,4),%xmm9,%xmm0
DB 196,99,53,12,200,15 ; vblendps $0xf,%ymm0,%ymm9,%ymm9
- DB 233,210,254,255,255 ; jmpq 37fc <_sk_load_8888_avx+0x14>
+ DB 233,210,254,255,255 ; jmpq 37f8 <_sk_load_8888_avx+0x14>
DB 102,144 ; xchg %ax,%ax
DB 236 ; in (%dx),%al
DB 255 ; (bad)
@@ -7859,7 +7856,7 @@ _sk_load_8888_avx LABEL PROC
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 126,255 ; jle 3945 <_sk_load_8888_avx+0x15d>
+ DB 126,255 ; jle 3941 <_sk_load_8888_avx+0x15d>
DB 255 ; (bad)
DB 255 ; .byte 0xff
@@ -7902,10 +7899,10 @@ _sk_gather_8888_avx LABEL PROC
DB 196,131,121,34,4,152,2 ; vpinsrd $0x2,(%r8,%r11,4),%xmm0,%xmm0
DB 196,131,121,34,28,144,3 ; vpinsrd $0x3,(%r8,%r10,4),%xmm0,%xmm3
DB 196,227,61,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm8,%ymm0
- DB 197,124,40,21,134,32,0,0 ; vmovaps 0x2086(%rip),%ymm10 # 5a80 <_sk_callback_avx+0x545>
+ DB 197,124,40,21,138,32,0,0 ; vmovaps 0x208a(%rip),%ymm10 # 5a80 <_sk_callback_avx+0x549>
DB 196,193,124,84,194 ; vandps %ymm10,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,13,0,31,0,0 ; vbroadcastss 0x1f00(%rip),%ymm9 # 590c <_sk_callback_avx+0x3d1>
+ DB 196,98,125,24,13,0,31,0,0 ; vbroadcastss 0x1f00(%rip),%ymm9 # 5908 <_sk_callback_avx+0x3d1>
DB 196,193,124,89,193 ; vmulps %ymm9,%ymm0,%ymm0
DB 196,193,113,114,208,8 ; vpsrld $0x8,%xmm8,%xmm1
DB 197,233,114,211,8 ; vpsrld $0x8,%xmm3,%xmm2
@@ -7935,7 +7932,7 @@ PUBLIC _sk_store_8888_avx
_sk_store_8888_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
- DB 196,98,125,24,5,142,30,0,0 ; vbroadcastss 0x1e8e(%rip),%ymm8 # 5910 <_sk_callback_avx+0x3d5>
+ DB 196,98,125,24,5,142,30,0,0 ; vbroadcastss 0x1e8e(%rip),%ymm8 # 590c <_sk_callback_avx+0x3d5>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,65,116,89,208 ; vmulps %ymm8,%ymm1,%ymm10
@@ -7960,7 +7957,7 @@ _sk_store_8888_avx LABEL PROC
DB 196,65,45,86,192 ; vorpd %ymm8,%ymm10,%ymm8
DB 196,65,53,86,192 ; vorpd %ymm8,%ymm9,%ymm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,10 ; jne 3b10 <_sk_store_8888_avx+0x9c>
+ DB 117,10 ; jne 3b0c <_sk_store_8888_avx+0x9c>
DB 196,65,124,17,4,186 ; vmovups %ymm8,(%r10,%rdi,4)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -7968,9 +7965,9 @@ _sk_store_8888_avx LABEL PROC
DB 65,128,224,7 ; and $0x7,%r8b
DB 65,254,200 ; dec %r8b
DB 65,128,248,6 ; cmp $0x6,%r8b
- DB 119,236 ; ja 3b0c <_sk_store_8888_avx+0x98>
+ DB 119,236 ; ja 3b08 <_sk_store_8888_avx+0x98>
DB 69,15,182,192 ; movzbl %r8b,%r8d
- DB 76,141,13,85,0,0,0 ; lea 0x55(%rip),%r9 # 3b80 <_sk_store_8888_avx+0x10c>
+ DB 76,141,13,85,0,0,0 ; lea 0x55(%rip),%r9 # 3b7c <_sk_store_8888_avx+0x10c>
DB 75,99,4,129 ; movslq (%r9,%r8,4),%rax
DB 76,1,200 ; add %r9,%rax
DB 255,224 ; jmpq *%rax
@@ -7984,7 +7981,7 @@ _sk_store_8888_avx LABEL PROC
DB 196,67,121,22,68,186,8,2 ; vpextrd $0x2,%xmm8,0x8(%r10,%rdi,4)
DB 196,67,121,22,68,186,4,1 ; vpextrd $0x1,%xmm8,0x4(%r10,%rdi,4)
DB 196,65,121,126,4,186 ; vmovd %xmm8,(%r10,%rdi,4)
- DB 235,143 ; jmp 3b0c <_sk_store_8888_avx+0x98>
+ DB 235,143 ; jmp 3b08 <_sk_store_8888_avx+0x98>
DB 15,31,0 ; nopl (%rax)
DB 245 ; cmc
DB 255 ; (bad)
@@ -8020,7 +8017,7 @@ _sk_load_f16_avx LABEL PROC
DB 197,252,17,116,36,64 ; vmovups %ymm6,0x40(%rsp)
DB 197,252,17,108,36,32 ; vmovups %ymm5,0x20(%rsp)
DB 197,254,127,36,36 ; vmovdqu %ymm4,(%rsp)
- DB 15,133,143,2,0,0 ; jne 3e57 <_sk_load_f16_avx+0x2bb>
+ DB 15,133,143,2,0,0 ; jne 3e53 <_sk_load_f16_avx+0x2bb>
DB 197,121,16,4,248 ; vmovupd (%rax,%rdi,8),%xmm8
DB 197,249,16,84,248,16 ; vmovupd 0x10(%rax,%rdi,8),%xmm2
DB 197,249,16,76,248,32 ; vmovupd 0x20(%rax,%rdi,8),%xmm1
@@ -8038,13 +8035,13 @@ _sk_load_f16_avx LABEL PROC
DB 197,249,105,201 ; vpunpckhwd %xmm1,%xmm0,%xmm1
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
- DB 196,98,125,24,37,243,28,0,0 ; vbroadcastss 0x1cf3(%rip),%ymm12 # 5914 <_sk_callback_avx+0x3d9>
+ DB 196,98,125,24,37,243,28,0,0 ; vbroadcastss 0x1cf3(%rip),%ymm12 # 5910 <_sk_callback_avx+0x3d9>
DB 196,193,124,84,204 ; vandps %ymm12,%ymm0,%ymm1
DB 197,252,87,193 ; vxorps %ymm1,%ymm0,%ymm0
DB 196,195,125,25,198,1 ; vextractf128 $0x1,%ymm0,%xmm14
- DB 196,98,121,24,29,223,28,0,0 ; vbroadcastss 0x1cdf(%rip),%xmm11 # 5918 <_sk_callback_avx+0x3dd>
+ DB 196,98,121,24,29,223,28,0,0 ; vbroadcastss 0x1cdf(%rip),%xmm11 # 5914 <_sk_callback_avx+0x3dd>
DB 196,193,8,87,219 ; vxorps %xmm11,%xmm14,%xmm3
- DB 196,98,121,24,45,213,28,0,0 ; vbroadcastss 0x1cd5(%rip),%xmm13 # 591c <_sk_callback_avx+0x3e1>
+ DB 196,98,121,24,45,213,28,0,0 ; vbroadcastss 0x1cd5(%rip),%xmm13 # 5918 <_sk_callback_avx+0x3e1>
DB 197,145,102,219 ; vpcmpgtd %xmm3,%xmm13,%xmm3
DB 196,65,120,87,211 ; vxorps %xmm11,%xmm0,%xmm10
DB 196,65,17,102,210 ; vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -8058,7 +8055,7 @@ _sk_load_f16_avx LABEL PROC
DB 196,227,125,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm0,%ymm0
DB 197,252,86,193 ; vorps %ymm1,%ymm0,%ymm0
DB 196,227,125,25,193,1 ; vextractf128 $0x1,%ymm0,%xmm1
- DB 196,226,121,24,29,139,28,0,0 ; vbroadcastss 0x1c8b(%rip),%xmm3 # 5920 <_sk_callback_avx+0x3e5>
+ DB 196,226,121,24,29,139,28,0,0 ; vbroadcastss 0x1c8b(%rip),%xmm3 # 591c <_sk_callback_avx+0x3e5>
DB 197,241,254,203 ; vpaddd %xmm3,%xmm1,%xmm1
DB 197,249,254,195 ; vpaddd %xmm3,%xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
@@ -8151,29 +8148,29 @@ _sk_load_f16_avx LABEL PROC
DB 197,123,16,4,248 ; vmovsd (%rax,%rdi,8),%xmm8
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,79 ; je 3eb6 <_sk_load_f16_avx+0x31a>
+ DB 116,79 ; je 3eb2 <_sk_load_f16_avx+0x31a>
DB 197,57,22,68,248,8 ; vmovhpd 0x8(%rax,%rdi,8),%xmm8,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,67 ; jb 3eb6 <_sk_load_f16_avx+0x31a>
+ DB 114,67 ; jb 3eb2 <_sk_load_f16_avx+0x31a>
DB 197,251,16,84,248,16 ; vmovsd 0x10(%rax,%rdi,8),%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 116,68 ; je 3ec3 <_sk_load_f16_avx+0x327>
+ DB 116,68 ; je 3ebf <_sk_load_f16_avx+0x327>
DB 197,233,22,84,248,24 ; vmovhpd 0x18(%rax,%rdi,8),%xmm2,%xmm2
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,56 ; jb 3ec3 <_sk_load_f16_avx+0x327>
+ DB 114,56 ; jb 3ebf <_sk_load_f16_avx+0x327>
DB 197,251,16,76,248,32 ; vmovsd 0x20(%rax,%rdi,8),%xmm1
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 15,132,68,253,255,255 ; je 3bdf <_sk_load_f16_avx+0x43>
+ DB 15,132,68,253,255,255 ; je 3bdb <_sk_load_f16_avx+0x43>
DB 197,241,22,76,248,40 ; vmovhpd 0x28(%rax,%rdi,8),%xmm1,%xmm1
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 15,130,52,253,255,255 ; jb 3bdf <_sk_load_f16_avx+0x43>
+ DB 15,130,52,253,255,255 ; jb 3bdb <_sk_load_f16_avx+0x43>
DB 197,122,126,76,248,48 ; vmovq 0x30(%rax,%rdi,8),%xmm9
- DB 233,41,253,255,255 ; jmpq 3bdf <_sk_load_f16_avx+0x43>
+ DB 233,41,253,255,255 ; jmpq 3bdb <_sk_load_f16_avx+0x43>
DB 197,241,87,201 ; vxorpd %xmm1,%xmm1,%xmm1
DB 197,233,87,210 ; vxorpd %xmm2,%xmm2,%xmm2
- DB 233,28,253,255,255 ; jmpq 3bdf <_sk_load_f16_avx+0x43>
+ DB 233,28,253,255,255 ; jmpq 3bdb <_sk_load_f16_avx+0x43>
DB 197,241,87,201 ; vxorpd %xmm1,%xmm1,%xmm1
- DB 233,19,253,255,255 ; jmpq 3bdf <_sk_load_f16_avx+0x43>
+ DB 233,19,253,255,255 ; jmpq 3bdb <_sk_load_f16_avx+0x43>
PUBLIC _sk_gather_f16_avx
_sk_gather_f16_avx LABEL PROC
@@ -8235,13 +8232,13 @@ _sk_gather_f16_avx LABEL PROC
DB 197,249,105,210 ; vpunpckhwd %xmm2,%xmm0,%xmm2
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,194,1 ; vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
- DB 196,98,125,24,37,75,25,0,0 ; vbroadcastss 0x194b(%rip),%ymm12 # 5924 <_sk_callback_avx+0x3e9>
+ DB 196,98,125,24,37,75,25,0,0 ; vbroadcastss 0x194b(%rip),%ymm12 # 5920 <_sk_callback_avx+0x3e9>
DB 196,193,124,84,212 ; vandps %ymm12,%ymm0,%ymm2
DB 197,252,87,194 ; vxorps %ymm2,%ymm0,%ymm0
DB 196,195,125,25,198,1 ; vextractf128 $0x1,%ymm0,%xmm14
- DB 196,98,121,24,29,55,25,0,0 ; vbroadcastss 0x1937(%rip),%xmm11 # 5928 <_sk_callback_avx+0x3ed>
+ DB 196,98,121,24,29,55,25,0,0 ; vbroadcastss 0x1937(%rip),%xmm11 # 5924 <_sk_callback_avx+0x3ed>
DB 196,193,8,87,219 ; vxorps %xmm11,%xmm14,%xmm3
- DB 196,98,121,24,45,45,25,0,0 ; vbroadcastss 0x192d(%rip),%xmm13 # 592c <_sk_callback_avx+0x3f1>
+ DB 196,98,121,24,45,45,25,0,0 ; vbroadcastss 0x192d(%rip),%xmm13 # 5928 <_sk_callback_avx+0x3f1>
DB 197,145,102,219 ; vpcmpgtd %xmm3,%xmm13,%xmm3
DB 196,65,120,87,211 ; vxorps %xmm11,%xmm0,%xmm10
DB 196,65,17,102,210 ; vpcmpgtd %xmm10,%xmm13,%xmm10
@@ -8255,7 +8252,7 @@ _sk_gather_f16_avx LABEL PROC
DB 196,227,125,24,195,1 ; vinsertf128 $0x1,%xmm3,%ymm0,%ymm0
DB 197,252,86,194 ; vorps %ymm2,%ymm0,%ymm0
DB 196,227,125,25,194,1 ; vextractf128 $0x1,%ymm0,%xmm2
- DB 196,226,121,24,29,227,24,0,0 ; vbroadcastss 0x18e3(%rip),%xmm3 # 5930 <_sk_callback_avx+0x3f5>
+ DB 196,226,121,24,29,227,24,0,0 ; vbroadcastss 0x18e3(%rip),%xmm3 # 592c <_sk_callback_avx+0x3f5>
DB 197,233,254,211 ; vpaddd %xmm3,%xmm2,%xmm2
DB 197,249,254,195 ; vpaddd %xmm3,%xmm0,%xmm0
DB 196,227,125,24,194,1 ; vinsertf128 $0x1,%xmm2,%ymm0,%ymm0
@@ -8357,12 +8354,12 @@ _sk_store_f16_avx LABEL PROC
DB 197,252,17,180,36,128,0,0,0 ; vmovups %ymm6,0x80(%rsp)
DB 197,252,17,108,36,96 ; vmovups %ymm5,0x60(%rsp)
DB 197,252,17,100,36,64 ; vmovups %ymm4,0x40(%rsp)
- DB 196,98,125,24,13,240,22,0,0 ; vbroadcastss 0x16f0(%rip),%ymm9 # 5934 <_sk_callback_avx+0x3f9>
+ DB 196,98,125,24,13,240,22,0,0 ; vbroadcastss 0x16f0(%rip),%ymm9 # 5930 <_sk_callback_avx+0x3f9>
DB 196,65,124,84,209 ; vandps %ymm9,%ymm0,%ymm10
DB 197,252,17,4,36 ; vmovups %ymm0,(%rsp)
DB 196,65,124,87,218 ; vxorps %ymm10,%ymm0,%ymm11
DB 196,67,125,25,220,1 ; vextractf128 $0x1,%ymm11,%xmm12
- DB 196,98,121,24,5,214,22,0,0 ; vbroadcastss 0x16d6(%rip),%xmm8 # 5938 <_sk_callback_avx+0x3fd>
+ DB 196,98,121,24,5,214,22,0,0 ; vbroadcastss 0x16d6(%rip),%xmm8 # 5934 <_sk_callback_avx+0x3fd>
DB 196,65,57,102,236 ; vpcmpgtd %xmm12,%xmm8,%xmm13
DB 196,65,57,102,243 ; vpcmpgtd %xmm11,%xmm8,%xmm14
DB 196,67,13,24,237,1 ; vinsertf128 $0x1,%xmm13,%ymm14,%ymm13
@@ -8372,7 +8369,7 @@ _sk_store_f16_avx LABEL PROC
DB 196,67,13,24,242,1 ; vinsertf128 $0x1,%xmm10,%ymm14,%ymm14
DB 196,193,33,114,211,13 ; vpsrld $0xd,%xmm11,%xmm11
DB 196,193,25,114,212,13 ; vpsrld $0xd,%xmm12,%xmm12
- DB 196,98,125,24,21,157,22,0,0 ; vbroadcastss 0x169d(%rip),%ymm10 # 593c <_sk_callback_avx+0x401>
+ DB 196,98,125,24,21,157,22,0,0 ; vbroadcastss 0x169d(%rip),%ymm10 # 5938 <_sk_callback_avx+0x401>
DB 196,65,12,86,242 ; vorps %ymm10,%ymm14,%ymm14
DB 196,67,125,25,247,1 ; vextractf128 $0x1,%ymm14,%xmm15
DB 196,65,1,254,228 ; vpaddd %xmm12,%xmm15,%xmm12
@@ -8454,7 +8451,7 @@ _sk_store_f16_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 72,133,201 ; test %rcx,%rcx
- DB 117,75 ; jne 4486 <_sk_store_f16_avx+0x270>
+ DB 117,75 ; jne 4482 <_sk_store_f16_avx+0x270>
DB 197,120,17,28,248 ; vmovups %xmm11,(%rax,%rdi,8)
DB 197,120,17,84,248,16 ; vmovups %xmm10,0x10(%rax,%rdi,8)
DB 197,120,17,76,248,32 ; vmovups %xmm9,0x20(%rax,%rdi,8)
@@ -8470,22 +8467,22 @@ _sk_store_f16_avx LABEL PROC
DB 255,224 ; jmpq *%rax
DB 197,121,214,28,248 ; vmovq %xmm11,(%rax,%rdi,8)
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,193 ; je 4452 <_sk_store_f16_avx+0x23c>
+ DB 116,193 ; je 444e <_sk_store_f16_avx+0x23c>
DB 197,121,23,92,248,8 ; vmovhpd %xmm11,0x8(%rax,%rdi,8)
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,181 ; jb 4452 <_sk_store_f16_avx+0x23c>
+ DB 114,181 ; jb 444e <_sk_store_f16_avx+0x23c>
DB 197,121,214,84,248,16 ; vmovq %xmm10,0x10(%rax,%rdi,8)
- DB 116,173 ; je 4452 <_sk_store_f16_avx+0x23c>
+ DB 116,173 ; je 444e <_sk_store_f16_avx+0x23c>
DB 197,121,23,84,248,24 ; vmovhpd %xmm10,0x18(%rax,%rdi,8)
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,161 ; jb 4452 <_sk_store_f16_avx+0x23c>
+ DB 114,161 ; jb 444e <_sk_store_f16_avx+0x23c>
DB 197,121,214,76,248,32 ; vmovq %xmm9,0x20(%rax,%rdi,8)
- DB 116,153 ; je 4452 <_sk_store_f16_avx+0x23c>
+ DB 116,153 ; je 444e <_sk_store_f16_avx+0x23c>
DB 197,121,23,76,248,40 ; vmovhpd %xmm9,0x28(%rax,%rdi,8)
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,141 ; jb 4452 <_sk_store_f16_avx+0x23c>
+ DB 114,141 ; jb 444e <_sk_store_f16_avx+0x23c>
DB 197,121,214,68,248,48 ; vmovq %xmm8,0x30(%rax,%rdi,8)
- DB 235,133 ; jmp 4452 <_sk_store_f16_avx+0x23c>
+ DB 235,133 ; jmp 444e <_sk_store_f16_avx+0x23c>
PUBLIC _sk_load_u16_be_avx
_sk_load_u16_be_avx LABEL PROC
@@ -8493,7 +8490,7 @@ _sk_load_u16_be_avx LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 72,141,4,189,0,0,0,0 ; lea 0x0(,%rdi,4),%rax
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,253,0,0,0 ; jne 45e0 <_sk_load_u16_be_avx+0x113>
+ DB 15,133,253,0,0,0 ; jne 45dc <_sk_load_u16_be_avx+0x113>
DB 196,65,121,16,4,64 ; vmovupd (%r8,%rax,2),%xmm8
DB 196,193,121,16,84,64,16 ; vmovupd 0x10(%r8,%rax,2),%xmm2
DB 196,193,121,16,92,64,32 ; vmovupd 0x20(%r8,%rax,2),%xmm3
@@ -8515,7 +8512,7 @@ _sk_load_u16_be_avx LABEL PROC
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,29,236,19,0,0 ; vbroadcastss 0x13ec(%rip),%ymm11 # 5940 <_sk_callback_avx+0x405>
+ DB 196,98,125,24,29,236,19,0,0 ; vbroadcastss 0x13ec(%rip),%ymm11 # 593c <_sk_callback_avx+0x405>
DB 196,193,124,89,195 ; vmulps %ymm11,%ymm0,%ymm0
DB 197,177,109,202 ; vpunpckhqdq %xmm2,%xmm9,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -8549,29 +8546,29 @@ _sk_load_u16_be_avx LABEL PROC
DB 196,65,123,16,4,64 ; vmovsd (%r8,%rax,2),%xmm8
DB 196,65,49,239,201 ; vpxor %xmm9,%xmm9,%xmm9
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,85 ; je 4646 <_sk_load_u16_be_avx+0x179>
+ DB 116,85 ; je 4642 <_sk_load_u16_be_avx+0x179>
DB 196,65,57,22,68,64,8 ; vmovhpd 0x8(%r8,%rax,2),%xmm8,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,72 ; jb 4646 <_sk_load_u16_be_avx+0x179>
+ DB 114,72 ; jb 4642 <_sk_load_u16_be_avx+0x179>
DB 196,193,123,16,84,64,16 ; vmovsd 0x10(%r8,%rax,2),%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 116,72 ; je 4653 <_sk_load_u16_be_avx+0x186>
+ DB 116,72 ; je 464f <_sk_load_u16_be_avx+0x186>
DB 196,193,105,22,84,64,24 ; vmovhpd 0x18(%r8,%rax,2),%xmm2,%xmm2
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,59 ; jb 4653 <_sk_load_u16_be_avx+0x186>
+ DB 114,59 ; jb 464f <_sk_load_u16_be_avx+0x186>
DB 196,193,123,16,92,64,32 ; vmovsd 0x20(%r8,%rax,2),%xmm3
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 15,132,213,254,255,255 ; je 44fe <_sk_load_u16_be_avx+0x31>
+ DB 15,132,213,254,255,255 ; je 44fa <_sk_load_u16_be_avx+0x31>
DB 196,193,97,22,92,64,40 ; vmovhpd 0x28(%r8,%rax,2),%xmm3,%xmm3
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 15,130,196,254,255,255 ; jb 44fe <_sk_load_u16_be_avx+0x31>
+ DB 15,130,196,254,255,255 ; jb 44fa <_sk_load_u16_be_avx+0x31>
DB 196,65,122,126,76,64,48 ; vmovq 0x30(%r8,%rax,2),%xmm9
- DB 233,184,254,255,255 ; jmpq 44fe <_sk_load_u16_be_avx+0x31>
+ DB 233,184,254,255,255 ; jmpq 44fa <_sk_load_u16_be_avx+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
DB 197,233,87,210 ; vxorpd %xmm2,%xmm2,%xmm2
- DB 233,171,254,255,255 ; jmpq 44fe <_sk_load_u16_be_avx+0x31>
+ DB 233,171,254,255,255 ; jmpq 44fa <_sk_load_u16_be_avx+0x31>
DB 197,225,87,219 ; vxorpd %xmm3,%xmm3,%xmm3
- DB 233,162,254,255,255 ; jmpq 44fe <_sk_load_u16_be_avx+0x31>
+ DB 233,162,254,255,255 ; jmpq 44fa <_sk_load_u16_be_avx+0x31>
PUBLIC _sk_load_rgb_u16_be_avx
_sk_load_rgb_u16_be_avx LABEL PROC
@@ -8579,7 +8576,7 @@ _sk_load_rgb_u16_be_avx LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 72,141,4,127 ; lea (%rdi,%rdi,2),%rax
DB 72,133,201 ; test %rcx,%rcx
- DB 15,133,243,0,0,0 ; jne 4761 <_sk_load_rgb_u16_be_avx+0x105>
+ DB 15,133,243,0,0,0 ; jne 475d <_sk_load_rgb_u16_be_avx+0x105>
DB 196,193,122,111,4,64 ; vmovdqu (%r8,%rax,2),%xmm0
DB 196,193,122,111,84,64,12 ; vmovdqu 0xc(%r8,%rax,2),%xmm2
DB 196,193,122,111,76,64,24 ; vmovdqu 0x18(%r8,%rax,2),%xmm1
@@ -8606,7 +8603,7 @@ _sk_load_rgb_u16_be_avx LABEL PROC
DB 196,226,121,51,192 ; vpmovzxwd %xmm0,%xmm0
DB 196,227,125,24,193,1 ; vinsertf128 $0x1,%xmm1,%ymm0,%ymm0
DB 197,252,91,192 ; vcvtdq2ps %ymm0,%ymm0
- DB 196,98,125,24,29,76,18,0,0 ; vbroadcastss 0x124c(%rip),%ymm11 # 5944 <_sk_callback_avx+0x409>
+ DB 196,98,125,24,29,76,18,0,0 ; vbroadcastss 0x124c(%rip),%ymm11 # 5940 <_sk_callback_avx+0x409>
DB 196,193,124,89,195 ; vmulps %ymm11,%ymm0,%ymm0
DB 197,185,109,202 ; vpunpckhqdq %xmm2,%xmm8,%xmm1
DB 197,233,113,241,8 ; vpsllw $0x8,%xmm1,%xmm2
@@ -8627,48 +8624,48 @@ _sk_load_rgb_u16_be_avx LABEL PROC
DB 197,252,91,210 ; vcvtdq2ps %ymm2,%ymm2
DB 196,193,108,89,211 ; vmulps %ymm11,%ymm2,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,233,17,0,0 ; vbroadcastss 0x11e9(%rip),%ymm3 # 5948 <_sk_callback_avx+0x40d>
+ DB 196,226,125,24,29,233,17,0,0 ; vbroadcastss 0x11e9(%rip),%ymm3 # 5944 <_sk_callback_avx+0x40d>
DB 255,224 ; jmpq *%rax
DB 196,193,121,110,4,64 ; vmovd (%r8,%rax,2),%xmm0
DB 196,193,121,196,68,64,4,2 ; vpinsrw $0x2,0x4(%r8,%rax,2),%xmm0,%xmm0
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 117,5 ; jne 477a <_sk_load_rgb_u16_be_avx+0x11e>
- DB 233,40,255,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
+ DB 117,5 ; jne 4776 <_sk_load_rgb_u16_be_avx+0x11e>
+ DB 233,40,255,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
DB 196,193,121,110,76,64,6 ; vmovd 0x6(%r8,%rax,2),%xmm1
DB 196,65,113,196,68,64,10,2 ; vpinsrw $0x2,0xa(%r8,%rax,2),%xmm1,%xmm8
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,26 ; jb 47a9 <_sk_load_rgb_u16_be_avx+0x14d>
+ DB 114,26 ; jb 47a5 <_sk_load_rgb_u16_be_avx+0x14d>
DB 196,193,121,110,76,64,12 ; vmovd 0xc(%r8,%rax,2),%xmm1
DB 196,193,113,196,84,64,16,2 ; vpinsrw $0x2,0x10(%r8,%rax,2),%xmm1,%xmm2
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 117,10 ; jne 47ae <_sk_load_rgb_u16_be_avx+0x152>
- DB 233,249,254,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
- DB 233,244,254,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
+ DB 117,10 ; jne 47aa <_sk_load_rgb_u16_be_avx+0x152>
+ DB 233,249,254,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
+ DB 233,244,254,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
DB 196,193,121,110,76,64,18 ; vmovd 0x12(%r8,%rax,2),%xmm1
DB 196,65,113,196,76,64,22,2 ; vpinsrw $0x2,0x16(%r8,%rax,2),%xmm1,%xmm9
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,26 ; jb 47dd <_sk_load_rgb_u16_be_avx+0x181>
+ DB 114,26 ; jb 47d9 <_sk_load_rgb_u16_be_avx+0x181>
DB 196,193,121,110,76,64,24 ; vmovd 0x18(%r8,%rax,2),%xmm1
DB 196,193,113,196,76,64,28,2 ; vpinsrw $0x2,0x1c(%r8,%rax,2),%xmm1,%xmm1
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 117,10 ; jne 47e2 <_sk_load_rgb_u16_be_avx+0x186>
- DB 233,197,254,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
- DB 233,192,254,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
+ DB 117,10 ; jne 47de <_sk_load_rgb_u16_be_avx+0x186>
+ DB 233,197,254,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
+ DB 233,192,254,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
DB 196,193,121,110,92,64,30 ; vmovd 0x1e(%r8,%rax,2),%xmm3
DB 196,65,97,196,92,64,34,2 ; vpinsrw $0x2,0x22(%r8,%rax,2),%xmm3,%xmm11
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,20 ; jb 480b <_sk_load_rgb_u16_be_avx+0x1af>
+ DB 114,20 ; jb 4807 <_sk_load_rgb_u16_be_avx+0x1af>
DB 196,193,121,110,92,64,36 ; vmovd 0x24(%r8,%rax,2),%xmm3
DB 196,193,97,196,92,64,40,2 ; vpinsrw $0x2,0x28(%r8,%rax,2),%xmm3,%xmm3
- DB 233,151,254,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
- DB 233,146,254,255,255 ; jmpq 46a2 <_sk_load_rgb_u16_be_avx+0x46>
+ DB 233,151,254,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
+ DB 233,146,254,255,255 ; jmpq 469e <_sk_load_rgb_u16_be_avx+0x46>
PUBLIC _sk_store_u16_be_avx
_sk_store_u16_be_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,0 ; mov (%rax),%r8
DB 72,141,4,189,0,0,0,0 ; lea 0x0(,%rdi,4),%rax
- DB 196,98,125,24,5,38,17,0,0 ; vbroadcastss 0x1126(%rip),%ymm8 # 594c <_sk_callback_avx+0x411>
+ DB 196,98,125,24,5,38,17,0,0 ; vbroadcastss 0x1126(%rip),%ymm8 # 5948 <_sk_callback_avx+0x411>
DB 196,65,124,89,200 ; vmulps %ymm8,%ymm0,%ymm9
DB 196,65,125,91,201 ; vcvtps2dq %ymm9,%ymm9
DB 196,67,125,25,202,1 ; vextractf128 $0x1,%ymm9,%xmm10
@@ -8706,7 +8703,7 @@ _sk_store_u16_be_avx LABEL PROC
DB 196,65,17,98,200 ; vpunpckldq %xmm8,%xmm13,%xmm9
DB 196,65,17,106,192 ; vpunpckhdq %xmm8,%xmm13,%xmm8
DB 72,133,201 ; test %rcx,%rcx
- DB 117,31 ; jne 490a <_sk_store_u16_be_avx+0xfa>
+ DB 117,31 ; jne 4906 <_sk_store_u16_be_avx+0xfa>
DB 196,65,120,17,28,64 ; vmovups %xmm11,(%r8,%rax,2)
DB 196,65,120,17,84,64,16 ; vmovups %xmm10,0x10(%r8,%rax,2)
DB 196,65,120,17,76,64,32 ; vmovups %xmm9,0x20(%r8,%rax,2)
@@ -8715,31 +8712,31 @@ _sk_store_u16_be_avx LABEL PROC
DB 255,224 ; jmpq *%rax
DB 196,65,121,214,28,64 ; vmovq %xmm11,(%r8,%rax,2)
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,240 ; je 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 116,240 ; je 4902 <_sk_store_u16_be_avx+0xf6>
DB 196,65,121,23,92,64,8 ; vmovhpd %xmm11,0x8(%r8,%rax,2)
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,227 ; jb 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 114,227 ; jb 4902 <_sk_store_u16_be_avx+0xf6>
DB 196,65,121,214,84,64,16 ; vmovq %xmm10,0x10(%r8,%rax,2)
- DB 116,218 ; je 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 116,218 ; je 4902 <_sk_store_u16_be_avx+0xf6>
DB 196,65,121,23,84,64,24 ; vmovhpd %xmm10,0x18(%r8,%rax,2)
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,205 ; jb 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 114,205 ; jb 4902 <_sk_store_u16_be_avx+0xf6>
DB 196,65,121,214,76,64,32 ; vmovq %xmm9,0x20(%r8,%rax,2)
- DB 116,196 ; je 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 116,196 ; je 4902 <_sk_store_u16_be_avx+0xf6>
DB 196,65,121,23,76,64,40 ; vmovhpd %xmm9,0x28(%r8,%rax,2)
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,183 ; jb 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 114,183 ; jb 4902 <_sk_store_u16_be_avx+0xf6>
DB 196,65,121,214,68,64,48 ; vmovq %xmm8,0x30(%r8,%rax,2)
- DB 235,174 ; jmp 4906 <_sk_store_u16_be_avx+0xf6>
+ DB 235,174 ; jmp 4902 <_sk_store_u16_be_avx+0xf6>
PUBLIC _sk_load_f32_avx
_sk_load_f32_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 119,110 ; ja 49ce <_sk_load_f32_avx+0x76>
+ DB 119,110 ; ja 49ca <_sk_load_f32_avx+0x76>
DB 76,139,0 ; mov (%rax),%r8
DB 76,141,12,189,0,0,0,0 ; lea 0x0(,%rdi,4),%r9
- DB 76,141,21,134,0,0,0 ; lea 0x86(%rip),%r10 # 49f8 <_sk_load_f32_avx+0xa0>
+ DB 76,141,21,134,0,0,0 ; lea 0x86(%rip),%r10 # 49f4 <_sk_load_f32_avx+0xa0>
DB 73,99,4,138 ; movslq (%r10,%rcx,4),%rax
DB 76,1,208 ; add %r10,%rax
DB 255,224 ; jmpq *%rax
@@ -8796,7 +8793,7 @@ _sk_store_f32_avx LABEL PROC
DB 196,65,37,20,196 ; vunpcklpd %ymm12,%ymm11,%ymm8
DB 196,65,37,21,220 ; vunpckhpd %ymm12,%ymm11,%ymm11
DB 72,133,201 ; test %rcx,%rcx
- DB 117,55 ; jne 4a85 <_sk_store_f32_avx+0x6d>
+ DB 117,55 ; jne 4a81 <_sk_store_f32_avx+0x6d>
DB 196,67,45,24,225,1 ; vinsertf128 $0x1,%xmm9,%ymm10,%ymm12
DB 196,67,61,24,235,1 ; vinsertf128 $0x1,%xmm11,%ymm8,%ymm13
DB 196,67,45,6,201,49 ; vperm2f128 $0x31,%ymm9,%ymm10,%ymm9
@@ -8809,22 +8806,22 @@ _sk_store_f32_avx LABEL PROC
DB 255,224 ; jmpq *%rax
DB 196,65,121,17,20,128 ; vmovupd %xmm10,(%r8,%rax,4)
DB 72,131,249,1 ; cmp $0x1,%rcx
- DB 116,240 ; je 4a81 <_sk_store_f32_avx+0x69>
+ DB 116,240 ; je 4a7d <_sk_store_f32_avx+0x69>
DB 196,65,121,17,76,128,16 ; vmovupd %xmm9,0x10(%r8,%rax,4)
DB 72,131,249,3 ; cmp $0x3,%rcx
- DB 114,227 ; jb 4a81 <_sk_store_f32_avx+0x69>
+ DB 114,227 ; jb 4a7d <_sk_store_f32_avx+0x69>
DB 196,65,121,17,68,128,32 ; vmovupd %xmm8,0x20(%r8,%rax,4)
- DB 116,218 ; je 4a81 <_sk_store_f32_avx+0x69>
+ DB 116,218 ; je 4a7d <_sk_store_f32_avx+0x69>
DB 196,65,121,17,92,128,48 ; vmovupd %xmm11,0x30(%r8,%rax,4)
DB 72,131,249,5 ; cmp $0x5,%rcx
- DB 114,205 ; jb 4a81 <_sk_store_f32_avx+0x69>
+ DB 114,205 ; jb 4a7d <_sk_store_f32_avx+0x69>
DB 196,67,125,25,84,128,64,1 ; vextractf128 $0x1,%ymm10,0x40(%r8,%rax,4)
- DB 116,195 ; je 4a81 <_sk_store_f32_avx+0x69>
+ DB 116,195 ; je 4a7d <_sk_store_f32_avx+0x69>
DB 196,67,125,25,76,128,80,1 ; vextractf128 $0x1,%ymm9,0x50(%r8,%rax,4)
DB 72,131,249,7 ; cmp $0x7,%rcx
- DB 114,181 ; jb 4a81 <_sk_store_f32_avx+0x69>
+ DB 114,181 ; jb 4a7d <_sk_store_f32_avx+0x69>
DB 196,67,125,25,68,128,96,1 ; vextractf128 $0x1,%ymm8,0x60(%r8,%rax,4)
- DB 235,171 ; jmp 4a81 <_sk_store_f32_avx+0x69>
+ DB 235,171 ; jmp 4a7d <_sk_store_f32_avx+0x69>
PUBLIC _sk_clamp_x_avx
_sk_clamp_x_avx LABEL PROC
@@ -8946,12 +8943,12 @@ _sk_mirror_y_avx LABEL PROC
PUBLIC _sk_luminance_to_alpha_avx
_sk_luminance_to_alpha_avx LABEL PROC
- DB 196,226,125,24,29,175,12,0,0 ; vbroadcastss 0xcaf(%rip),%ymm3 # 5950 <_sk_callback_avx+0x415>
+ DB 196,226,125,24,29,175,12,0,0 ; vbroadcastss 0xcaf(%rip),%ymm3 # 594c <_sk_callback_avx+0x415>
DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,29,166,12,0,0 ; vbroadcastss 0xca6(%rip),%ymm3 # 5954 <_sk_callback_avx+0x419>
+ DB 196,226,125,24,29,166,12,0,0 ; vbroadcastss 0xca6(%rip),%ymm3 # 5950 <_sk_callback_avx+0x419>
DB 197,244,89,203 ; vmulps %ymm3,%ymm1,%ymm1
DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 196,226,125,24,13,153,12,0,0 ; vbroadcastss 0xc99(%rip),%ymm1 # 5958 <_sk_callback_avx+0x41d>
+ DB 196,226,125,24,13,153,12,0,0 ; vbroadcastss 0xc99(%rip),%ymm1 # 5954 <_sk_callback_avx+0x41d>
DB 197,236,89,201 ; vmulps %ymm1,%ymm2,%ymm1
DB 197,252,88,217 ; vaddps %ymm1,%ymm0,%ymm3
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9119,7 +9116,7 @@ _sk_linear_gradient_avx LABEL PROC
DB 196,226,125,24,88,28 ; vbroadcastss 0x1c(%rax),%ymm3
DB 76,139,0 ; mov (%rax),%r8
DB 77,133,192 ; test %r8,%r8
- DB 15,132,146,0,0,0 ; je 5015 <_sk_linear_gradient_avx+0xb8>
+ DB 15,132,146,0,0,0 ; je 5011 <_sk_linear_gradient_avx+0xb8>
DB 72,139,64,8 ; mov 0x8(%rax),%rax
DB 72,131,192,32 ; add $0x20,%rax
DB 196,65,28,87,228 ; vxorps %ymm12,%ymm12,%ymm12
@@ -9146,8 +9143,8 @@ _sk_linear_gradient_avx LABEL PROC
DB 196,227,13,74,219,208 ; vblendvps %ymm13,%ymm3,%ymm14,%ymm3
DB 72,131,192,36 ; add $0x24,%rax
DB 73,255,200 ; dec %r8
- DB 117,140 ; jne 4f9f <_sk_linear_gradient_avx+0x42>
- DB 235,20 ; jmp 5029 <_sk_linear_gradient_avx+0xcc>
+ DB 117,140 ; jne 4f9b <_sk_linear_gradient_avx+0x42>
+ DB 235,20 ; jmp 5025 <_sk_linear_gradient_avx+0xcc>
DB 196,65,36,87,219 ; vxorps %ymm11,%ymm11,%ymm11
DB 196,65,44,87,210 ; vxorps %ymm10,%ymm10,%ymm10
DB 196,65,52,87,201 ; vxorps %ymm9,%ymm9,%ymm9
@@ -9198,27 +9195,27 @@ _sk_xy_to_polar_unit_avx LABEL PROC
DB 196,65,52,95,226 ; vmaxps %ymm10,%ymm9,%ymm12
DB 196,65,36,94,220 ; vdivps %ymm12,%ymm11,%ymm11
DB 196,65,36,89,227 ; vmulps %ymm11,%ymm11,%ymm12
- DB 196,98,125,24,45,126,8,0,0 ; vbroadcastss 0x87e(%rip),%ymm13 # 595c <_sk_callback_avx+0x421>
+ DB 196,98,125,24,45,126,8,0,0 ; vbroadcastss 0x87e(%rip),%ymm13 # 5958 <_sk_callback_avx+0x421>
DB 196,65,28,89,237 ; vmulps %ymm13,%ymm12,%ymm13
- DB 196,98,125,24,53,116,8,0,0 ; vbroadcastss 0x874(%rip),%ymm14 # 5960 <_sk_callback_avx+0x425>
+ DB 196,98,125,24,53,116,8,0,0 ; vbroadcastss 0x874(%rip),%ymm14 # 595c <_sk_callback_avx+0x425>
DB 196,65,20,88,238 ; vaddps %ymm14,%ymm13,%ymm13
DB 196,65,28,89,237 ; vmulps %ymm13,%ymm12,%ymm13
- DB 196,98,125,24,53,101,8,0,0 ; vbroadcastss 0x865(%rip),%ymm14 # 5964 <_sk_callback_avx+0x429>
+ DB 196,98,125,24,53,101,8,0,0 ; vbroadcastss 0x865(%rip),%ymm14 # 5960 <_sk_callback_avx+0x429>
DB 196,65,20,88,238 ; vaddps %ymm14,%ymm13,%ymm13
DB 196,65,28,89,229 ; vmulps %ymm13,%ymm12,%ymm12
- DB 196,98,125,24,45,86,8,0,0 ; vbroadcastss 0x856(%rip),%ymm13 # 5968 <_sk_callback_avx+0x42d>
+ DB 196,98,125,24,45,86,8,0,0 ; vbroadcastss 0x856(%rip),%ymm13 # 5964 <_sk_callback_avx+0x42d>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
DB 196,65,52,194,202,1 ; vcmpltps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,65,8,0,0 ; vbroadcastss 0x841(%rip),%ymm10 # 596c <_sk_callback_avx+0x431>
+ DB 196,98,125,24,21,65,8,0,0 ; vbroadcastss 0x841(%rip),%ymm10 # 5968 <_sk_callback_avx+0x431>
DB 196,65,44,92,211 ; vsubps %ymm11,%ymm10,%ymm10
DB 196,67,37,74,202,144 ; vblendvps %ymm9,%ymm10,%ymm11,%ymm9
DB 196,193,124,194,192,1 ; vcmpltps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,21,43,8,0,0 ; vbroadcastss 0x82b(%rip),%ymm10 # 5970 <_sk_callback_avx+0x435>
+ DB 196,98,125,24,21,43,8,0,0 ; vbroadcastss 0x82b(%rip),%ymm10 # 596c <_sk_callback_avx+0x435>
DB 196,65,44,92,209 ; vsubps %ymm9,%ymm10,%ymm10
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 196,65,116,194,200,1 ; vcmpltps %ymm8,%ymm1,%ymm9
- DB 196,98,125,24,21,21,8,0,0 ; vbroadcastss 0x815(%rip),%ymm10 # 5974 <_sk_callback_avx+0x439>
+ DB 196,98,125,24,21,21,8,0,0 ; vbroadcastss 0x815(%rip),%ymm10 # 5970 <_sk_callback_avx+0x439>
DB 197,44,92,208 ; vsubps %ymm0,%ymm10,%ymm10
DB 196,195,125,74,194,144 ; vblendvps %ymm9,%ymm10,%ymm0,%ymm0
DB 196,65,124,194,200,3 ; vcmpunordps %ymm8,%ymm0,%ymm9
@@ -9229,7 +9226,7 @@ _sk_xy_to_polar_unit_avx LABEL PROC
PUBLIC _sk_save_xy_avx
_sk_save_xy_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,244,7,0,0 ; vbroadcastss 0x7f4(%rip),%ymm8 # 5978 <_sk_callback_avx+0x43d>
+ DB 196,98,125,24,5,244,7,0,0 ; vbroadcastss 0x7f4(%rip),%ymm8 # 5974 <_sk_callback_avx+0x43d>
DB 196,65,124,88,200 ; vaddps %ymm8,%ymm0,%ymm9
DB 196,67,125,8,209,1 ; vroundps $0x1,%ymm9,%ymm10
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
@@ -9262,9 +9259,9 @@ _sk_accumulate_avx LABEL PROC
PUBLIC _sk_bilinear_nx_avx
_sk_bilinear_nx_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,128,7,0,0 ; vbroadcastss 0x780(%rip),%ymm0 # 597c <_sk_callback_avx+0x441>
+ DB 196,226,125,24,5,128,7,0,0 ; vbroadcastss 0x780(%rip),%ymm0 # 5978 <_sk_callback_avx+0x441>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,119,7,0,0 ; vbroadcastss 0x777(%rip),%ymm8 # 5980 <_sk_callback_avx+0x445>
+ DB 196,98,125,24,5,119,7,0,0 ; vbroadcastss 0x777(%rip),%ymm8 # 597c <_sk_callback_avx+0x445>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9273,7 +9270,7 @@ _sk_bilinear_nx_avx LABEL PROC
PUBLIC _sk_bilinear_px_avx
_sk_bilinear_px_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,95,7,0,0 ; vbroadcastss 0x75f(%rip),%ymm0 # 5984 <_sk_callback_avx+0x449>
+ DB 196,226,125,24,5,95,7,0,0 ; vbroadcastss 0x75f(%rip),%ymm0 # 5980 <_sk_callback_avx+0x449>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -9283,9 +9280,9 @@ _sk_bilinear_px_avx LABEL PROC
PUBLIC _sk_bilinear_ny_avx
_sk_bilinear_ny_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,67,7,0,0 ; vbroadcastss 0x743(%rip),%ymm1 # 5988 <_sk_callback_avx+0x44d>
+ DB 196,226,125,24,13,67,7,0,0 ; vbroadcastss 0x743(%rip),%ymm1 # 5984 <_sk_callback_avx+0x44d>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,57,7,0,0 ; vbroadcastss 0x739(%rip),%ymm8 # 598c <_sk_callback_avx+0x451>
+ DB 196,98,125,24,5,57,7,0,0 ; vbroadcastss 0x739(%rip),%ymm8 # 5988 <_sk_callback_avx+0x451>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9294,7 +9291,7 @@ _sk_bilinear_ny_avx LABEL PROC
PUBLIC _sk_bilinear_py_avx
_sk_bilinear_py_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,33,7,0,0 ; vbroadcastss 0x721(%rip),%ymm1 # 5990 <_sk_callback_avx+0x455>
+ DB 196,226,125,24,13,33,7,0,0 ; vbroadcastss 0x721(%rip),%ymm1 # 598c <_sk_callback_avx+0x455>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -9304,14 +9301,14 @@ _sk_bilinear_py_avx LABEL PROC
PUBLIC _sk_bicubic_n3x_avx
_sk_bicubic_n3x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,4,7,0,0 ; vbroadcastss 0x704(%rip),%ymm0 # 5994 <_sk_callback_avx+0x459>
+ DB 196,226,125,24,5,4,7,0,0 ; vbroadcastss 0x704(%rip),%ymm0 # 5990 <_sk_callback_avx+0x459>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,251,6,0,0 ; vbroadcastss 0x6fb(%rip),%ymm8 # 5998 <_sk_callback_avx+0x45d>
+ DB 196,98,125,24,5,251,6,0,0 ; vbroadcastss 0x6fb(%rip),%ymm8 # 5994 <_sk_callback_avx+0x45d>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,236,6,0,0 ; vbroadcastss 0x6ec(%rip),%ymm10 # 599c <_sk_callback_avx+0x461>
+ DB 196,98,125,24,21,236,6,0,0 ; vbroadcastss 0x6ec(%rip),%ymm10 # 5998 <_sk_callback_avx+0x461>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,226,6,0,0 ; vbroadcastss 0x6e2(%rip),%ymm10 # 59a0 <_sk_callback_avx+0x465>
+ DB 196,98,125,24,21,226,6,0,0 ; vbroadcastss 0x6e2(%rip),%ymm10 # 599c <_sk_callback_avx+0x465>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -9321,19 +9318,19 @@ _sk_bicubic_n3x_avx LABEL PROC
PUBLIC _sk_bicubic_n1x_avx
_sk_bicubic_n1x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,197,6,0,0 ; vbroadcastss 0x6c5(%rip),%ymm0 # 59a4 <_sk_callback_avx+0x469>
+ DB 196,226,125,24,5,197,6,0,0 ; vbroadcastss 0x6c5(%rip),%ymm0 # 59a0 <_sk_callback_avx+0x469>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,188,6,0,0 ; vbroadcastss 0x6bc(%rip),%ymm8 # 59a8 <_sk_callback_avx+0x46d>
+ DB 196,98,125,24,5,188,6,0,0 ; vbroadcastss 0x6bc(%rip),%ymm8 # 59a4 <_sk_callback_avx+0x46d>
DB 197,60,92,64,64 ; vsubps 0x40(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,178,6,0,0 ; vbroadcastss 0x6b2(%rip),%ymm9 # 59ac <_sk_callback_avx+0x471>
+ DB 196,98,125,24,13,178,6,0,0 ; vbroadcastss 0x6b2(%rip),%ymm9 # 59a8 <_sk_callback_avx+0x471>
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,168,6,0,0 ; vbroadcastss 0x6a8(%rip),%ymm10 # 59b0 <_sk_callback_avx+0x475>
+ DB 196,98,125,24,21,168,6,0,0 ; vbroadcastss 0x6a8(%rip),%ymm10 # 59ac <_sk_callback_avx+0x475>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,153,6,0,0 ; vbroadcastss 0x699(%rip),%ymm10 # 59b4 <_sk_callback_avx+0x479>
+ DB 196,98,125,24,21,153,6,0,0 ; vbroadcastss 0x699(%rip),%ymm10 # 59b0 <_sk_callback_avx+0x479>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,138,6,0,0 ; vbroadcastss 0x68a(%rip),%ymm9 # 59b8 <_sk_callback_avx+0x47d>
+ DB 196,98,125,24,13,138,6,0,0 ; vbroadcastss 0x68a(%rip),%ymm9 # 59b4 <_sk_callback_avx+0x47d>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9342,17 +9339,17 @@ _sk_bicubic_n1x_avx LABEL PROC
PUBLIC _sk_bicubic_p1x_avx
_sk_bicubic_p1x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,114,6,0,0 ; vbroadcastss 0x672(%rip),%ymm8 # 59bc <_sk_callback_avx+0x481>
+ DB 196,98,125,24,5,114,6,0,0 ; vbroadcastss 0x672(%rip),%ymm8 # 59b8 <_sk_callback_avx+0x481>
DB 197,188,88,0 ; vaddps (%rax),%ymm8,%ymm0
DB 197,124,16,72,64 ; vmovups 0x40(%rax),%ymm9
- DB 196,98,125,24,21,100,6,0,0 ; vbroadcastss 0x664(%rip),%ymm10 # 59c0 <_sk_callback_avx+0x485>
+ DB 196,98,125,24,21,100,6,0,0 ; vbroadcastss 0x664(%rip),%ymm10 # 59bc <_sk_callback_avx+0x485>
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
- DB 196,98,125,24,29,90,6,0,0 ; vbroadcastss 0x65a(%rip),%ymm11 # 59c4 <_sk_callback_avx+0x489>
+ DB 196,98,125,24,29,90,6,0,0 ; vbroadcastss 0x65a(%rip),%ymm11 # 59c0 <_sk_callback_avx+0x489>
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 196,98,125,24,13,65,6,0,0 ; vbroadcastss 0x641(%rip),%ymm9 # 59c8 <_sk_callback_avx+0x48d>
+ DB 196,98,125,24,13,65,6,0,0 ; vbroadcastss 0x641(%rip),%ymm9 # 59c4 <_sk_callback_avx+0x48d>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9361,13 +9358,13 @@ _sk_bicubic_p1x_avx LABEL PROC
PUBLIC _sk_bicubic_p3x_avx
_sk_bicubic_p3x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,41,6,0,0 ; vbroadcastss 0x629(%rip),%ymm0 # 59cc <_sk_callback_avx+0x491>
+ DB 196,226,125,24,5,41,6,0,0 ; vbroadcastss 0x629(%rip),%ymm0 # 59c8 <_sk_callback_avx+0x491>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,64,64 ; vmovups 0x40(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,22,6,0,0 ; vbroadcastss 0x616(%rip),%ymm10 # 59d0 <_sk_callback_avx+0x495>
+ DB 196,98,125,24,21,22,6,0,0 ; vbroadcastss 0x616(%rip),%ymm10 # 59cc <_sk_callback_avx+0x495>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,12,6,0,0 ; vbroadcastss 0x60c(%rip),%ymm10 # 59d4 <_sk_callback_avx+0x499>
+ DB 196,98,125,24,21,12,6,0,0 ; vbroadcastss 0x60c(%rip),%ymm10 # 59d0 <_sk_callback_avx+0x499>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,128,0,0,0 ; vmovups %ymm8,0x80(%rax)
@@ -9377,14 +9374,14 @@ _sk_bicubic_p3x_avx LABEL PROC
PUBLIC _sk_bicubic_n3y_avx
_sk_bicubic_n3y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,239,5,0,0 ; vbroadcastss 0x5ef(%rip),%ymm1 # 59d8 <_sk_callback_avx+0x49d>
+ DB 196,226,125,24,13,239,5,0,0 ; vbroadcastss 0x5ef(%rip),%ymm1 # 59d4 <_sk_callback_avx+0x49d>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,229,5,0,0 ; vbroadcastss 0x5e5(%rip),%ymm8 # 59dc <_sk_callback_avx+0x4a1>
+ DB 196,98,125,24,5,229,5,0,0 ; vbroadcastss 0x5e5(%rip),%ymm8 # 59d8 <_sk_callback_avx+0x4a1>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,214,5,0,0 ; vbroadcastss 0x5d6(%rip),%ymm10 # 59e0 <_sk_callback_avx+0x4a5>
+ DB 196,98,125,24,21,214,5,0,0 ; vbroadcastss 0x5d6(%rip),%ymm10 # 59dc <_sk_callback_avx+0x4a5>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,204,5,0,0 ; vbroadcastss 0x5cc(%rip),%ymm10 # 59e4 <_sk_callback_avx+0x4a9>
+ DB 196,98,125,24,21,204,5,0,0 ; vbroadcastss 0x5cc(%rip),%ymm10 # 59e0 <_sk_callback_avx+0x4a9>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -9394,19 +9391,19 @@ _sk_bicubic_n3y_avx LABEL PROC
PUBLIC _sk_bicubic_n1y_avx
_sk_bicubic_n1y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,175,5,0,0 ; vbroadcastss 0x5af(%rip),%ymm1 # 59e8 <_sk_callback_avx+0x4ad>
+ DB 196,226,125,24,13,175,5,0,0 ; vbroadcastss 0x5af(%rip),%ymm1 # 59e4 <_sk_callback_avx+0x4ad>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,165,5,0,0 ; vbroadcastss 0x5a5(%rip),%ymm8 # 59ec <_sk_callback_avx+0x4b1>
+ DB 196,98,125,24,5,165,5,0,0 ; vbroadcastss 0x5a5(%rip),%ymm8 # 59e8 <_sk_callback_avx+0x4b1>
DB 197,60,92,64,96 ; vsubps 0x60(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,155,5,0,0 ; vbroadcastss 0x59b(%rip),%ymm9 # 59f0 <_sk_callback_avx+0x4b5>
+ DB 196,98,125,24,13,155,5,0,0 ; vbroadcastss 0x59b(%rip),%ymm9 # 59ec <_sk_callback_avx+0x4b5>
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,145,5,0,0 ; vbroadcastss 0x591(%rip),%ymm10 # 59f4 <_sk_callback_avx+0x4b9>
+ DB 196,98,125,24,21,145,5,0,0 ; vbroadcastss 0x591(%rip),%ymm10 # 59f0 <_sk_callback_avx+0x4b9>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,130,5,0,0 ; vbroadcastss 0x582(%rip),%ymm10 # 59f8 <_sk_callback_avx+0x4bd>
+ DB 196,98,125,24,21,130,5,0,0 ; vbroadcastss 0x582(%rip),%ymm10 # 59f4 <_sk_callback_avx+0x4bd>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,115,5,0,0 ; vbroadcastss 0x573(%rip),%ymm9 # 59fc <_sk_callback_avx+0x4c1>
+ DB 196,98,125,24,13,115,5,0,0 ; vbroadcastss 0x573(%rip),%ymm9 # 59f8 <_sk_callback_avx+0x4c1>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9415,17 +9412,17 @@ _sk_bicubic_n1y_avx LABEL PROC
PUBLIC _sk_bicubic_p1y_avx
_sk_bicubic_p1y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,91,5,0,0 ; vbroadcastss 0x55b(%rip),%ymm8 # 5a00 <_sk_callback_avx+0x4c5>
+ DB 196,98,125,24,5,91,5,0,0 ; vbroadcastss 0x55b(%rip),%ymm8 # 59fc <_sk_callback_avx+0x4c5>
DB 197,188,88,72,32 ; vaddps 0x20(%rax),%ymm8,%ymm1
DB 197,124,16,72,96 ; vmovups 0x60(%rax),%ymm9
- DB 196,98,125,24,21,76,5,0,0 ; vbroadcastss 0x54c(%rip),%ymm10 # 5a04 <_sk_callback_avx+0x4c9>
+ DB 196,98,125,24,21,76,5,0,0 ; vbroadcastss 0x54c(%rip),%ymm10 # 5a00 <_sk_callback_avx+0x4c9>
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
- DB 196,98,125,24,29,66,5,0,0 ; vbroadcastss 0x542(%rip),%ymm11 # 5a08 <_sk_callback_avx+0x4cd>
+ DB 196,98,125,24,29,66,5,0,0 ; vbroadcastss 0x542(%rip),%ymm11 # 5a04 <_sk_callback_avx+0x4cd>
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 196,98,125,24,13,41,5,0,0 ; vbroadcastss 0x529(%rip),%ymm9 # 5a0c <_sk_callback_avx+0x4d1>
+ DB 196,98,125,24,13,41,5,0,0 ; vbroadcastss 0x529(%rip),%ymm9 # 5a08 <_sk_callback_avx+0x4d1>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -9434,13 +9431,13 @@ _sk_bicubic_p1y_avx LABEL PROC
PUBLIC _sk_bicubic_p3y_avx
_sk_bicubic_p3y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,17,5,0,0 ; vbroadcastss 0x511(%rip),%ymm1 # 5a10 <_sk_callback_avx+0x4d5>
+ DB 196,226,125,24,13,17,5,0,0 ; vbroadcastss 0x511(%rip),%ymm1 # 5a0c <_sk_callback_avx+0x4d5>
DB 197,244,88,72,32 ; vaddps 0x20(%rax),%ymm1,%ymm1
DB 197,124,16,64,96 ; vmovups 0x60(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,253,4,0,0 ; vbroadcastss 0x4fd(%rip),%ymm10 # 5a14 <_sk_callback_avx+0x4d9>
+ DB 196,98,125,24,21,253,4,0,0 ; vbroadcastss 0x4fd(%rip),%ymm10 # 5a10 <_sk_callback_avx+0x4d9>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,243,4,0,0 ; vbroadcastss 0x4f3(%rip),%ymm10 # 5a18 <_sk_callback_avx+0x4dd>
+ DB 196,98,125,24,21,243,4,0,0 ; vbroadcastss 0x4f3(%rip),%ymm10 # 5a14 <_sk_callback_avx+0x4dd>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,160,0,0,0 ; vmovups %ymm8,0xa0(%rax)
@@ -9523,11 +9520,10 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 2,0 ; add (%rax),%al
DB 0,0 ; add %al,(%rax)
- DB 33,8 ; and %ecx,(%rax)
- DB 130 ; (bad)
- DB 60,0 ; cmp $0x0,%al
DB 0,0 ; add %al,(%rax)
- DB 191,0,0,128,63 ; mov $0x3f800000,%edi
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 252 ; cld
+ DB 190,0,0,128,63 ; mov $0x3f800000,%esi
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
DB 0,128,63,0,0,128 ; add %al,-0x7fffffc1(%rax)
@@ -9599,7 +9595,7 @@ ALIGN 4
DB 190,129,128,128,59 ; mov $0x3b808081,%esi
DB 129,128,128,59,0,248,0,0,8,33 ; addl $0x21080000,-0x7ffc480(%rax)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 5741 <.literal4+0xed>
+ DB 224,7 ; loopne 573d <.literal4+0xed>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -9613,10 +9609,10 @@ ALIGN 4
DB 129,128,128,59,129,128,128,59,0,0 ; addl $0x3b80,-0x7f7ec480(%rax)
DB 0,52,255 ; add %dh,(%rdi,%rdi,8)
DB 255 ; (bad)
- DB 127,0 ; jg 576c <.literal4+0x118>
+ DB 127,0 ; jg 5768 <.literal4+0x118>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 57e5 <.literal4+0x191>
+ DB 119,115 ; ja 57e1 <.literal4+0x191>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -9630,10 +9626,10 @@ ALIGN 4
DB 0,128,63,0,0,0 ; add %al,0x3f(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 57a0 <.literal4+0x14c>
+ DB 127,0 ; jg 579c <.literal4+0x14c>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 5819 <.literal4+0x1c5>
+ DB 119,115 ; ja 5815 <.literal4+0x1c5>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -9647,10 +9643,10 @@ ALIGN 4
DB 0,128,63,0,0,0 ; add %al,0x3f(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 57d4 <.literal4+0x180>
+ DB 127,0 ; jg 57d0 <.literal4+0x180>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 584d <.literal4+0x1f9>
+ DB 119,115 ; ja 5849 <.literal4+0x1f9>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -9664,10 +9660,10 @@ ALIGN 4
DB 0,128,63,0,0,0 ; add %al,0x3f(%rax)
DB 52,255 ; xor $0xff,%al
DB 255 ; (bad)
- DB 127,0 ; jg 5808 <.literal4+0x1b4>
+ DB 127,0 ; jg 5804 <.literal4+0x1b4>
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
- DB 119,115 ; ja 5881 <.literal4+0x22d>
+ DB 119,115 ; ja 587d <.literal4+0x22d>
DB 248 ; clc
DB 194,117,191 ; retq $0xbf75
DB 191,63,249,68,180 ; mov $0xb444f93f,%edi
@@ -9680,7 +9676,7 @@ ALIGN 4
DB 0,75,0 ; add %cl,0x0(%rbx)
DB 0,128,63,0,0,200 ; add %al,-0x37ffffc1(%rax)
DB 66,0,0 ; rex.X add %al,(%rax)
- DB 127,67 ; jg 587f <.literal4+0x22b>
+ DB 127,67 ; jg 587b <.literal4+0x22b>
DB 0,0 ; add %al,(%rax)
DB 0,195 ; add %al,%bl
DB 0,0 ; add %al,(%rax)
@@ -9692,10 +9688,10 @@ ALIGN 4
DB 190,80,128,3,62 ; mov $0x3e038050,%esi
DB 31 ; (bad)
DB 215 ; xlat %ds:(%rbx)
- DB 118,63 ; jbe 589f <.literal4+0x24b>
+ DB 118,63 ; jbe 589b <.literal4+0x24b>
DB 246,64,83,63 ; testb $0x3f,0x53(%rax)
DB 129,128,128,59,129,128,128,59,0,0 ; addl $0x3b80,-0x7f7ec480(%rax)
- DB 127,67 ; jg 58b3 <.literal4+0x25f>
+ DB 127,67 ; jg 58af <.literal4+0x25f>
DB 129,128,128,59,0,0,128,63,129,128 ; addl $0x80813f80,0x3b80(%rax)
DB 128,59,0 ; cmpb $0x0,(%rbx)
DB 0,128,63,129,128,128 ; add %al,-0x7f7f7ec1(%rax)
@@ -9704,7 +9700,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 8,33 ; or %ah,(%rcx)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 5895 <.literal4+0x241>
+ DB 224,7 ; loopne 5891 <.literal4+0x241>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -9716,7 +9712,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 8,33 ; or %ah,(%rcx)
DB 132,55 ; test %dh,(%rdi)
- DB 224,7 ; loopne 58b1 <.literal4+0x25d>
+ DB 224,7 ; loopne 58ad <.literal4+0x25d>
DB 0,0 ; add %al,(%rax)
DB 33,8 ; and %ecx,(%rax)
DB 2,58 ; add (%rdx),%bh
@@ -9727,7 +9723,7 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 248 ; clc
DB 65,0,0 ; add %al,(%r8)
- DB 124,66 ; jl 5906 <.literal4+0x2b2>
+ DB 124,66 ; jl 5902 <.literal4+0x2b2>
DB 0,240 ; add %dh,%al
DB 0,0 ; add %al,(%rax)
DB 137,136,136,55,0,15 ; mov %ecx,0xf003788(%rax)
@@ -9745,9 +9741,9 @@ ALIGN 4
DB 137,136,136,59,15,0 ; mov %ecx,0xf3b88(%rax)
DB 0,0 ; add %al,(%rax)
DB 137,136,136,61,0,0 ; mov %ecx,0x3d88(%rax)
- DB 112,65 ; jo 5949 <.literal4+0x2f5>
+ DB 112,65 ; jo 5945 <.literal4+0x2f5>
DB 129,128,128,59,129,128,128,59,0,0 ; addl $0x3b80,-0x7f7ec480(%rax)
- DB 127,67 ; jg 5957 <.literal4+0x303>
+ DB 127,67 ; jg 5953 <.literal4+0x303>
DB 0,128,0,0,0,0 ; add %al,0x0(%rax)
DB 0,128,0,4,0,128 ; add %al,-0x7ffffc00(%rax)
DB 0,0 ; add %al,(%rax)
@@ -9763,7 +9759,7 @@ ALIGN 4
DB 0,128,55,0,0,128 ; add %al,-0x7fffffc9(%rax)
DB 63 ; (bad)
DB 0,255 ; add %bh,%bh
- DB 127,71 ; jg 5997 <.literal4+0x343>
+ DB 127,71 ; jg 5993 <.literal4+0x343>
DB 208 ; (bad)
DB 179,89 ; mov $0x59,%bl
DB 62,89 ; ds pop %rcx
@@ -10011,7 +10007,7 @@ _sk_seed_shader_sse41 LABEL PROC
DB 102,15,110,199 ; movd %edi,%xmm0
DB 102,15,112,192,0 ; pshufd $0x0,%xmm0,%xmm0
DB 15,91,200 ; cvtdq2ps %xmm0,%xmm1
- DB 15,40,21,49,58,0,0 ; movaps 0x3a31(%rip),%xmm2 # 3b40 <_sk_callback_sse41+0xab>
+ DB 15,40,21,49,58,0,0 ; movaps 0x3a31(%rip),%xmm2 # 3b40 <_sk_callback_sse41+0xaf>
DB 15,88,202 ; addps %xmm2,%xmm1
DB 15,16,2 ; movups (%rdx),%xmm0
DB 15,88,193 ; addps %xmm1,%xmm0
@@ -10020,7 +10016,7 @@ _sk_seed_shader_sse41 LABEL PROC
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,88,202 ; addps %xmm2,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,21,32,58,0,0 ; movaps 0x3a20(%rip),%xmm2 # 3b50 <_sk_callback_sse41+0xbb>
+ DB 15,40,21,32,58,0,0 ; movaps 0x3a20(%rip),%xmm2 # 3b50 <_sk_callback_sse41+0xbf>
DB 15,87,219 ; xorps %xmm3,%xmm3
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,87,237 ; xorps %xmm5,%xmm5
@@ -10041,14 +10037,14 @@ _sk_dither_sse41 LABEL PROC
DB 102,68,15,110,1 ; movd (%rcx),%xmm8
DB 102,69,15,112,192,0 ; pshufd $0x0,%xmm8,%xmm8
DB 102,69,15,239,193 ; pxor %xmm9,%xmm8
- DB 102,68,15,111,21,229,57,0,0 ; movdqa 0x39e5(%rip),%xmm10 # 3b60 <_sk_callback_sse41+0xcb>
+ DB 102,68,15,111,21,229,57,0,0 ; movdqa 0x39e5(%rip),%xmm10 # 3b60 <_sk_callback_sse41+0xcf>
DB 102,69,15,111,216 ; movdqa %xmm8,%xmm11
DB 102,69,15,219,218 ; pand %xmm10,%xmm11
DB 102,65,15,114,243,5 ; pslld $0x5,%xmm11
DB 102,69,15,219,209 ; pand %xmm9,%xmm10
DB 102,65,15,114,242,4 ; pslld $0x4,%xmm10
- DB 102,68,15,111,37,209,57,0,0 ; movdqa 0x39d1(%rip),%xmm12 # 3b70 <_sk_callback_sse41+0xdb>
- DB 102,68,15,111,45,216,57,0,0 ; movdqa 0x39d8(%rip),%xmm13 # 3b80 <_sk_callback_sse41+0xeb>
+ DB 102,68,15,111,37,209,57,0,0 ; movdqa 0x39d1(%rip),%xmm12 # 3b70 <_sk_callback_sse41+0xdf>
+ DB 102,68,15,111,45,216,57,0,0 ; movdqa 0x39d8(%rip),%xmm13 # 3b80 <_sk_callback_sse41+0xef>
DB 102,69,15,111,240 ; movdqa %xmm8,%xmm14
DB 102,69,15,219,245 ; pand %xmm13,%xmm14
DB 102,65,15,114,246,2 ; pslld $0x2,%xmm14
@@ -10064,12 +10060,11 @@ _sk_dither_sse41 LABEL PROC
DB 102,69,15,235,245 ; por %xmm13,%xmm14
DB 102,69,15,235,240 ; por %xmm8,%xmm14
DB 69,15,91,198 ; cvtdq2ps %xmm14,%xmm8
- DB 68,15,89,5,147,57,0,0 ; mulps 0x3993(%rip),%xmm8 # 3b90 <_sk_callback_sse41+0xfb>
- DB 68,15,88,5,155,57,0,0 ; addps 0x399b(%rip),%xmm8 # 3ba0 <_sk_callback_sse41+0x10b>
+ DB 68,15,89,5,147,57,0,0 ; mulps 0x3993(%rip),%xmm8 # 3b90 <_sk_callback_sse41+0xff>
+ DB 68,15,88,5,155,57,0,0 ; addps 0x399b(%rip),%xmm8 # 3ba0 <_sk_callback_sse41+0x10f>
DB 243,68,15,16,72,8 ; movss 0x8(%rax),%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
- DB 68,15,89,203 ; mulps %xmm3,%xmm9
DB 65,15,88,193 ; addps %xmm9,%xmm0
DB 65,15,88,201 ; addps %xmm9,%xmm1
DB 65,15,88,209 ; addps %xmm9,%xmm2
@@ -10102,7 +10097,7 @@ _sk_clear_sse41 LABEL PROC
PUBLIC _sk_srcatop_sse41
_sk_srcatop_sse41 LABEL PROC
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 68,15,40,5,68,57,0,0 ; movaps 0x3944(%rip),%xmm8 # 3bb0 <_sk_callback_sse41+0x11b>
+ DB 68,15,40,5,72,57,0,0 ; movaps 0x3948(%rip),%xmm8 # 3bb0 <_sk_callback_sse41+0x11f>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -10125,7 +10120,7 @@ PUBLIC _sk_dstatop_sse41
_sk_dstatop_sse41 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
DB 68,15,89,196 ; mulps %xmm4,%xmm8
- DB 68,15,40,13,7,57,0,0 ; movaps 0x3907(%rip),%xmm9 # 3bc0 <_sk_callback_sse41+0x12b>
+ DB 68,15,40,13,11,57,0,0 ; movaps 0x390b(%rip),%xmm9 # 3bc0 <_sk_callback_sse41+0x12f>
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,88,192 ; addps %xmm8,%xmm0
@@ -10166,7 +10161,7 @@ _sk_dstin_sse41 LABEL PROC
PUBLIC _sk_srcout_sse41
_sk_srcout_sse41 LABEL PROC
- DB 68,15,40,5,171,56,0,0 ; movaps 0x38ab(%rip),%xmm8 # 3bd0 <_sk_callback_sse41+0x13b>
+ DB 68,15,40,5,175,56,0,0 ; movaps 0x38af(%rip),%xmm8 # 3bd0 <_sk_callback_sse41+0x13f>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
@@ -10177,7 +10172,7 @@ _sk_srcout_sse41 LABEL PROC
PUBLIC _sk_dstout_sse41
_sk_dstout_sse41 LABEL PROC
- DB 68,15,40,5,155,56,0,0 ; movaps 0x389b(%rip),%xmm8 # 3be0 <_sk_callback_sse41+0x14b>
+ DB 68,15,40,5,159,56,0,0 ; movaps 0x389f(%rip),%xmm8 # 3be0 <_sk_callback_sse41+0x14f>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 15,89,196 ; mulps %xmm4,%xmm0
@@ -10192,7 +10187,7 @@ _sk_dstout_sse41 LABEL PROC
PUBLIC _sk_srcover_sse41
_sk_srcover_sse41 LABEL PROC
- DB 68,15,40,5,126,56,0,0 ; movaps 0x387e(%rip),%xmm8 # 3bf0 <_sk_callback_sse41+0x15b>
+ DB 68,15,40,5,130,56,0,0 ; movaps 0x3882(%rip),%xmm8 # 3bf0 <_sk_callback_sse41+0x15f>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -10210,7 +10205,7 @@ _sk_srcover_sse41 LABEL PROC
PUBLIC _sk_dstover_sse41
_sk_dstover_sse41 LABEL PROC
- DB 68,15,40,5,82,56,0,0 ; movaps 0x3852(%rip),%xmm8 # 3c00 <_sk_callback_sse41+0x16b>
+ DB 68,15,40,5,86,56,0,0 ; movaps 0x3856(%rip),%xmm8 # 3c00 <_sk_callback_sse41+0x16f>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -10234,7 +10229,7 @@ _sk_modulate_sse41 LABEL PROC
PUBLIC _sk_multiply_sse41
_sk_multiply_sse41 LABEL PROC
- DB 68,15,40,5,38,56,0,0 ; movaps 0x3826(%rip),%xmm8 # 3c10 <_sk_callback_sse41+0x17b>
+ DB 68,15,40,5,42,56,0,0 ; movaps 0x382a(%rip),%xmm8 # 3c10 <_sk_callback_sse41+0x17f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 69,15,40,209 ; movaps %xmm9,%xmm10
@@ -10304,7 +10299,7 @@ _sk_screen_sse41 LABEL PROC
PUBLIC _sk_xor__sse41
_sk_xor__sse41 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
- DB 15,40,29,87,55,0,0 ; movaps 0x3757(%rip),%xmm3 # 3c20 <_sk_callback_sse41+0x18b>
+ DB 15,40,29,91,55,0,0 ; movaps 0x375b(%rip),%xmm3 # 3c20 <_sk_callback_sse41+0x18f>
DB 68,15,40,203 ; movaps %xmm3,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
@@ -10350,7 +10345,7 @@ _sk_darken_sse41 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,95,209 ; maxps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,194,54,0,0 ; movaps 0x36c2(%rip),%xmm2 # 3c30 <_sk_callback_sse41+0x19b>
+ DB 15,40,21,198,54,0,0 ; movaps 0x36c6(%rip),%xmm2 # 3c30 <_sk_callback_sse41+0x19f>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -10382,7 +10377,7 @@ _sk_lighten_sse41 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,103,54,0,0 ; movaps 0x3667(%rip),%xmm2 # 3c40 <_sk_callback_sse41+0x1ab>
+ DB 15,40,21,107,54,0,0 ; movaps 0x366b(%rip),%xmm2 # 3c40 <_sk_callback_sse41+0x1af>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -10417,7 +10412,7 @@ _sk_difference_sse41 LABEL PROC
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,1,54,0,0 ; movaps 0x3601(%rip),%xmm2 # 3c50 <_sk_callback_sse41+0x1bb>
+ DB 15,40,21,5,54,0,0 ; movaps 0x3605(%rip),%xmm2 # 3c50 <_sk_callback_sse41+0x1bf>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -10442,7 +10437,7 @@ _sk_exclusion_sse41 LABEL PROC
DB 15,89,214 ; mulps %xmm6,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,202 ; subps %xmm2,%xmm9
- DB 15,40,13,194,53,0,0 ; movaps 0x35c2(%rip),%xmm1 # 3c60 <_sk_callback_sse41+0x1cb>
+ DB 15,40,13,198,53,0,0 ; movaps 0x35c6(%rip),%xmm1 # 3c60 <_sk_callback_sse41+0x1cf>
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,89,207 ; mulps %xmm7,%xmm1
DB 15,88,217 ; addps %xmm1,%xmm3
@@ -10454,7 +10449,7 @@ _sk_exclusion_sse41 LABEL PROC
PUBLIC _sk_colorburn_sse41
_sk_colorburn_sse41 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,40,21,177,53,0,0 ; movaps 0x35b1(%rip),%xmm10 # 3c70 <_sk_callback_sse41+0x1db>
+ DB 68,15,40,21,181,53,0,0 ; movaps 0x35b5(%rip),%xmm10 # 3c70 <_sk_callback_sse41+0x1df>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 69,15,40,203 ; movaps %xmm11,%xmm9
@@ -10534,7 +10529,7 @@ _sk_colorburn_sse41 LABEL PROC
PUBLIC _sk_colordodge_sse41
_sk_colordodge_sse41 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,40,21,143,52,0,0 ; movaps 0x348f(%rip),%xmm10 # 3c80 <_sk_callback_sse41+0x1eb>
+ DB 68,15,40,21,147,52,0,0 ; movaps 0x3493(%rip),%xmm10 # 3c80 <_sk_callback_sse41+0x1ef>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 69,15,40,227 ; movaps %xmm11,%xmm12
@@ -10615,7 +10610,7 @@ _sk_hardlight_sse41 LABEL PROC
DB 15,40,244 ; movaps %xmm4,%xmm6
DB 15,40,227 ; movaps %xmm3,%xmm4
DB 68,15,40,200 ; movaps %xmm0,%xmm9
- DB 68,15,40,21,101,51,0,0 ; movaps 0x3365(%rip),%xmm10 # 3c90 <_sk_callback_sse41+0x1fb>
+ DB 68,15,40,21,105,51,0,0 ; movaps 0x3369(%rip),%xmm10 # 3c90 <_sk_callback_sse41+0x1ff>
DB 65,15,40,234 ; movaps %xmm10,%xmm5
DB 15,92,239 ; subps %xmm7,%xmm5
DB 15,40,197 ; movaps %xmm5,%xmm0
@@ -10697,7 +10692,7 @@ PUBLIC _sk_overlay_sse41
_sk_overlay_sse41 LABEL PROC
DB 68,15,40,201 ; movaps %xmm1,%xmm9
DB 68,15,40,240 ; movaps %xmm0,%xmm14
- DB 68,15,40,21,71,50,0,0 ; movaps 0x3247(%rip),%xmm10 # 3ca0 <_sk_callback_sse41+0x20b>
+ DB 68,15,40,21,75,50,0,0 ; movaps 0x324b(%rip),%xmm10 # 3ca0 <_sk_callback_sse41+0x20f>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 65,15,40,195 ; movaps %xmm11,%xmm0
@@ -10781,7 +10776,7 @@ _sk_softlight_sse41 LABEL PROC
DB 15,40,198 ; movaps %xmm6,%xmm0
DB 15,94,199 ; divps %xmm7,%xmm0
DB 65,15,84,193 ; andps %xmm9,%xmm0
- DB 15,40,13,26,49,0,0 ; movaps 0x311a(%rip),%xmm1 # 3cb0 <_sk_callback_sse41+0x21b>
+ DB 15,40,13,30,49,0,0 ; movaps 0x311e(%rip),%xmm1 # 3cb0 <_sk_callback_sse41+0x21f>
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 68,15,92,208 ; subps %xmm0,%xmm10
DB 68,15,40,240 ; movaps %xmm0,%xmm14
@@ -10794,10 +10789,10 @@ _sk_softlight_sse41 LABEL PROC
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 15,89,210 ; mulps %xmm2,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
- DB 68,15,40,45,248,48,0,0 ; movaps 0x30f8(%rip),%xmm13 # 3cc0 <_sk_callback_sse41+0x22b>
+ DB 68,15,40,45,252,48,0,0 ; movaps 0x30fc(%rip),%xmm13 # 3cc0 <_sk_callback_sse41+0x22f>
DB 69,15,88,245 ; addps %xmm13,%xmm14
DB 68,15,89,242 ; mulps %xmm2,%xmm14
- DB 68,15,40,37,248,48,0,0 ; movaps 0x30f8(%rip),%xmm12 # 3cd0 <_sk_callback_sse41+0x23b>
+ DB 68,15,40,37,252,48,0,0 ; movaps 0x30fc(%rip),%xmm12 # 3cd0 <_sk_callback_sse41+0x23f>
DB 69,15,89,252 ; mulps %xmm12,%xmm15
DB 69,15,88,254 ; addps %xmm14,%xmm15
DB 15,40,198 ; movaps %xmm6,%xmm0
@@ -10942,7 +10937,7 @@ _sk_clamp_0_sse41 LABEL PROC
PUBLIC _sk_clamp_1_sse41
_sk_clamp_1_sse41 LABEL PROC
- DB 68,15,40,5,8,47,0,0 ; movaps 0x2f08(%rip),%xmm8 # 3ce0 <_sk_callback_sse41+0x24b>
+ DB 68,15,40,5,12,47,0,0 ; movaps 0x2f0c(%rip),%xmm8 # 3ce0 <_sk_callback_sse41+0x24f>
DB 65,15,93,192 ; minps %xmm8,%xmm0
DB 65,15,93,200 ; minps %xmm8,%xmm1
DB 65,15,93,208 ; minps %xmm8,%xmm2
@@ -10952,7 +10947,7 @@ _sk_clamp_1_sse41 LABEL PROC
PUBLIC _sk_clamp_a_sse41
_sk_clamp_a_sse41 LABEL PROC
- DB 15,93,29,253,46,0,0 ; minps 0x2efd(%rip),%xmm3 # 3cf0 <_sk_callback_sse41+0x25b>
+ DB 15,93,29,1,47,0,0 ; minps 0x2f01(%rip),%xmm3 # 3cf0 <_sk_callback_sse41+0x25f>
DB 15,93,195 ; minps %xmm3,%xmm0
DB 15,93,203 ; minps %xmm3,%xmm1
DB 15,93,211 ; minps %xmm3,%xmm2
@@ -11025,7 +11020,7 @@ _sk_premul_sse41 LABEL PROC
PUBLIC _sk_unpremul_sse41
_sk_unpremul_sse41 LABEL PROC
DB 69,15,87,192 ; xorps %xmm8,%xmm8
- DB 68,15,40,13,104,46,0,0 ; movaps 0x2e68(%rip),%xmm9 # 3d00 <_sk_callback_sse41+0x26b>
+ DB 68,15,40,13,108,46,0,0 ; movaps 0x2e6c(%rip),%xmm9 # 3d00 <_sk_callback_sse41+0x26f>
DB 68,15,94,203 ; divps %xmm3,%xmm9
DB 68,15,194,195,4 ; cmpneqps %xmm3,%xmm8
DB 69,15,84,193 ; andps %xmm9,%xmm8
@@ -11037,20 +11032,20 @@ _sk_unpremul_sse41 LABEL PROC
PUBLIC _sk_from_srgb_sse41
_sk_from_srgb_sse41 LABEL PROC
- DB 68,15,40,29,83,46,0,0 ; movaps 0x2e53(%rip),%xmm11 # 3d10 <_sk_callback_sse41+0x27b>
+ DB 68,15,40,29,87,46,0,0 ; movaps 0x2e57(%rip),%xmm11 # 3d10 <_sk_callback_sse41+0x27f>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
DB 68,15,40,208 ; movaps %xmm0,%xmm10
DB 69,15,89,210 ; mulps %xmm10,%xmm10
- DB 68,15,40,37,75,46,0,0 ; movaps 0x2e4b(%rip),%xmm12 # 3d20 <_sk_callback_sse41+0x28b>
+ DB 68,15,40,37,79,46,0,0 ; movaps 0x2e4f(%rip),%xmm12 # 3d20 <_sk_callback_sse41+0x28f>
DB 68,15,40,192 ; movaps %xmm0,%xmm8
DB 69,15,89,196 ; mulps %xmm12,%xmm8
- DB 68,15,40,45,75,46,0,0 ; movaps 0x2e4b(%rip),%xmm13 # 3d30 <_sk_callback_sse41+0x29b>
+ DB 68,15,40,45,79,46,0,0 ; movaps 0x2e4f(%rip),%xmm13 # 3d30 <_sk_callback_sse41+0x29f>
DB 69,15,88,197 ; addps %xmm13,%xmm8
DB 69,15,89,194 ; mulps %xmm10,%xmm8
- DB 68,15,40,53,75,46,0,0 ; movaps 0x2e4b(%rip),%xmm14 # 3d40 <_sk_callback_sse41+0x2ab>
+ DB 68,15,40,53,79,46,0,0 ; movaps 0x2e4f(%rip),%xmm14 # 3d40 <_sk_callback_sse41+0x2af>
DB 69,15,88,198 ; addps %xmm14,%xmm8
- DB 68,15,40,61,79,46,0,0 ; movaps 0x2e4f(%rip),%xmm15 # 3d50 <_sk_callback_sse41+0x2bb>
+ DB 68,15,40,61,83,46,0,0 ; movaps 0x2e53(%rip),%xmm15 # 3d50 <_sk_callback_sse41+0x2bf>
DB 65,15,194,199,1 ; cmpltps %xmm15,%xmm0
DB 102,69,15,56,20,193 ; blendvps %xmm0,%xmm9,%xmm8
DB 68,15,40,209 ; movaps %xmm1,%xmm10
@@ -11094,20 +11089,20 @@ _sk_to_srgb_sse41 LABEL PROC
DB 68,15,82,192 ; rsqrtps %xmm0,%xmm8
DB 69,15,83,200 ; rcpps %xmm8,%xmm9
DB 69,15,82,208 ; rsqrtps %xmm8,%xmm10
- DB 68,15,40,29,188,45,0,0 ; movaps 0x2dbc(%rip),%xmm11 # 3d60 <_sk_callback_sse41+0x2cb>
+ DB 68,15,40,29,192,45,0,0 ; movaps 0x2dc0(%rip),%xmm11 # 3d60 <_sk_callback_sse41+0x2cf>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 65,15,89,203 ; mulps %xmm11,%xmm1
- DB 68,15,40,37,189,45,0,0 ; movaps 0x2dbd(%rip),%xmm12 # 3d70 <_sk_callback_sse41+0x2db>
+ DB 68,15,40,37,193,45,0,0 ; movaps 0x2dc1(%rip),%xmm12 # 3d70 <_sk_callback_sse41+0x2df>
DB 69,15,89,204 ; mulps %xmm12,%xmm9
- DB 68,15,40,45,193,45,0,0 ; movaps 0x2dc1(%rip),%xmm13 # 3d80 <_sk_callback_sse41+0x2eb>
+ DB 68,15,40,45,197,45,0,0 ; movaps 0x2dc5(%rip),%xmm13 # 3d80 <_sk_callback_sse41+0x2ef>
DB 69,15,88,205 ; addps %xmm13,%xmm9
- DB 68,15,40,53,197,45,0,0 ; movaps 0x2dc5(%rip),%xmm14 # 3d90 <_sk_callback_sse41+0x2fb>
+ DB 68,15,40,53,201,45,0,0 ; movaps 0x2dc9(%rip),%xmm14 # 3d90 <_sk_callback_sse41+0x2ff>
DB 69,15,89,214 ; mulps %xmm14,%xmm10
DB 69,15,88,209 ; addps %xmm9,%xmm10
- DB 68,15,40,5,197,45,0,0 ; movaps 0x2dc5(%rip),%xmm8 # 3da0 <_sk_callback_sse41+0x30b>
+ DB 68,15,40,5,201,45,0,0 ; movaps 0x2dc9(%rip),%xmm8 # 3da0 <_sk_callback_sse41+0x30f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,93,202 ; minps %xmm10,%xmm9
- DB 68,15,40,61,197,45,0,0 ; movaps 0x2dc5(%rip),%xmm15 # 3db0 <_sk_callback_sse41+0x31b>
+ DB 68,15,40,61,201,45,0,0 ; movaps 0x2dc9(%rip),%xmm15 # 3db0 <_sk_callback_sse41+0x31f>
DB 65,15,194,199,1 ; cmpltps %xmm15,%xmm0
DB 102,68,15,56,20,201 ; blendvps %xmm0,%xmm1,%xmm9
DB 15,82,194 ; rsqrtps %xmm2,%xmm0
@@ -11160,7 +11155,7 @@ _sk_rgb_to_hsl_sse41 LABEL PROC
DB 68,15,93,226 ; minps %xmm2,%xmm12
DB 65,15,40,203 ; movaps %xmm11,%xmm1
DB 65,15,92,204 ; subps %xmm12,%xmm1
- DB 68,15,40,53,19,45,0,0 ; movaps 0x2d13(%rip),%xmm14 # 3dc0 <_sk_callback_sse41+0x32b>
+ DB 68,15,40,53,23,45,0,0 ; movaps 0x2d17(%rip),%xmm14 # 3dc0 <_sk_callback_sse41+0x32f>
DB 68,15,94,241 ; divps %xmm1,%xmm14
DB 69,15,40,211 ; movaps %xmm11,%xmm10
DB 69,15,194,208,0 ; cmpeqps %xmm8,%xmm10
@@ -11169,27 +11164,27 @@ _sk_rgb_to_hsl_sse41 LABEL PROC
DB 65,15,89,198 ; mulps %xmm14,%xmm0
DB 69,15,40,249 ; movaps %xmm9,%xmm15
DB 68,15,194,250,1 ; cmpltps %xmm2,%xmm15
- DB 68,15,84,61,250,44,0,0 ; andps 0x2cfa(%rip),%xmm15 # 3dd0 <_sk_callback_sse41+0x33b>
+ DB 68,15,84,61,254,44,0,0 ; andps 0x2cfe(%rip),%xmm15 # 3dd0 <_sk_callback_sse41+0x33f>
DB 68,15,88,248 ; addps %xmm0,%xmm15
DB 65,15,40,195 ; movaps %xmm11,%xmm0
DB 65,15,194,193,0 ; cmpeqps %xmm9,%xmm0
DB 65,15,92,208 ; subps %xmm8,%xmm2
DB 65,15,89,214 ; mulps %xmm14,%xmm2
- DB 68,15,40,45,237,44,0,0 ; movaps 0x2ced(%rip),%xmm13 # 3de0 <_sk_callback_sse41+0x34b>
+ DB 68,15,40,45,241,44,0,0 ; movaps 0x2cf1(%rip),%xmm13 # 3de0 <_sk_callback_sse41+0x34f>
DB 65,15,88,213 ; addps %xmm13,%xmm2
DB 69,15,92,193 ; subps %xmm9,%xmm8
DB 69,15,89,198 ; mulps %xmm14,%xmm8
- DB 68,15,88,5,233,44,0,0 ; addps 0x2ce9(%rip),%xmm8 # 3df0 <_sk_callback_sse41+0x35b>
+ DB 68,15,88,5,237,44,0,0 ; addps 0x2ced(%rip),%xmm8 # 3df0 <_sk_callback_sse41+0x35f>
DB 102,68,15,56,20,194 ; blendvps %xmm0,%xmm2,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 102,69,15,56,20,199 ; blendvps %xmm0,%xmm15,%xmm8
- DB 68,15,89,5,225,44,0,0 ; mulps 0x2ce1(%rip),%xmm8 # 3e00 <_sk_callback_sse41+0x36b>
+ DB 68,15,89,5,229,44,0,0 ; mulps 0x2ce5(%rip),%xmm8 # 3e00 <_sk_callback_sse41+0x36f>
DB 69,15,40,203 ; movaps %xmm11,%xmm9
DB 69,15,194,204,4 ; cmpneqps %xmm12,%xmm9
DB 69,15,84,193 ; andps %xmm9,%xmm8
DB 69,15,92,235 ; subps %xmm11,%xmm13
DB 69,15,88,220 ; addps %xmm12,%xmm11
- DB 15,40,5,213,44,0,0 ; movaps 0x2cd5(%rip),%xmm0 # 3e10 <_sk_callback_sse41+0x37b>
+ DB 15,40,5,217,44,0,0 ; movaps 0x2cd9(%rip),%xmm0 # 3e10 <_sk_callback_sse41+0x37f>
DB 65,15,40,211 ; movaps %xmm11,%xmm2
DB 15,89,208 ; mulps %xmm0,%xmm2
DB 15,194,194,1 ; cmpltps %xmm2,%xmm0
@@ -11210,7 +11205,7 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 15,41,100,36,32 ; movaps %xmm4,0x20(%rsp)
DB 15,41,92,36,16 ; movaps %xmm3,0x10(%rsp)
DB 68,15,40,208 ; movaps %xmm0,%xmm10
- DB 68,15,40,13,151,44,0,0 ; movaps 0x2c97(%rip),%xmm9 # 3e20 <_sk_callback_sse41+0x38b>
+ DB 68,15,40,13,155,44,0,0 ; movaps 0x2c9b(%rip),%xmm9 # 3e20 <_sk_callback_sse41+0x38f>
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,194,194,2 ; cmpleps %xmm2,%xmm0
DB 15,40,217 ; movaps %xmm1,%xmm3
@@ -11223,19 +11218,19 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 15,41,20,36 ; movaps %xmm2,(%rsp)
DB 69,15,88,192 ; addps %xmm8,%xmm8
DB 68,15,92,197 ; subps %xmm5,%xmm8
- DB 68,15,40,53,115,44,0,0 ; movaps 0x2c73(%rip),%xmm14 # 3e30 <_sk_callback_sse41+0x39b>
+ DB 68,15,40,53,119,44,0,0 ; movaps 0x2c77(%rip),%xmm14 # 3e30 <_sk_callback_sse41+0x39f>
DB 69,15,88,242 ; addps %xmm10,%xmm14
DB 102,65,15,58,8,198,1 ; roundps $0x1,%xmm14,%xmm0
DB 68,15,92,240 ; subps %xmm0,%xmm14
- DB 68,15,40,29,108,44,0,0 ; movaps 0x2c6c(%rip),%xmm11 # 3e40 <_sk_callback_sse41+0x3ab>
+ DB 68,15,40,29,112,44,0,0 ; movaps 0x2c70(%rip),%xmm11 # 3e40 <_sk_callback_sse41+0x3af>
DB 65,15,40,195 ; movaps %xmm11,%xmm0
DB 65,15,194,198,2 ; cmpleps %xmm14,%xmm0
DB 15,40,245 ; movaps %xmm5,%xmm6
DB 65,15,92,240 ; subps %xmm8,%xmm6
- DB 15,40,61,101,44,0,0 ; movaps 0x2c65(%rip),%xmm7 # 3e50 <_sk_callback_sse41+0x3bb>
+ DB 15,40,61,105,44,0,0 ; movaps 0x2c69(%rip),%xmm7 # 3e50 <_sk_callback_sse41+0x3bf>
DB 69,15,40,238 ; movaps %xmm14,%xmm13
DB 68,15,89,239 ; mulps %xmm7,%xmm13
- DB 15,40,29,102,44,0,0 ; movaps 0x2c66(%rip),%xmm3 # 3e60 <_sk_callback_sse41+0x3cb>
+ DB 15,40,29,106,44,0,0 ; movaps 0x2c6a(%rip),%xmm3 # 3e60 <_sk_callback_sse41+0x3cf>
DB 68,15,40,227 ; movaps %xmm3,%xmm12
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 68,15,89,230 ; mulps %xmm6,%xmm12
@@ -11245,7 +11240,7 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 65,15,194,198,2 ; cmpleps %xmm14,%xmm0
DB 68,15,40,253 ; movaps %xmm5,%xmm15
DB 102,69,15,56,20,252 ; blendvps %xmm0,%xmm12,%xmm15
- DB 68,15,40,37,69,44,0,0 ; movaps 0x2c45(%rip),%xmm12 # 3e70 <_sk_callback_sse41+0x3db>
+ DB 68,15,40,37,73,44,0,0 ; movaps 0x2c49(%rip),%xmm12 # 3e70 <_sk_callback_sse41+0x3df>
DB 65,15,40,196 ; movaps %xmm12,%xmm0
DB 65,15,194,198,2 ; cmpleps %xmm14,%xmm0
DB 68,15,89,238 ; mulps %xmm6,%xmm13
@@ -11279,7 +11274,7 @@ _sk_hsl_to_rgb_sse41 LABEL PROC
DB 65,15,40,198 ; movaps %xmm14,%xmm0
DB 15,40,20,36 ; movaps (%rsp),%xmm2
DB 102,15,56,20,202 ; blendvps %xmm0,%xmm2,%xmm1
- DB 68,15,88,21,190,43,0,0 ; addps 0x2bbe(%rip),%xmm10 # 3e80 <_sk_callback_sse41+0x3eb>
+ DB 68,15,88,21,194,43,0,0 ; addps 0x2bc2(%rip),%xmm10 # 3e80 <_sk_callback_sse41+0x3ef>
DB 102,65,15,58,8,194,1 ; roundps $0x1,%xmm10,%xmm0
DB 68,15,92,208 ; subps %xmm0,%xmm10
DB 69,15,194,218,2 ; cmpleps %xmm10,%xmm11
@@ -11328,7 +11323,7 @@ _sk_scale_u8_sse41 LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 102,68,15,56,49,4,56 ; pmovzxbd (%rax,%rdi,1),%xmm8
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,23,43,0,0 ; mulps 0x2b17(%rip),%xmm8 # 3e90 <_sk_callback_sse41+0x3fb>
+ DB 68,15,89,5,27,43,0,0 ; mulps 0x2b1b(%rip),%xmm8 # 3e90 <_sk_callback_sse41+0x3ff>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 65,15,89,208 ; mulps %xmm8,%xmm2
@@ -11362,7 +11357,7 @@ _sk_lerp_u8_sse41 LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 102,68,15,56,49,4,56 ; pmovzxbd (%rax,%rdi,1),%xmm8
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,195,42,0,0 ; mulps 0x2ac3(%rip),%xmm8 # 3ea0 <_sk_callback_sse41+0x40b>
+ DB 68,15,89,5,199,42,0,0 ; mulps 0x2ac7(%rip),%xmm8 # 3ea0 <_sk_callback_sse41+0x40f>
DB 15,92,196 ; subps %xmm4,%xmm0
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -11383,17 +11378,17 @@ _sk_lerp_565_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 102,68,15,56,51,4,120 ; pmovzxwd (%rax,%rdi,2),%xmm8
- DB 102,15,111,29,147,42,0,0 ; movdqa 0x2a93(%rip),%xmm3 # 3eb0 <_sk_callback_sse41+0x41b>
+ DB 102,15,111,29,151,42,0,0 ; movdqa 0x2a97(%rip),%xmm3 # 3eb0 <_sk_callback_sse41+0x41f>
DB 102,65,15,219,216 ; pand %xmm8,%xmm3
DB 68,15,91,203 ; cvtdq2ps %xmm3,%xmm9
- DB 68,15,89,13,146,42,0,0 ; mulps 0x2a92(%rip),%xmm9 # 3ec0 <_sk_callback_sse41+0x42b>
- DB 102,15,111,29,154,42,0,0 ; movdqa 0x2a9a(%rip),%xmm3 # 3ed0 <_sk_callback_sse41+0x43b>
+ DB 68,15,89,13,150,42,0,0 ; mulps 0x2a96(%rip),%xmm9 # 3ec0 <_sk_callback_sse41+0x42f>
+ DB 102,15,111,29,158,42,0,0 ; movdqa 0x2a9e(%rip),%xmm3 # 3ed0 <_sk_callback_sse41+0x43f>
DB 102,65,15,219,216 ; pand %xmm8,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,155,42,0,0 ; mulps 0x2a9b(%rip),%xmm3 # 3ee0 <_sk_callback_sse41+0x44b>
- DB 102,68,15,219,5,162,42,0,0 ; pand 0x2aa2(%rip),%xmm8 # 3ef0 <_sk_callback_sse41+0x45b>
+ DB 15,89,29,159,42,0,0 ; mulps 0x2a9f(%rip),%xmm3 # 3ee0 <_sk_callback_sse41+0x44f>
+ DB 102,68,15,219,5,166,42,0,0 ; pand 0x2aa6(%rip),%xmm8 # 3ef0 <_sk_callback_sse41+0x45f>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,166,42,0,0 ; mulps 0x2aa6(%rip),%xmm8 # 3f00 <_sk_callback_sse41+0x46b>
+ DB 68,15,89,5,170,42,0,0 ; mulps 0x2aaa(%rip),%xmm8 # 3f00 <_sk_callback_sse41+0x46f>
DB 15,92,196 ; subps %xmm4,%xmm0
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -11404,7 +11399,7 @@ _sk_lerp_565_sse41 LABEL PROC
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 15,88,214 ; addps %xmm6,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,144,42,0,0 ; movaps 0x2a90(%rip),%xmm3 # 3f10 <_sk_callback_sse41+0x47b>
+ DB 15,40,29,148,42,0,0 ; movaps 0x2a94(%rip),%xmm3 # 3f10 <_sk_callback_sse41+0x47f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_load_tables_sse41
@@ -11413,7 +11408,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 76,139,72,8 ; mov 0x8(%rax),%r9
DB 243,69,15,111,4,184 ; movdqu (%r8,%rdi,4),%xmm8
- DB 102,15,111,5,135,42,0,0 ; movdqa 0x2a87(%rip),%xmm0 # 3f20 <_sk_callback_sse41+0x48b>
+ DB 102,15,111,5,139,42,0,0 ; movdqa 0x2a8b(%rip),%xmm0 # 3f20 <_sk_callback_sse41+0x48f>
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,73,15,58,22,192,1 ; pextrq $0x1,%xmm0,%r8
DB 102,72,15,126,193 ; movq %xmm0,%rcx
@@ -11428,7 +11423,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 102,15,58,33,193,48 ; insertps $0x30,%xmm1,%xmm0
DB 76,139,64,16 ; mov 0x10(%rax),%r8
DB 102,65,15,111,200 ; movdqa %xmm8,%xmm1
- DB 102,15,56,0,13,66,42,0,0 ; pshufb 0x2a42(%rip),%xmm1 # 3f30 <_sk_callback_sse41+0x49b>
+ DB 102,15,56,0,13,70,42,0,0 ; pshufb 0x2a46(%rip),%xmm1 # 3f30 <_sk_callback_sse41+0x49f>
DB 102,73,15,58,22,201,1 ; pextrq $0x1,%xmm1,%r9
DB 102,72,15,126,201 ; movq %xmm1,%rcx
DB 68,15,182,209 ; movzbl %cl,%r10d
@@ -11443,7 +11438,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 102,15,58,33,202,48 ; insertps $0x30,%xmm2,%xmm1
DB 76,139,64,24 ; mov 0x18(%rax),%r8
DB 102,65,15,111,208 ; movdqa %xmm8,%xmm2
- DB 102,15,56,0,21,254,41,0,0 ; pshufb 0x29fe(%rip),%xmm2 # 3f40 <_sk_callback_sse41+0x4ab>
+ DB 102,15,56,0,21,2,42,0,0 ; pshufb 0x2a02(%rip),%xmm2 # 3f40 <_sk_callback_sse41+0x4af>
DB 102,72,15,58,22,209,1 ; pextrq $0x1,%xmm2,%rcx
DB 102,72,15,126,208 ; movq %xmm2,%rax
DB 68,15,182,200 ; movzbl %al,%r9d
@@ -11458,7 +11453,7 @@ _sk_load_tables_sse41 LABEL PROC
DB 102,15,58,33,211,48 ; insertps $0x30,%xmm3,%xmm2
DB 102,65,15,114,208,24 ; psrld $0x18,%xmm8
DB 65,15,91,216 ; cvtdq2ps %xmm8,%xmm3
- DB 15,89,29,187,41,0,0 ; mulps 0x29bb(%rip),%xmm3 # 3f50 <_sk_callback_sse41+0x4bb>
+ DB 15,89,29,191,41,0,0 ; mulps 0x29bf(%rip),%xmm3 # 3f50 <_sk_callback_sse41+0x4bf>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -11475,7 +11470,7 @@ _sk_load_tables_u16_be_sse41 LABEL PROC
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,97,200 ; punpcklwd %xmm0,%xmm1
DB 102,68,15,105,200 ; punpckhwd %xmm0,%xmm9
- DB 102,68,15,111,5,142,41,0,0 ; movdqa 0x298e(%rip),%xmm8 # 3f60 <_sk_callback_sse41+0x4cb>
+ DB 102,68,15,111,5,146,41,0,0 ; movdqa 0x2992(%rip),%xmm8 # 3f60 <_sk_callback_sse41+0x4cf>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,15,56,51,192 ; pmovzxwd %xmm0,%xmm0
@@ -11492,7 +11487,7 @@ _sk_load_tables_u16_be_sse41 LABEL PROC
DB 243,67,15,16,20,8 ; movss (%r8,%r9,1),%xmm2
DB 102,15,58,33,194,48 ; insertps $0x30,%xmm2,%xmm0
DB 76,139,64,16 ; mov 0x10(%rax),%r8
- DB 102,15,56,0,13,65,41,0,0 ; pshufb 0x2941(%rip),%xmm1 # 3f70 <_sk_callback_sse41+0x4db>
+ DB 102,15,56,0,13,69,41,0,0 ; pshufb 0x2945(%rip),%xmm1 # 3f70 <_sk_callback_sse41+0x4df>
DB 102,15,56,51,201 ; pmovzxwd %xmm1,%xmm1
DB 102,73,15,58,22,201,1 ; pextrq $0x1,%xmm1,%r9
DB 102,72,15,126,201 ; movq %xmm1,%rcx
@@ -11528,7 +11523,7 @@ _sk_load_tables_u16_be_sse41 LABEL PROC
DB 102,65,15,235,216 ; por %xmm8,%xmm3
DB 102,15,56,51,219 ; pmovzxwd %xmm3,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,143,40,0,0 ; mulps 0x288f(%rip),%xmm3 # 3f80 <_sk_callback_sse41+0x4eb>
+ DB 15,89,29,147,40,0,0 ; mulps 0x2893(%rip),%xmm3 # 3f80 <_sk_callback_sse41+0x4ef>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -11548,7 +11543,7 @@ _sk_load_tables_rgb_u16_be_sse41 LABEL PROC
DB 102,68,15,97,200 ; punpcklwd %xmm0,%xmm9
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,65,15,97,201 ; punpcklwd %xmm9,%xmm1
- DB 102,68,15,111,5,81,40,0,0 ; movdqa 0x2851(%rip),%xmm8 # 3f90 <_sk_callback_sse41+0x4fb>
+ DB 102,68,15,111,5,85,40,0,0 ; movdqa 0x2855(%rip),%xmm8 # 3f90 <_sk_callback_sse41+0x4ff>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,15,56,51,192 ; pmovzxwd %xmm0,%xmm0
@@ -11565,7 +11560,7 @@ _sk_load_tables_rgb_u16_be_sse41 LABEL PROC
DB 243,67,15,16,28,8 ; movss (%r8,%r9,1),%xmm3
DB 102,15,58,33,195,48 ; insertps $0x30,%xmm3,%xmm0
DB 76,139,64,16 ; mov 0x10(%rax),%r8
- DB 102,15,56,0,13,4,40,0,0 ; pshufb 0x2804(%rip),%xmm1 # 3fa0 <_sk_callback_sse41+0x50b>
+ DB 102,15,56,0,13,8,40,0,0 ; pshufb 0x2808(%rip),%xmm1 # 3fa0 <_sk_callback_sse41+0x50f>
DB 102,15,56,51,201 ; pmovzxwd %xmm1,%xmm1
DB 102,73,15,58,22,201,1 ; pextrq $0x1,%xmm1,%r9
DB 102,72,15,126,201 ; movq %xmm1,%rcx
@@ -11596,7 +11591,7 @@ _sk_load_tables_rgb_u16_be_sse41 LABEL PROC
DB 243,65,15,16,28,8 ; movss (%r8,%rcx,1),%xmm3
DB 102,15,58,33,211,48 ; insertps $0x30,%xmm3,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,111,39,0,0 ; movaps 0x276f(%rip),%xmm3 # 3fb0 <_sk_callback_sse41+0x51b>
+ DB 15,40,29,115,39,0,0 ; movaps 0x2773(%rip),%xmm3 # 3fb0 <_sk_callback_sse41+0x51f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_byte_tables_sse41
@@ -11604,7 +11599,7 @@ _sk_byte_tables_sse41 LABEL PROC
DB 65,86 ; push %r14
DB 83 ; push %rbx
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,112,39,0,0 ; movaps 0x2770(%rip),%xmm8 # 3fc0 <_sk_callback_sse41+0x52b>
+ DB 68,15,40,5,116,39,0,0 ; movaps 0x2774(%rip),%xmm8 # 3fc0 <_sk_callback_sse41+0x52f>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
@@ -11623,7 +11618,7 @@ _sk_byte_tables_sse41 LABEL PROC
DB 102,15,58,32,193,3 ; pinsrb $0x3,%ecx,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,13,33,39,0,0 ; movaps 0x2721(%rip),%xmm9 # 3fd0 <_sk_callback_sse41+0x53b>
+ DB 68,15,40,13,37,39,0,0 ; movaps 0x2725(%rip),%xmm9 # 3fd0 <_sk_callback_sse41+0x53f>
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -11712,7 +11707,7 @@ _sk_byte_tables_rgb_sse41 LABEL PROC
DB 102,15,58,32,193,3 ; pinsrb $0x3,%ecx,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,13,169,37,0,0 ; movaps 0x25a9(%rip),%xmm9 # 3fe0 <_sk_callback_sse41+0x54b>
+ DB 68,15,40,13,173,37,0,0 ; movaps 0x25ad(%rip),%xmm9 # 3fe0 <_sk_callback_sse41+0x54f>
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -11879,31 +11874,31 @@ _sk_parametric_r_sse41 LABEL PROC
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,194 ; cvtdq2ps %xmm10,%xmm8
- DB 68,15,89,5,0,35,0,0 ; mulps 0x2300(%rip),%xmm8 # 3ff0 <_sk_callback_sse41+0x55b>
- DB 68,15,84,21,8,35,0,0 ; andps 0x2308(%rip),%xmm10 # 4000 <_sk_callback_sse41+0x56b>
- DB 68,15,86,21,16,35,0,0 ; orps 0x2310(%rip),%xmm10 # 4010 <_sk_callback_sse41+0x57b>
- DB 68,15,88,5,24,35,0,0 ; addps 0x2318(%rip),%xmm8 # 4020 <_sk_callback_sse41+0x58b>
- DB 68,15,40,37,32,35,0,0 ; movaps 0x2320(%rip),%xmm12 # 4030 <_sk_callback_sse41+0x59b>
+ DB 68,15,89,5,4,35,0,0 ; mulps 0x2304(%rip),%xmm8 # 3ff0 <_sk_callback_sse41+0x55f>
+ DB 68,15,84,21,12,35,0,0 ; andps 0x230c(%rip),%xmm10 # 4000 <_sk_callback_sse41+0x56f>
+ DB 68,15,86,21,20,35,0,0 ; orps 0x2314(%rip),%xmm10 # 4010 <_sk_callback_sse41+0x57f>
+ DB 68,15,88,5,28,35,0,0 ; addps 0x231c(%rip),%xmm8 # 4020 <_sk_callback_sse41+0x58f>
+ DB 68,15,40,37,36,35,0,0 ; movaps 0x2324(%rip),%xmm12 # 4030 <_sk_callback_sse41+0x59f>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,196 ; subps %xmm12,%xmm8
- DB 68,15,88,21,32,35,0,0 ; addps 0x2320(%rip),%xmm10 # 4040 <_sk_callback_sse41+0x5ab>
- DB 68,15,40,37,40,35,0,0 ; movaps 0x2328(%rip),%xmm12 # 4050 <_sk_callback_sse41+0x5bb>
+ DB 68,15,88,21,36,35,0,0 ; addps 0x2324(%rip),%xmm10 # 4040 <_sk_callback_sse41+0x5af>
+ DB 68,15,40,37,44,35,0,0 ; movaps 0x232c(%rip),%xmm12 # 4050 <_sk_callback_sse41+0x5bf>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,196 ; subps %xmm12,%xmm8
DB 69,15,89,195 ; mulps %xmm11,%xmm8
DB 102,69,15,58,8,208,1 ; roundps $0x1,%xmm8,%xmm10
DB 69,15,40,216 ; movaps %xmm8,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,5,21,35,0,0 ; addps 0x2315(%rip),%xmm8 # 4060 <_sk_callback_sse41+0x5cb>
- DB 68,15,40,21,29,35,0,0 ; movaps 0x231d(%rip),%xmm10 # 4070 <_sk_callback_sse41+0x5db>
+ DB 68,15,88,5,25,35,0,0 ; addps 0x2319(%rip),%xmm8 # 4060 <_sk_callback_sse41+0x5cf>
+ DB 68,15,40,21,33,35,0,0 ; movaps 0x2321(%rip),%xmm10 # 4070 <_sk_callback_sse41+0x5df>
DB 69,15,89,211 ; mulps %xmm11,%xmm10
DB 69,15,92,194 ; subps %xmm10,%xmm8
- DB 68,15,40,21,29,35,0,0 ; movaps 0x231d(%rip),%xmm10 # 4080 <_sk_callback_sse41+0x5eb>
+ DB 68,15,40,21,33,35,0,0 ; movaps 0x2321(%rip),%xmm10 # 4080 <_sk_callback_sse41+0x5ef>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 68,15,40,29,33,35,0,0 ; movaps 0x2321(%rip),%xmm11 # 4090 <_sk_callback_sse41+0x5fb>
+ DB 68,15,40,29,37,35,0,0 ; movaps 0x2325(%rip),%xmm11 # 4090 <_sk_callback_sse41+0x5ff>
DB 69,15,94,218 ; divps %xmm10,%xmm11
DB 69,15,88,216 ; addps %xmm8,%xmm11
- DB 68,15,89,29,33,35,0,0 ; mulps 0x2321(%rip),%xmm11 # 40a0 <_sk_callback_sse41+0x60b>
+ DB 68,15,89,29,37,35,0,0 ; mulps 0x2325(%rip),%xmm11 # 40a0 <_sk_callback_sse41+0x60f>
DB 102,69,15,91,211 ; cvtps2dq %xmm11,%xmm10
DB 243,68,15,16,64,20 ; movss 0x14(%rax),%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
@@ -11911,7 +11906,7 @@ _sk_parametric_r_sse41 LABEL PROC
DB 102,69,15,56,20,193 ; blendvps %xmm0,%xmm9,%xmm8
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 68,15,95,192 ; maxps %xmm0,%xmm8
- DB 68,15,93,5,8,35,0,0 ; minps 0x2308(%rip),%xmm8 # 40b0 <_sk_callback_sse41+0x61b>
+ DB 68,15,93,5,12,35,0,0 ; minps 0x230c(%rip),%xmm8 # 40b0 <_sk_callback_sse41+0x61f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -11939,31 +11934,31 @@ _sk_parametric_g_sse41 LABEL PROC
DB 68,15,88,217 ; addps %xmm1,%xmm11
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,91,227 ; cvtdq2ps %xmm11,%xmm12
- DB 68,15,89,37,169,34,0,0 ; mulps 0x22a9(%rip),%xmm12 # 40c0 <_sk_callback_sse41+0x62b>
- DB 68,15,84,29,177,34,0,0 ; andps 0x22b1(%rip),%xmm11 # 40d0 <_sk_callback_sse41+0x63b>
- DB 68,15,86,29,185,34,0,0 ; orps 0x22b9(%rip),%xmm11 # 40e0 <_sk_callback_sse41+0x64b>
- DB 68,15,88,37,193,34,0,0 ; addps 0x22c1(%rip),%xmm12 # 40f0 <_sk_callback_sse41+0x65b>
- DB 15,40,13,202,34,0,0 ; movaps 0x22ca(%rip),%xmm1 # 4100 <_sk_callback_sse41+0x66b>
+ DB 68,15,89,37,173,34,0,0 ; mulps 0x22ad(%rip),%xmm12 # 40c0 <_sk_callback_sse41+0x62f>
+ DB 68,15,84,29,181,34,0,0 ; andps 0x22b5(%rip),%xmm11 # 40d0 <_sk_callback_sse41+0x63f>
+ DB 68,15,86,29,189,34,0,0 ; orps 0x22bd(%rip),%xmm11 # 40e0 <_sk_callback_sse41+0x64f>
+ DB 68,15,88,37,197,34,0,0 ; addps 0x22c5(%rip),%xmm12 # 40f0 <_sk_callback_sse41+0x65f>
+ DB 15,40,13,206,34,0,0 ; movaps 0x22ce(%rip),%xmm1 # 4100 <_sk_callback_sse41+0x66f>
DB 65,15,89,203 ; mulps %xmm11,%xmm1
DB 68,15,92,225 ; subps %xmm1,%xmm12
- DB 68,15,88,29,202,34,0,0 ; addps 0x22ca(%rip),%xmm11 # 4110 <_sk_callback_sse41+0x67b>
- DB 15,40,13,211,34,0,0 ; movaps 0x22d3(%rip),%xmm1 # 4120 <_sk_callback_sse41+0x68b>
+ DB 68,15,88,29,206,34,0,0 ; addps 0x22ce(%rip),%xmm11 # 4110 <_sk_callback_sse41+0x67f>
+ DB 15,40,13,215,34,0,0 ; movaps 0x22d7(%rip),%xmm1 # 4120 <_sk_callback_sse41+0x68f>
DB 65,15,94,203 ; divps %xmm11,%xmm1
DB 68,15,92,225 ; subps %xmm1,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 102,69,15,58,8,212,1 ; roundps $0x1,%xmm12,%xmm10
DB 69,15,40,220 ; movaps %xmm12,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,37,192,34,0,0 ; addps 0x22c0(%rip),%xmm12 # 4130 <_sk_callback_sse41+0x69b>
- DB 15,40,13,201,34,0,0 ; movaps 0x22c9(%rip),%xmm1 # 4140 <_sk_callback_sse41+0x6ab>
+ DB 68,15,88,37,196,34,0,0 ; addps 0x22c4(%rip),%xmm12 # 4130 <_sk_callback_sse41+0x69f>
+ DB 15,40,13,205,34,0,0 ; movaps 0x22cd(%rip),%xmm1 # 4140 <_sk_callback_sse41+0x6af>
DB 65,15,89,203 ; mulps %xmm11,%xmm1
DB 68,15,92,225 ; subps %xmm1,%xmm12
- DB 68,15,40,21,201,34,0,0 ; movaps 0x22c9(%rip),%xmm10 # 4150 <_sk_callback_sse41+0x6bb>
+ DB 68,15,40,21,205,34,0,0 ; movaps 0x22cd(%rip),%xmm10 # 4150 <_sk_callback_sse41+0x6bf>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 15,40,13,206,34,0,0 ; movaps 0x22ce(%rip),%xmm1 # 4160 <_sk_callback_sse41+0x6cb>
+ DB 15,40,13,210,34,0,0 ; movaps 0x22d2(%rip),%xmm1 # 4160 <_sk_callback_sse41+0x6cf>
DB 65,15,94,202 ; divps %xmm10,%xmm1
DB 65,15,88,204 ; addps %xmm12,%xmm1
- DB 15,89,13,207,34,0,0 ; mulps 0x22cf(%rip),%xmm1 # 4170 <_sk_callback_sse41+0x6db>
+ DB 15,89,13,211,34,0,0 ; mulps 0x22d3(%rip),%xmm1 # 4170 <_sk_callback_sse41+0x6df>
DB 102,68,15,91,209 ; cvtps2dq %xmm1,%xmm10
DB 243,15,16,72,20 ; movss 0x14(%rax),%xmm1
DB 15,198,201,0 ; shufps $0x0,%xmm1,%xmm1
@@ -11971,7 +11966,7 @@ _sk_parametric_g_sse41 LABEL PROC
DB 102,65,15,56,20,201 ; blendvps %xmm0,%xmm9,%xmm1
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,95,200 ; maxps %xmm0,%xmm1
- DB 15,93,13,186,34,0,0 ; minps 0x22ba(%rip),%xmm1 # 4180 <_sk_callback_sse41+0x6eb>
+ DB 15,93,13,190,34,0,0 ; minps 0x22be(%rip),%xmm1 # 4180 <_sk_callback_sse41+0x6ef>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -11999,31 +11994,31 @@ _sk_parametric_b_sse41 LABEL PROC
DB 68,15,88,218 ; addps %xmm2,%xmm11
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,91,227 ; cvtdq2ps %xmm11,%xmm12
- DB 68,15,89,37,91,34,0,0 ; mulps 0x225b(%rip),%xmm12 # 4190 <_sk_callback_sse41+0x6fb>
- DB 68,15,84,29,99,34,0,0 ; andps 0x2263(%rip),%xmm11 # 41a0 <_sk_callback_sse41+0x70b>
- DB 68,15,86,29,107,34,0,0 ; orps 0x226b(%rip),%xmm11 # 41b0 <_sk_callback_sse41+0x71b>
- DB 68,15,88,37,115,34,0,0 ; addps 0x2273(%rip),%xmm12 # 41c0 <_sk_callback_sse41+0x72b>
- DB 15,40,21,124,34,0,0 ; movaps 0x227c(%rip),%xmm2 # 41d0 <_sk_callback_sse41+0x73b>
+ DB 68,15,89,37,95,34,0,0 ; mulps 0x225f(%rip),%xmm12 # 4190 <_sk_callback_sse41+0x6ff>
+ DB 68,15,84,29,103,34,0,0 ; andps 0x2267(%rip),%xmm11 # 41a0 <_sk_callback_sse41+0x70f>
+ DB 68,15,86,29,111,34,0,0 ; orps 0x226f(%rip),%xmm11 # 41b0 <_sk_callback_sse41+0x71f>
+ DB 68,15,88,37,119,34,0,0 ; addps 0x2277(%rip),%xmm12 # 41c0 <_sk_callback_sse41+0x72f>
+ DB 15,40,21,128,34,0,0 ; movaps 0x2280(%rip),%xmm2 # 41d0 <_sk_callback_sse41+0x73f>
DB 65,15,89,211 ; mulps %xmm11,%xmm2
DB 68,15,92,226 ; subps %xmm2,%xmm12
- DB 68,15,88,29,124,34,0,0 ; addps 0x227c(%rip),%xmm11 # 41e0 <_sk_callback_sse41+0x74b>
- DB 15,40,21,133,34,0,0 ; movaps 0x2285(%rip),%xmm2 # 41f0 <_sk_callback_sse41+0x75b>
+ DB 68,15,88,29,128,34,0,0 ; addps 0x2280(%rip),%xmm11 # 41e0 <_sk_callback_sse41+0x74f>
+ DB 15,40,21,137,34,0,0 ; movaps 0x2289(%rip),%xmm2 # 41f0 <_sk_callback_sse41+0x75f>
DB 65,15,94,211 ; divps %xmm11,%xmm2
DB 68,15,92,226 ; subps %xmm2,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 102,69,15,58,8,212,1 ; roundps $0x1,%xmm12,%xmm10
DB 69,15,40,220 ; movaps %xmm12,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,37,114,34,0,0 ; addps 0x2272(%rip),%xmm12 # 4200 <_sk_callback_sse41+0x76b>
- DB 15,40,21,123,34,0,0 ; movaps 0x227b(%rip),%xmm2 # 4210 <_sk_callback_sse41+0x77b>
+ DB 68,15,88,37,118,34,0,0 ; addps 0x2276(%rip),%xmm12 # 4200 <_sk_callback_sse41+0x76f>
+ DB 15,40,21,127,34,0,0 ; movaps 0x227f(%rip),%xmm2 # 4210 <_sk_callback_sse41+0x77f>
DB 65,15,89,211 ; mulps %xmm11,%xmm2
DB 68,15,92,226 ; subps %xmm2,%xmm12
- DB 68,15,40,21,123,34,0,0 ; movaps 0x227b(%rip),%xmm10 # 4220 <_sk_callback_sse41+0x78b>
+ DB 68,15,40,21,127,34,0,0 ; movaps 0x227f(%rip),%xmm10 # 4220 <_sk_callback_sse41+0x78f>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 15,40,21,128,34,0,0 ; movaps 0x2280(%rip),%xmm2 # 4230 <_sk_callback_sse41+0x79b>
+ DB 15,40,21,132,34,0,0 ; movaps 0x2284(%rip),%xmm2 # 4230 <_sk_callback_sse41+0x79f>
DB 65,15,94,210 ; divps %xmm10,%xmm2
DB 65,15,88,212 ; addps %xmm12,%xmm2
- DB 15,89,21,129,34,0,0 ; mulps 0x2281(%rip),%xmm2 # 4240 <_sk_callback_sse41+0x7ab>
+ DB 15,89,21,133,34,0,0 ; mulps 0x2285(%rip),%xmm2 # 4240 <_sk_callback_sse41+0x7af>
DB 102,68,15,91,210 ; cvtps2dq %xmm2,%xmm10
DB 243,15,16,80,20 ; movss 0x14(%rax),%xmm2
DB 15,198,210,0 ; shufps $0x0,%xmm2,%xmm2
@@ -12031,7 +12026,7 @@ _sk_parametric_b_sse41 LABEL PROC
DB 102,65,15,56,20,209 ; blendvps %xmm0,%xmm9,%xmm2
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,95,208 ; maxps %xmm0,%xmm2
- DB 15,93,21,108,34,0,0 ; minps 0x226c(%rip),%xmm2 # 4250 <_sk_callback_sse41+0x7bb>
+ DB 15,93,21,112,34,0,0 ; minps 0x2270(%rip),%xmm2 # 4250 <_sk_callback_sse41+0x7bf>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -12059,31 +12054,31 @@ _sk_parametric_a_sse41 LABEL PROC
DB 68,15,88,219 ; addps %xmm3,%xmm11
DB 69,15,198,210,0 ; shufps $0x0,%xmm10,%xmm10
DB 69,15,91,227 ; cvtdq2ps %xmm11,%xmm12
- DB 68,15,89,37,13,34,0,0 ; mulps 0x220d(%rip),%xmm12 # 4260 <_sk_callback_sse41+0x7cb>
- DB 68,15,84,29,21,34,0,0 ; andps 0x2215(%rip),%xmm11 # 4270 <_sk_callback_sse41+0x7db>
- DB 68,15,86,29,29,34,0,0 ; orps 0x221d(%rip),%xmm11 # 4280 <_sk_callback_sse41+0x7eb>
- DB 68,15,88,37,37,34,0,0 ; addps 0x2225(%rip),%xmm12 # 4290 <_sk_callback_sse41+0x7fb>
- DB 15,40,29,46,34,0,0 ; movaps 0x222e(%rip),%xmm3 # 42a0 <_sk_callback_sse41+0x80b>
+ DB 68,15,89,37,17,34,0,0 ; mulps 0x2211(%rip),%xmm12 # 4260 <_sk_callback_sse41+0x7cf>
+ DB 68,15,84,29,25,34,0,0 ; andps 0x2219(%rip),%xmm11 # 4270 <_sk_callback_sse41+0x7df>
+ DB 68,15,86,29,33,34,0,0 ; orps 0x2221(%rip),%xmm11 # 4280 <_sk_callback_sse41+0x7ef>
+ DB 68,15,88,37,41,34,0,0 ; addps 0x2229(%rip),%xmm12 # 4290 <_sk_callback_sse41+0x7ff>
+ DB 15,40,29,50,34,0,0 ; movaps 0x2232(%rip),%xmm3 # 42a0 <_sk_callback_sse41+0x80f>
DB 65,15,89,219 ; mulps %xmm11,%xmm3
DB 68,15,92,227 ; subps %xmm3,%xmm12
- DB 68,15,88,29,46,34,0,0 ; addps 0x222e(%rip),%xmm11 # 42b0 <_sk_callback_sse41+0x81b>
- DB 15,40,29,55,34,0,0 ; movaps 0x2237(%rip),%xmm3 # 42c0 <_sk_callback_sse41+0x82b>
+ DB 68,15,88,29,50,34,0,0 ; addps 0x2232(%rip),%xmm11 # 42b0 <_sk_callback_sse41+0x81f>
+ DB 15,40,29,59,34,0,0 ; movaps 0x223b(%rip),%xmm3 # 42c0 <_sk_callback_sse41+0x82f>
DB 65,15,94,219 ; divps %xmm11,%xmm3
DB 68,15,92,227 ; subps %xmm3,%xmm12
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 102,69,15,58,8,212,1 ; roundps $0x1,%xmm12,%xmm10
DB 69,15,40,220 ; movaps %xmm12,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 68,15,88,37,36,34,0,0 ; addps 0x2224(%rip),%xmm12 # 42d0 <_sk_callback_sse41+0x83b>
- DB 15,40,29,45,34,0,0 ; movaps 0x222d(%rip),%xmm3 # 42e0 <_sk_callback_sse41+0x84b>
+ DB 68,15,88,37,40,34,0,0 ; addps 0x2228(%rip),%xmm12 # 42d0 <_sk_callback_sse41+0x83f>
+ DB 15,40,29,49,34,0,0 ; movaps 0x2231(%rip),%xmm3 # 42e0 <_sk_callback_sse41+0x84f>
DB 65,15,89,219 ; mulps %xmm11,%xmm3
DB 68,15,92,227 ; subps %xmm3,%xmm12
- DB 68,15,40,21,45,34,0,0 ; movaps 0x222d(%rip),%xmm10 # 42f0 <_sk_callback_sse41+0x85b>
+ DB 68,15,40,21,49,34,0,0 ; movaps 0x2231(%rip),%xmm10 # 42f0 <_sk_callback_sse41+0x85f>
DB 69,15,92,211 ; subps %xmm11,%xmm10
- DB 15,40,29,50,34,0,0 ; movaps 0x2232(%rip),%xmm3 # 4300 <_sk_callback_sse41+0x86b>
+ DB 15,40,29,54,34,0,0 ; movaps 0x2236(%rip),%xmm3 # 4300 <_sk_callback_sse41+0x86f>
DB 65,15,94,218 ; divps %xmm10,%xmm3
DB 65,15,88,220 ; addps %xmm12,%xmm3
- DB 15,89,29,51,34,0,0 ; mulps 0x2233(%rip),%xmm3 # 4310 <_sk_callback_sse41+0x87b>
+ DB 15,89,29,55,34,0,0 ; mulps 0x2237(%rip),%xmm3 # 4310 <_sk_callback_sse41+0x87f>
DB 102,68,15,91,211 ; cvtps2dq %xmm3,%xmm10
DB 243,15,16,88,20 ; movss 0x14(%rax),%xmm3
DB 15,198,219,0 ; shufps $0x0,%xmm3,%xmm3
@@ -12091,7 +12086,7 @@ _sk_parametric_a_sse41 LABEL PROC
DB 102,65,15,56,20,217 ; blendvps %xmm0,%xmm9,%xmm3
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,95,216 ; maxps %xmm0,%xmm3
- DB 15,93,29,30,34,0,0 ; minps 0x221e(%rip),%xmm3 # 4320 <_sk_callback_sse41+0x88b>
+ DB 15,93,29,34,34,0,0 ; minps 0x2222(%rip),%xmm3 # 4320 <_sk_callback_sse41+0x88f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -12099,29 +12094,29 @@ _sk_parametric_a_sse41 LABEL PROC
PUBLIC _sk_lab_to_xyz_sse41
_sk_lab_to_xyz_sse41 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,89,5,26,34,0,0 ; mulps 0x221a(%rip),%xmm8 # 4330 <_sk_callback_sse41+0x89b>
- DB 68,15,40,13,34,34,0,0 ; movaps 0x2222(%rip),%xmm9 # 4340 <_sk_callback_sse41+0x8ab>
+ DB 68,15,89,5,30,34,0,0 ; mulps 0x221e(%rip),%xmm8 # 4330 <_sk_callback_sse41+0x89f>
+ DB 68,15,40,13,38,34,0,0 ; movaps 0x2226(%rip),%xmm9 # 4340 <_sk_callback_sse41+0x8af>
DB 65,15,89,201 ; mulps %xmm9,%xmm1
- DB 15,40,5,39,34,0,0 ; movaps 0x2227(%rip),%xmm0 # 4350 <_sk_callback_sse41+0x8bb>
+ DB 15,40,5,43,34,0,0 ; movaps 0x222b(%rip),%xmm0 # 4350 <_sk_callback_sse41+0x8bf>
DB 15,88,200 ; addps %xmm0,%xmm1
DB 65,15,89,209 ; mulps %xmm9,%xmm2
DB 15,88,208 ; addps %xmm0,%xmm2
- DB 68,15,88,5,37,34,0,0 ; addps 0x2225(%rip),%xmm8 # 4360 <_sk_callback_sse41+0x8cb>
- DB 68,15,89,5,45,34,0,0 ; mulps 0x222d(%rip),%xmm8 # 4370 <_sk_callback_sse41+0x8db>
- DB 15,89,13,54,34,0,0 ; mulps 0x2236(%rip),%xmm1 # 4380 <_sk_callback_sse41+0x8eb>
+ DB 68,15,88,5,41,34,0,0 ; addps 0x2229(%rip),%xmm8 # 4360 <_sk_callback_sse41+0x8cf>
+ DB 68,15,89,5,49,34,0,0 ; mulps 0x2231(%rip),%xmm8 # 4370 <_sk_callback_sse41+0x8df>
+ DB 15,89,13,58,34,0,0 ; mulps 0x223a(%rip),%xmm1 # 4380 <_sk_callback_sse41+0x8ef>
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 15,89,21,59,34,0,0 ; mulps 0x223b(%rip),%xmm2 # 4390 <_sk_callback_sse41+0x8fb>
+ DB 15,89,21,63,34,0,0 ; mulps 0x223f(%rip),%xmm2 # 4390 <_sk_callback_sse41+0x8ff>
DB 69,15,40,208 ; movaps %xmm8,%xmm10
DB 68,15,92,210 ; subps %xmm2,%xmm10
DB 68,15,40,217 ; movaps %xmm1,%xmm11
DB 69,15,89,219 ; mulps %xmm11,%xmm11
DB 68,15,89,217 ; mulps %xmm1,%xmm11
- DB 68,15,40,13,47,34,0,0 ; movaps 0x222f(%rip),%xmm9 # 43a0 <_sk_callback_sse41+0x90b>
+ DB 68,15,40,13,51,34,0,0 ; movaps 0x2233(%rip),%xmm9 # 43a0 <_sk_callback_sse41+0x90f>
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 65,15,194,195,1 ; cmpltps %xmm11,%xmm0
- DB 15,40,21,47,34,0,0 ; movaps 0x222f(%rip),%xmm2 # 43b0 <_sk_callback_sse41+0x91b>
+ DB 15,40,21,51,34,0,0 ; movaps 0x2233(%rip),%xmm2 # 43b0 <_sk_callback_sse41+0x91f>
DB 15,88,202 ; addps %xmm2,%xmm1
- DB 68,15,40,37,52,34,0,0 ; movaps 0x2234(%rip),%xmm12 # 43c0 <_sk_callback_sse41+0x92b>
+ DB 68,15,40,37,56,34,0,0 ; movaps 0x2238(%rip),%xmm12 # 43c0 <_sk_callback_sse41+0x92f>
DB 65,15,89,204 ; mulps %xmm12,%xmm1
DB 102,65,15,56,20,203 ; blendvps %xmm0,%xmm11,%xmm1
DB 69,15,40,216 ; movaps %xmm8,%xmm11
@@ -12140,8 +12135,8 @@ _sk_lab_to_xyz_sse41 LABEL PROC
DB 65,15,89,212 ; mulps %xmm12,%xmm2
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 102,65,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm2
- DB 15,89,13,237,33,0,0 ; mulps 0x21ed(%rip),%xmm1 # 43d0 <_sk_callback_sse41+0x93b>
- DB 15,89,21,246,33,0,0 ; mulps 0x21f6(%rip),%xmm2 # 43e0 <_sk_callback_sse41+0x94b>
+ DB 15,89,13,241,33,0,0 ; mulps 0x21f1(%rip),%xmm1 # 43d0 <_sk_callback_sse41+0x93f>
+ DB 15,89,21,250,33,0,0 ; mulps 0x21fa(%rip),%xmm2 # 43e0 <_sk_callback_sse41+0x94f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 65,15,40,200 ; movaps %xmm8,%xmm1
@@ -12153,7 +12148,7 @@ _sk_load_a8_sse41 LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 102,15,56,49,4,56 ; pmovzxbd (%rax,%rdi,1),%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,230,33,0,0 ; mulps 0x21e6(%rip),%xmm3 # 43f0 <_sk_callback_sse41+0x95b>
+ DB 15,89,29,234,33,0,0 ; mulps 0x21ea(%rip),%xmm3 # 43f0 <_sk_callback_sse41+0x95f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 15,87,201 ; xorps %xmm1,%xmm1
@@ -12184,7 +12179,7 @@ _sk_gather_a8_sse41 LABEL PROC
DB 102,15,58,32,192,3 ; pinsrb $0x3,%eax,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,122,33,0,0 ; mulps 0x217a(%rip),%xmm3 # 4400 <_sk_callback_sse41+0x96b>
+ DB 15,89,29,126,33,0,0 ; mulps 0x217e(%rip),%xmm3 # 4400 <_sk_callback_sse41+0x96f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
@@ -12195,7 +12190,7 @@ PUBLIC _sk_store_a8_sse41
_sk_store_a8_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,110,33,0,0 ; movaps 0x216e(%rip),%xmm8 # 4410 <_sk_callback_sse41+0x97b>
+ DB 68,15,40,5,114,33,0,0 ; movaps 0x2172(%rip),%xmm8 # 4410 <_sk_callback_sse41+0x97f>
DB 68,15,89,195 ; mulps %xmm3,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
DB 102,69,15,56,43,192 ; packusdw %xmm8,%xmm8
@@ -12210,9 +12205,9 @@ _sk_load_g8_sse41 LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 102,15,56,49,4,56 ; pmovzxbd (%rax,%rdi,1),%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,75,33,0,0 ; mulps 0x214b(%rip),%xmm0 # 4420 <_sk_callback_sse41+0x98b>
+ DB 15,89,5,79,33,0,0 ; mulps 0x214f(%rip),%xmm0 # 4420 <_sk_callback_sse41+0x98f>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,82,33,0,0 ; movaps 0x2152(%rip),%xmm3 # 4430 <_sk_callback_sse41+0x99b>
+ DB 15,40,29,86,33,0,0 ; movaps 0x2156(%rip),%xmm3 # 4430 <_sk_callback_sse41+0x99f>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -12241,9 +12236,9 @@ _sk_gather_g8_sse41 LABEL PROC
DB 102,15,58,32,192,3 ; pinsrb $0x3,%eax,%xmm0
DB 102,15,56,49,192 ; pmovzxbd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,235,32,0,0 ; mulps 0x20eb(%rip),%xmm0 # 4440 <_sk_callback_sse41+0x9ab>
+ DB 15,89,5,239,32,0,0 ; mulps 0x20ef(%rip),%xmm0 # 4440 <_sk_callback_sse41+0x9af>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,242,32,0,0 ; movaps 0x20f2(%rip),%xmm3 # 4450 <_sk_callback_sse41+0x9bb>
+ DB 15,40,29,246,32,0,0 ; movaps 0x20f6(%rip),%xmm3 # 4450 <_sk_callback_sse41+0x9bf>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -12253,9 +12248,9 @@ _sk_gather_i8_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,192 ; mov %rax,%r8
DB 77,133,192 ; test %r8,%r8
- DB 116,5 ; je 2375 <_sk_gather_i8_sse41+0xf>
+ DB 116,5 ; je 2371 <_sk_gather_i8_sse41+0xf>
DB 76,137,192 ; mov %r8,%rax
- DB 235,2 ; jmp 2377 <_sk_gather_i8_sse41+0x11>
+ DB 235,2 ; jmp 2373 <_sk_gather_i8_sse41+0x11>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 243,15,91,201 ; cvttps2dq %xmm1,%xmm1
@@ -12286,17 +12281,17 @@ _sk_gather_i8_sse41 LABEL PROC
DB 102,15,58,34,28,8,1 ; pinsrd $0x1,(%rax,%rcx,1),%xmm3
DB 102,66,15,58,34,28,144,2 ; pinsrd $0x2,(%rax,%r10,4),%xmm3
DB 102,66,15,58,34,28,8,3 ; pinsrd $0x3,(%rax,%r9,1),%xmm3
- DB 102,15,111,5,73,32,0,0 ; movdqa 0x2049(%rip),%xmm0 # 4460 <_sk_callback_sse41+0x9cb>
+ DB 102,15,111,5,77,32,0,0 ; movdqa 0x204d(%rip),%xmm0 # 4460 <_sk_callback_sse41+0x9cf>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,74,32,0,0 ; movaps 0x204a(%rip),%xmm8 # 4470 <_sk_callback_sse41+0x9db>
+ DB 68,15,40,5,78,32,0,0 ; movaps 0x204e(%rip),%xmm8 # 4470 <_sk_callback_sse41+0x9df>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
- DB 102,15,56,0,13,73,32,0,0 ; pshufb 0x2049(%rip),%xmm1 # 4480 <_sk_callback_sse41+0x9eb>
+ DB 102,15,56,0,13,77,32,0,0 ; pshufb 0x204d(%rip),%xmm1 # 4480 <_sk_callback_sse41+0x9ef>
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
- DB 102,15,56,0,21,69,32,0,0 ; pshufb 0x2045(%rip),%xmm2 # 4490 <_sk_callback_sse41+0x9fb>
+ DB 102,15,56,0,21,73,32,0,0 ; pshufb 0x2049(%rip),%xmm2 # 4490 <_sk_callback_sse41+0x9ff>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -12310,19 +12305,19 @@ _sk_load_565_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 102,15,56,51,20,120 ; pmovzxwd (%rax,%rdi,2),%xmm2
- DB 102,15,111,5,43,32,0,0 ; movdqa 0x202b(%rip),%xmm0 # 44a0 <_sk_callback_sse41+0xa0b>
+ DB 102,15,111,5,47,32,0,0 ; movdqa 0x202f(%rip),%xmm0 # 44a0 <_sk_callback_sse41+0xa0f>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,45,32,0,0 ; mulps 0x202d(%rip),%xmm0 # 44b0 <_sk_callback_sse41+0xa1b>
- DB 102,15,111,13,53,32,0,0 ; movdqa 0x2035(%rip),%xmm1 # 44c0 <_sk_callback_sse41+0xa2b>
+ DB 15,89,5,49,32,0,0 ; mulps 0x2031(%rip),%xmm0 # 44b0 <_sk_callback_sse41+0xa1f>
+ DB 102,15,111,13,57,32,0,0 ; movdqa 0x2039(%rip),%xmm1 # 44c0 <_sk_callback_sse41+0xa2f>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,55,32,0,0 ; mulps 0x2037(%rip),%xmm1 # 44d0 <_sk_callback_sse41+0xa3b>
- DB 102,15,219,21,63,32,0,0 ; pand 0x203f(%rip),%xmm2 # 44e0 <_sk_callback_sse41+0xa4b>
+ DB 15,89,13,59,32,0,0 ; mulps 0x203b(%rip),%xmm1 # 44d0 <_sk_callback_sse41+0xa3f>
+ DB 102,15,219,21,67,32,0,0 ; pand 0x2043(%rip),%xmm2 # 44e0 <_sk_callback_sse41+0xa4f>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,69,32,0,0 ; mulps 0x2045(%rip),%xmm2 # 44f0 <_sk_callback_sse41+0xa5b>
+ DB 15,89,21,73,32,0,0 ; mulps 0x2049(%rip),%xmm2 # 44f0 <_sk_callback_sse41+0xa5f>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,76,32,0,0 ; movaps 0x204c(%rip),%xmm3 # 4500 <_sk_callback_sse41+0xa6b>
+ DB 15,40,29,80,32,0,0 ; movaps 0x2050(%rip),%xmm3 # 4500 <_sk_callback_sse41+0xa6f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_gather_565_sse41
@@ -12348,31 +12343,31 @@ _sk_gather_565_sse41 LABEL PROC
DB 65,15,183,4,65 ; movzwl (%r9,%rax,2),%eax
DB 102,15,196,192,3 ; pinsrw $0x3,%eax,%xmm0
DB 102,15,56,51,208 ; pmovzxwd %xmm0,%xmm2
- DB 102,15,111,5,241,31,0,0 ; movdqa 0x1ff1(%rip),%xmm0 # 4510 <_sk_callback_sse41+0xa7b>
+ DB 102,15,111,5,245,31,0,0 ; movdqa 0x1ff5(%rip),%xmm0 # 4510 <_sk_callback_sse41+0xa7f>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,243,31,0,0 ; mulps 0x1ff3(%rip),%xmm0 # 4520 <_sk_callback_sse41+0xa8b>
- DB 102,15,111,13,251,31,0,0 ; movdqa 0x1ffb(%rip),%xmm1 # 4530 <_sk_callback_sse41+0xa9b>
+ DB 15,89,5,247,31,0,0 ; mulps 0x1ff7(%rip),%xmm0 # 4520 <_sk_callback_sse41+0xa8f>
+ DB 102,15,111,13,255,31,0,0 ; movdqa 0x1fff(%rip),%xmm1 # 4530 <_sk_callback_sse41+0xa9f>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,253,31,0,0 ; mulps 0x1ffd(%rip),%xmm1 # 4540 <_sk_callback_sse41+0xaab>
- DB 102,15,219,21,5,32,0,0 ; pand 0x2005(%rip),%xmm2 # 4550 <_sk_callback_sse41+0xabb>
+ DB 15,89,13,1,32,0,0 ; mulps 0x2001(%rip),%xmm1 # 4540 <_sk_callback_sse41+0xaaf>
+ DB 102,15,219,21,9,32,0,0 ; pand 0x2009(%rip),%xmm2 # 4550 <_sk_callback_sse41+0xabf>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,11,32,0,0 ; mulps 0x200b(%rip),%xmm2 # 4560 <_sk_callback_sse41+0xacb>
+ DB 15,89,21,15,32,0,0 ; mulps 0x200f(%rip),%xmm2 # 4560 <_sk_callback_sse41+0xacf>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,18,32,0,0 ; movaps 0x2012(%rip),%xmm3 # 4570 <_sk_callback_sse41+0xadb>
+ DB 15,40,29,22,32,0,0 ; movaps 0x2016(%rip),%xmm3 # 4570 <_sk_callback_sse41+0xadf>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_store_565_sse41
_sk_store_565_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,19,32,0,0 ; movaps 0x2013(%rip),%xmm8 # 4580 <_sk_callback_sse41+0xaeb>
+ DB 68,15,40,5,23,32,0,0 ; movaps 0x2017(%rip),%xmm8 # 4580 <_sk_callback_sse41+0xaef>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
DB 102,65,15,114,241,11 ; pslld $0xb,%xmm9
- DB 68,15,40,21,8,32,0,0 ; movaps 0x2008(%rip),%xmm10 # 4590 <_sk_callback_sse41+0xafb>
+ DB 68,15,40,21,12,32,0,0 ; movaps 0x200c(%rip),%xmm10 # 4590 <_sk_callback_sse41+0xaff>
DB 68,15,89,209 ; mulps %xmm1,%xmm10
DB 102,69,15,91,210 ; cvtps2dq %xmm10,%xmm10
DB 102,65,15,114,242,5 ; pslld $0x5,%xmm10
@@ -12390,21 +12385,21 @@ _sk_load_4444_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 102,15,56,51,28,120 ; pmovzxwd (%rax,%rdi,2),%xmm3
- DB 102,15,111,5,211,31,0,0 ; movdqa 0x1fd3(%rip),%xmm0 # 45a0 <_sk_callback_sse41+0xb0b>
+ DB 102,15,111,5,215,31,0,0 ; movdqa 0x1fd7(%rip),%xmm0 # 45a0 <_sk_callback_sse41+0xb0f>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,213,31,0,0 ; mulps 0x1fd5(%rip),%xmm0 # 45b0 <_sk_callback_sse41+0xb1b>
- DB 102,15,111,13,221,31,0,0 ; movdqa 0x1fdd(%rip),%xmm1 # 45c0 <_sk_callback_sse41+0xb2b>
+ DB 15,89,5,217,31,0,0 ; mulps 0x1fd9(%rip),%xmm0 # 45b0 <_sk_callback_sse41+0xb1f>
+ DB 102,15,111,13,225,31,0,0 ; movdqa 0x1fe1(%rip),%xmm1 # 45c0 <_sk_callback_sse41+0xb2f>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,223,31,0,0 ; mulps 0x1fdf(%rip),%xmm1 # 45d0 <_sk_callback_sse41+0xb3b>
- DB 102,15,111,21,231,31,0,0 ; movdqa 0x1fe7(%rip),%xmm2 # 45e0 <_sk_callback_sse41+0xb4b>
+ DB 15,89,13,227,31,0,0 ; mulps 0x1fe3(%rip),%xmm1 # 45d0 <_sk_callback_sse41+0xb3f>
+ DB 102,15,111,21,235,31,0,0 ; movdqa 0x1feb(%rip),%xmm2 # 45e0 <_sk_callback_sse41+0xb4f>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,233,31,0,0 ; mulps 0x1fe9(%rip),%xmm2 # 45f0 <_sk_callback_sse41+0xb5b>
- DB 102,15,219,29,241,31,0,0 ; pand 0x1ff1(%rip),%xmm3 # 4600 <_sk_callback_sse41+0xb6b>
+ DB 15,89,21,237,31,0,0 ; mulps 0x1fed(%rip),%xmm2 # 45f0 <_sk_callback_sse41+0xb5f>
+ DB 102,15,219,29,245,31,0,0 ; pand 0x1ff5(%rip),%xmm3 # 4600 <_sk_callback_sse41+0xb6f>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,247,31,0,0 ; mulps 0x1ff7(%rip),%xmm3 # 4610 <_sk_callback_sse41+0xb7b>
+ DB 15,89,29,251,31,0,0 ; mulps 0x1ffb(%rip),%xmm3 # 4610 <_sk_callback_sse41+0xb7f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -12431,21 +12426,21 @@ _sk_gather_4444_sse41 LABEL PROC
DB 65,15,183,4,65 ; movzwl (%r9,%rax,2),%eax
DB 102,15,196,192,3 ; pinsrw $0x3,%eax,%xmm0
DB 102,15,56,51,216 ; pmovzxwd %xmm0,%xmm3
- DB 102,15,111,5,154,31,0,0 ; movdqa 0x1f9a(%rip),%xmm0 # 4620 <_sk_callback_sse41+0xb8b>
+ DB 102,15,111,5,158,31,0,0 ; movdqa 0x1f9e(%rip),%xmm0 # 4620 <_sk_callback_sse41+0xb8f>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,156,31,0,0 ; mulps 0x1f9c(%rip),%xmm0 # 4630 <_sk_callback_sse41+0xb9b>
- DB 102,15,111,13,164,31,0,0 ; movdqa 0x1fa4(%rip),%xmm1 # 4640 <_sk_callback_sse41+0xbab>
+ DB 15,89,5,160,31,0,0 ; mulps 0x1fa0(%rip),%xmm0 # 4630 <_sk_callback_sse41+0xb9f>
+ DB 102,15,111,13,168,31,0,0 ; movdqa 0x1fa8(%rip),%xmm1 # 4640 <_sk_callback_sse41+0xbaf>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,166,31,0,0 ; mulps 0x1fa6(%rip),%xmm1 # 4650 <_sk_callback_sse41+0xbbb>
- DB 102,15,111,21,174,31,0,0 ; movdqa 0x1fae(%rip),%xmm2 # 4660 <_sk_callback_sse41+0xbcb>
+ DB 15,89,13,170,31,0,0 ; mulps 0x1faa(%rip),%xmm1 # 4650 <_sk_callback_sse41+0xbbf>
+ DB 102,15,111,21,178,31,0,0 ; movdqa 0x1fb2(%rip),%xmm2 # 4660 <_sk_callback_sse41+0xbcf>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,176,31,0,0 ; mulps 0x1fb0(%rip),%xmm2 # 4670 <_sk_callback_sse41+0xbdb>
- DB 102,15,219,29,184,31,0,0 ; pand 0x1fb8(%rip),%xmm3 # 4680 <_sk_callback_sse41+0xbeb>
+ DB 15,89,21,180,31,0,0 ; mulps 0x1fb4(%rip),%xmm2 # 4670 <_sk_callback_sse41+0xbdf>
+ DB 102,15,219,29,188,31,0,0 ; pand 0x1fbc(%rip),%xmm3 # 4680 <_sk_callback_sse41+0xbef>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,190,31,0,0 ; mulps 0x1fbe(%rip),%xmm3 # 4690 <_sk_callback_sse41+0xbfb>
+ DB 15,89,29,194,31,0,0 ; mulps 0x1fc2(%rip),%xmm3 # 4690 <_sk_callback_sse41+0xbff>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -12453,7 +12448,7 @@ PUBLIC _sk_store_4444_sse41
_sk_store_4444_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,189,31,0,0 ; movaps 0x1fbd(%rip),%xmm8 # 46a0 <_sk_callback_sse41+0xc0b>
+ DB 68,15,40,5,193,31,0,0 ; movaps 0x1fc1(%rip),%xmm8 # 46a0 <_sk_callback_sse41+0xc0f>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -12481,17 +12476,17 @@ _sk_load_8888_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 15,16,28,184 ; movups (%rax,%rdi,4),%xmm3
- DB 15,40,5,92,31,0,0 ; movaps 0x1f5c(%rip),%xmm0 # 46b0 <_sk_callback_sse41+0xc1b>
+ DB 15,40,5,96,31,0,0 ; movaps 0x1f60(%rip),%xmm0 # 46b0 <_sk_callback_sse41+0xc1f>
DB 15,84,195 ; andps %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,94,31,0,0 ; movaps 0x1f5e(%rip),%xmm8 # 46c0 <_sk_callback_sse41+0xc2b>
+ DB 68,15,40,5,98,31,0,0 ; movaps 0x1f62(%rip),%xmm8 # 46c0 <_sk_callback_sse41+0xc2f>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,40,203 ; movaps %xmm3,%xmm1
- DB 102,15,56,0,13,94,31,0,0 ; pshufb 0x1f5e(%rip),%xmm1 # 46d0 <_sk_callback_sse41+0xc3b>
+ DB 102,15,56,0,13,98,31,0,0 ; pshufb 0x1f62(%rip),%xmm1 # 46d0 <_sk_callback_sse41+0xc3f>
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 15,40,211 ; movaps %xmm3,%xmm2
- DB 102,15,56,0,21,91,31,0,0 ; pshufb 0x1f5b(%rip),%xmm2 # 46e0 <_sk_callback_sse41+0xc4b>
+ DB 102,15,56,0,21,95,31,0,0 ; pshufb 0x1f5f(%rip),%xmm2 # 46e0 <_sk_callback_sse41+0xc4f>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -12520,17 +12515,17 @@ _sk_gather_8888_sse41 LABEL PROC
DB 102,65,15,58,34,28,129,1 ; pinsrd $0x1,(%r9,%rax,4),%xmm3
DB 102,67,15,58,34,28,145,2 ; pinsrd $0x2,(%r9,%r10,4),%xmm3
DB 102,65,15,58,34,28,137,3 ; pinsrd $0x3,(%r9,%rcx,4),%xmm3
- DB 102,15,111,5,244,30,0,0 ; movdqa 0x1ef4(%rip),%xmm0 # 46f0 <_sk_callback_sse41+0xc5b>
+ DB 102,15,111,5,248,30,0,0 ; movdqa 0x1ef8(%rip),%xmm0 # 46f0 <_sk_callback_sse41+0xc5f>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,245,30,0,0 ; movaps 0x1ef5(%rip),%xmm8 # 4700 <_sk_callback_sse41+0xc6b>
+ DB 68,15,40,5,249,30,0,0 ; movaps 0x1ef9(%rip),%xmm8 # 4700 <_sk_callback_sse41+0xc6f>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
- DB 102,15,56,0,13,244,30,0,0 ; pshufb 0x1ef4(%rip),%xmm1 # 4710 <_sk_callback_sse41+0xc7b>
+ DB 102,15,56,0,13,248,30,0,0 ; pshufb 0x1ef8(%rip),%xmm1 # 4710 <_sk_callback_sse41+0xc7f>
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,111,211 ; movdqa %xmm3,%xmm2
- DB 102,15,56,0,21,240,30,0,0 ; pshufb 0x1ef0(%rip),%xmm2 # 4720 <_sk_callback_sse41+0xc8b>
+ DB 102,15,56,0,21,244,30,0,0 ; pshufb 0x1ef4(%rip),%xmm2 # 4720 <_sk_callback_sse41+0xc8f>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 102,15,114,211,24 ; psrld $0x18,%xmm3
@@ -12543,7 +12538,7 @@ PUBLIC _sk_store_8888_sse41
_sk_store_8888_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,220,30,0,0 ; movaps 0x1edc(%rip),%xmm8 # 4730 <_sk_callback_sse41+0xc9b>
+ DB 68,15,40,5,224,30,0,0 ; movaps 0x1ee0(%rip),%xmm8 # 4730 <_sk_callback_sse41+0xc9f>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -12578,18 +12573,18 @@ _sk_load_f16_sse41 LABEL PROC
DB 102,68,15,97,216 ; punpcklwd %xmm0,%xmm11
DB 102,68,15,105,200 ; punpckhwd %xmm0,%xmm9
DB 102,65,15,56,51,203 ; pmovzxwd %xmm11,%xmm1
- DB 102,68,15,111,5,85,30,0,0 ; movdqa 0x1e55(%rip),%xmm8 # 4740 <_sk_callback_sse41+0xcab>
+ DB 102,68,15,111,5,89,30,0,0 ; movdqa 0x1e59(%rip),%xmm8 # 4740 <_sk_callback_sse41+0xcaf>
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,65,15,219,208 ; pand %xmm8,%xmm2
DB 102,15,239,202 ; pxor %xmm2,%xmm1
- DB 102,15,111,29,80,30,0,0 ; movdqa 0x1e50(%rip),%xmm3 # 4750 <_sk_callback_sse41+0xcbb>
+ DB 102,15,111,29,84,30,0,0 ; movdqa 0x1e54(%rip),%xmm3 # 4750 <_sk_callback_sse41+0xcbf>
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,56,63,195 ; pmaxud %xmm3,%xmm0
DB 102,15,118,193 ; pcmpeqd %xmm1,%xmm0
DB 102,15,114,241,13 ; pslld $0xd,%xmm1
DB 102,15,235,202 ; por %xmm2,%xmm1
- DB 102,68,15,111,21,60,30,0,0 ; movdqa 0x1e3c(%rip),%xmm10 # 4760 <_sk_callback_sse41+0xccb>
+ DB 102,68,15,111,21,64,30,0,0 ; movdqa 0x1e40(%rip),%xmm10 # 4760 <_sk_callback_sse41+0xccf>
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,15,219,193 ; pand %xmm1,%xmm0
DB 102,65,15,115,219,8 ; psrldq $0x8,%xmm11
@@ -12660,18 +12655,18 @@ _sk_gather_f16_sse41 LABEL PROC
DB 102,68,15,97,218 ; punpcklwd %xmm2,%xmm11
DB 102,68,15,105,202 ; punpckhwd %xmm2,%xmm9
DB 102,65,15,56,51,203 ; pmovzxwd %xmm11,%xmm1
- DB 102,68,15,111,5,250,28,0,0 ; movdqa 0x1cfa(%rip),%xmm8 # 4770 <_sk_callback_sse41+0xcdb>
+ DB 102,68,15,111,5,254,28,0,0 ; movdqa 0x1cfe(%rip),%xmm8 # 4770 <_sk_callback_sse41+0xcdf>
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,65,15,219,208 ; pand %xmm8,%xmm2
DB 102,15,239,202 ; pxor %xmm2,%xmm1
- DB 102,15,111,29,245,28,0,0 ; movdqa 0x1cf5(%rip),%xmm3 # 4780 <_sk_callback_sse41+0xceb>
+ DB 102,15,111,29,249,28,0,0 ; movdqa 0x1cf9(%rip),%xmm3 # 4780 <_sk_callback_sse41+0xcef>
DB 102,15,114,242,16 ; pslld $0x10,%xmm2
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,56,63,195 ; pmaxud %xmm3,%xmm0
DB 102,15,118,193 ; pcmpeqd %xmm1,%xmm0
DB 102,15,114,241,13 ; pslld $0xd,%xmm1
DB 102,15,235,202 ; por %xmm2,%xmm1
- DB 102,68,15,111,21,225,28,0,0 ; movdqa 0x1ce1(%rip),%xmm10 # 4790 <_sk_callback_sse41+0xcfb>
+ DB 102,68,15,111,21,229,28,0,0 ; movdqa 0x1ce5(%rip),%xmm10 # 4790 <_sk_callback_sse41+0xcff>
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,15,219,193 ; pand %xmm1,%xmm0
DB 102,65,15,115,219,8 ; psrldq $0x8,%xmm11
@@ -12717,17 +12712,17 @@ PUBLIC _sk_store_f16_sse41
_sk_store_f16_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 102,68,15,111,21,23,28,0,0 ; movdqa 0x1c17(%rip),%xmm10 # 47a0 <_sk_callback_sse41+0xd0b>
+ DB 102,68,15,111,21,27,28,0,0 ; movdqa 0x1c1b(%rip),%xmm10 # 47a0 <_sk_callback_sse41+0xd0f>
DB 102,68,15,111,224 ; movdqa %xmm0,%xmm12
DB 102,68,15,111,232 ; movdqa %xmm0,%xmm13
DB 102,69,15,219,234 ; pand %xmm10,%xmm13
DB 102,69,15,239,229 ; pxor %xmm13,%xmm12
- DB 102,68,15,111,13,10,28,0,0 ; movdqa 0x1c0a(%rip),%xmm9 # 47b0 <_sk_callback_sse41+0xd1b>
+ DB 102,68,15,111,13,14,28,0,0 ; movdqa 0x1c0e(%rip),%xmm9 # 47b0 <_sk_callback_sse41+0xd1f>
DB 102,65,15,114,213,16 ; psrld $0x10,%xmm13
DB 102,69,15,111,193 ; movdqa %xmm9,%xmm8
DB 102,69,15,102,196 ; pcmpgtd %xmm12,%xmm8
DB 102,65,15,114,212,13 ; psrld $0xd,%xmm12
- DB 102,68,15,111,29,251,27,0,0 ; movdqa 0x1bfb(%rip),%xmm11 # 47c0 <_sk_callback_sse41+0xd2b>
+ DB 102,68,15,111,29,255,27,0,0 ; movdqa 0x1bff(%rip),%xmm11 # 47c0 <_sk_callback_sse41+0xd2f>
DB 102,69,15,235,235 ; por %xmm11,%xmm13
DB 102,69,15,254,236 ; paddd %xmm12,%xmm13
DB 102,69,15,223,197 ; pandn %xmm13,%xmm8
@@ -12795,7 +12790,7 @@ _sk_load_u16_be_sse41 LABEL PROC
DB 102,15,235,200 ; por %xmm0,%xmm1
DB 102,15,56,51,193 ; pmovzxwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,202,26,0,0 ; movaps 0x1aca(%rip),%xmm8 # 47d0 <_sk_callback_sse41+0xd3b>
+ DB 68,15,40,5,206,26,0,0 ; movaps 0x1ace(%rip),%xmm8 # 47d0 <_sk_callback_sse41+0xd3f>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -12845,7 +12840,7 @@ _sk_load_rgb_u16_be_sse41 LABEL PROC
DB 102,15,235,193 ; por %xmm1,%xmm0
DB 102,15,56,51,192 ; pmovzxwd %xmm0,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,11,26,0,0 ; movaps 0x1a0b(%rip),%xmm8 # 47e0 <_sk_callback_sse41+0xd4b>
+ DB 68,15,40,5,15,26,0,0 ; movaps 0x1a0f(%rip),%xmm8 # 47e0 <_sk_callback_sse41+0xd4f>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -12862,14 +12857,14 @@ _sk_load_rgb_u16_be_sse41 LABEL PROC
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,210,25,0,0 ; movaps 0x19d2(%rip),%xmm3 # 47f0 <_sk_callback_sse41+0xd5b>
+ DB 15,40,29,214,25,0,0 ; movaps 0x19d6(%rip),%xmm3 # 47f0 <_sk_callback_sse41+0xd5f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_store_u16_be_sse41
_sk_store_u16_be_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,13,211,25,0,0 ; movaps 0x19d3(%rip),%xmm9 # 4800 <_sk_callback_sse41+0xd6b>
+ DB 68,15,40,13,215,25,0,0 ; movaps 0x19d7(%rip),%xmm9 # 4800 <_sk_callback_sse41+0xd6f>
DB 68,15,40,192 ; movaps %xmm0,%xmm8
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
@@ -13074,10 +13069,10 @@ _sk_mirror_y_sse41 LABEL PROC
PUBLIC _sk_luminance_to_alpha_sse41
_sk_luminance_to_alpha_sse41 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 15,89,5,241,22,0,0 ; mulps 0x16f1(%rip),%xmm0 # 4810 <_sk_callback_sse41+0xd7b>
- DB 15,89,13,250,22,0,0 ; mulps 0x16fa(%rip),%xmm1 # 4820 <_sk_callback_sse41+0xd8b>
+ DB 15,89,5,245,22,0,0 ; mulps 0x16f5(%rip),%xmm0 # 4810 <_sk_callback_sse41+0xd7f>
+ DB 15,89,13,254,22,0,0 ; mulps 0x16fe(%rip),%xmm1 # 4820 <_sk_callback_sse41+0xd8f>
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,29,0,23,0,0 ; mulps 0x1700(%rip),%xmm3 # 4830 <_sk_callback_sse41+0xd9b>
+ DB 15,89,29,4,23,0,0 ; mulps 0x1704(%rip),%xmm3 # 4830 <_sk_callback_sse41+0xd9f>
DB 15,88,217 ; addps %xmm1,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
@@ -13300,7 +13295,7 @@ _sk_linear_gradient_sse41 LABEL PROC
DB 69,15,198,237,0 ; shufps $0x0,%xmm13,%xmm13
DB 72,139,8 ; mov (%rax),%rcx
DB 72,133,201 ; test %rcx,%rcx
- DB 15,132,4,1,0,0 ; je 35d8 <_sk_linear_gradient_sse41+0x13e>
+ DB 15,132,4,1,0,0 ; je 35d4 <_sk_linear_gradient_sse41+0x13e>
DB 72,131,236,88 ; sub $0x58,%rsp
DB 15,41,36,36 ; movaps %xmm4,(%rsp)
DB 15,41,108,36,16 ; movaps %xmm5,0x10(%rsp)
@@ -13351,13 +13346,13 @@ _sk_linear_gradient_sse41 LABEL PROC
DB 15,40,196 ; movaps %xmm4,%xmm0
DB 72,131,192,36 ; add $0x24,%rax
DB 72,255,201 ; dec %rcx
- DB 15,133,65,255,255,255 ; jne 3500 <_sk_linear_gradient_sse41+0x66>
+ DB 15,133,65,255,255,255 ; jne 34fc <_sk_linear_gradient_sse41+0x66>
DB 15,40,124,36,48 ; movaps 0x30(%rsp),%xmm7
DB 15,40,116,36,32 ; movaps 0x20(%rsp),%xmm6
DB 15,40,108,36,16 ; movaps 0x10(%rsp),%xmm5
DB 15,40,36,36 ; movaps (%rsp),%xmm4
DB 72,131,196,88 ; add $0x58,%rsp
- DB 235,13 ; jmp 35e5 <_sk_linear_gradient_sse41+0x14b>
+ DB 235,13 ; jmp 35e1 <_sk_linear_gradient_sse41+0x14b>
DB 15,87,201 ; xorps %xmm1,%xmm1
DB 15,87,210 ; xorps %xmm2,%xmm2
DB 15,87,219 ; xorps %xmm3,%xmm3
@@ -13422,26 +13417,26 @@ _sk_xy_to_polar_unit_sse41 LABEL PROC
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,40,236 ; movaps %xmm12,%xmm13
DB 69,15,89,237 ; mulps %xmm13,%xmm13
- DB 68,15,40,21,131,17,0,0 ; movaps 0x1183(%rip),%xmm10 # 4840 <_sk_callback_sse41+0xdab>
+ DB 68,15,40,21,135,17,0,0 ; movaps 0x1187(%rip),%xmm10 # 4840 <_sk_callback_sse41+0xdaf>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,135,17,0,0 ; addps 0x1187(%rip),%xmm10 # 4850 <_sk_callback_sse41+0xdbb>
+ DB 68,15,88,21,139,17,0,0 ; addps 0x118b(%rip),%xmm10 # 4850 <_sk_callback_sse41+0xdbf>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,139,17,0,0 ; addps 0x118b(%rip),%xmm10 # 4860 <_sk_callback_sse41+0xdcb>
+ DB 68,15,88,21,143,17,0,0 ; addps 0x118f(%rip),%xmm10 # 4860 <_sk_callback_sse41+0xdcf>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,143,17,0,0 ; addps 0x118f(%rip),%xmm10 # 4870 <_sk_callback_sse41+0xddb>
+ DB 68,15,88,21,147,17,0,0 ; addps 0x1193(%rip),%xmm10 # 4870 <_sk_callback_sse41+0xddf>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,194,195,1 ; cmpltps %xmm11,%xmm0
- DB 68,15,40,29,142,17,0,0 ; movaps 0x118e(%rip),%xmm11 # 4880 <_sk_callback_sse41+0xdeb>
+ DB 68,15,40,29,146,17,0,0 ; movaps 0x1192(%rip),%xmm11 # 4880 <_sk_callback_sse41+0xdef>
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 102,69,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm10
DB 69,15,194,200,1 ; cmpltps %xmm8,%xmm9
- DB 68,15,40,29,135,17,0,0 ; movaps 0x1187(%rip),%xmm11 # 4890 <_sk_callback_sse41+0xdfb>
+ DB 68,15,40,29,139,17,0,0 ; movaps 0x118b(%rip),%xmm11 # 4890 <_sk_callback_sse41+0xdff>
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 102,69,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm10
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 65,15,194,192,1 ; cmpltps %xmm8,%xmm0
- DB 68,15,40,13,121,17,0,0 ; movaps 0x1179(%rip),%xmm9 # 48a0 <_sk_callback_sse41+0xe0b>
+ DB 68,15,40,13,125,17,0,0 ; movaps 0x117d(%rip),%xmm9 # 48a0 <_sk_callback_sse41+0xe0f>
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 102,69,15,56,20,209 ; blendvps %xmm0,%xmm9,%xmm10
DB 69,15,194,194,7 ; cmpordps %xmm10,%xmm8
@@ -13453,7 +13448,7 @@ _sk_xy_to_polar_unit_sse41 LABEL PROC
PUBLIC _sk_save_xy_sse41
_sk_save_xy_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,100,17,0,0 ; movaps 0x1164(%rip),%xmm8 # 48b0 <_sk_callback_sse41+0xe1b>
+ DB 68,15,40,5,104,17,0,0 ; movaps 0x1168(%rip),%xmm8 # 48b0 <_sk_callback_sse41+0xe1f>
DB 15,17,0 ; movups %xmm0,(%rax)
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,88,200 ; addps %xmm8,%xmm9
@@ -13493,8 +13488,8 @@ _sk_bilinear_nx_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,230,16,0,0 ; addps 0x10e6(%rip),%xmm0 # 48c0 <_sk_callback_sse41+0xe2b>
- DB 68,15,40,13,238,16,0,0 ; movaps 0x10ee(%rip),%xmm9 # 48d0 <_sk_callback_sse41+0xe3b>
+ DB 15,88,5,234,16,0,0 ; addps 0x10ea(%rip),%xmm0 # 48c0 <_sk_callback_sse41+0xe2f>
+ DB 68,15,40,13,242,16,0,0 ; movaps 0x10f2(%rip),%xmm9 # 48d0 <_sk_callback_sse41+0xe3f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13505,7 +13500,7 @@ _sk_bilinear_px_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,221,16,0,0 ; addps 0x10dd(%rip),%xmm0 # 48e0 <_sk_callback_sse41+0xe4b>
+ DB 15,88,5,225,16,0,0 ; addps 0x10e1(%rip),%xmm0 # 48e0 <_sk_callback_sse41+0xe4f>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13515,8 +13510,8 @@ _sk_bilinear_ny_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,207,16,0,0 ; addps 0x10cf(%rip),%xmm1 # 48f0 <_sk_callback_sse41+0xe5b>
- DB 68,15,40,13,215,16,0,0 ; movaps 0x10d7(%rip),%xmm9 # 4900 <_sk_callback_sse41+0xe6b>
+ DB 15,88,13,211,16,0,0 ; addps 0x10d3(%rip),%xmm1 # 48f0 <_sk_callback_sse41+0xe5f>
+ DB 68,15,40,13,219,16,0,0 ; movaps 0x10db(%rip),%xmm9 # 4900 <_sk_callback_sse41+0xe6f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13527,7 +13522,7 @@ _sk_bilinear_py_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,197,16,0,0 ; addps 0x10c5(%rip),%xmm1 # 4910 <_sk_callback_sse41+0xe7b>
+ DB 15,88,13,201,16,0,0 ; addps 0x10c9(%rip),%xmm1 # 4910 <_sk_callback_sse41+0xe7f>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13537,13 +13532,13 @@ _sk_bicubic_n3x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,184,16,0,0 ; addps 0x10b8(%rip),%xmm0 # 4920 <_sk_callback_sse41+0xe8b>
- DB 68,15,40,13,192,16,0,0 ; movaps 0x10c0(%rip),%xmm9 # 4930 <_sk_callback_sse41+0xe9b>
+ DB 15,88,5,188,16,0,0 ; addps 0x10bc(%rip),%xmm0 # 4920 <_sk_callback_sse41+0xe8f>
+ DB 68,15,40,13,196,16,0,0 ; movaps 0x10c4(%rip),%xmm9 # 4930 <_sk_callback_sse41+0xe9f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,188,16,0,0 ; mulps 0x10bc(%rip),%xmm9 # 4940 <_sk_callback_sse41+0xeab>
- DB 68,15,88,13,196,16,0,0 ; addps 0x10c4(%rip),%xmm9 # 4950 <_sk_callback_sse41+0xebb>
+ DB 68,15,89,13,192,16,0,0 ; mulps 0x10c0(%rip),%xmm9 # 4940 <_sk_callback_sse41+0xeaf>
+ DB 68,15,88,13,200,16,0,0 ; addps 0x10c8(%rip),%xmm9 # 4950 <_sk_callback_sse41+0xebf>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13554,16 +13549,16 @@ _sk_bicubic_n1x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,179,16,0,0 ; addps 0x10b3(%rip),%xmm0 # 4960 <_sk_callback_sse41+0xecb>
- DB 68,15,40,13,187,16,0,0 ; movaps 0x10bb(%rip),%xmm9 # 4970 <_sk_callback_sse41+0xedb>
+ DB 15,88,5,183,16,0,0 ; addps 0x10b7(%rip),%xmm0 # 4960 <_sk_callback_sse41+0xecf>
+ DB 68,15,40,13,191,16,0,0 ; movaps 0x10bf(%rip),%xmm9 # 4970 <_sk_callback_sse41+0xedf>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,191,16,0,0 ; movaps 0x10bf(%rip),%xmm8 # 4980 <_sk_callback_sse41+0xeeb>
+ DB 68,15,40,5,195,16,0,0 ; movaps 0x10c3(%rip),%xmm8 # 4980 <_sk_callback_sse41+0xeef>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,195,16,0,0 ; addps 0x10c3(%rip),%xmm8 # 4990 <_sk_callback_sse41+0xefb>
+ DB 68,15,88,5,199,16,0,0 ; addps 0x10c7(%rip),%xmm8 # 4990 <_sk_callback_sse41+0xeff>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,199,16,0,0 ; addps 0x10c7(%rip),%xmm8 # 49a0 <_sk_callback_sse41+0xf0b>
+ DB 68,15,88,5,203,16,0,0 ; addps 0x10cb(%rip),%xmm8 # 49a0 <_sk_callback_sse41+0xf0f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,203,16,0,0 ; addps 0x10cb(%rip),%xmm8 # 49b0 <_sk_callback_sse41+0xf1b>
+ DB 68,15,88,5,207,16,0,0 ; addps 0x10cf(%rip),%xmm8 # 49b0 <_sk_callback_sse41+0xf1f>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13571,17 +13566,17 @@ _sk_bicubic_n1x_sse41 LABEL PROC
PUBLIC _sk_bicubic_p1x_sse41
_sk_bicubic_p1x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,197,16,0,0 ; movaps 0x10c5(%rip),%xmm8 # 49c0 <_sk_callback_sse41+0xf2b>
+ DB 68,15,40,5,201,16,0,0 ; movaps 0x10c9(%rip),%xmm8 # 49c0 <_sk_callback_sse41+0xf2f>
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,72,64 ; movups 0x40(%rax),%xmm9
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,21,193,16,0,0 ; movaps 0x10c1(%rip),%xmm10 # 49d0 <_sk_callback_sse41+0xf3b>
+ DB 68,15,40,21,197,16,0,0 ; movaps 0x10c5(%rip),%xmm10 # 49d0 <_sk_callback_sse41+0xf3f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,197,16,0,0 ; addps 0x10c5(%rip),%xmm10 # 49e0 <_sk_callback_sse41+0xf4b>
+ DB 68,15,88,21,201,16,0,0 ; addps 0x10c9(%rip),%xmm10 # 49e0 <_sk_callback_sse41+0xf4f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,193,16,0,0 ; addps 0x10c1(%rip),%xmm10 # 49f0 <_sk_callback_sse41+0xf5b>
+ DB 68,15,88,21,197,16,0,0 ; addps 0x10c5(%rip),%xmm10 # 49f0 <_sk_callback_sse41+0xf5f>
DB 68,15,17,144,128,0,0,0 ; movups %xmm10,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13591,11 +13586,11 @@ _sk_bicubic_p3x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,180,16,0,0 ; addps 0x10b4(%rip),%xmm0 # 4a00 <_sk_callback_sse41+0xf6b>
+ DB 15,88,5,184,16,0,0 ; addps 0x10b8(%rip),%xmm0 # 4a00 <_sk_callback_sse41+0xf6f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,180,16,0,0 ; mulps 0x10b4(%rip),%xmm8 # 4a10 <_sk_callback_sse41+0xf7b>
- DB 68,15,88,5,188,16,0,0 ; addps 0x10bc(%rip),%xmm8 # 4a20 <_sk_callback_sse41+0xf8b>
+ DB 68,15,89,5,184,16,0,0 ; mulps 0x10b8(%rip),%xmm8 # 4a10 <_sk_callback_sse41+0xf7f>
+ DB 68,15,88,5,192,16,0,0 ; addps 0x10c0(%rip),%xmm8 # 4a20 <_sk_callback_sse41+0xf8f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13606,13 +13601,13 @@ _sk_bicubic_n3y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,170,16,0,0 ; addps 0x10aa(%rip),%xmm1 # 4a30 <_sk_callback_sse41+0xf9b>
- DB 68,15,40,13,178,16,0,0 ; movaps 0x10b2(%rip),%xmm9 # 4a40 <_sk_callback_sse41+0xfab>
+ DB 15,88,13,174,16,0,0 ; addps 0x10ae(%rip),%xmm1 # 4a30 <_sk_callback_sse41+0xf9f>
+ DB 68,15,40,13,182,16,0,0 ; movaps 0x10b6(%rip),%xmm9 # 4a40 <_sk_callback_sse41+0xfaf>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,174,16,0,0 ; mulps 0x10ae(%rip),%xmm9 # 4a50 <_sk_callback_sse41+0xfbb>
- DB 68,15,88,13,182,16,0,0 ; addps 0x10b6(%rip),%xmm9 # 4a60 <_sk_callback_sse41+0xfcb>
+ DB 68,15,89,13,178,16,0,0 ; mulps 0x10b2(%rip),%xmm9 # 4a50 <_sk_callback_sse41+0xfbf>
+ DB 68,15,88,13,186,16,0,0 ; addps 0x10ba(%rip),%xmm9 # 4a60 <_sk_callback_sse41+0xfcf>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13623,16 +13618,16 @@ _sk_bicubic_n1y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,164,16,0,0 ; addps 0x10a4(%rip),%xmm1 # 4a70 <_sk_callback_sse41+0xfdb>
- DB 68,15,40,13,172,16,0,0 ; movaps 0x10ac(%rip),%xmm9 # 4a80 <_sk_callback_sse41+0xfeb>
+ DB 15,88,13,168,16,0,0 ; addps 0x10a8(%rip),%xmm1 # 4a70 <_sk_callback_sse41+0xfdf>
+ DB 68,15,40,13,176,16,0,0 ; movaps 0x10b0(%rip),%xmm9 # 4a80 <_sk_callback_sse41+0xfef>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,176,16,0,0 ; movaps 0x10b0(%rip),%xmm8 # 4a90 <_sk_callback_sse41+0xffb>
+ DB 68,15,40,5,180,16,0,0 ; movaps 0x10b4(%rip),%xmm8 # 4a90 <_sk_callback_sse41+0xfff>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,180,16,0,0 ; addps 0x10b4(%rip),%xmm8 # 4aa0 <_sk_callback_sse41+0x100b>
+ DB 68,15,88,5,184,16,0,0 ; addps 0x10b8(%rip),%xmm8 # 4aa0 <_sk_callback_sse41+0x100f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,184,16,0,0 ; addps 0x10b8(%rip),%xmm8 # 4ab0 <_sk_callback_sse41+0x101b>
+ DB 68,15,88,5,188,16,0,0 ; addps 0x10bc(%rip),%xmm8 # 4ab0 <_sk_callback_sse41+0x101f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,188,16,0,0 ; addps 0x10bc(%rip),%xmm8 # 4ac0 <_sk_callback_sse41+0x102b>
+ DB 68,15,88,5,192,16,0,0 ; addps 0x10c0(%rip),%xmm8 # 4ac0 <_sk_callback_sse41+0x102f>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13640,17 +13635,17 @@ _sk_bicubic_n1y_sse41 LABEL PROC
PUBLIC _sk_bicubic_p1y_sse41
_sk_bicubic_p1y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,182,16,0,0 ; movaps 0x10b6(%rip),%xmm8 # 4ad0 <_sk_callback_sse41+0x103b>
+ DB 68,15,40,5,186,16,0,0 ; movaps 0x10ba(%rip),%xmm8 # 4ad0 <_sk_callback_sse41+0x103f>
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,72,96 ; movups 0x60(%rax),%xmm9
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 68,15,40,21,177,16,0,0 ; movaps 0x10b1(%rip),%xmm10 # 4ae0 <_sk_callback_sse41+0x104b>
+ DB 68,15,40,21,181,16,0,0 ; movaps 0x10b5(%rip),%xmm10 # 4ae0 <_sk_callback_sse41+0x104f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,181,16,0,0 ; addps 0x10b5(%rip),%xmm10 # 4af0 <_sk_callback_sse41+0x105b>
+ DB 68,15,88,21,185,16,0,0 ; addps 0x10b9(%rip),%xmm10 # 4af0 <_sk_callback_sse41+0x105f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,177,16,0,0 ; addps 0x10b1(%rip),%xmm10 # 4b00 <_sk_callback_sse41+0x106b>
+ DB 68,15,88,21,181,16,0,0 ; addps 0x10b5(%rip),%xmm10 # 4b00 <_sk_callback_sse41+0x106f>
DB 68,15,17,144,160,0,0,0 ; movups %xmm10,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -13660,11 +13655,11 @@ _sk_bicubic_p3y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,163,16,0,0 ; addps 0x10a3(%rip),%xmm1 # 4b10 <_sk_callback_sse41+0x107b>
+ DB 15,88,13,167,16,0,0 ; addps 0x10a7(%rip),%xmm1 # 4b10 <_sk_callback_sse41+0x107f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,163,16,0,0 ; mulps 0x10a3(%rip),%xmm8 # 4b20 <_sk_callback_sse41+0x108b>
- DB 68,15,88,5,171,16,0,0 ; addps 0x10ab(%rip),%xmm8 # 4b30 <_sk_callback_sse41+0x109b>
+ DB 68,15,89,5,167,16,0,0 ; mulps 0x10a7(%rip),%xmm8 # 4b20 <_sk_callback_sse41+0x108f>
+ DB 68,15,88,5,175,16,0,0 ; addps 0x10af(%rip),%xmm8 # 4b30 <_sk_callback_sse41+0x109f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -13763,15 +13758,16 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 2,0 ; add (%rax),%al
DB 0,0 ; add %al,(%rax)
- DB 33,8 ; and %ecx,(%rax)
- DB 130 ; (bad)
- DB 60,33 ; cmp $0x21,%al
- DB 8,130,60,33,8,130 ; or %al,-0x7df7dec4(%rdx)
- DB 60,33 ; cmp $0x21,%al
- DB 8,130,60,0,0,0 ; or %al,0x3c(%rdx)
- DB 191,0,0,0,191 ; mov $0xbf000000,%edi
DB 0,0 ; add %al,(%rax)
- DB 0,191,0,0,0,191 ; add %bh,-0x41000000(%rdi)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 252 ; cld
+ DB 190,0,0,252,190 ; mov $0xbefc0000,%esi
+ DB 0,0 ; add %al,(%rax)
+ DB 252 ; cld
+ DB 190,0,0,252,190 ; mov $0xbefc0000,%esi
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
DB 0,128,63,0,0,128 ; add %al,-0x7fffffc1(%rax)
@@ -14137,10 +14133,10 @@ ALIGN 16
DB 0,1 ; add %al,(%rcx)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a003f38 <_sk_callback_sse41+0xa0004a3>
+ DB 255,5,255,255,255,9 ; incl 0x9ffffff(%rip) # a003f38 <_sk_callback_sse41+0xa0004a7>
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 3003f40 <_sk_callback_sse41+0x30004ab>
+ DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 3003f40 <_sk_callback_sse41+0x30004af>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -14255,7 +14251,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a3803a <_sk_callback_sse41+0xffffffffe9a345a5>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a3803a <_sk_callback_sse41+0xffffffffe9a345a9>
DB 220,63 ; fdivrl (%rdi)
DB 81 ; push %rcx
DB 140,242 ; mov %?,%edx
@@ -14351,7 +14347,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a3810a <_sk_callback_sse41+0xffffffffe9a34675>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a3810a <_sk_callback_sse41+0xffffffffe9a34679>
DB 220,63 ; fdivrl (%rdi)
DB 81 ; push %rcx
DB 140,242 ; mov %?,%edx
@@ -14447,7 +14443,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a381da <_sk_callback_sse41+0xffffffffe9a34745>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a381da <_sk_callback_sse41+0xffffffffe9a34749>
DB 220,63 ; fdivrl (%rdi)
DB 81 ; push %rcx
DB 140,242 ; mov %?,%edx
@@ -14543,7 +14539,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a382aa <_sk_callback_sse41+0xffffffffe9a34815>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a382aa <_sk_callback_sse41+0xffffffffe9a34819>
DB 220,63 ; fdivrl (%rdi)
DB 81 ; push %rcx
DB 140,242 ; mov %?,%edx
@@ -14701,7 +14697,7 @@ ALIGN 16
DB 5,255,255,255,9 ; add $0x9ffffff,%eax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 3004490 <_sk_callback_sse41+0x30009fb>
+ DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 3004490 <_sk_callback_sse41+0x30009ff>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -14943,7 +14939,7 @@ ALIGN 16
DB 5,255,255,255,9 ; add $0x9ffffff,%eax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 30046e0 <_sk_callback_sse41+0x3000c4b>
+ DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 30046e0 <_sk_callback_sse41+0x3000c4f>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -14970,7 +14966,7 @@ ALIGN 16
DB 5,255,255,255,9 ; add $0x9ffffff,%eax
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 3004720 <_sk_callback_sse41+0x3000c8b>
+ DB 255,13,255,255,255,2 ; decl 0x2ffffff(%rip) # 3004720 <_sk_callback_sse41+0x3000c8f>
DB 255 ; (bad)
DB 255 ; (bad)
DB 255,6 ; incl (%rsi)
@@ -15245,7 +15241,7 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d7f5 <_sk_callback_sse41+0x3d639d60>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d7f5 <_sk_callback_sse41+0x3d639d64>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 0,63 ; add %bh,(%rdi)
DB 0,0 ; add %al,(%rax)
@@ -15271,7 +15267,7 @@ ALIGN 16
DB 0,192 ; add %al,%al
DB 63 ; (bad)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d835 <_sk_callback_sse41+0x3d639da0>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d835 <_sk_callback_sse41+0x3d639da4>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 192,63,0 ; sarb $0x0,(%rdi)
DB 0,192 ; add %al,%al
@@ -15355,7 +15351,7 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d905 <_sk_callback_sse41+0x3d639e70>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d905 <_sk_callback_sse41+0x3d639e74>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 0,63 ; add %bh,(%rdi)
DB 0,0 ; add %al,(%rax)
@@ -15381,7 +15377,7 @@ ALIGN 16
DB 0,192 ; add %al,%al
DB 63 ; (bad)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d945 <_sk_callback_sse41+0x3d639eb0>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63d945 <_sk_callback_sse41+0x3d639eb4>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 192,63,0 ; sarb $0x0,(%rdi)
DB 0,192 ; add %al,%al
@@ -15392,11 +15388,11 @@ ALIGN 16
DB 63 ; (bad)
DB 114,28 ; jb 4b3e <.literal16+0xffe>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 4b42 <_sk_callback_sse41+0x10ad>
+ DB 62,114,28 ; jb,pt 4b42 <_sk_callback_sse41+0x10b1>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 4b46 <_sk_callback_sse41+0x10b1>
+ DB 62,114,28 ; jb,pt 4b46 <_sk_callback_sse41+0x10b5>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 4b4a <_sk_callback_sse41+0x10b5>
+ DB 62,114,28 ; jb,pt 4b4a <_sk_callback_sse41+0x10b9>
DB 199 ; (bad)
DB 62,171 ; ds stos %eax,%es:(%rdi)
DB 170 ; stos %al,%es:(%rdi)
@@ -15487,7 +15483,7 @@ _sk_seed_shader_sse2 LABEL PROC
DB 102,15,110,199 ; movd %edi,%xmm0
DB 102,15,112,192,0 ; pshufd $0x0,%xmm0,%xmm0
DB 15,91,200 ; cvtdq2ps %xmm0,%xmm1
- DB 15,40,21,161,62,0,0 ; movaps 0x3ea1(%rip),%xmm2 # 3fb0 <_sk_callback_sse2+0xab>
+ DB 15,40,21,161,62,0,0 ; movaps 0x3ea1(%rip),%xmm2 # 3fb0 <_sk_callback_sse2+0xaf>
DB 15,88,202 ; addps %xmm2,%xmm1
DB 15,16,2 ; movups (%rdx),%xmm0
DB 15,88,193 ; addps %xmm1,%xmm0
@@ -15496,7 +15492,7 @@ _sk_seed_shader_sse2 LABEL PROC
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,88,202 ; addps %xmm2,%xmm1
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,21,144,62,0,0 ; movaps 0x3e90(%rip),%xmm2 # 3fc0 <_sk_callback_sse2+0xbb>
+ DB 15,40,21,144,62,0,0 ; movaps 0x3e90(%rip),%xmm2 # 3fc0 <_sk_callback_sse2+0xbf>
DB 15,87,219 ; xorps %xmm3,%xmm3
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,87,237 ; xorps %xmm5,%xmm5
@@ -15517,14 +15513,14 @@ _sk_dither_sse2 LABEL PROC
DB 102,68,15,110,1 ; movd (%rcx),%xmm8
DB 102,69,15,112,192,0 ; pshufd $0x0,%xmm8,%xmm8
DB 102,69,15,239,193 ; pxor %xmm9,%xmm8
- DB 102,68,15,111,21,85,62,0,0 ; movdqa 0x3e55(%rip),%xmm10 # 3fd0 <_sk_callback_sse2+0xcb>
+ DB 102,68,15,111,21,85,62,0,0 ; movdqa 0x3e55(%rip),%xmm10 # 3fd0 <_sk_callback_sse2+0xcf>
DB 102,69,15,111,216 ; movdqa %xmm8,%xmm11
DB 102,69,15,219,218 ; pand %xmm10,%xmm11
DB 102,65,15,114,243,5 ; pslld $0x5,%xmm11
DB 102,69,15,219,209 ; pand %xmm9,%xmm10
DB 102,65,15,114,242,4 ; pslld $0x4,%xmm10
- DB 102,68,15,111,37,65,62,0,0 ; movdqa 0x3e41(%rip),%xmm12 # 3fe0 <_sk_callback_sse2+0xdb>
- DB 102,68,15,111,45,72,62,0,0 ; movdqa 0x3e48(%rip),%xmm13 # 3ff0 <_sk_callback_sse2+0xeb>
+ DB 102,68,15,111,37,65,62,0,0 ; movdqa 0x3e41(%rip),%xmm12 # 3fe0 <_sk_callback_sse2+0xdf>
+ DB 102,68,15,111,45,72,62,0,0 ; movdqa 0x3e48(%rip),%xmm13 # 3ff0 <_sk_callback_sse2+0xef>
DB 102,69,15,111,240 ; movdqa %xmm8,%xmm14
DB 102,69,15,219,245 ; pand %xmm13,%xmm14
DB 102,65,15,114,246,2 ; pslld $0x2,%xmm14
@@ -15540,12 +15536,11 @@ _sk_dither_sse2 LABEL PROC
DB 102,69,15,235,245 ; por %xmm13,%xmm14
DB 102,69,15,235,240 ; por %xmm8,%xmm14
DB 69,15,91,198 ; cvtdq2ps %xmm14,%xmm8
- DB 68,15,89,5,3,62,0,0 ; mulps 0x3e03(%rip),%xmm8 # 4000 <_sk_callback_sse2+0xfb>
- DB 68,15,88,5,11,62,0,0 ; addps 0x3e0b(%rip),%xmm8 # 4010 <_sk_callback_sse2+0x10b>
+ DB 68,15,89,5,3,62,0,0 ; mulps 0x3e03(%rip),%xmm8 # 4000 <_sk_callback_sse2+0xff>
+ DB 68,15,88,5,11,62,0,0 ; addps 0x3e0b(%rip),%xmm8 # 4010 <_sk_callback_sse2+0x10f>
DB 243,68,15,16,72,8 ; movss 0x8(%rax),%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
- DB 68,15,89,203 ; mulps %xmm3,%xmm9
DB 65,15,88,193 ; addps %xmm9,%xmm0
DB 65,15,88,201 ; addps %xmm9,%xmm1
DB 65,15,88,209 ; addps %xmm9,%xmm2
@@ -15578,7 +15573,7 @@ _sk_clear_sse2 LABEL PROC
PUBLIC _sk_srcatop_sse2
_sk_srcatop_sse2 LABEL PROC
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 68,15,40,5,180,61,0,0 ; movaps 0x3db4(%rip),%xmm8 # 4020 <_sk_callback_sse2+0x11b>
+ DB 68,15,40,5,184,61,0,0 ; movaps 0x3db8(%rip),%xmm8 # 4020 <_sk_callback_sse2+0x11f>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -15601,7 +15596,7 @@ PUBLIC _sk_dstatop_sse2
_sk_dstatop_sse2 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
DB 68,15,89,196 ; mulps %xmm4,%xmm8
- DB 68,15,40,13,119,61,0,0 ; movaps 0x3d77(%rip),%xmm9 # 4030 <_sk_callback_sse2+0x12b>
+ DB 68,15,40,13,123,61,0,0 ; movaps 0x3d7b(%rip),%xmm9 # 4030 <_sk_callback_sse2+0x12f>
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 65,15,88,192 ; addps %xmm8,%xmm0
@@ -15642,7 +15637,7 @@ _sk_dstin_sse2 LABEL PROC
PUBLIC _sk_srcout_sse2
_sk_srcout_sse2 LABEL PROC
- DB 68,15,40,5,27,61,0,0 ; movaps 0x3d1b(%rip),%xmm8 # 4040 <_sk_callback_sse2+0x13b>
+ DB 68,15,40,5,31,61,0,0 ; movaps 0x3d1f(%rip),%xmm8 # 4040 <_sk_callback_sse2+0x13f>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
@@ -15653,7 +15648,7 @@ _sk_srcout_sse2 LABEL PROC
PUBLIC _sk_dstout_sse2
_sk_dstout_sse2 LABEL PROC
- DB 68,15,40,5,11,61,0,0 ; movaps 0x3d0b(%rip),%xmm8 # 4050 <_sk_callback_sse2+0x14b>
+ DB 68,15,40,5,15,61,0,0 ; movaps 0x3d0f(%rip),%xmm8 # 4050 <_sk_callback_sse2+0x14f>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 15,89,196 ; mulps %xmm4,%xmm0
@@ -15668,7 +15663,7 @@ _sk_dstout_sse2 LABEL PROC
PUBLIC _sk_srcover_sse2
_sk_srcover_sse2 LABEL PROC
- DB 68,15,40,5,238,60,0,0 ; movaps 0x3cee(%rip),%xmm8 # 4060 <_sk_callback_sse2+0x15b>
+ DB 68,15,40,5,242,60,0,0 ; movaps 0x3cf2(%rip),%xmm8 # 4060 <_sk_callback_sse2+0x15f>
DB 68,15,92,195 ; subps %xmm3,%xmm8
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,89,204 ; mulps %xmm4,%xmm9
@@ -15686,7 +15681,7 @@ _sk_srcover_sse2 LABEL PROC
PUBLIC _sk_dstover_sse2
_sk_dstover_sse2 LABEL PROC
- DB 68,15,40,5,194,60,0,0 ; movaps 0x3cc2(%rip),%xmm8 # 4070 <_sk_callback_sse2+0x16b>
+ DB 68,15,40,5,198,60,0,0 ; movaps 0x3cc6(%rip),%xmm8 # 4070 <_sk_callback_sse2+0x16f>
DB 68,15,92,199 ; subps %xmm7,%xmm8
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -15710,7 +15705,7 @@ _sk_modulate_sse2 LABEL PROC
PUBLIC _sk_multiply_sse2
_sk_multiply_sse2 LABEL PROC
- DB 68,15,40,5,150,60,0,0 ; movaps 0x3c96(%rip),%xmm8 # 4080 <_sk_callback_sse2+0x17b>
+ DB 68,15,40,5,154,60,0,0 ; movaps 0x3c9a(%rip),%xmm8 # 4080 <_sk_callback_sse2+0x17f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 69,15,40,209 ; movaps %xmm9,%xmm10
@@ -15780,7 +15775,7 @@ _sk_screen_sse2 LABEL PROC
PUBLIC _sk_xor__sse2
_sk_xor__sse2 LABEL PROC
DB 68,15,40,195 ; movaps %xmm3,%xmm8
- DB 15,40,29,199,59,0,0 ; movaps 0x3bc7(%rip),%xmm3 # 4090 <_sk_callback_sse2+0x18b>
+ DB 15,40,29,203,59,0,0 ; movaps 0x3bcb(%rip),%xmm3 # 4090 <_sk_callback_sse2+0x18f>
DB 68,15,40,203 ; movaps %xmm3,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 65,15,89,193 ; mulps %xmm9,%xmm0
@@ -15826,7 +15821,7 @@ _sk_darken_sse2 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,95,209 ; maxps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,50,59,0,0 ; movaps 0x3b32(%rip),%xmm2 # 40a0 <_sk_callback_sse2+0x19b>
+ DB 15,40,21,54,59,0,0 ; movaps 0x3b36(%rip),%xmm2 # 40a0 <_sk_callback_sse2+0x19f>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -15858,7 +15853,7 @@ _sk_lighten_sse2 LABEL PROC
DB 68,15,89,206 ; mulps %xmm6,%xmm9
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,215,58,0,0 ; movaps 0x3ad7(%rip),%xmm2 # 40b0 <_sk_callback_sse2+0x1ab>
+ DB 15,40,21,219,58,0,0 ; movaps 0x3adb(%rip),%xmm2 # 40b0 <_sk_callback_sse2+0x1af>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -15893,7 +15888,7 @@ _sk_difference_sse2 LABEL PROC
DB 65,15,93,209 ; minps %xmm9,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,194 ; subps %xmm2,%xmm8
- DB 15,40,21,113,58,0,0 ; movaps 0x3a71(%rip),%xmm2 # 40c0 <_sk_callback_sse2+0x1bb>
+ DB 15,40,21,117,58,0,0 ; movaps 0x3a75(%rip),%xmm2 # 40c0 <_sk_callback_sse2+0x1bf>
DB 15,92,211 ; subps %xmm3,%xmm2
DB 15,89,215 ; mulps %xmm7,%xmm2
DB 15,88,218 ; addps %xmm2,%xmm3
@@ -15918,7 +15913,7 @@ _sk_exclusion_sse2 LABEL PROC
DB 15,89,214 ; mulps %xmm6,%xmm2
DB 15,88,210 ; addps %xmm2,%xmm2
DB 68,15,92,202 ; subps %xmm2,%xmm9
- DB 15,40,13,50,58,0,0 ; movaps 0x3a32(%rip),%xmm1 # 40d0 <_sk_callback_sse2+0x1cb>
+ DB 15,40,13,54,58,0,0 ; movaps 0x3a36(%rip),%xmm1 # 40d0 <_sk_callback_sse2+0x1cf>
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,89,207 ; mulps %xmm7,%xmm1
DB 15,88,217 ; addps %xmm1,%xmm3
@@ -15930,7 +15925,7 @@ _sk_exclusion_sse2 LABEL PROC
PUBLIC _sk_colorburn_sse2
_sk_colorburn_sse2 LABEL PROC
DB 68,15,40,192 ; movaps %xmm0,%xmm8
- DB 68,15,40,21,33,58,0,0 ; movaps 0x3a21(%rip),%xmm10 # 40e0 <_sk_callback_sse2+0x1db>
+ DB 68,15,40,21,37,58,0,0 ; movaps 0x3a25(%rip),%xmm10 # 40e0 <_sk_callback_sse2+0x1df>
DB 69,15,40,202 ; movaps %xmm10,%xmm9
DB 68,15,92,207 ; subps %xmm7,%xmm9
DB 69,15,40,217 ; movaps %xmm9,%xmm11
@@ -16022,7 +16017,7 @@ _sk_colorburn_sse2 LABEL PROC
PUBLIC _sk_colordodge_sse2
_sk_colordodge_sse2 LABEL PROC
DB 68,15,40,200 ; movaps %xmm0,%xmm9
- DB 68,15,40,21,215,56,0,0 ; movaps 0x38d7(%rip),%xmm10 # 40f0 <_sk_callback_sse2+0x1eb>
+ DB 68,15,40,21,219,56,0,0 ; movaps 0x38db(%rip),%xmm10 # 40f0 <_sk_callback_sse2+0x1ef>
DB 69,15,40,218 ; movaps %xmm10,%xmm11
DB 68,15,92,223 ; subps %xmm7,%xmm11
DB 69,15,40,227 ; movaps %xmm11,%xmm12
@@ -16115,7 +16110,7 @@ _sk_hardlight_sse2 LABEL PROC
DB 15,41,52,36 ; movaps %xmm6,(%rsp)
DB 15,40,245 ; movaps %xmm5,%xmm6
DB 15,40,236 ; movaps %xmm4,%xmm5
- DB 68,15,40,29,137,55,0,0 ; movaps 0x3789(%rip),%xmm11 # 4100 <_sk_callback_sse2+0x1fb>
+ DB 68,15,40,29,141,55,0,0 ; movaps 0x378d(%rip),%xmm11 # 4100 <_sk_callback_sse2+0x1ff>
DB 69,15,40,211 ; movaps %xmm11,%xmm10
DB 68,15,92,215 ; subps %xmm7,%xmm10
DB 69,15,40,194 ; movaps %xmm10,%xmm8
@@ -16202,7 +16197,7 @@ PUBLIC _sk_overlay_sse2
_sk_overlay_sse2 LABEL PROC
DB 68,15,40,193 ; movaps %xmm1,%xmm8
DB 68,15,40,232 ; movaps %xmm0,%xmm13
- DB 68,15,40,13,84,54,0,0 ; movaps 0x3654(%rip),%xmm9 # 4110 <_sk_callback_sse2+0x20b>
+ DB 68,15,40,13,88,54,0,0 ; movaps 0x3658(%rip),%xmm9 # 4110 <_sk_callback_sse2+0x20f>
DB 69,15,40,209 ; movaps %xmm9,%xmm10
DB 68,15,92,215 ; subps %xmm7,%xmm10
DB 69,15,40,218 ; movaps %xmm10,%xmm11
@@ -16292,7 +16287,7 @@ _sk_softlight_sse2 LABEL PROC
DB 68,15,40,213 ; movaps %xmm5,%xmm10
DB 68,15,94,215 ; divps %xmm7,%xmm10
DB 69,15,84,212 ; andps %xmm12,%xmm10
- DB 68,15,40,13,14,53,0,0 ; movaps 0x350e(%rip),%xmm9 # 4120 <_sk_callback_sse2+0x21b>
+ DB 68,15,40,13,18,53,0,0 ; movaps 0x3512(%rip),%xmm9 # 4120 <_sk_callback_sse2+0x21f>
DB 69,15,40,249 ; movaps %xmm9,%xmm15
DB 69,15,92,250 ; subps %xmm10,%xmm15
DB 69,15,40,218 ; movaps %xmm10,%xmm11
@@ -16305,10 +16300,10 @@ _sk_softlight_sse2 LABEL PROC
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 65,15,88,194 ; addps %xmm10,%xmm0
- DB 68,15,40,53,232,52,0,0 ; movaps 0x34e8(%rip),%xmm14 # 4130 <_sk_callback_sse2+0x22b>
+ DB 68,15,40,53,236,52,0,0 ; movaps 0x34ec(%rip),%xmm14 # 4130 <_sk_callback_sse2+0x22f>
DB 69,15,88,222 ; addps %xmm14,%xmm11
DB 68,15,89,216 ; mulps %xmm0,%xmm11
- DB 68,15,40,21,232,52,0,0 ; movaps 0x34e8(%rip),%xmm10 # 4140 <_sk_callback_sse2+0x23b>
+ DB 68,15,40,21,236,52,0,0 ; movaps 0x34ec(%rip),%xmm10 # 4140 <_sk_callback_sse2+0x23f>
DB 69,15,89,234 ; mulps %xmm10,%xmm13
DB 69,15,88,235 ; addps %xmm11,%xmm13
DB 15,88,228 ; addps %xmm4,%xmm4
@@ -16457,7 +16452,7 @@ _sk_clamp_0_sse2 LABEL PROC
PUBLIC _sk_clamp_1_sse2
_sk_clamp_1_sse2 LABEL PROC
- DB 68,15,40,5,244,50,0,0 ; movaps 0x32f4(%rip),%xmm8 # 4150 <_sk_callback_sse2+0x24b>
+ DB 68,15,40,5,248,50,0,0 ; movaps 0x32f8(%rip),%xmm8 # 4150 <_sk_callback_sse2+0x24f>
DB 65,15,93,192 ; minps %xmm8,%xmm0
DB 65,15,93,200 ; minps %xmm8,%xmm1
DB 65,15,93,208 ; minps %xmm8,%xmm2
@@ -16467,7 +16462,7 @@ _sk_clamp_1_sse2 LABEL PROC
PUBLIC _sk_clamp_a_sse2
_sk_clamp_a_sse2 LABEL PROC
- DB 15,93,29,233,50,0,0 ; minps 0x32e9(%rip),%xmm3 # 4160 <_sk_callback_sse2+0x25b>
+ DB 15,93,29,237,50,0,0 ; minps 0x32ed(%rip),%xmm3 # 4160 <_sk_callback_sse2+0x25f>
DB 15,93,195 ; minps %xmm3,%xmm0
DB 15,93,203 ; minps %xmm3,%xmm1
DB 15,93,211 ; minps %xmm3,%xmm2
@@ -16540,7 +16535,7 @@ _sk_premul_sse2 LABEL PROC
PUBLIC _sk_unpremul_sse2
_sk_unpremul_sse2 LABEL PROC
DB 69,15,87,192 ; xorps %xmm8,%xmm8
- DB 68,15,40,13,84,50,0,0 ; movaps 0x3254(%rip),%xmm9 # 4170 <_sk_callback_sse2+0x26b>
+ DB 68,15,40,13,88,50,0,0 ; movaps 0x3258(%rip),%xmm9 # 4170 <_sk_callback_sse2+0x26f>
DB 68,15,94,203 ; divps %xmm3,%xmm9
DB 68,15,194,195,4 ; cmpneqps %xmm3,%xmm8
DB 69,15,84,193 ; andps %xmm9,%xmm8
@@ -16552,20 +16547,20 @@ _sk_unpremul_sse2 LABEL PROC
PUBLIC _sk_from_srgb_sse2
_sk_from_srgb_sse2 LABEL PROC
- DB 68,15,40,5,63,50,0,0 ; movaps 0x323f(%rip),%xmm8 # 4180 <_sk_callback_sse2+0x27b>
+ DB 68,15,40,5,67,50,0,0 ; movaps 0x3243(%rip),%xmm8 # 4180 <_sk_callback_sse2+0x27f>
DB 68,15,40,232 ; movaps %xmm0,%xmm13
DB 69,15,89,232 ; mulps %xmm8,%xmm13
DB 68,15,40,216 ; movaps %xmm0,%xmm11
DB 69,15,89,219 ; mulps %xmm11,%xmm11
- DB 68,15,40,13,55,50,0,0 ; movaps 0x3237(%rip),%xmm9 # 4190 <_sk_callback_sse2+0x28b>
+ DB 68,15,40,13,59,50,0,0 ; movaps 0x323b(%rip),%xmm9 # 4190 <_sk_callback_sse2+0x28f>
DB 68,15,40,240 ; movaps %xmm0,%xmm14
DB 69,15,89,241 ; mulps %xmm9,%xmm14
- DB 68,15,40,21,55,50,0,0 ; movaps 0x3237(%rip),%xmm10 # 41a0 <_sk_callback_sse2+0x29b>
+ DB 68,15,40,21,59,50,0,0 ; movaps 0x323b(%rip),%xmm10 # 41a0 <_sk_callback_sse2+0x29f>
DB 69,15,88,242 ; addps %xmm10,%xmm14
DB 69,15,89,243 ; mulps %xmm11,%xmm14
- DB 68,15,40,29,55,50,0,0 ; movaps 0x3237(%rip),%xmm11 # 41b0 <_sk_callback_sse2+0x2ab>
+ DB 68,15,40,29,59,50,0,0 ; movaps 0x323b(%rip),%xmm11 # 41b0 <_sk_callback_sse2+0x2af>
DB 69,15,88,243 ; addps %xmm11,%xmm14
- DB 68,15,40,37,59,50,0,0 ; movaps 0x323b(%rip),%xmm12 # 41c0 <_sk_callback_sse2+0x2bb>
+ DB 68,15,40,37,63,50,0,0 ; movaps 0x323f(%rip),%xmm12 # 41c0 <_sk_callback_sse2+0x2bf>
DB 65,15,194,196,1 ; cmpltps %xmm12,%xmm0
DB 68,15,84,232 ; andps %xmm0,%xmm13
DB 65,15,85,198 ; andnps %xmm14,%xmm0
@@ -16602,20 +16597,20 @@ _sk_to_srgb_sse2 LABEL PROC
DB 68,15,82,192 ; rsqrtps %xmm0,%xmm8
DB 69,15,83,200 ; rcpps %xmm8,%xmm9
DB 69,15,82,232 ; rsqrtps %xmm8,%xmm13
- DB 68,15,40,5,192,49,0,0 ; movaps 0x31c0(%rip),%xmm8 # 41d0 <_sk_callback_sse2+0x2cb>
+ DB 68,15,40,5,196,49,0,0 ; movaps 0x31c4(%rip),%xmm8 # 41d0 <_sk_callback_sse2+0x2cf>
DB 68,15,40,240 ; movaps %xmm0,%xmm14
DB 69,15,89,240 ; mulps %xmm8,%xmm14
- DB 68,15,40,21,192,49,0,0 ; movaps 0x31c0(%rip),%xmm10 # 41e0 <_sk_callback_sse2+0x2db>
+ DB 68,15,40,21,196,49,0,0 ; movaps 0x31c4(%rip),%xmm10 # 41e0 <_sk_callback_sse2+0x2df>
DB 69,15,89,202 ; mulps %xmm10,%xmm9
- DB 68,15,40,29,196,49,0,0 ; movaps 0x31c4(%rip),%xmm11 # 41f0 <_sk_callback_sse2+0x2eb>
+ DB 68,15,40,29,200,49,0,0 ; movaps 0x31c8(%rip),%xmm11 # 41f0 <_sk_callback_sse2+0x2ef>
DB 69,15,88,203 ; addps %xmm11,%xmm9
- DB 68,15,40,37,200,49,0,0 ; movaps 0x31c8(%rip),%xmm12 # 4200 <_sk_callback_sse2+0x2fb>
+ DB 68,15,40,37,204,49,0,0 ; movaps 0x31cc(%rip),%xmm12 # 4200 <_sk_callback_sse2+0x2ff>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,40,13,200,49,0,0 ; movaps 0x31c8(%rip),%xmm9 # 4210 <_sk_callback_sse2+0x30b>
+ DB 68,15,40,13,204,49,0,0 ; movaps 0x31cc(%rip),%xmm9 # 4210 <_sk_callback_sse2+0x30f>
DB 69,15,40,249 ; movaps %xmm9,%xmm15
DB 69,15,93,253 ; minps %xmm13,%xmm15
- DB 68,15,40,45,200,49,0,0 ; movaps 0x31c8(%rip),%xmm13 # 4220 <_sk_callback_sse2+0x31b>
+ DB 68,15,40,45,204,49,0,0 ; movaps 0x31cc(%rip),%xmm13 # 4220 <_sk_callback_sse2+0x31f>
DB 65,15,194,197,1 ; cmpltps %xmm13,%xmm0
DB 68,15,84,240 ; andps %xmm0,%xmm14
DB 65,15,85,199 ; andnps %xmm15,%xmm0
@@ -16663,7 +16658,7 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 68,15,93,218 ; minps %xmm2,%xmm11
DB 65,15,40,202 ; movaps %xmm10,%xmm1
DB 65,15,92,203 ; subps %xmm11,%xmm1
- DB 68,15,40,45,33,49,0,0 ; movaps 0x3121(%rip),%xmm13 # 4230 <_sk_callback_sse2+0x32b>
+ DB 68,15,40,45,37,49,0,0 ; movaps 0x3125(%rip),%xmm13 # 4230 <_sk_callback_sse2+0x32f>
DB 68,15,94,233 ; divps %xmm1,%xmm13
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,194,192,0 ; cmpeqps %xmm8,%xmm0
@@ -16672,30 +16667,30 @@ _sk_rgb_to_hsl_sse2 LABEL PROC
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,40,241 ; movaps %xmm9,%xmm14
DB 68,15,194,242,1 ; cmpltps %xmm2,%xmm14
- DB 68,15,84,53,7,49,0,0 ; andps 0x3107(%rip),%xmm14 # 4240 <_sk_callback_sse2+0x33b>
+ DB 68,15,84,53,11,49,0,0 ; andps 0x310b(%rip),%xmm14 # 4240 <_sk_callback_sse2+0x33f>
DB 69,15,88,244 ; addps %xmm12,%xmm14
DB 69,15,40,250 ; movaps %xmm10,%xmm15
DB 69,15,194,249,0 ; cmpeqps %xmm9,%xmm15
DB 65,15,92,208 ; subps %xmm8,%xmm2
DB 65,15,89,213 ; mulps %xmm13,%xmm2
- DB 68,15,40,37,250,48,0,0 ; movaps 0x30fa(%rip),%xmm12 # 4250 <_sk_callback_sse2+0x34b>
+ DB 68,15,40,37,254,48,0,0 ; movaps 0x30fe(%rip),%xmm12 # 4250 <_sk_callback_sse2+0x34f>
DB 65,15,88,212 ; addps %xmm12,%xmm2
DB 69,15,92,193 ; subps %xmm9,%xmm8
DB 69,15,89,197 ; mulps %xmm13,%xmm8
- DB 68,15,88,5,246,48,0,0 ; addps 0x30f6(%rip),%xmm8 # 4260 <_sk_callback_sse2+0x35b>
+ DB 68,15,88,5,250,48,0,0 ; addps 0x30fa(%rip),%xmm8 # 4260 <_sk_callback_sse2+0x35f>
DB 65,15,84,215 ; andps %xmm15,%xmm2
DB 69,15,85,248 ; andnps %xmm8,%xmm15
DB 68,15,86,250 ; orps %xmm2,%xmm15
DB 68,15,84,240 ; andps %xmm0,%xmm14
DB 65,15,85,199 ; andnps %xmm15,%xmm0
DB 65,15,86,198 ; orps %xmm14,%xmm0
- DB 15,89,5,231,48,0,0 ; mulps 0x30e7(%rip),%xmm0 # 4270 <_sk_callback_sse2+0x36b>
+ DB 15,89,5,235,48,0,0 ; mulps 0x30eb(%rip),%xmm0 # 4270 <_sk_callback_sse2+0x36f>
DB 69,15,40,194 ; movaps %xmm10,%xmm8
DB 69,15,194,195,4 ; cmpneqps %xmm11,%xmm8
DB 65,15,84,192 ; andps %xmm8,%xmm0
DB 69,15,92,226 ; subps %xmm10,%xmm12
DB 69,15,88,211 ; addps %xmm11,%xmm10
- DB 68,15,40,13,218,48,0,0 ; movaps 0x30da(%rip),%xmm9 # 4280 <_sk_callback_sse2+0x37b>
+ DB 68,15,40,13,222,48,0,0 ; movaps 0x30de(%rip),%xmm9 # 4280 <_sk_callback_sse2+0x37f>
DB 65,15,40,210 ; movaps %xmm10,%xmm2
DB 65,15,89,209 ; mulps %xmm9,%xmm2
DB 68,15,194,202,1 ; cmpltps %xmm2,%xmm9
@@ -16718,7 +16713,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,41,92,36,32 ; movaps %xmm3,0x20(%rsp)
DB 68,15,40,218 ; movaps %xmm2,%xmm11
DB 15,40,240 ; movaps %xmm0,%xmm6
- DB 68,15,40,13,149,48,0,0 ; movaps 0x3095(%rip),%xmm9 # 4290 <_sk_callback_sse2+0x38b>
+ DB 68,15,40,13,153,48,0,0 ; movaps 0x3099(%rip),%xmm9 # 4290 <_sk_callback_sse2+0x38f>
DB 69,15,40,209 ; movaps %xmm9,%xmm10
DB 69,15,194,211,2 ; cmpleps %xmm11,%xmm10
DB 15,40,193 ; movaps %xmm1,%xmm0
@@ -16735,28 +16730,28 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 69,15,88,211 ; addps %xmm11,%xmm10
DB 69,15,88,219 ; addps %xmm11,%xmm11
DB 69,15,92,218 ; subps %xmm10,%xmm11
- DB 15,40,5,95,48,0,0 ; movaps 0x305f(%rip),%xmm0 # 42a0 <_sk_callback_sse2+0x39b>
+ DB 15,40,5,99,48,0,0 ; movaps 0x3063(%rip),%xmm0 # 42a0 <_sk_callback_sse2+0x39f>
DB 15,88,198 ; addps %xmm6,%xmm0
DB 243,15,91,200 ; cvttps2dq %xmm0,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
DB 15,40,216 ; movaps %xmm0,%xmm3
DB 15,194,217,1 ; cmpltps %xmm1,%xmm3
- DB 15,84,29,87,48,0,0 ; andps 0x3057(%rip),%xmm3 # 42b0 <_sk_callback_sse2+0x3ab>
+ DB 15,84,29,91,48,0,0 ; andps 0x305b(%rip),%xmm3 # 42b0 <_sk_callback_sse2+0x3af>
DB 15,92,203 ; subps %xmm3,%xmm1
DB 15,92,193 ; subps %xmm1,%xmm0
- DB 68,15,40,45,89,48,0,0 ; movaps 0x3059(%rip),%xmm13 # 42c0 <_sk_callback_sse2+0x3bb>
+ DB 68,15,40,45,93,48,0,0 ; movaps 0x305d(%rip),%xmm13 # 42c0 <_sk_callback_sse2+0x3bf>
DB 69,15,40,197 ; movaps %xmm13,%xmm8
DB 68,15,194,192,2 ; cmpleps %xmm0,%xmm8
DB 69,15,40,242 ; movaps %xmm10,%xmm14
DB 69,15,92,243 ; subps %xmm11,%xmm14
DB 65,15,40,217 ; movaps %xmm9,%xmm3
DB 15,194,216,2 ; cmpleps %xmm0,%xmm3
- DB 15,40,21,105,48,0,0 ; movaps 0x3069(%rip),%xmm2 # 42f0 <_sk_callback_sse2+0x3eb>
+ DB 15,40,21,109,48,0,0 ; movaps 0x306d(%rip),%xmm2 # 42f0 <_sk_callback_sse2+0x3ef>
DB 68,15,40,250 ; movaps %xmm2,%xmm15
DB 68,15,194,248,2 ; cmpleps %xmm0,%xmm15
- DB 15,40,13,57,48,0,0 ; movaps 0x3039(%rip),%xmm1 # 42d0 <_sk_callback_sse2+0x3cb>
+ DB 15,40,13,61,48,0,0 ; movaps 0x303d(%rip),%xmm1 # 42d0 <_sk_callback_sse2+0x3cf>
DB 15,89,193 ; mulps %xmm1,%xmm0
- DB 15,40,45,63,48,0,0 ; movaps 0x303f(%rip),%xmm5 # 42e0 <_sk_callback_sse2+0x3db>
+ DB 15,40,45,67,48,0,0 ; movaps 0x3043(%rip),%xmm5 # 42e0 <_sk_callback_sse2+0x3df>
DB 15,40,229 ; movaps %xmm5,%xmm4
DB 15,92,224 ; subps %xmm0,%xmm4
DB 65,15,89,230 ; mulps %xmm14,%xmm4
@@ -16779,7 +16774,7 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,40,222 ; movaps %xmm6,%xmm3
DB 15,194,216,1 ; cmpltps %xmm0,%xmm3
- DB 15,84,29,180,47,0,0 ; andps 0x2fb4(%rip),%xmm3 # 42b0 <_sk_callback_sse2+0x3ab>
+ DB 15,84,29,184,47,0,0 ; andps 0x2fb8(%rip),%xmm3 # 42b0 <_sk_callback_sse2+0x3af>
DB 15,92,195 ; subps %xmm3,%xmm0
DB 68,15,40,230 ; movaps %xmm6,%xmm12
DB 68,15,92,224 ; subps %xmm0,%xmm12
@@ -16809,12 +16804,12 @@ _sk_hsl_to_rgb_sse2 LABEL PROC
DB 15,40,60,36 ; movaps (%rsp),%xmm7
DB 15,40,231 ; movaps %xmm7,%xmm4
DB 15,85,227 ; andnps %xmm3,%xmm4
- DB 15,88,53,141,47,0,0 ; addps 0x2f8d(%rip),%xmm6 # 4300 <_sk_callback_sse2+0x3fb>
+ DB 15,88,53,145,47,0,0 ; addps 0x2f91(%rip),%xmm6 # 4300 <_sk_callback_sse2+0x3ff>
DB 243,15,91,198 ; cvttps2dq %xmm6,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
DB 15,40,222 ; movaps %xmm6,%xmm3
DB 15,194,216,1 ; cmpltps %xmm0,%xmm3
- DB 15,84,29,40,47,0,0 ; andps 0x2f28(%rip),%xmm3 # 42b0 <_sk_callback_sse2+0x3ab>
+ DB 15,84,29,44,47,0,0 ; andps 0x2f2c(%rip),%xmm3 # 42b0 <_sk_callback_sse2+0x3af>
DB 15,92,195 ; subps %xmm3,%xmm0
DB 15,92,240 ; subps %xmm0,%xmm6
DB 15,89,206 ; mulps %xmm6,%xmm1
@@ -16875,7 +16870,7 @@ _sk_scale_u8_sse2 LABEL PROC
DB 102,69,15,96,193 ; punpcklbw %xmm9,%xmm8
DB 102,69,15,97,193 ; punpcklwd %xmm9,%xmm8
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,178,46,0,0 ; mulps 0x2eb2(%rip),%xmm8 # 4310 <_sk_callback_sse2+0x40b>
+ DB 68,15,89,5,182,46,0,0 ; mulps 0x2eb6(%rip),%xmm8 # 4310 <_sk_callback_sse2+0x40f>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 65,15,89,208 ; mulps %xmm8,%xmm2
@@ -16912,7 +16907,7 @@ _sk_lerp_u8_sse2 LABEL PROC
DB 102,69,15,96,193 ; punpcklbw %xmm9,%xmm8
DB 102,69,15,97,193 ; punpcklwd %xmm9,%xmm8
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,80,46,0,0 ; mulps 0x2e50(%rip),%xmm8 # 4320 <_sk_callback_sse2+0x41b>
+ DB 68,15,89,5,84,46,0,0 ; mulps 0x2e54(%rip),%xmm8 # 4320 <_sk_callback_sse2+0x41f>
DB 15,92,196 ; subps %xmm4,%xmm0
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -16935,17 +16930,17 @@ _sk_lerp_565_sse2 LABEL PROC
DB 243,68,15,126,4,120 ; movq (%rax,%rdi,2),%xmm8
DB 102,15,239,219 ; pxor %xmm3,%xmm3
DB 102,68,15,97,195 ; punpcklwd %xmm3,%xmm8
- DB 102,15,111,29,24,46,0,0 ; movdqa 0x2e18(%rip),%xmm3 # 4330 <_sk_callback_sse2+0x42b>
+ DB 102,15,111,29,28,46,0,0 ; movdqa 0x2e1c(%rip),%xmm3 # 4330 <_sk_callback_sse2+0x42f>
DB 102,65,15,219,216 ; pand %xmm8,%xmm3
DB 68,15,91,203 ; cvtdq2ps %xmm3,%xmm9
- DB 68,15,89,13,23,46,0,0 ; mulps 0x2e17(%rip),%xmm9 # 4340 <_sk_callback_sse2+0x43b>
- DB 102,15,111,29,31,46,0,0 ; movdqa 0x2e1f(%rip),%xmm3 # 4350 <_sk_callback_sse2+0x44b>
+ DB 68,15,89,13,27,46,0,0 ; mulps 0x2e1b(%rip),%xmm9 # 4340 <_sk_callback_sse2+0x43f>
+ DB 102,15,111,29,35,46,0,0 ; movdqa 0x2e23(%rip),%xmm3 # 4350 <_sk_callback_sse2+0x44f>
DB 102,65,15,219,216 ; pand %xmm8,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,32,46,0,0 ; mulps 0x2e20(%rip),%xmm3 # 4360 <_sk_callback_sse2+0x45b>
- DB 102,68,15,219,5,39,46,0,0 ; pand 0x2e27(%rip),%xmm8 # 4370 <_sk_callback_sse2+0x46b>
+ DB 15,89,29,36,46,0,0 ; mulps 0x2e24(%rip),%xmm3 # 4360 <_sk_callback_sse2+0x45f>
+ DB 102,68,15,219,5,43,46,0,0 ; pand 0x2e2b(%rip),%xmm8 # 4370 <_sk_callback_sse2+0x46f>
DB 69,15,91,192 ; cvtdq2ps %xmm8,%xmm8
- DB 68,15,89,5,43,46,0,0 ; mulps 0x2e2b(%rip),%xmm8 # 4380 <_sk_callback_sse2+0x47b>
+ DB 68,15,89,5,47,46,0,0 ; mulps 0x2e2f(%rip),%xmm8 # 4380 <_sk_callback_sse2+0x47f>
DB 15,92,196 ; subps %xmm4,%xmm0
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 15,88,196 ; addps %xmm4,%xmm0
@@ -16956,7 +16951,7 @@ _sk_lerp_565_sse2 LABEL PROC
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 15,88,214 ; addps %xmm6,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,21,46,0,0 ; movaps 0x2e15(%rip),%xmm3 # 4390 <_sk_callback_sse2+0x48b>
+ DB 15,40,29,25,46,0,0 ; movaps 0x2e19(%rip),%xmm3 # 4390 <_sk_callback_sse2+0x48f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_load_tables_sse2
@@ -16965,7 +16960,7 @@ _sk_load_tables_sse2 LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 76,139,72,8 ; mov 0x8(%rax),%r9
DB 243,69,15,111,12,184 ; movdqu (%r8,%rdi,4),%xmm9
- DB 102,68,15,111,5,11,46,0,0 ; movdqa 0x2e0b(%rip),%xmm8 # 43a0 <_sk_callback_sse2+0x49b>
+ DB 102,68,15,111,5,15,46,0,0 ; movdqa 0x2e0f(%rip),%xmm8 # 43a0 <_sk_callback_sse2+0x49f>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
@@ -17020,7 +17015,7 @@ _sk_load_tables_sse2 LABEL PROC
DB 65,15,20,208 ; unpcklps %xmm8,%xmm2
DB 102,65,15,114,209,24 ; psrld $0x18,%xmm9
DB 65,15,91,217 ; cvtdq2ps %xmm9,%xmm3
- DB 15,89,29,24,45,0,0 ; mulps 0x2d18(%rip),%xmm3 # 43b0 <_sk_callback_sse2+0x4ab>
+ DB 15,89,29,28,45,0,0 ; mulps 0x2d1c(%rip),%xmm3 # 43b0 <_sk_callback_sse2+0x4af>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -17037,7 +17032,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,97,200 ; punpcklwd %xmm0,%xmm1
DB 102,68,15,105,200 ; punpckhwd %xmm0,%xmm9
- DB 102,68,15,111,21,235,44,0,0 ; movdqa 0x2ceb(%rip),%xmm10 # 43c0 <_sk_callback_sse2+0x4bb>
+ DB 102,68,15,111,21,239,44,0,0 ; movdqa 0x2cef(%rip),%xmm10 # 43c0 <_sk_callback_sse2+0x4bf>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,194 ; pand %xmm10,%xmm0
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
@@ -17098,7 +17093,7 @@ _sk_load_tables_u16_be_sse2 LABEL PROC
DB 102,65,15,235,217 ; por %xmm9,%xmm3
DB 102,65,15,97,216 ; punpcklwd %xmm8,%xmm3
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,218,43,0,0 ; mulps 0x2bda(%rip),%xmm3 # 43d0 <_sk_callback_sse2+0x4cb>
+ DB 15,89,29,222,43,0,0 ; mulps 0x2bde(%rip),%xmm3 # 43d0 <_sk_callback_sse2+0x4cf>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -17118,7 +17113,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC
DB 102,68,15,97,208 ; punpcklwd %xmm0,%xmm10
DB 102,65,15,111,195 ; movdqa %xmm11,%xmm0
DB 102,65,15,97,194 ; punpcklwd %xmm10,%xmm0
- DB 102,68,15,111,5,154,43,0,0 ; movdqa 0x2b9a(%rip),%xmm8 # 43e0 <_sk_callback_sse2+0x4db>
+ DB 102,68,15,111,5,158,43,0,0 ; movdqa 0x2b9e(%rip),%xmm8 # 43e0 <_sk_callback_sse2+0x4df>
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,65,15,219,192 ; pand %xmm8,%xmm0
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
@@ -17173,7 +17168,7 @@ _sk_load_tables_rgb_u16_be_sse2 LABEL PROC
DB 15,20,211 ; unpcklps %xmm3,%xmm2
DB 65,15,20,208 ; unpcklps %xmm8,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,169,42,0,0 ; movaps 0x2aa9(%rip),%xmm3 # 43f0 <_sk_callback_sse2+0x4eb>
+ DB 15,40,29,173,42,0,0 ; movaps 0x2aad(%rip),%xmm3 # 43f0 <_sk_callback_sse2+0x4ef>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_byte_tables_sse2
@@ -17181,7 +17176,7 @@ _sk_byte_tables_sse2 LABEL PROC
DB 65,86 ; push %r14
DB 83 ; push %rbx
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,170,42,0,0 ; movaps 0x2aaa(%rip),%xmm8 # 4400 <_sk_callback_sse2+0x4fb>
+ DB 68,15,40,5,174,42,0,0 ; movaps 0x2aae(%rip),%xmm8 # 4400 <_sk_callback_sse2+0x4ff>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,91,192 ; cvtps2dq %xmm0,%xmm0
DB 102,72,15,126,193 ; movq %xmm0,%rcx
@@ -17208,7 +17203,7 @@ _sk_byte_tables_sse2 LABEL PROC
DB 102,65,15,96,193 ; punpcklbw %xmm9,%xmm0
DB 102,65,15,97,193 ; punpcklwd %xmm9,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,21,71,42,0,0 ; movaps 0x2a47(%rip),%xmm10 # 4410 <_sk_callback_sse2+0x50b>
+ DB 68,15,40,21,75,42,0,0 ; movaps 0x2a4b(%rip),%xmm10 # 4410 <_sk_callback_sse2+0x50f>
DB 65,15,89,194 ; mulps %xmm10,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -17322,7 +17317,7 @@ _sk_byte_tables_rgb_sse2 LABEL PROC
DB 102,65,15,96,193 ; punpcklbw %xmm9,%xmm0
DB 102,65,15,97,193 ; punpcklwd %xmm9,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,21,154,40,0,0 ; movaps 0x289a(%rip),%xmm10 # 4420 <_sk_callback_sse2+0x51b>
+ DB 68,15,40,21,158,40,0,0 ; movaps 0x289e(%rip),%xmm10 # 4420 <_sk_callback_sse2+0x51f>
DB 65,15,89,194 ; mulps %xmm10,%xmm0
DB 65,15,89,200 ; mulps %xmm8,%xmm1
DB 102,15,91,201 ; cvtps2dq %xmm1,%xmm1
@@ -17509,15 +17504,15 @@ _sk_parametric_r_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,217,37,0,0 ; mulps 0x25d9(%rip),%xmm9 # 4430 <_sk_callback_sse2+0x52b>
- DB 68,15,84,21,225,37,0,0 ; andps 0x25e1(%rip),%xmm10 # 4440 <_sk_callback_sse2+0x53b>
- DB 68,15,86,21,233,37,0,0 ; orps 0x25e9(%rip),%xmm10 # 4450 <_sk_callback_sse2+0x54b>
- DB 68,15,88,13,241,37,0,0 ; addps 0x25f1(%rip),%xmm9 # 4460 <_sk_callback_sse2+0x55b>
- DB 68,15,40,37,249,37,0,0 ; movaps 0x25f9(%rip),%xmm12 # 4470 <_sk_callback_sse2+0x56b>
+ DB 68,15,89,13,221,37,0,0 ; mulps 0x25dd(%rip),%xmm9 # 4430 <_sk_callback_sse2+0x52f>
+ DB 68,15,84,21,229,37,0,0 ; andps 0x25e5(%rip),%xmm10 # 4440 <_sk_callback_sse2+0x53f>
+ DB 68,15,86,21,237,37,0,0 ; orps 0x25ed(%rip),%xmm10 # 4450 <_sk_callback_sse2+0x54f>
+ DB 68,15,88,13,245,37,0,0 ; addps 0x25f5(%rip),%xmm9 # 4460 <_sk_callback_sse2+0x55f>
+ DB 68,15,40,37,253,37,0,0 ; movaps 0x25fd(%rip),%xmm12 # 4470 <_sk_callback_sse2+0x56f>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,249,37,0,0 ; addps 0x25f9(%rip),%xmm10 # 4480 <_sk_callback_sse2+0x57b>
- DB 68,15,40,37,1,38,0,0 ; movaps 0x2601(%rip),%xmm12 # 4490 <_sk_callback_sse2+0x58b>
+ DB 68,15,88,21,253,37,0,0 ; addps 0x25fd(%rip),%xmm10 # 4480 <_sk_callback_sse2+0x57f>
+ DB 68,15,40,37,5,38,0,0 ; movaps 0x2605(%rip),%xmm12 # 4490 <_sk_callback_sse2+0x58f>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -17525,22 +17520,22 @@ _sk_parametric_r_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,235,37,0,0 ; movaps 0x25eb(%rip),%xmm10 # 44a0 <_sk_callback_sse2+0x59b>
+ DB 68,15,40,21,239,37,0,0 ; movaps 0x25ef(%rip),%xmm10 # 44a0 <_sk_callback_sse2+0x59f>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,223,37,0,0 ; addps 0x25df(%rip),%xmm9 # 44b0 <_sk_callback_sse2+0x5ab>
- DB 68,15,40,37,231,37,0,0 ; movaps 0x25e7(%rip),%xmm12 # 44c0 <_sk_callback_sse2+0x5bb>
+ DB 68,15,88,13,227,37,0,0 ; addps 0x25e3(%rip),%xmm9 # 44b0 <_sk_callback_sse2+0x5af>
+ DB 68,15,40,37,235,37,0,0 ; movaps 0x25eb(%rip),%xmm12 # 44c0 <_sk_callback_sse2+0x5bf>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,231,37,0,0 ; movaps 0x25e7(%rip),%xmm12 # 44d0 <_sk_callback_sse2+0x5cb>
+ DB 68,15,40,37,235,37,0,0 ; movaps 0x25eb(%rip),%xmm12 # 44d0 <_sk_callback_sse2+0x5cf>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,235,37,0,0 ; movaps 0x25eb(%rip),%xmm13 # 44e0 <_sk_callback_sse2+0x5db>
+ DB 68,15,40,45,239,37,0,0 ; movaps 0x25ef(%rip),%xmm13 # 44e0 <_sk_callback_sse2+0x5df>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,235,37,0,0 ; mulps 0x25eb(%rip),%xmm13 # 44f0 <_sk_callback_sse2+0x5eb>
+ DB 68,15,89,45,239,37,0,0 ; mulps 0x25ef(%rip),%xmm13 # 44f0 <_sk_callback_sse2+0x5ef>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -17574,15 +17569,15 @@ _sk_parametric_g_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,107,37,0,0 ; mulps 0x256b(%rip),%xmm9 # 4500 <_sk_callback_sse2+0x5fb>
- DB 68,15,84,21,115,37,0,0 ; andps 0x2573(%rip),%xmm10 # 4510 <_sk_callback_sse2+0x60b>
- DB 68,15,86,21,123,37,0,0 ; orps 0x257b(%rip),%xmm10 # 4520 <_sk_callback_sse2+0x61b>
- DB 68,15,88,13,131,37,0,0 ; addps 0x2583(%rip),%xmm9 # 4530 <_sk_callback_sse2+0x62b>
- DB 68,15,40,37,139,37,0,0 ; movaps 0x258b(%rip),%xmm12 # 4540 <_sk_callback_sse2+0x63b>
+ DB 68,15,89,13,111,37,0,0 ; mulps 0x256f(%rip),%xmm9 # 4500 <_sk_callback_sse2+0x5ff>
+ DB 68,15,84,21,119,37,0,0 ; andps 0x2577(%rip),%xmm10 # 4510 <_sk_callback_sse2+0x60f>
+ DB 68,15,86,21,127,37,0,0 ; orps 0x257f(%rip),%xmm10 # 4520 <_sk_callback_sse2+0x61f>
+ DB 68,15,88,13,135,37,0,0 ; addps 0x2587(%rip),%xmm9 # 4530 <_sk_callback_sse2+0x62f>
+ DB 68,15,40,37,143,37,0,0 ; movaps 0x258f(%rip),%xmm12 # 4540 <_sk_callback_sse2+0x63f>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,139,37,0,0 ; addps 0x258b(%rip),%xmm10 # 4550 <_sk_callback_sse2+0x64b>
- DB 68,15,40,37,147,37,0,0 ; movaps 0x2593(%rip),%xmm12 # 4560 <_sk_callback_sse2+0x65b>
+ DB 68,15,88,21,143,37,0,0 ; addps 0x258f(%rip),%xmm10 # 4550 <_sk_callback_sse2+0x64f>
+ DB 68,15,40,37,151,37,0,0 ; movaps 0x2597(%rip),%xmm12 # 4560 <_sk_callback_sse2+0x65f>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -17590,22 +17585,22 @@ _sk_parametric_g_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,125,37,0,0 ; movaps 0x257d(%rip),%xmm10 # 4570 <_sk_callback_sse2+0x66b>
+ DB 68,15,40,21,129,37,0,0 ; movaps 0x2581(%rip),%xmm10 # 4570 <_sk_callback_sse2+0x66f>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,113,37,0,0 ; addps 0x2571(%rip),%xmm9 # 4580 <_sk_callback_sse2+0x67b>
- DB 68,15,40,37,121,37,0,0 ; movaps 0x2579(%rip),%xmm12 # 4590 <_sk_callback_sse2+0x68b>
+ DB 68,15,88,13,117,37,0,0 ; addps 0x2575(%rip),%xmm9 # 4580 <_sk_callback_sse2+0x67f>
+ DB 68,15,40,37,125,37,0,0 ; movaps 0x257d(%rip),%xmm12 # 4590 <_sk_callback_sse2+0x68f>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,121,37,0,0 ; movaps 0x2579(%rip),%xmm12 # 45a0 <_sk_callback_sse2+0x69b>
+ DB 68,15,40,37,125,37,0,0 ; movaps 0x257d(%rip),%xmm12 # 45a0 <_sk_callback_sse2+0x69f>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,125,37,0,0 ; movaps 0x257d(%rip),%xmm13 # 45b0 <_sk_callback_sse2+0x6ab>
+ DB 68,15,40,45,129,37,0,0 ; movaps 0x2581(%rip),%xmm13 # 45b0 <_sk_callback_sse2+0x6af>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,125,37,0,0 ; mulps 0x257d(%rip),%xmm13 # 45c0 <_sk_callback_sse2+0x6bb>
+ DB 68,15,89,45,129,37,0,0 ; mulps 0x2581(%rip),%xmm13 # 45c0 <_sk_callback_sse2+0x6bf>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -17639,15 +17634,15 @@ _sk_parametric_b_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,253,36,0,0 ; mulps 0x24fd(%rip),%xmm9 # 45d0 <_sk_callback_sse2+0x6cb>
- DB 68,15,84,21,5,37,0,0 ; andps 0x2505(%rip),%xmm10 # 45e0 <_sk_callback_sse2+0x6db>
- DB 68,15,86,21,13,37,0,0 ; orps 0x250d(%rip),%xmm10 # 45f0 <_sk_callback_sse2+0x6eb>
- DB 68,15,88,13,21,37,0,0 ; addps 0x2515(%rip),%xmm9 # 4600 <_sk_callback_sse2+0x6fb>
- DB 68,15,40,37,29,37,0,0 ; movaps 0x251d(%rip),%xmm12 # 4610 <_sk_callback_sse2+0x70b>
+ DB 68,15,89,13,1,37,0,0 ; mulps 0x2501(%rip),%xmm9 # 45d0 <_sk_callback_sse2+0x6cf>
+ DB 68,15,84,21,9,37,0,0 ; andps 0x2509(%rip),%xmm10 # 45e0 <_sk_callback_sse2+0x6df>
+ DB 68,15,86,21,17,37,0,0 ; orps 0x2511(%rip),%xmm10 # 45f0 <_sk_callback_sse2+0x6ef>
+ DB 68,15,88,13,25,37,0,0 ; addps 0x2519(%rip),%xmm9 # 4600 <_sk_callback_sse2+0x6ff>
+ DB 68,15,40,37,33,37,0,0 ; movaps 0x2521(%rip),%xmm12 # 4610 <_sk_callback_sse2+0x70f>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,29,37,0,0 ; addps 0x251d(%rip),%xmm10 # 4620 <_sk_callback_sse2+0x71b>
- DB 68,15,40,37,37,37,0,0 ; movaps 0x2525(%rip),%xmm12 # 4630 <_sk_callback_sse2+0x72b>
+ DB 68,15,88,21,33,37,0,0 ; addps 0x2521(%rip),%xmm10 # 4620 <_sk_callback_sse2+0x71f>
+ DB 68,15,40,37,41,37,0,0 ; movaps 0x2529(%rip),%xmm12 # 4630 <_sk_callback_sse2+0x72f>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -17655,22 +17650,22 @@ _sk_parametric_b_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,15,37,0,0 ; movaps 0x250f(%rip),%xmm10 # 4640 <_sk_callback_sse2+0x73b>
+ DB 68,15,40,21,19,37,0,0 ; movaps 0x2513(%rip),%xmm10 # 4640 <_sk_callback_sse2+0x73f>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,3,37,0,0 ; addps 0x2503(%rip),%xmm9 # 4650 <_sk_callback_sse2+0x74b>
- DB 68,15,40,37,11,37,0,0 ; movaps 0x250b(%rip),%xmm12 # 4660 <_sk_callback_sse2+0x75b>
+ DB 68,15,88,13,7,37,0,0 ; addps 0x2507(%rip),%xmm9 # 4650 <_sk_callback_sse2+0x74f>
+ DB 68,15,40,37,15,37,0,0 ; movaps 0x250f(%rip),%xmm12 # 4660 <_sk_callback_sse2+0x75f>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,11,37,0,0 ; movaps 0x250b(%rip),%xmm12 # 4670 <_sk_callback_sse2+0x76b>
+ DB 68,15,40,37,15,37,0,0 ; movaps 0x250f(%rip),%xmm12 # 4670 <_sk_callback_sse2+0x76f>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,15,37,0,0 ; movaps 0x250f(%rip),%xmm13 # 4680 <_sk_callback_sse2+0x77b>
+ DB 68,15,40,45,19,37,0,0 ; movaps 0x2513(%rip),%xmm13 # 4680 <_sk_callback_sse2+0x77f>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,15,37,0,0 ; mulps 0x250f(%rip),%xmm13 # 4690 <_sk_callback_sse2+0x78b>
+ DB 68,15,89,45,19,37,0,0 ; mulps 0x2513(%rip),%xmm13 # 4690 <_sk_callback_sse2+0x78f>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -17704,15 +17699,15 @@ _sk_parametric_a_sse2 LABEL PROC
DB 69,15,88,209 ; addps %xmm9,%xmm10
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,91,202 ; cvtdq2ps %xmm10,%xmm9
- DB 68,15,89,13,143,36,0,0 ; mulps 0x248f(%rip),%xmm9 # 46a0 <_sk_callback_sse2+0x79b>
- DB 68,15,84,21,151,36,0,0 ; andps 0x2497(%rip),%xmm10 # 46b0 <_sk_callback_sse2+0x7ab>
- DB 68,15,86,21,159,36,0,0 ; orps 0x249f(%rip),%xmm10 # 46c0 <_sk_callback_sse2+0x7bb>
- DB 68,15,88,13,167,36,0,0 ; addps 0x24a7(%rip),%xmm9 # 46d0 <_sk_callback_sse2+0x7cb>
- DB 68,15,40,37,175,36,0,0 ; movaps 0x24af(%rip),%xmm12 # 46e0 <_sk_callback_sse2+0x7db>
+ DB 68,15,89,13,147,36,0,0 ; mulps 0x2493(%rip),%xmm9 # 46a0 <_sk_callback_sse2+0x79f>
+ DB 68,15,84,21,155,36,0,0 ; andps 0x249b(%rip),%xmm10 # 46b0 <_sk_callback_sse2+0x7af>
+ DB 68,15,86,21,163,36,0,0 ; orps 0x24a3(%rip),%xmm10 # 46c0 <_sk_callback_sse2+0x7bf>
+ DB 68,15,88,13,171,36,0,0 ; addps 0x24ab(%rip),%xmm9 # 46d0 <_sk_callback_sse2+0x7cf>
+ DB 68,15,40,37,179,36,0,0 ; movaps 0x24b3(%rip),%xmm12 # 46e0 <_sk_callback_sse2+0x7df>
DB 69,15,89,226 ; mulps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,88,21,175,36,0,0 ; addps 0x24af(%rip),%xmm10 # 46f0 <_sk_callback_sse2+0x7eb>
- DB 68,15,40,37,183,36,0,0 ; movaps 0x24b7(%rip),%xmm12 # 4700 <_sk_callback_sse2+0x7fb>
+ DB 68,15,88,21,179,36,0,0 ; addps 0x24b3(%rip),%xmm10 # 46f0 <_sk_callback_sse2+0x7ef>
+ DB 68,15,40,37,187,36,0,0 ; movaps 0x24bb(%rip),%xmm12 # 4700 <_sk_callback_sse2+0x7ff>
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
DB 69,15,89,203 ; mulps %xmm11,%xmm9
@@ -17720,22 +17715,22 @@ _sk_parametric_a_sse2 LABEL PROC
DB 69,15,91,226 ; cvtdq2ps %xmm10,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,194,236,1 ; cmpltps %xmm12,%xmm13
- DB 68,15,40,21,161,36,0,0 ; movaps 0x24a1(%rip),%xmm10 # 4710 <_sk_callback_sse2+0x80b>
+ DB 68,15,40,21,165,36,0,0 ; movaps 0x24a5(%rip),%xmm10 # 4710 <_sk_callback_sse2+0x80f>
DB 69,15,84,234 ; andps %xmm10,%xmm13
DB 69,15,87,219 ; xorps %xmm11,%xmm11
DB 69,15,92,229 ; subps %xmm13,%xmm12
DB 69,15,40,233 ; movaps %xmm9,%xmm13
DB 69,15,92,236 ; subps %xmm12,%xmm13
- DB 68,15,88,13,149,36,0,0 ; addps 0x2495(%rip),%xmm9 # 4720 <_sk_callback_sse2+0x81b>
- DB 68,15,40,37,157,36,0,0 ; movaps 0x249d(%rip),%xmm12 # 4730 <_sk_callback_sse2+0x82b>
+ DB 68,15,88,13,153,36,0,0 ; addps 0x2499(%rip),%xmm9 # 4720 <_sk_callback_sse2+0x81f>
+ DB 68,15,40,37,161,36,0,0 ; movaps 0x24a1(%rip),%xmm12 # 4730 <_sk_callback_sse2+0x82f>
DB 69,15,89,229 ; mulps %xmm13,%xmm12
DB 69,15,92,204 ; subps %xmm12,%xmm9
- DB 68,15,40,37,157,36,0,0 ; movaps 0x249d(%rip),%xmm12 # 4740 <_sk_callback_sse2+0x83b>
+ DB 68,15,40,37,161,36,0,0 ; movaps 0x24a1(%rip),%xmm12 # 4740 <_sk_callback_sse2+0x83f>
DB 69,15,92,229 ; subps %xmm13,%xmm12
- DB 68,15,40,45,161,36,0,0 ; movaps 0x24a1(%rip),%xmm13 # 4750 <_sk_callback_sse2+0x84b>
+ DB 68,15,40,45,165,36,0,0 ; movaps 0x24a5(%rip),%xmm13 # 4750 <_sk_callback_sse2+0x84f>
DB 69,15,94,236 ; divps %xmm12,%xmm13
DB 69,15,88,233 ; addps %xmm9,%xmm13
- DB 68,15,89,45,161,36,0,0 ; mulps 0x24a1(%rip),%xmm13 # 4760 <_sk_callback_sse2+0x85b>
+ DB 68,15,89,45,165,36,0,0 ; mulps 0x24a5(%rip),%xmm13 # 4760 <_sk_callback_sse2+0x85f>
DB 102,69,15,91,205 ; cvtps2dq %xmm13,%xmm9
DB 243,68,15,16,96,20 ; movss 0x14(%rax),%xmm12
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
@@ -17750,29 +17745,29 @@ _sk_parametric_a_sse2 LABEL PROC
PUBLIC _sk_lab_to_xyz_sse2
_sk_lab_to_xyz_sse2 LABEL PROC
- DB 15,89,5,126,36,0,0 ; mulps 0x247e(%rip),%xmm0 # 4770 <_sk_callback_sse2+0x86b>
- DB 68,15,40,5,134,36,0,0 ; movaps 0x2486(%rip),%xmm8 # 4780 <_sk_callback_sse2+0x87b>
+ DB 15,89,5,130,36,0,0 ; mulps 0x2482(%rip),%xmm0 # 4770 <_sk_callback_sse2+0x86f>
+ DB 68,15,40,5,138,36,0,0 ; movaps 0x248a(%rip),%xmm8 # 4780 <_sk_callback_sse2+0x87f>
DB 65,15,89,200 ; mulps %xmm8,%xmm1
- DB 68,15,40,13,138,36,0,0 ; movaps 0x248a(%rip),%xmm9 # 4790 <_sk_callback_sse2+0x88b>
+ DB 68,15,40,13,142,36,0,0 ; movaps 0x248e(%rip),%xmm9 # 4790 <_sk_callback_sse2+0x88f>
DB 65,15,88,201 ; addps %xmm9,%xmm1
DB 65,15,89,208 ; mulps %xmm8,%xmm2
DB 65,15,88,209 ; addps %xmm9,%xmm2
- DB 15,88,5,135,36,0,0 ; addps 0x2487(%rip),%xmm0 # 47a0 <_sk_callback_sse2+0x89b>
- DB 15,89,5,144,36,0,0 ; mulps 0x2490(%rip),%xmm0 # 47b0 <_sk_callback_sse2+0x8ab>
- DB 15,89,13,153,36,0,0 ; mulps 0x2499(%rip),%xmm1 # 47c0 <_sk_callback_sse2+0x8bb>
+ DB 15,88,5,139,36,0,0 ; addps 0x248b(%rip),%xmm0 # 47a0 <_sk_callback_sse2+0x89f>
+ DB 15,89,5,148,36,0,0 ; mulps 0x2494(%rip),%xmm0 # 47b0 <_sk_callback_sse2+0x8af>
+ DB 15,89,13,157,36,0,0 ; mulps 0x249d(%rip),%xmm1 # 47c0 <_sk_callback_sse2+0x8bf>
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,21,159,36,0,0 ; mulps 0x249f(%rip),%xmm2 # 47d0 <_sk_callback_sse2+0x8cb>
+ DB 15,89,21,163,36,0,0 ; mulps 0x24a3(%rip),%xmm2 # 47d0 <_sk_callback_sse2+0x8cf>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 68,15,92,202 ; subps %xmm2,%xmm9
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
DB 68,15,89,225 ; mulps %xmm1,%xmm12
- DB 15,40,21,148,36,0,0 ; movaps 0x2494(%rip),%xmm2 # 47e0 <_sk_callback_sse2+0x8db>
+ DB 15,40,21,152,36,0,0 ; movaps 0x2498(%rip),%xmm2 # 47e0 <_sk_callback_sse2+0x8df>
DB 68,15,40,194 ; movaps %xmm2,%xmm8
DB 69,15,194,196,1 ; cmpltps %xmm12,%xmm8
- DB 68,15,40,21,147,36,0,0 ; movaps 0x2493(%rip),%xmm10 # 47f0 <_sk_callback_sse2+0x8eb>
+ DB 68,15,40,21,151,36,0,0 ; movaps 0x2497(%rip),%xmm10 # 47f0 <_sk_callback_sse2+0x8ef>
DB 65,15,88,202 ; addps %xmm10,%xmm1
- DB 68,15,40,29,151,36,0,0 ; movaps 0x2497(%rip),%xmm11 # 4800 <_sk_callback_sse2+0x8fb>
+ DB 68,15,40,29,155,36,0,0 ; movaps 0x249b(%rip),%xmm11 # 4800 <_sk_callback_sse2+0x8ff>
DB 65,15,89,203 ; mulps %xmm11,%xmm1
DB 69,15,84,224 ; andps %xmm8,%xmm12
DB 68,15,85,193 ; andnps %xmm1,%xmm8
@@ -17796,8 +17791,8 @@ _sk_lab_to_xyz_sse2 LABEL PROC
DB 15,84,194 ; andps %xmm2,%xmm0
DB 65,15,85,209 ; andnps %xmm9,%xmm2
DB 15,86,208 ; orps %xmm0,%xmm2
- DB 68,15,89,5,71,36,0,0 ; mulps 0x2447(%rip),%xmm8 # 4810 <_sk_callback_sse2+0x90b>
- DB 15,89,21,80,36,0,0 ; mulps 0x2450(%rip),%xmm2 # 4820 <_sk_callback_sse2+0x91b>
+ DB 68,15,89,5,75,36,0,0 ; mulps 0x244b(%rip),%xmm8 # 4810 <_sk_callback_sse2+0x90f>
+ DB 15,89,21,84,36,0,0 ; mulps 0x2454(%rip),%xmm2 # 4820 <_sk_callback_sse2+0x91f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 65,15,40,192 ; movaps %xmm8,%xmm0
DB 255,224 ; jmpq *%rax
@@ -17811,7 +17806,7 @@ _sk_load_a8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,56,36,0,0 ; mulps 0x2438(%rip),%xmm3 # 4830 <_sk_callback_sse2+0x92b>
+ DB 15,89,29,60,36,0,0 ; mulps 0x243c(%rip),%xmm3 # 4830 <_sk_callback_sse2+0x92f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
@@ -17854,7 +17849,7 @@ _sk_gather_a8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,216 ; cvtdq2ps %xmm0,%xmm3
- DB 15,89,29,167,35,0,0 ; mulps 0x23a7(%rip),%xmm3 # 4840 <_sk_callback_sse2+0x93b>
+ DB 15,89,29,171,35,0,0 ; mulps 0x23ab(%rip),%xmm3 # 4840 <_sk_callback_sse2+0x93f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
DB 102,15,239,201 ; pxor %xmm1,%xmm1
@@ -17865,7 +17860,7 @@ PUBLIC _sk_store_a8_sse2
_sk_store_a8_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,155,35,0,0 ; movaps 0x239b(%rip),%xmm8 # 4850 <_sk_callback_sse2+0x94b>
+ DB 68,15,40,5,159,35,0,0 ; movaps 0x239f(%rip),%xmm8 # 4850 <_sk_callback_sse2+0x94f>
DB 68,15,89,195 ; mulps %xmm3,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
DB 102,65,15,114,240,16 ; pslld $0x10,%xmm8
@@ -17885,9 +17880,9 @@ _sk_load_g8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,98,35,0,0 ; mulps 0x2362(%rip),%xmm0 # 4860 <_sk_callback_sse2+0x95b>
+ DB 15,89,5,102,35,0,0 ; mulps 0x2366(%rip),%xmm0 # 4860 <_sk_callback_sse2+0x95f>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,105,35,0,0 ; movaps 0x2369(%rip),%xmm3 # 4870 <_sk_callback_sse2+0x96b>
+ DB 15,40,29,109,35,0,0 ; movaps 0x236d(%rip),%xmm3 # 4870 <_sk_callback_sse2+0x96f>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -17928,9 +17923,9 @@ _sk_gather_g8_sse2 LABEL PROC
DB 102,15,96,193 ; punpcklbw %xmm1,%xmm0
DB 102,15,97,193 ; punpcklwd %xmm1,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,222,34,0,0 ; mulps 0x22de(%rip),%xmm0 # 4880 <_sk_callback_sse2+0x97b>
+ DB 15,89,5,226,34,0,0 ; mulps 0x22e2(%rip),%xmm0 # 4880 <_sk_callback_sse2+0x97f>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,229,34,0,0 ; movaps 0x22e5(%rip),%xmm3 # 4890 <_sk_callback_sse2+0x98b>
+ DB 15,40,29,233,34,0,0 ; movaps 0x22e9(%rip),%xmm3 # 4890 <_sk_callback_sse2+0x98f>
DB 15,40,200 ; movaps %xmm0,%xmm1
DB 15,40,208 ; movaps %xmm0,%xmm2
DB 255,224 ; jmpq *%rax
@@ -17940,9 +17935,9 @@ _sk_gather_i8_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 73,137,192 ; mov %rax,%r8
DB 77,133,192 ; test %r8,%r8
- DB 116,5 ; je 25c2 <_sk_gather_i8_sse2+0xf>
+ DB 116,5 ; je 25be <_sk_gather_i8_sse2+0xf>
DB 76,137,192 ; mov %r8,%rax
- DB 235,2 ; jmp 25c4 <_sk_gather_i8_sse2+0x11>
+ DB 235,2 ; jmp 25c0 <_sk_gather_i8_sse2+0x11>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,16 ; mov (%rax),%r10
DB 243,15,91,201 ; cvttps2dq %xmm1,%xmm1
@@ -17991,11 +17986,11 @@ _sk_gather_i8_sse2 LABEL PROC
DB 102,67,15,110,12,136 ; movd (%r8,%r9,4),%xmm1
DB 102,68,15,98,201 ; punpckldq %xmm1,%xmm9
DB 102,68,15,98,200 ; punpckldq %xmm0,%xmm9
- DB 102,15,111,21,4,34,0,0 ; movdqa 0x2204(%rip),%xmm2 # 48a0 <_sk_callback_sse2+0x99b>
+ DB 102,15,111,21,8,34,0,0 ; movdqa 0x2208(%rip),%xmm2 # 48a0 <_sk_callback_sse2+0x99f>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,0,34,0,0 ; movaps 0x2200(%rip),%xmm8 # 48b0 <_sk_callback_sse2+0x9ab>
+ DB 68,15,40,5,4,34,0,0 ; movaps 0x2204(%rip),%xmm8 # 48b0 <_sk_callback_sse2+0x9af>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -18020,19 +18015,19 @@ _sk_load_565_sse2 LABEL PROC
DB 243,15,126,20,120 ; movq (%rax,%rdi,2),%xmm2
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2
- DB 102,15,111,5,182,33,0,0 ; movdqa 0x21b6(%rip),%xmm0 # 48c0 <_sk_callback_sse2+0x9bb>
+ DB 102,15,111,5,186,33,0,0 ; movdqa 0x21ba(%rip),%xmm0 # 48c0 <_sk_callback_sse2+0x9bf>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,184,33,0,0 ; mulps 0x21b8(%rip),%xmm0 # 48d0 <_sk_callback_sse2+0x9cb>
- DB 102,15,111,13,192,33,0,0 ; movdqa 0x21c0(%rip),%xmm1 # 48e0 <_sk_callback_sse2+0x9db>
+ DB 15,89,5,188,33,0,0 ; mulps 0x21bc(%rip),%xmm0 # 48d0 <_sk_callback_sse2+0x9cf>
+ DB 102,15,111,13,196,33,0,0 ; movdqa 0x21c4(%rip),%xmm1 # 48e0 <_sk_callback_sse2+0x9df>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,194,33,0,0 ; mulps 0x21c2(%rip),%xmm1 # 48f0 <_sk_callback_sse2+0x9eb>
- DB 102,15,219,21,202,33,0,0 ; pand 0x21ca(%rip),%xmm2 # 4900 <_sk_callback_sse2+0x9fb>
+ DB 15,89,13,198,33,0,0 ; mulps 0x21c6(%rip),%xmm1 # 48f0 <_sk_callback_sse2+0x9ef>
+ DB 102,15,219,21,206,33,0,0 ; pand 0x21ce(%rip),%xmm2 # 4900 <_sk_callback_sse2+0x9ff>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,208,33,0,0 ; mulps 0x21d0(%rip),%xmm2 # 4910 <_sk_callback_sse2+0xa0b>
+ DB 15,89,21,212,33,0,0 ; mulps 0x21d4(%rip),%xmm2 # 4910 <_sk_callback_sse2+0xa0f>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,215,33,0,0 ; movaps 0x21d7(%rip),%xmm3 # 4920 <_sk_callback_sse2+0xa1b>
+ DB 15,40,29,219,33,0,0 ; movaps 0x21db(%rip),%xmm3 # 4920 <_sk_callback_sse2+0xa1f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_gather_565_sse2
@@ -18065,31 +18060,31 @@ _sk_gather_565_sse2 LABEL PROC
DB 102,15,196,208,3 ; pinsrw $0x3,%eax,%xmm2
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,208 ; punpcklwd %xmm0,%xmm2
- DB 102,15,111,5,96,33,0,0 ; movdqa 0x2160(%rip),%xmm0 # 4930 <_sk_callback_sse2+0xa2b>
+ DB 102,15,111,5,100,33,0,0 ; movdqa 0x2164(%rip),%xmm0 # 4930 <_sk_callback_sse2+0xa2f>
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,98,33,0,0 ; mulps 0x2162(%rip),%xmm0 # 4940 <_sk_callback_sse2+0xa3b>
- DB 102,15,111,13,106,33,0,0 ; movdqa 0x216a(%rip),%xmm1 # 4950 <_sk_callback_sse2+0xa4b>
+ DB 15,89,5,102,33,0,0 ; mulps 0x2166(%rip),%xmm0 # 4940 <_sk_callback_sse2+0xa3f>
+ DB 102,15,111,13,110,33,0,0 ; movdqa 0x216e(%rip),%xmm1 # 4950 <_sk_callback_sse2+0xa4f>
DB 102,15,219,202 ; pand %xmm2,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,108,33,0,0 ; mulps 0x216c(%rip),%xmm1 # 4960 <_sk_callback_sse2+0xa5b>
- DB 102,15,219,21,116,33,0,0 ; pand 0x2174(%rip),%xmm2 # 4970 <_sk_callback_sse2+0xa6b>
+ DB 15,89,13,112,33,0,0 ; mulps 0x2170(%rip),%xmm1 # 4960 <_sk_callback_sse2+0xa5f>
+ DB 102,15,219,21,120,33,0,0 ; pand 0x2178(%rip),%xmm2 # 4970 <_sk_callback_sse2+0xa6f>
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,122,33,0,0 ; mulps 0x217a(%rip),%xmm2 # 4980 <_sk_callback_sse2+0xa7b>
+ DB 15,89,21,126,33,0,0 ; mulps 0x217e(%rip),%xmm2 # 4980 <_sk_callback_sse2+0xa7f>
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,129,33,0,0 ; movaps 0x2181(%rip),%xmm3 # 4990 <_sk_callback_sse2+0xa8b>
+ DB 15,40,29,133,33,0,0 ; movaps 0x2185(%rip),%xmm3 # 4990 <_sk_callback_sse2+0xa8f>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_store_565_sse2
_sk_store_565_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,130,33,0,0 ; movaps 0x2182(%rip),%xmm8 # 49a0 <_sk_callback_sse2+0xa9b>
+ DB 68,15,40,5,134,33,0,0 ; movaps 0x2186(%rip),%xmm8 # 49a0 <_sk_callback_sse2+0xa9f>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
DB 102,65,15,114,241,11 ; pslld $0xb,%xmm9
- DB 68,15,40,21,119,33,0,0 ; movaps 0x2177(%rip),%xmm10 # 49b0 <_sk_callback_sse2+0xaab>
+ DB 68,15,40,21,123,33,0,0 ; movaps 0x217b(%rip),%xmm10 # 49b0 <_sk_callback_sse2+0xaaf>
DB 68,15,89,209 ; mulps %xmm1,%xmm10
DB 102,69,15,91,210 ; cvtps2dq %xmm10,%xmm10
DB 102,65,15,114,242,5 ; pslld $0x5,%xmm10
@@ -18111,21 +18106,21 @@ _sk_load_4444_sse2 LABEL PROC
DB 243,15,126,28,120 ; movq (%rax,%rdi,2),%xmm3
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3
- DB 102,15,111,5,48,33,0,0 ; movdqa 0x2130(%rip),%xmm0 # 49c0 <_sk_callback_sse2+0xabb>
+ DB 102,15,111,5,52,33,0,0 ; movdqa 0x2134(%rip),%xmm0 # 49c0 <_sk_callback_sse2+0xabf>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,50,33,0,0 ; mulps 0x2132(%rip),%xmm0 # 49d0 <_sk_callback_sse2+0xacb>
- DB 102,15,111,13,58,33,0,0 ; movdqa 0x213a(%rip),%xmm1 # 49e0 <_sk_callback_sse2+0xadb>
+ DB 15,89,5,54,33,0,0 ; mulps 0x2136(%rip),%xmm0 # 49d0 <_sk_callback_sse2+0xacf>
+ DB 102,15,111,13,62,33,0,0 ; movdqa 0x213e(%rip),%xmm1 # 49e0 <_sk_callback_sse2+0xadf>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,60,33,0,0 ; mulps 0x213c(%rip),%xmm1 # 49f0 <_sk_callback_sse2+0xaeb>
- DB 102,15,111,21,68,33,0,0 ; movdqa 0x2144(%rip),%xmm2 # 4a00 <_sk_callback_sse2+0xafb>
+ DB 15,89,13,64,33,0,0 ; mulps 0x2140(%rip),%xmm1 # 49f0 <_sk_callback_sse2+0xaef>
+ DB 102,15,111,21,72,33,0,0 ; movdqa 0x2148(%rip),%xmm2 # 4a00 <_sk_callback_sse2+0xaff>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,70,33,0,0 ; mulps 0x2146(%rip),%xmm2 # 4a10 <_sk_callback_sse2+0xb0b>
- DB 102,15,219,29,78,33,0,0 ; pand 0x214e(%rip),%xmm3 # 4a20 <_sk_callback_sse2+0xb1b>
+ DB 15,89,21,74,33,0,0 ; mulps 0x214a(%rip),%xmm2 # 4a10 <_sk_callback_sse2+0xb0f>
+ DB 102,15,219,29,82,33,0,0 ; pand 0x2152(%rip),%xmm3 # 4a20 <_sk_callback_sse2+0xb1f>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,84,33,0,0 ; mulps 0x2154(%rip),%xmm3 # 4a30 <_sk_callback_sse2+0xb2b>
+ DB 15,89,29,88,33,0,0 ; mulps 0x2158(%rip),%xmm3 # 4a30 <_sk_callback_sse2+0xb2f>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -18159,21 +18154,21 @@ _sk_gather_4444_sse2 LABEL PROC
DB 102,15,196,216,3 ; pinsrw $0x3,%eax,%xmm3
DB 102,15,239,192 ; pxor %xmm0,%xmm0
DB 102,15,97,216 ; punpcklwd %xmm0,%xmm3
- DB 102,15,111,5,219,32,0,0 ; movdqa 0x20db(%rip),%xmm0 # 4a40 <_sk_callback_sse2+0xb3b>
+ DB 102,15,111,5,223,32,0,0 ; movdqa 0x20df(%rip),%xmm0 # 4a40 <_sk_callback_sse2+0xb3f>
DB 102,15,219,195 ; pand %xmm3,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 15,89,5,221,32,0,0 ; mulps 0x20dd(%rip),%xmm0 # 4a50 <_sk_callback_sse2+0xb4b>
- DB 102,15,111,13,229,32,0,0 ; movdqa 0x20e5(%rip),%xmm1 # 4a60 <_sk_callback_sse2+0xb5b>
+ DB 15,89,5,225,32,0,0 ; mulps 0x20e1(%rip),%xmm0 # 4a50 <_sk_callback_sse2+0xb4f>
+ DB 102,15,111,13,233,32,0,0 ; movdqa 0x20e9(%rip),%xmm1 # 4a60 <_sk_callback_sse2+0xb5f>
DB 102,15,219,203 ; pand %xmm3,%xmm1
DB 15,91,201 ; cvtdq2ps %xmm1,%xmm1
- DB 15,89,13,231,32,0,0 ; mulps 0x20e7(%rip),%xmm1 # 4a70 <_sk_callback_sse2+0xb6b>
- DB 102,15,111,21,239,32,0,0 ; movdqa 0x20ef(%rip),%xmm2 # 4a80 <_sk_callback_sse2+0xb7b>
+ DB 15,89,13,235,32,0,0 ; mulps 0x20eb(%rip),%xmm1 # 4a70 <_sk_callback_sse2+0xb6f>
+ DB 102,15,111,21,243,32,0,0 ; movdqa 0x20f3(%rip),%xmm2 # 4a80 <_sk_callback_sse2+0xb7f>
DB 102,15,219,211 ; pand %xmm3,%xmm2
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
- DB 15,89,21,241,32,0,0 ; mulps 0x20f1(%rip),%xmm2 # 4a90 <_sk_callback_sse2+0xb8b>
- DB 102,15,219,29,249,32,0,0 ; pand 0x20f9(%rip),%xmm3 # 4aa0 <_sk_callback_sse2+0xb9b>
+ DB 15,89,21,245,32,0,0 ; mulps 0x20f5(%rip),%xmm2 # 4a90 <_sk_callback_sse2+0xb8f>
+ DB 102,15,219,29,253,32,0,0 ; pand 0x20fd(%rip),%xmm3 # 4aa0 <_sk_callback_sse2+0xb9f>
DB 15,91,219 ; cvtdq2ps %xmm3,%xmm3
- DB 15,89,29,255,32,0,0 ; mulps 0x20ff(%rip),%xmm3 # 4ab0 <_sk_callback_sse2+0xbab>
+ DB 15,89,29,3,33,0,0 ; mulps 0x2103(%rip),%xmm3 # 4ab0 <_sk_callback_sse2+0xbaf>
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -18181,7 +18176,7 @@ PUBLIC _sk_store_4444_sse2
_sk_store_4444_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,254,32,0,0 ; movaps 0x20fe(%rip),%xmm8 # 4ac0 <_sk_callback_sse2+0xbbb>
+ DB 68,15,40,5,2,33,0,0 ; movaps 0x2102(%rip),%xmm8 # 4ac0 <_sk_callback_sse2+0xbbf>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -18211,11 +18206,11 @@ _sk_load_8888_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
DB 68,15,16,12,184 ; movups (%rax,%rdi,4),%xmm9
- DB 15,40,21,145,32,0,0 ; movaps 0x2091(%rip),%xmm2 # 4ad0 <_sk_callback_sse2+0xbcb>
+ DB 15,40,21,149,32,0,0 ; movaps 0x2095(%rip),%xmm2 # 4ad0 <_sk_callback_sse2+0xbcf>
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,84,194 ; andps %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,143,32,0,0 ; movaps 0x208f(%rip),%xmm8 # 4ae0 <_sk_callback_sse2+0xbdb>
+ DB 68,15,40,5,147,32,0,0 ; movaps 0x2093(%rip),%xmm8 # 4ae0 <_sk_callback_sse2+0xbdf>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 65,15,40,201 ; movaps %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -18262,11 +18257,11 @@ _sk_gather_8888_sse2 LABEL PROC
DB 102,67,15,110,12,129 ; movd (%r9,%r8,4),%xmm1
DB 102,68,15,98,201 ; punpckldq %xmm1,%xmm9
DB 102,68,15,98,200 ; punpckldq %xmm0,%xmm9
- DB 102,15,111,21,224,31,0,0 ; movdqa 0x1fe0(%rip),%xmm2 # 4af0 <_sk_callback_sse2+0xbeb>
+ DB 102,15,111,21,228,31,0,0 ; movdqa 0x1fe4(%rip),%xmm2 # 4af0 <_sk_callback_sse2+0xbef>
DB 102,65,15,111,193 ; movdqa %xmm9,%xmm0
DB 102,15,219,194 ; pand %xmm2,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,5,220,31,0,0 ; movaps 0x1fdc(%rip),%xmm8 # 4b00 <_sk_callback_sse2+0xbfb>
+ DB 68,15,40,5,224,31,0,0 ; movaps 0x1fe0(%rip),%xmm8 # 4b00 <_sk_callback_sse2+0xbff>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,65,15,111,201 ; movdqa %xmm9,%xmm1
DB 102,15,114,209,8 ; psrld $0x8,%xmm1
@@ -18288,7 +18283,7 @@ PUBLIC _sk_store_8888_sse2
_sk_store_8888_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,5,159,31,0,0 ; movaps 0x1f9f(%rip),%xmm8 # 4b10 <_sk_callback_sse2+0xc0b>
+ DB 68,15,40,5,163,31,0,0 ; movaps 0x1fa3(%rip),%xmm8 # 4b10 <_sk_callback_sse2+0xc0f>
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 102,69,15,91,201 ; cvtps2dq %xmm9,%xmm9
@@ -18325,7 +18320,7 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,69,15,239,210 ; pxor %xmm10,%xmm10
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,65,15,97,202 ; punpcklwd %xmm10,%xmm1
- DB 102,68,15,111,13,15,31,0,0 ; movdqa 0x1f0f(%rip),%xmm9 # 4b20 <_sk_callback_sse2+0xc1b>
+ DB 102,68,15,111,13,19,31,0,0 ; movdqa 0x1f13(%rip),%xmm9 # 4b20 <_sk_callback_sse2+0xc1f>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,193 ; pand %xmm9,%xmm0
DB 102,15,239,200 ; pxor %xmm0,%xmm1
@@ -18333,11 +18328,11 @@ _sk_load_f16_sse2 LABEL PROC
DB 102,68,15,111,233 ; movdqa %xmm1,%xmm13
DB 102,65,15,114,245,13 ; pslld $0xd,%xmm13
DB 102,68,15,235,232 ; por %xmm0,%xmm13
- DB 102,68,15,111,29,244,30,0,0 ; movdqa 0x1ef4(%rip),%xmm11 # 4b30 <_sk_callback_sse2+0xc2b>
+ DB 102,68,15,111,29,248,30,0,0 ; movdqa 0x1ef8(%rip),%xmm11 # 4b30 <_sk_callback_sse2+0xc2f>
DB 102,69,15,254,235 ; paddd %xmm11,%xmm13
- DB 102,68,15,111,37,246,30,0,0 ; movdqa 0x1ef6(%rip),%xmm12 # 4b40 <_sk_callback_sse2+0xc3b>
+ DB 102,68,15,111,37,250,30,0,0 ; movdqa 0x1efa(%rip),%xmm12 # 4b40 <_sk_callback_sse2+0xc3f>
DB 102,65,15,239,204 ; pxor %xmm12,%xmm1
- DB 102,15,111,29,249,30,0,0 ; movdqa 0x1ef9(%rip),%xmm3 # 4b50 <_sk_callback_sse2+0xc4b>
+ DB 102,15,111,29,253,30,0,0 ; movdqa 0x1efd(%rip),%xmm3 # 4b50 <_sk_callback_sse2+0xc4f>
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,102,193 ; pcmpgtd %xmm1,%xmm0
DB 102,65,15,223,197 ; pandn %xmm13,%xmm0
@@ -18421,7 +18416,7 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,69,15,239,210 ; pxor %xmm10,%xmm10
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,65,15,97,202 ; punpcklwd %xmm10,%xmm1
- DB 102,68,15,111,13,135,29,0,0 ; movdqa 0x1d87(%rip),%xmm9 # 4b60 <_sk_callback_sse2+0xc5b>
+ DB 102,68,15,111,13,139,29,0,0 ; movdqa 0x1d8b(%rip),%xmm9 # 4b60 <_sk_callback_sse2+0xc5f>
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,65,15,219,193 ; pand %xmm9,%xmm0
DB 102,15,239,200 ; pxor %xmm0,%xmm1
@@ -18429,11 +18424,11 @@ _sk_gather_f16_sse2 LABEL PROC
DB 102,68,15,111,233 ; movdqa %xmm1,%xmm13
DB 102,65,15,114,245,13 ; pslld $0xd,%xmm13
DB 102,68,15,235,232 ; por %xmm0,%xmm13
- DB 102,68,15,111,29,108,29,0,0 ; movdqa 0x1d6c(%rip),%xmm11 # 4b70 <_sk_callback_sse2+0xc6b>
+ DB 102,68,15,111,29,112,29,0,0 ; movdqa 0x1d70(%rip),%xmm11 # 4b70 <_sk_callback_sse2+0xc6f>
DB 102,69,15,254,235 ; paddd %xmm11,%xmm13
- DB 102,68,15,111,37,110,29,0,0 ; movdqa 0x1d6e(%rip),%xmm12 # 4b80 <_sk_callback_sse2+0xc7b>
+ DB 102,68,15,111,37,114,29,0,0 ; movdqa 0x1d72(%rip),%xmm12 # 4b80 <_sk_callback_sse2+0xc7f>
DB 102,65,15,239,204 ; pxor %xmm12,%xmm1
- DB 102,15,111,29,113,29,0,0 ; movdqa 0x1d71(%rip),%xmm3 # 4b90 <_sk_callback_sse2+0xc8b>
+ DB 102,15,111,29,117,29,0,0 ; movdqa 0x1d75(%rip),%xmm3 # 4b90 <_sk_callback_sse2+0xc8f>
DB 102,15,111,195 ; movdqa %xmm3,%xmm0
DB 102,15,102,193 ; pcmpgtd %xmm1,%xmm0
DB 102,65,15,223,197 ; pandn %xmm13,%xmm0
@@ -18484,17 +18479,17 @@ PUBLIC _sk_store_f16_sse2
_sk_store_f16_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 102,68,15,111,21,153,28,0,0 ; movdqa 0x1c99(%rip),%xmm10 # 4ba0 <_sk_callback_sse2+0xc9b>
+ DB 102,68,15,111,21,157,28,0,0 ; movdqa 0x1c9d(%rip),%xmm10 # 4ba0 <_sk_callback_sse2+0xc9f>
DB 102,68,15,111,224 ; movdqa %xmm0,%xmm12
DB 102,68,15,111,232 ; movdqa %xmm0,%xmm13
DB 102,69,15,219,234 ; pand %xmm10,%xmm13
DB 102,69,15,239,229 ; pxor %xmm13,%xmm12
- DB 102,68,15,111,13,140,28,0,0 ; movdqa 0x1c8c(%rip),%xmm9 # 4bb0 <_sk_callback_sse2+0xcab>
+ DB 102,68,15,111,13,144,28,0,0 ; movdqa 0x1c90(%rip),%xmm9 # 4bb0 <_sk_callback_sse2+0xcaf>
DB 102,65,15,114,213,16 ; psrld $0x10,%xmm13
DB 102,69,15,111,193 ; movdqa %xmm9,%xmm8
DB 102,69,15,102,196 ; pcmpgtd %xmm12,%xmm8
DB 102,65,15,114,212,13 ; psrld $0xd,%xmm12
- DB 102,68,15,111,29,125,28,0,0 ; movdqa 0x1c7d(%rip),%xmm11 # 4bc0 <_sk_callback_sse2+0xcbb>
+ DB 102,68,15,111,29,129,28,0,0 ; movdqa 0x1c81(%rip),%xmm11 # 4bc0 <_sk_callback_sse2+0xcbf>
DB 102,69,15,235,235 ; por %xmm11,%xmm13
DB 102,69,15,254,236 ; paddd %xmm12,%xmm13
DB 102,65,15,114,245,16 ; pslld $0x10,%xmm13
@@ -18571,7 +18566,7 @@ _sk_load_u16_be_sse2 LABEL PROC
DB 102,69,15,239,201 ; pxor %xmm9,%xmm9
DB 102,65,15,97,201 ; punpcklwd %xmm9,%xmm1
DB 15,91,193 ; cvtdq2ps %xmm1,%xmm0
- DB 68,15,40,5,27,27,0,0 ; movaps 0x1b1b(%rip),%xmm8 # 4bd0 <_sk_callback_sse2+0xccb>
+ DB 68,15,40,5,31,27,0,0 ; movaps 0x1b1f(%rip),%xmm8 # 4bd0 <_sk_callback_sse2+0xccf>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -18622,7 +18617,7 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 102,69,15,239,192 ; pxor %xmm8,%xmm8
DB 102,65,15,97,192 ; punpcklwd %xmm8,%xmm0
DB 15,91,192 ; cvtdq2ps %xmm0,%xmm0
- DB 68,15,40,13,87,26,0,0 ; movaps 0x1a57(%rip),%xmm9 # 4be0 <_sk_callback_sse2+0xcdb>
+ DB 68,15,40,13,91,26,0,0 ; movaps 0x1a5b(%rip),%xmm9 # 4be0 <_sk_callback_sse2+0xcdf>
DB 65,15,89,193 ; mulps %xmm9,%xmm0
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
DB 102,15,113,241,8 ; psllw $0x8,%xmm1
@@ -18639,14 +18634,14 @@ _sk_load_rgb_u16_be_sse2 LABEL PROC
DB 15,91,210 ; cvtdq2ps %xmm2,%xmm2
DB 65,15,89,209 ; mulps %xmm9,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,30,26,0,0 ; movaps 0x1a1e(%rip),%xmm3 # 4bf0 <_sk_callback_sse2+0xceb>
+ DB 15,40,29,34,26,0,0 ; movaps 0x1a22(%rip),%xmm3 # 4bf0 <_sk_callback_sse2+0xcef>
DB 255,224 ; jmpq *%rax
PUBLIC _sk_store_u16_be_sse2
_sk_store_u16_be_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 72,139,0 ; mov (%rax),%rax
- DB 68,15,40,13,31,26,0,0 ; movaps 0x1a1f(%rip),%xmm9 # 4c00 <_sk_callback_sse2+0xcfb>
+ DB 68,15,40,13,35,26,0,0 ; movaps 0x1a23(%rip),%xmm9 # 4c00 <_sk_callback_sse2+0xcff>
DB 68,15,40,192 ; movaps %xmm0,%xmm8
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 102,69,15,91,192 ; cvtps2dq %xmm8,%xmm8
@@ -18786,7 +18781,7 @@ _sk_repeat_x_sse2 LABEL PROC
DB 243,69,15,91,209 ; cvttps2dq %xmm9,%xmm10
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
DB 69,15,194,202,1 ; cmpltps %xmm10,%xmm9
- DB 68,15,84,13,9,24,0,0 ; andps 0x1809(%rip),%xmm9 # 4c10 <_sk_callback_sse2+0xd0b>
+ DB 68,15,84,13,13,24,0,0 ; andps 0x180d(%rip),%xmm9 # 4c10 <_sk_callback_sse2+0xd0f>
DB 69,15,92,209 ; subps %xmm9,%xmm10
DB 69,15,89,208 ; mulps %xmm8,%xmm10
DB 65,15,92,194 ; subps %xmm10,%xmm0
@@ -18806,7 +18801,7 @@ _sk_repeat_y_sse2 LABEL PROC
DB 243,69,15,91,209 ; cvttps2dq %xmm9,%xmm10
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
DB 69,15,194,202,1 ; cmpltps %xmm10,%xmm9
- DB 68,15,84,13,209,23,0,0 ; andps 0x17d1(%rip),%xmm9 # 4c20 <_sk_callback_sse2+0xd1b>
+ DB 68,15,84,13,213,23,0,0 ; andps 0x17d5(%rip),%xmm9 # 4c20 <_sk_callback_sse2+0xd1f>
DB 69,15,92,209 ; subps %xmm9,%xmm10
DB 69,15,89,208 ; mulps %xmm8,%xmm10
DB 65,15,92,202 ; subps %xmm10,%xmm1
@@ -18830,7 +18825,7 @@ _sk_mirror_x_sse2 LABEL PROC
DB 243,69,15,91,218 ; cvttps2dq %xmm10,%xmm11
DB 69,15,91,219 ; cvtdq2ps %xmm11,%xmm11
DB 69,15,194,211,1 ; cmpltps %xmm11,%xmm10
- DB 68,15,84,21,135,23,0,0 ; andps 0x1787(%rip),%xmm10 # 4c30 <_sk_callback_sse2+0xd2b>
+ DB 68,15,84,21,139,23,0,0 ; andps 0x178b(%rip),%xmm10 # 4c30 <_sk_callback_sse2+0xd2f>
DB 69,15,87,228 ; xorps %xmm12,%xmm12
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 69,15,89,216 ; mulps %xmm8,%xmm11
@@ -18858,7 +18853,7 @@ _sk_mirror_y_sse2 LABEL PROC
DB 243,69,15,91,218 ; cvttps2dq %xmm10,%xmm11
DB 69,15,91,219 ; cvtdq2ps %xmm11,%xmm11
DB 69,15,194,211,1 ; cmpltps %xmm11,%xmm10
- DB 68,15,84,21,45,23,0,0 ; andps 0x172d(%rip),%xmm10 # 4c40 <_sk_callback_sse2+0xd3b>
+ DB 68,15,84,21,49,23,0,0 ; andps 0x1731(%rip),%xmm10 # 4c40 <_sk_callback_sse2+0xd3f>
DB 69,15,87,228 ; xorps %xmm12,%xmm12
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 69,15,89,216 ; mulps %xmm8,%xmm11
@@ -18875,10 +18870,10 @@ _sk_mirror_y_sse2 LABEL PROC
PUBLIC _sk_luminance_to_alpha_sse2
_sk_luminance_to_alpha_sse2 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 15,89,5,5,23,0,0 ; mulps 0x1705(%rip),%xmm0 # 4c50 <_sk_callback_sse2+0xd4b>
- DB 15,89,13,14,23,0,0 ; mulps 0x170e(%rip),%xmm1 # 4c60 <_sk_callback_sse2+0xd5b>
+ DB 15,89,5,9,23,0,0 ; mulps 0x1709(%rip),%xmm0 # 4c50 <_sk_callback_sse2+0xd4f>
+ DB 15,89,13,18,23,0,0 ; mulps 0x1712(%rip),%xmm1 # 4c60 <_sk_callback_sse2+0xd5f>
DB 15,88,200 ; addps %xmm0,%xmm1
- DB 15,89,29,20,23,0,0 ; mulps 0x1714(%rip),%xmm3 # 4c70 <_sk_callback_sse2+0xd6b>
+ DB 15,89,29,24,23,0,0 ; mulps 0x1718(%rip),%xmm3 # 4c70 <_sk_callback_sse2+0xd6f>
DB 15,88,217 ; addps %xmm1,%xmm3
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,87,192 ; xorps %xmm0,%xmm0
@@ -19101,7 +19096,7 @@ _sk_linear_gradient_sse2 LABEL PROC
DB 69,15,198,228,0 ; shufps $0x0,%xmm12,%xmm12
DB 72,139,8 ; mov (%rax),%rcx
DB 72,133,201 ; test %rcx,%rcx
- DB 15,132,15,1,0,0 ; je 3a0f <_sk_linear_gradient_sse2+0x149>
+ DB 15,132,15,1,0,0 ; je 3a0b <_sk_linear_gradient_sse2+0x149>
DB 72,139,64,8 ; mov 0x8(%rax),%rax
DB 72,131,192,32 ; add $0x20,%rax
DB 69,15,87,192 ; xorps %xmm8,%xmm8
@@ -19162,8 +19157,8 @@ _sk_linear_gradient_sse2 LABEL PROC
DB 69,15,86,231 ; orps %xmm15,%xmm12
DB 72,131,192,36 ; add $0x24,%rax
DB 72,255,201 ; dec %rcx
- DB 15,133,8,255,255,255 ; jne 3915 <_sk_linear_gradient_sse2+0x4f>
- DB 235,13 ; jmp 3a1c <_sk_linear_gradient_sse2+0x156>
+ DB 15,133,8,255,255,255 ; jne 3911 <_sk_linear_gradient_sse2+0x4f>
+ DB 235,13 ; jmp 3a18 <_sk_linear_gradient_sse2+0x156>
DB 15,87,201 ; xorps %xmm1,%xmm1
DB 15,87,210 ; xorps %xmm2,%xmm2
DB 15,87,219 ; xorps %xmm3,%xmm3
@@ -19228,29 +19223,29 @@ _sk_xy_to_polar_unit_sse2 LABEL PROC
DB 69,15,94,220 ; divps %xmm12,%xmm11
DB 69,15,40,227 ; movaps %xmm11,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
- DB 68,15,40,45,140,17,0,0 ; movaps 0x118c(%rip),%xmm13 # 4c80 <_sk_callback_sse2+0xd7b>
+ DB 68,15,40,45,144,17,0,0 ; movaps 0x1190(%rip),%xmm13 # 4c80 <_sk_callback_sse2+0xd7f>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,144,17,0,0 ; addps 0x1190(%rip),%xmm13 # 4c90 <_sk_callback_sse2+0xd8b>
+ DB 68,15,88,45,148,17,0,0 ; addps 0x1194(%rip),%xmm13 # 4c90 <_sk_callback_sse2+0xd8f>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,148,17,0,0 ; addps 0x1194(%rip),%xmm13 # 4ca0 <_sk_callback_sse2+0xd9b>
+ DB 68,15,88,45,152,17,0,0 ; addps 0x1198(%rip),%xmm13 # 4ca0 <_sk_callback_sse2+0xd9f>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,152,17,0,0 ; addps 0x1198(%rip),%xmm13 # 4cb0 <_sk_callback_sse2+0xdab>
+ DB 68,15,88,45,156,17,0,0 ; addps 0x119c(%rip),%xmm13 # 4cb0 <_sk_callback_sse2+0xdaf>
DB 69,15,89,235 ; mulps %xmm11,%xmm13
DB 69,15,194,202,1 ; cmpltps %xmm10,%xmm9
- DB 68,15,40,21,151,17,0,0 ; movaps 0x1197(%rip),%xmm10 # 4cc0 <_sk_callback_sse2+0xdbb>
+ DB 68,15,40,21,155,17,0,0 ; movaps 0x119b(%rip),%xmm10 # 4cc0 <_sk_callback_sse2+0xdbf>
DB 69,15,92,213 ; subps %xmm13,%xmm10
DB 69,15,84,209 ; andps %xmm9,%xmm10
DB 69,15,85,205 ; andnps %xmm13,%xmm9
DB 69,15,86,202 ; orps %xmm10,%xmm9
DB 68,15,194,192,1 ; cmpltps %xmm0,%xmm8
- DB 68,15,40,21,138,17,0,0 ; movaps 0x118a(%rip),%xmm10 # 4cd0 <_sk_callback_sse2+0xdcb>
+ DB 68,15,40,21,142,17,0,0 ; movaps 0x118e(%rip),%xmm10 # 4cd0 <_sk_callback_sse2+0xdcf>
DB 69,15,92,209 ; subps %xmm9,%xmm10
DB 69,15,84,208 ; andps %xmm8,%xmm10
DB 69,15,85,193 ; andnps %xmm9,%xmm8
DB 69,15,86,194 ; orps %xmm10,%xmm8
DB 68,15,40,201 ; movaps %xmm1,%xmm9
DB 68,15,194,200,1 ; cmpltps %xmm0,%xmm9
- DB 68,15,40,21,121,17,0,0 ; movaps 0x1179(%rip),%xmm10 # 4ce0 <_sk_callback_sse2+0xddb>
+ DB 68,15,40,21,125,17,0,0 ; movaps 0x117d(%rip),%xmm10 # 4ce0 <_sk_callback_sse2+0xddf>
DB 69,15,92,208 ; subps %xmm8,%xmm10
DB 69,15,84,209 ; andps %xmm9,%xmm10
DB 69,15,85,200 ; andnps %xmm8,%xmm9
@@ -19263,7 +19258,7 @@ _sk_xy_to_polar_unit_sse2 LABEL PROC
PUBLIC _sk_save_xy_sse2
_sk_save_xy_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,98,17,0,0 ; movaps 0x1162(%rip),%xmm8 # 4cf0 <_sk_callback_sse2+0xdeb>
+ DB 68,15,40,5,102,17,0,0 ; movaps 0x1166(%rip),%xmm8 # 4cf0 <_sk_callback_sse2+0xdef>
DB 15,17,0 ; movups %xmm0,(%rax)
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,88,200 ; addps %xmm8,%xmm9
@@ -19271,7 +19266,7 @@ _sk_save_xy_sse2 LABEL PROC
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
DB 69,15,40,217 ; movaps %xmm9,%xmm11
DB 69,15,194,218,1 ; cmpltps %xmm10,%xmm11
- DB 68,15,40,37,77,17,0,0 ; movaps 0x114d(%rip),%xmm12 # 4d00 <_sk_callback_sse2+0xdfb>
+ DB 68,15,40,37,81,17,0,0 ; movaps 0x1151(%rip),%xmm12 # 4d00 <_sk_callback_sse2+0xdff>
DB 69,15,84,220 ; andps %xmm12,%xmm11
DB 69,15,92,211 ; subps %xmm11,%xmm10
DB 69,15,92,202 ; subps %xmm10,%xmm9
@@ -19314,8 +19309,8 @@ _sk_bilinear_nx_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,198,16,0,0 ; addps 0x10c6(%rip),%xmm0 # 4d10 <_sk_callback_sse2+0xe0b>
- DB 68,15,40,13,206,16,0,0 ; movaps 0x10ce(%rip),%xmm9 # 4d20 <_sk_callback_sse2+0xe1b>
+ DB 15,88,5,202,16,0,0 ; addps 0x10ca(%rip),%xmm0 # 4d10 <_sk_callback_sse2+0xe0f>
+ DB 68,15,40,13,210,16,0,0 ; movaps 0x10d2(%rip),%xmm9 # 4d20 <_sk_callback_sse2+0xe1f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -19326,7 +19321,7 @@ _sk_bilinear_px_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,189,16,0,0 ; addps 0x10bd(%rip),%xmm0 # 4d30 <_sk_callback_sse2+0xe2b>
+ DB 15,88,5,193,16,0,0 ; addps 0x10c1(%rip),%xmm0 # 4d30 <_sk_callback_sse2+0xe2f>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -19336,8 +19331,8 @@ _sk_bilinear_ny_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,175,16,0,0 ; addps 0x10af(%rip),%xmm1 # 4d40 <_sk_callback_sse2+0xe3b>
- DB 68,15,40,13,183,16,0,0 ; movaps 0x10b7(%rip),%xmm9 # 4d50 <_sk_callback_sse2+0xe4b>
+ DB 15,88,13,179,16,0,0 ; addps 0x10b3(%rip),%xmm1 # 4d40 <_sk_callback_sse2+0xe3f>
+ DB 68,15,40,13,187,16,0,0 ; movaps 0x10bb(%rip),%xmm9 # 4d50 <_sk_callback_sse2+0xe4f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -19348,7 +19343,7 @@ _sk_bilinear_py_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,165,16,0,0 ; addps 0x10a5(%rip),%xmm1 # 4d60 <_sk_callback_sse2+0xe5b>
+ DB 15,88,13,169,16,0,0 ; addps 0x10a9(%rip),%xmm1 # 4d60 <_sk_callback_sse2+0xe5f>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -19358,13 +19353,13 @@ _sk_bicubic_n3x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,152,16,0,0 ; addps 0x1098(%rip),%xmm0 # 4d70 <_sk_callback_sse2+0xe6b>
- DB 68,15,40,13,160,16,0,0 ; movaps 0x10a0(%rip),%xmm9 # 4d80 <_sk_callback_sse2+0xe7b>
+ DB 15,88,5,156,16,0,0 ; addps 0x109c(%rip),%xmm0 # 4d70 <_sk_callback_sse2+0xe6f>
+ DB 68,15,40,13,164,16,0,0 ; movaps 0x10a4(%rip),%xmm9 # 4d80 <_sk_callback_sse2+0xe7f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,156,16,0,0 ; mulps 0x109c(%rip),%xmm9 # 4d90 <_sk_callback_sse2+0xe8b>
- DB 68,15,88,13,164,16,0,0 ; addps 0x10a4(%rip),%xmm9 # 4da0 <_sk_callback_sse2+0xe9b>
+ DB 68,15,89,13,160,16,0,0 ; mulps 0x10a0(%rip),%xmm9 # 4d90 <_sk_callback_sse2+0xe8f>
+ DB 68,15,88,13,168,16,0,0 ; addps 0x10a8(%rip),%xmm9 # 4da0 <_sk_callback_sse2+0xe9f>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,128,0,0,0 ; movups %xmm9,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -19375,16 +19370,16 @@ _sk_bicubic_n1x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,147,16,0,0 ; addps 0x1093(%rip),%xmm0 # 4db0 <_sk_callback_sse2+0xeab>
- DB 68,15,40,13,155,16,0,0 ; movaps 0x109b(%rip),%xmm9 # 4dc0 <_sk_callback_sse2+0xebb>
+ DB 15,88,5,151,16,0,0 ; addps 0x1097(%rip),%xmm0 # 4db0 <_sk_callback_sse2+0xeaf>
+ DB 68,15,40,13,159,16,0,0 ; movaps 0x109f(%rip),%xmm9 # 4dc0 <_sk_callback_sse2+0xebf>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,159,16,0,0 ; movaps 0x109f(%rip),%xmm8 # 4dd0 <_sk_callback_sse2+0xecb>
+ DB 68,15,40,5,163,16,0,0 ; movaps 0x10a3(%rip),%xmm8 # 4dd0 <_sk_callback_sse2+0xecf>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,163,16,0,0 ; addps 0x10a3(%rip),%xmm8 # 4de0 <_sk_callback_sse2+0xedb>
+ DB 68,15,88,5,167,16,0,0 ; addps 0x10a7(%rip),%xmm8 # 4de0 <_sk_callback_sse2+0xedf>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,167,16,0,0 ; addps 0x10a7(%rip),%xmm8 # 4df0 <_sk_callback_sse2+0xeeb>
+ DB 68,15,88,5,171,16,0,0 ; addps 0x10ab(%rip),%xmm8 # 4df0 <_sk_callback_sse2+0xeef>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,171,16,0,0 ; addps 0x10ab(%rip),%xmm8 # 4e00 <_sk_callback_sse2+0xefb>
+ DB 68,15,88,5,175,16,0,0 ; addps 0x10af(%rip),%xmm8 # 4e00 <_sk_callback_sse2+0xeff>
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -19392,17 +19387,17 @@ _sk_bicubic_n1x_sse2 LABEL PROC
PUBLIC _sk_bicubic_p1x_sse2
_sk_bicubic_p1x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,165,16,0,0 ; movaps 0x10a5(%rip),%xmm8 # 4e10 <_sk_callback_sse2+0xf0b>
+ DB 68,15,40,5,169,16,0,0 ; movaps 0x10a9(%rip),%xmm8 # 4e10 <_sk_callback_sse2+0xf0f>
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,72,64 ; movups 0x40(%rax),%xmm9
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,21,161,16,0,0 ; movaps 0x10a1(%rip),%xmm10 # 4e20 <_sk_callback_sse2+0xf1b>
+ DB 68,15,40,21,165,16,0,0 ; movaps 0x10a5(%rip),%xmm10 # 4e20 <_sk_callback_sse2+0xf1f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,165,16,0,0 ; addps 0x10a5(%rip),%xmm10 # 4e30 <_sk_callback_sse2+0xf2b>
+ DB 68,15,88,21,169,16,0,0 ; addps 0x10a9(%rip),%xmm10 # 4e30 <_sk_callback_sse2+0xf2f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,161,16,0,0 ; addps 0x10a1(%rip),%xmm10 # 4e40 <_sk_callback_sse2+0xf3b>
+ DB 68,15,88,21,165,16,0,0 ; addps 0x10a5(%rip),%xmm10 # 4e40 <_sk_callback_sse2+0xf3f>
DB 68,15,17,144,128,0,0,0 ; movups %xmm10,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -19412,11 +19407,11 @@ _sk_bicubic_p3x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,64,64 ; movups 0x40(%rax),%xmm8
- DB 15,88,5,148,16,0,0 ; addps 0x1094(%rip),%xmm0 # 4e50 <_sk_callback_sse2+0xf4b>
+ DB 15,88,5,152,16,0,0 ; addps 0x1098(%rip),%xmm0 # 4e50 <_sk_callback_sse2+0xf4f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,148,16,0,0 ; mulps 0x1094(%rip),%xmm8 # 4e60 <_sk_callback_sse2+0xf5b>
- DB 68,15,88,5,156,16,0,0 ; addps 0x109c(%rip),%xmm8 # 4e70 <_sk_callback_sse2+0xf6b>
+ DB 68,15,89,5,152,16,0,0 ; mulps 0x1098(%rip),%xmm8 # 4e60 <_sk_callback_sse2+0xf5f>
+ DB 68,15,88,5,160,16,0,0 ; addps 0x10a0(%rip),%xmm8 # 4e70 <_sk_callback_sse2+0xf6f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,128,0,0,0 ; movups %xmm8,0x80(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -19427,13 +19422,13 @@ _sk_bicubic_n3y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,138,16,0,0 ; addps 0x108a(%rip),%xmm1 # 4e80 <_sk_callback_sse2+0xf7b>
- DB 68,15,40,13,146,16,0,0 ; movaps 0x1092(%rip),%xmm9 # 4e90 <_sk_callback_sse2+0xf8b>
+ DB 15,88,13,142,16,0,0 ; addps 0x108e(%rip),%xmm1 # 4e80 <_sk_callback_sse2+0xf7f>
+ DB 68,15,40,13,150,16,0,0 ; movaps 0x1096(%rip),%xmm9 # 4e90 <_sk_callback_sse2+0xf8f>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,142,16,0,0 ; mulps 0x108e(%rip),%xmm9 # 4ea0 <_sk_callback_sse2+0xf9b>
- DB 68,15,88,13,150,16,0,0 ; addps 0x1096(%rip),%xmm9 # 4eb0 <_sk_callback_sse2+0xfab>
+ DB 68,15,89,13,146,16,0,0 ; mulps 0x1092(%rip),%xmm9 # 4ea0 <_sk_callback_sse2+0xf9f>
+ DB 68,15,88,13,154,16,0,0 ; addps 0x109a(%rip),%xmm9 # 4eb0 <_sk_callback_sse2+0xfaf>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,160,0,0,0 ; movups %xmm9,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -19444,16 +19439,16 @@ _sk_bicubic_n1y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,132,16,0,0 ; addps 0x1084(%rip),%xmm1 # 4ec0 <_sk_callback_sse2+0xfbb>
- DB 68,15,40,13,140,16,0,0 ; movaps 0x108c(%rip),%xmm9 # 4ed0 <_sk_callback_sse2+0xfcb>
+ DB 15,88,13,136,16,0,0 ; addps 0x1088(%rip),%xmm1 # 4ec0 <_sk_callback_sse2+0xfbf>
+ DB 68,15,40,13,144,16,0,0 ; movaps 0x1090(%rip),%xmm9 # 4ed0 <_sk_callback_sse2+0xfcf>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,144,16,0,0 ; movaps 0x1090(%rip),%xmm8 # 4ee0 <_sk_callback_sse2+0xfdb>
+ DB 68,15,40,5,148,16,0,0 ; movaps 0x1094(%rip),%xmm8 # 4ee0 <_sk_callback_sse2+0xfdf>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,148,16,0,0 ; addps 0x1094(%rip),%xmm8 # 4ef0 <_sk_callback_sse2+0xfeb>
+ DB 68,15,88,5,152,16,0,0 ; addps 0x1098(%rip),%xmm8 # 4ef0 <_sk_callback_sse2+0xfef>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,152,16,0,0 ; addps 0x1098(%rip),%xmm8 # 4f00 <_sk_callback_sse2+0xffb>
+ DB 68,15,88,5,156,16,0,0 ; addps 0x109c(%rip),%xmm8 # 4f00 <_sk_callback_sse2+0xfff>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,156,16,0,0 ; addps 0x109c(%rip),%xmm8 # 4f10 <_sk_callback_sse2+0x100b>
+ DB 68,15,88,5,160,16,0,0 ; addps 0x10a0(%rip),%xmm8 # 4f10 <_sk_callback_sse2+0x100f>
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -19461,17 +19456,17 @@ _sk_bicubic_n1y_sse2 LABEL PROC
PUBLIC _sk_bicubic_p1y_sse2
_sk_bicubic_p1y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,150,16,0,0 ; movaps 0x1096(%rip),%xmm8 # 4f20 <_sk_callback_sse2+0x101b>
+ DB 68,15,40,5,154,16,0,0 ; movaps 0x109a(%rip),%xmm8 # 4f20 <_sk_callback_sse2+0x101f>
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,72,96 ; movups 0x60(%rax),%xmm9
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 68,15,40,21,145,16,0,0 ; movaps 0x1091(%rip),%xmm10 # 4f30 <_sk_callback_sse2+0x102b>
+ DB 68,15,40,21,149,16,0,0 ; movaps 0x1095(%rip),%xmm10 # 4f30 <_sk_callback_sse2+0x102f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,149,16,0,0 ; addps 0x1095(%rip),%xmm10 # 4f40 <_sk_callback_sse2+0x103b>
+ DB 68,15,88,21,153,16,0,0 ; addps 0x1099(%rip),%xmm10 # 4f40 <_sk_callback_sse2+0x103f>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,145,16,0,0 ; addps 0x1091(%rip),%xmm10 # 4f50 <_sk_callback_sse2+0x104b>
+ DB 68,15,88,21,149,16,0,0 ; addps 0x1095(%rip),%xmm10 # 4f50 <_sk_callback_sse2+0x104f>
DB 68,15,17,144,160,0,0,0 ; movups %xmm10,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -19481,11 +19476,11 @@ _sk_bicubic_p3y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,32 ; movups 0x20(%rax),%xmm1
DB 68,15,16,64,96 ; movups 0x60(%rax),%xmm8
- DB 15,88,13,131,16,0,0 ; addps 0x1083(%rip),%xmm1 # 4f60 <_sk_callback_sse2+0x105b>
+ DB 15,88,13,135,16,0,0 ; addps 0x1087(%rip),%xmm1 # 4f60 <_sk_callback_sse2+0x105f>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,131,16,0,0 ; mulps 0x1083(%rip),%xmm8 # 4f70 <_sk_callback_sse2+0x106b>
- DB 68,15,88,5,139,16,0,0 ; addps 0x108b(%rip),%xmm8 # 4f80 <_sk_callback_sse2+0x107b>
+ DB 68,15,89,5,135,16,0,0 ; mulps 0x1087(%rip),%xmm8 # 4f70 <_sk_callback_sse2+0x106f>
+ DB 68,15,88,5,143,16,0,0 ; addps 0x108f(%rip),%xmm8 # 4f80 <_sk_callback_sse2+0x107f>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,160,0,0,0 ; movups %xmm8,0xa0(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -19584,15 +19579,16 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 2,0 ; add (%rax),%al
DB 0,0 ; add %al,(%rax)
- DB 33,8 ; and %ecx,(%rax)
- DB 130 ; (bad)
- DB 60,33 ; cmp $0x21,%al
- DB 8,130,60,33,8,130 ; or %al,-0x7df7dec4(%rdx)
- DB 60,33 ; cmp $0x21,%al
- DB 8,130,60,0,0,0 ; or %al,0x3c(%rdx)
- DB 191,0,0,0,191 ; mov $0xbf000000,%edi
DB 0,0 ; add %al,(%rax)
- DB 0,191,0,0,0,191 ; add %bh,-0x41000000(%rdi)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 128,60,0,0 ; cmpb $0x0,(%rax,%rax,1)
+ DB 252 ; cld
+ DB 190,0,0,252,190 ; mov $0xbefc0000,%esi
+ DB 0,0 ; add %al,(%rax)
+ DB 252 ; cld
+ DB 190,0,0,252,190 ; mov $0xbefc0000,%esi
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
DB 0,128,63,0,0,128 ; add %al,-0x7fffffc1(%rax)
@@ -20052,7 +20048,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a3847a <_sk_callback_sse2+0xffffffffe9a34575>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a3847a <_sk_callback_sse2+0xffffffffe9a34579>
DB 220,63 ; fdivrl (%rdi)
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
@@ -20147,7 +20143,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a3854a <_sk_callback_sse2+0xffffffffe9a34645>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a3854a <_sk_callback_sse2+0xffffffffe9a34649>
DB 220,63 ; fdivrl (%rdi)
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
@@ -20242,7 +20238,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a3861a <_sk_callback_sse2+0xffffffffe9a34715>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a3861a <_sk_callback_sse2+0xffffffffe9a34719>
DB 220,63 ; fdivrl (%rdi)
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
@@ -20337,7 +20333,7 @@ ALIGN 16
DB 249 ; stc
DB 68,180,62 ; rex.R mov $0x3e,%spl
DB 163,233,220,63,163,233,220,63,163 ; movabs %eax,0xa33fdce9a33fdce9
- DB 233,220,63,163,233 ; jmpq ffffffffe9a386ea <_sk_callback_sse2+0xffffffffe9a347e5>
+ DB 233,220,63,163,233 ; jmpq ffffffffe9a386ea <_sk_callback_sse2+0xffffffffe9a347e9>
DB 220,63 ; fdivrl (%rdi)
DB 0,0 ; add %al,(%rax)
DB 128,63,0 ; cmpb $0x0,(%rdi)
@@ -21012,7 +21008,7 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dc45 <_sk_callback_sse2+0x3d639d40>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dc45 <_sk_callback_sse2+0x3d639d44>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 0,63 ; add %bh,(%rdi)
DB 0,0 ; add %al,(%rax)
@@ -21038,7 +21034,7 @@ ALIGN 16
DB 0,192 ; add %al,%al
DB 63 ; (bad)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dc85 <_sk_callback_sse2+0x3d639d80>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dc85 <_sk_callback_sse2+0x3d639d84>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 192,63,0 ; sarb $0x0,(%rdi)
DB 0,192 ; add %al,%al
@@ -21122,7 +21118,7 @@ ALIGN 16
DB 0,0 ; add %al,(%rax)
DB 0,63 ; add %bh,(%rdi)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dd55 <_sk_callback_sse2+0x3d639e50>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dd55 <_sk_callback_sse2+0x3d639e54>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 0,63 ; add %bh,(%rdi)
DB 0,0 ; add %al,(%rax)
@@ -21148,7 +21144,7 @@ ALIGN 16
DB 0,192 ; add %al,%al
DB 63 ; (bad)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dd95 <_sk_callback_sse2+0x3d639e90>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d63dd95 <_sk_callback_sse2+0x3d639e94>
DB 57,142,99,61,0,0 ; cmp %ecx,0x3d63(%rsi)
DB 192,63,0 ; sarb $0x0,(%rdi)
DB 0,192 ; add %al,%al
@@ -21159,11 +21155,11 @@ ALIGN 16
DB 63 ; (bad)
DB 114,28 ; jb 4f8e <.literal16+0xfde>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 4f92 <_sk_callback_sse2+0x108d>
+ DB 62,114,28 ; jb,pt 4f92 <_sk_callback_sse2+0x1091>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 4f96 <_sk_callback_sse2+0x1091>
+ DB 62,114,28 ; jb,pt 4f96 <_sk_callback_sse2+0x1095>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 4f9a <_sk_callback_sse2+0x1095>
+ DB 62,114,28 ; jb,pt 4f9a <_sk_callback_sse2+0x1099>
DB 199 ; (bad)
DB 62,171 ; ds stos %eax,%es:(%rdi)
DB 170 ; stos %al,%es:(%rdi)
diff --git a/src/jumper/SkJumper_stages.cpp b/src/jumper/SkJumper_stages.cpp
index b93b5a01fd..e1c245358e 100644
--- a/src/jumper/SkJumper_stages.cpp
+++ b/src/jumper/SkJumper_stages.cpp
@@ -312,15 +312,14 @@ STAGE(dither) {
| (Y & 2) << 2 | (X & 2) << 1
| (Y & 4) >> 1 | (X & 4) >> 2;
- // Scale that dither to [0,1], then [-0.5,+0.5].
- // I chose to scale by 1/63.0f here to make this exactly [0,1].
- // I suspect the divide by 64 in the article was written with fast integer math in mind.
- F dither = cast(M) * (1/63.0f) - 0.5f;
-
- // Fold in an extra alpha to dither as if applied to the unpremul values of r,g,b.
- r += c->rate*dither*a;
- g += c->rate*dither*a;
- b += c->rate*dither*a;
+ // Scale that dither to [0,1), then (-0.5,+0.5), here using 63/128 = 0.4921875 as 0.5-epsilon.
+ // We want to make sure our dither is less than 0.5 in either direction to keep exact values
+ // like 0 and 1 unchanged after rounding.
+ F dither = cast(M) * (2/128.0f) - (63/128.0f);
+
+ r += c->rate*dither;
+ g += c->rate*dither;
+ b += c->rate*dither;
}
STAGE(constant_color) {