aboutsummaryrefslogtreecommitdiffhomepage
path: root/src
diff options
context:
space:
mode:
Diffstat (limited to 'src')
-rw-r--r--src/core/SkRasterPipeline.h113
-rw-r--r--src/jumper/SkJumper.cpp129
-rw-r--r--src/jumper/SkJumper_generated.S1576
-rw-r--r--src/jumper/SkJumper_generated_win.S1283
-rw-r--r--src/jumper/SkJumper_stages.cpp33
5 files changed, 1582 insertions, 1552 deletions
diff --git a/src/core/SkRasterPipeline.h b/src/core/SkRasterPipeline.h
index f826f391ee..60464b0d44 100644
--- a/src/core/SkRasterPipeline.h
+++ b/src/core/SkRasterPipeline.h
@@ -36,62 +36,63 @@ struct SkJumper_Engine;
* If you'd like to see how this works internally, you want to start digging around src/jumper.
*/
-#define SK_RASTER_PIPELINE_STAGES(M) \
- M(callback) \
- M(move_src_dst) M(move_dst_src) \
- M(clamp_0) M(clamp_1) M(clamp_a) M(clamp_a_dst) \
- M(unpremul) M(premul) M(premul_dst) \
- M(set_rgb) M(swap_rb) M(invert) \
- M(from_srgb) M(from_srgb_dst) M(to_srgb) \
- M(black_color) M(white_color) M(uniform_color) \
- M(seed_shader) M(dither) \
- M(load_a8) M(load_a8_dst) M(store_a8) M(gather_a8) \
- M(load_g8) M(load_g8_dst) M(gather_g8) \
- M(load_565) M(load_565_dst) M(store_565) M(gather_565) \
- M(load_4444) M(load_4444_dst) M(store_4444) M(gather_4444) \
- M(load_f16) M(load_f16_dst) M(store_f16) M(gather_f16) \
- M(load_f32) M(load_f32_dst) M(store_f32) \
- M(load_8888) M(load_8888_dst) M(store_8888) M(gather_8888) \
- M(load_bgra) M(load_bgra_dst) M(store_bgra) M(gather_bgra) \
- M(load_u16_be) M(load_rgb_u16_be) M(store_u16_be) \
- M(load_tables_u16_be) M(load_tables_rgb_u16_be) \
- M(load_tables) M(load_rgba) M(store_rgba) \
- M(scale_u8) M(scale_565) M(scale_1_float) \
- M( lerp_u8) M( lerp_565) M( lerp_1_float) \
- M(dstatop) M(dstin) M(dstout) M(dstover) \
- M(srcatop) M(srcin) M(srcout) M(srcover) \
- M(clear) M(modulate) M(multiply) M(plus_) M(screen) M(xor_) \
- M(colorburn) M(colordodge) M(darken) M(difference) \
- M(exclusion) M(hardlight) M(lighten) M(overlay) M(softlight) \
- M(hue) M(saturation) M(color) M(luminosity) \
- M(srcover_rgba_8888) M(srcover_bgra_8888) \
- M(luminance_to_alpha) \
- M(matrix_translate) M(matrix_scale_translate) \
- M(matrix_2x3) M(matrix_3x4) M(matrix_4x5) M(matrix_4x3) \
- M(matrix_perspective) \
- M(parametric_r) M(parametric_g) M(parametric_b) \
- M(parametric_a) M(gamma) \
- M(table_r) M(table_g) M(table_b) M(table_a) \
- M(lab_to_xyz) \
- M(mirror_x) M(repeat_x) \
- M(mirror_y) M(repeat_y) \
- M(clamp_x_1) M(mirror_x_1) M(repeat_x_1) \
- M(bilinear_nx) M(bilinear_px) M(bilinear_ny) M(bilinear_py) \
- M(bicubic_n3x) M(bicubic_n1x) M(bicubic_p1x) M(bicubic_p3x) \
- M(bicubic_n3y) M(bicubic_n1y) M(bicubic_p1y) M(bicubic_p3y) \
- M(save_xy) M(accumulate) \
- M(evenly_spaced_gradient) \
- M(gauss_a_to_rgba) M(gradient) \
- M(evenly_spaced_2_stop_gradient) \
- M(xy_to_unit_angle) \
- M(xy_to_radius) \
- M(xy_to_2pt_conical_quadratic_min) \
- M(xy_to_2pt_conical_quadratic_max) \
- M(xy_to_2pt_conical_linear) \
- M(mask_2pt_conical_degenerates) M(apply_vector_mask) \
- M(byte_tables) M(byte_tables_rgb) \
- M(rgb_to_hsl) M(hsl_to_rgb) \
- M(clut_3D) M(clut_4D)
+#define SK_RASTER_PIPELINE_STAGES(M) \
+ M(callback) \
+ M(move_src_dst) M(move_dst_src) \
+ M(clamp_0) M(clamp_1) M(clamp_a) M(clamp_a_dst) \
+ M(unpremul) M(premul) M(premul_dst) \
+ M(set_rgb) M(swap_rb) M(invert) \
+ M(from_srgb) M(from_srgb_dst) M(to_srgb) \
+ M(black_color) M(white_color) M(uniform_color) \
+ M(seed_shader) M(dither) \
+ M(load_a8) M(load_a8_dst) M(store_a8) M(gather_a8) \
+ M(load_g8) M(load_g8_dst) M(gather_g8) \
+ M(load_565) M(load_565_dst) M(store_565) M(gather_565) \
+ M(load_4444) M(load_4444_dst) M(store_4444) M(gather_4444) \
+ M(load_f16) M(load_f16_dst) M(store_f16) M(gather_f16) \
+ M(load_f32) M(load_f32_dst) M(store_f32) \
+ M(load_8888) M(load_8888_dst) M(store_8888) M(gather_8888) \
+ M(load_bgra) M(load_bgra_dst) M(store_bgra) M(gather_bgra) \
+ M(load_u16_be) M(load_rgb_u16_be) M(store_u16_be) \
+ M(load_tables_u16_be) M(load_tables_rgb_u16_be) M(load_tables) \
+ M(load_rgba) M(store_rgba) \
+ M(scale_u8) M(scale_565) M(scale_1_float) \
+ M( lerp_u8) M( lerp_565) M( lerp_1_float) \
+ M(dstatop) M(dstin) M(dstout) M(dstover) \
+ M(srcatop) M(srcin) M(srcout) M(srcover) \
+ M(clear) M(modulate) M(multiply) M(plus_) M(screen) M(xor_) \
+ M(colorburn) M(colordodge) M(darken) M(difference) \
+ M(exclusion) M(hardlight) M(lighten) M(overlay) M(softlight) \
+ M(hue) M(saturation) M(color) M(luminosity) \
+ M(srcover_rgba_8888) M(srcover_bgra_8888) \
+ M(luminance_to_alpha) \
+ M(matrix_translate) M(matrix_scale_translate) \
+ M(matrix_2x3) M(matrix_3x4) M(matrix_4x5) M(matrix_4x3) \
+ M(matrix_perspective) \
+ M(parametric_r) M(parametric_g) M(parametric_b) \
+ M(parametric_a) M(gamma) \
+ M(table_r) M(table_g) M(table_b) M(table_a) \
+ M(lab_to_xyz) \
+ M(mirror_x) M(repeat_x) \
+ M(mirror_y) M(repeat_y) \
+ M(clamp_x_1) M(mirror_x_1) M(repeat_x_1) \
+ M(bilinear_nx) M(bilinear_px) M(bilinear_ny) M(bilinear_py) \
+ M(bicubic_n3x) M(bicubic_n1x) M(bicubic_p1x) M(bicubic_p3x) \
+ M(bicubic_n3y) M(bicubic_n1y) M(bicubic_p1y) M(bicubic_p3y) \
+ M(save_xy) M(accumulate) \
+ M(evenly_spaced_gradient) \
+ M(gradient) \
+ M(evenly_spaced_2_stop_gradient) \
+ M(xy_to_unit_angle) \
+ M(xy_to_radius) \
+ M(xy_to_2pt_conical_quadratic_min) \
+ M(xy_to_2pt_conical_quadratic_max) \
+ M(xy_to_2pt_conical_linear) \
+ M(mask_2pt_conical_degenerates) M(apply_vector_mask) \
+ M(byte_tables) M(byte_tables_rgb) \
+ M(rgb_to_hsl) M(hsl_to_rgb) \
+ M(clut_3D) M(clut_4D) \
+ M(gauss_a_to_rgba)
class SkRasterPipeline {
public:
diff --git a/src/jumper/SkJumper.cpp b/src/jumper/SkJumper.cpp
index bd46723b2d..3faee519ee 100644
--- a/src/jumper/SkJumper.cpp
+++ b/src/jumper/SkJumper.cpp
@@ -148,13 +148,13 @@ extern "C" {
#if SK_JUMPER_USE_ASSEMBLY
#if defined(__x86_64__) || defined(_M_X64)
template <SkRasterPipeline::StockStage st>
- static constexpr StageFn* hsw_lowp() { return nullptr; }
+ static constexpr StageFn* hsw_lowp();
template <SkRasterPipeline::StockStage st>
- static constexpr StageFn* sse41_lowp() { return nullptr; }
+ static constexpr StageFn* sse41_lowp();
template <SkRasterPipeline::StockStage st>
- static constexpr StageFn* sse2_lowp() { return nullptr; }
+ static constexpr StageFn* sse2_lowp();
#define LOWP(st) \
template <> constexpr StageFn* hsw_lowp<SkRasterPipeline::st>() { \
@@ -166,72 +166,111 @@ extern "C" {
template <> constexpr StageFn* sse2_lowp<SkRasterPipeline::st>() { \
return ASM(st,sse2_lowp); \
}
+ #define NOPE(st) \
+ template <> constexpr StageFn* hsw_lowp<SkRasterPipeline::st>() { \
+ return nullptr; \
+ } \
+ template <> constexpr StageFn* sse41_lowp<SkRasterPipeline::st>() { \
+ return nullptr; \
+ } \
+ template <> constexpr StageFn* sse2_lowp<SkRasterPipeline::st>() { \
+ return nullptr; \
+ }
#elif defined(__i386__) || defined(_M_IX86)
template <SkRasterPipeline::StockStage st>
- static constexpr StageFn* sse2_lowp() { return nullptr; }
+ static constexpr StageFn* sse2_lowp();
#define LOWP(st) \
template <> constexpr StageFn* sse2_lowp<SkRasterPipeline::st>() { \
return ASM(st,sse2_lowp); \
}
+ #define NOPE(st) \
+ template <> constexpr StageFn* sse2_lowp<SkRasterPipeline::st>() { \
+ return nullptr; \
+ }
#elif defined(JUMPER_NEON_HAS_LOWP)
template <SkRasterPipeline::StockStage st>
- static constexpr StageFn* neon_lowp() { return nullptr; }
+ static constexpr StageFn* neon_lowp();
#define LOWP(st) \
template <> constexpr StageFn* neon_lowp<SkRasterPipeline::st>() { \
return sk_##st##_lowp; \
}
+ #define NOPE(st) \
+ template <> constexpr StageFn* neon_lowp<SkRasterPipeline::st>() { \
+ return nullptr; \
+ }
+
#else
#define LOWP(st)
+ #define NOPE(st)
#endif
+ #define TODO(st) NOPE(st) // stages that should be implemented in lowp, but aren't.
+
+ NOPE(callback)
+ LOWP(move_src_dst) LOWP(move_dst_src)
+ NOPE(clamp_0) NOPE(clamp_1) TODO(clamp_a) TODO(clamp_a_dst)
+ NOPE(unpremul) LOWP(premul) TODO(premul_dst)
+ LOWP(set_rgb) LOWP(swap_rb) LOWP(invert)
+ NOPE(from_srgb) NOPE(from_srgb_dst) NOPE(to_srgb)
LOWP(black_color) LOWP(white_color) LOWP(uniform_color)
- LOWP(set_rgb)
- LOWP(premul)
- LOWP(luminance_to_alpha)
- LOWP(load_8888) LOWP(load_8888_dst) LOWP(store_8888)
- LOWP(load_bgra) LOWP(load_bgra_dst) LOWP(store_bgra)
- LOWP(load_a8) LOWP(load_a8_dst) LOWP(store_a8)
- LOWP(load_g8) LOWP(load_g8_dst)
- LOWP(load_565) LOWP(load_565_dst) LOWP(store_565)
- LOWP(swap_rb)
+ LOWP(seed_shader) TODO(dither)
+ LOWP(load_a8) LOWP(load_a8_dst) LOWP(store_a8) LOWP(gather_a8)
+ LOWP(load_g8) LOWP(load_g8_dst) LOWP(gather_g8)
+ LOWP(load_565) LOWP(load_565_dst) LOWP(store_565) LOWP(gather_565)
+ TODO(load_4444) TODO(load_4444_dst) TODO(store_4444) TODO(gather_4444)
+ NOPE(load_f16) NOPE(load_f16_dst) NOPE(store_f16) NOPE(gather_f16)
+ NOPE(load_f32) NOPE(load_f32_dst) NOPE(store_f32)
+ LOWP(load_8888) LOWP(load_8888_dst) LOWP(store_8888) LOWP(gather_8888)
+ LOWP(load_bgra) LOWP(load_bgra_dst) LOWP(store_bgra) LOWP(gather_bgra)
+ TODO(load_u16_be) TODO(load_rgb_u16_be) TODO(store_u16_be)
+ NOPE(load_tables_u16_be) NOPE(load_tables_rgb_u16_be) NOPE(load_tables)
+ NOPE(load_rgba) NOPE(store_rgba)
+ LOWP(scale_u8) LOWP(scale_565) LOWP(scale_1_float)
+ LOWP( lerp_u8) LOWP( lerp_565) LOWP( lerp_1_float)
+ LOWP(dstatop) LOWP(dstin) LOWP(dstout) LOWP(dstover)
+ LOWP(srcatop) LOWP(srcin) LOWP(srcout) LOWP(srcover)
+ LOWP(clear) LOWP(modulate) LOWP(multiply) LOWP(plus_) LOWP(screen) LOWP(xor_)
+ NOPE(colorburn) NOPE(colordodge) LOWP(darken) LOWP(difference)
+ LOWP(exclusion) LOWP(hardlight) LOWP(lighten) LOWP(overlay) NOPE(softlight)
+ NOPE(hue) NOPE(saturation) NOPE(color) NOPE(luminosity)
LOWP(srcover_rgba_8888) LOWP(srcover_bgra_8888)
- LOWP(lerp_1_float)
- LOWP(lerp_u8)
- LOWP(lerp_565)
- LOWP(scale_1_float)
- LOWP(scale_u8)
- LOWP(scale_565)
- LOWP(move_src_dst)
- LOWP(move_dst_src)
- LOWP(clear)
- LOWP(srcatop)
- LOWP(dstatop)
- LOWP(srcin)
- LOWP(dstin)
- LOWP(srcout)
- LOWP(dstout)
- LOWP(srcover)
- LOWP(dstover)
- LOWP(modulate)
- LOWP(multiply)
- LOWP(screen)
- LOWP(xor_)
- LOWP(plus_)
- LOWP(darken)
- LOWP(lighten)
- LOWP(difference)
- LOWP(exclusion)
- LOWP(hardlight)
- LOWP(overlay)
- LOWP(seed_shader)
- LOWP(matrix_translate) LOWP(matrix_scale_translate) LOWP(matrix_2x3) LOWP(matrix_perspective)
- LOWP(gather_8888) LOWP(gather_bgra) LOWP(gather_565) LOWP(gather_a8) LOWP(gather_g8)
+ LOWP(luminance_to_alpha)
+ LOWP(matrix_translate) LOWP(matrix_scale_translate)
+ LOWP(matrix_2x3) NOPE(matrix_3x4) TODO(matrix_4x5) TODO(matrix_4x3)
+ LOWP(matrix_perspective)
+ NOPE(parametric_r) NOPE(parametric_g) NOPE(parametric_b)
+ NOPE(parametric_a) NOPE(gamma)
+ NOPE(table_r) NOPE(table_g) NOPE(table_b) NOPE(table_a)
+ NOPE(lab_to_xyz)
+ TODO(mirror_x) TODO(repeat_x)
+ TODO(mirror_y) TODO(repeat_y)
+ TODO(clamp_x_1) TODO(mirror_x_1) TODO(repeat_x_1)
+ TODO(bilinear_nx) TODO(bilinear_px) TODO(bilinear_ny) TODO(bilinear_py)
+ TODO(bicubic_n3x) TODO(bicubic_n1x) TODO(bicubic_p1x) TODO(bicubic_p3x)
+ TODO(bicubic_n3y) TODO(bicubic_n1y) TODO(bicubic_p1y) TODO(bicubic_p3y)
+ TODO(save_xy) TODO(accumulate)
+ TODO(evenly_spaced_gradient)
+ TODO(gradient)
+ TODO(evenly_spaced_2_stop_gradient)
+ TODO(xy_to_unit_angle)
+ TODO(xy_to_radius)
+ TODO(xy_to_2pt_conical_quadratic_min)
+ TODO(xy_to_2pt_conical_quadratic_max)
+ TODO(xy_to_2pt_conical_linear)
+ TODO(mask_2pt_conical_degenerates) TODO(apply_vector_mask)
+ TODO(byte_tables) TODO(byte_tables_rgb)
+ NOPE(rgb_to_hsl) NOPE(hsl_to_rgb)
+ NOPE(clut_3D) NOPE(clut_4D)
+ NOPE(gauss_a_to_rgba)
+
#undef LOWP
+ #undef TODO
+ #undef NOPE
#endif
// Engines comprise everything we need to run SkRasterPipelines.
diff --git a/src/jumper/SkJumper_generated.S b/src/jumper/SkJumper_generated.S
index b7b6710f4d..fa97122c0e 100644
--- a/src/jumper/SkJumper_generated.S
+++ b/src/jumper/SkJumper_generated.S
@@ -7027,52 +7027,6 @@ _sk_evenly_spaced_gradient_vfp4:
.long 0xe28dd004 // add sp, sp, #4
.long 0xe8bd4ff0 // pop {r4, r5, r6, r7, r8, r9, sl, fp, lr}
.long 0xe12fff12 // bx r2
- .long 0xe320f000 // nop {0}
-
-HIDDEN _sk_gauss_a_to_rgba_vfp4
-.globl _sk_gauss_a_to_rgba_vfp4
-FUNCTION(_sk_gauss_a_to_rgba_vfp4)
-_sk_gauss_a_to_rgba_vfp4:
- .long 0xe28f2048 // add r2, pc, #72
- .long 0xf4620acf // vld1.64 {d16-d17}, [r2]
- .long 0xe28f2050 // add r2, pc, #80
- .long 0xf4622acf // vld1.64 {d18-d19}, [r2]
- .long 0xe28f2058 // add r2, pc, #88
- .long 0xf2462c70 // vfma.f32 q9, q3, q8
- .long 0xf4620acf // vld1.64 {d16-d17}, [r2]
- .long 0xe28f205c // add r2, pc, #92
- .long 0xf2460c72 // vfma.f32 q8, q3, q9
- .long 0xf4622acf // vld1.64 {d18-d19}, [r2]
- .long 0xe28f2060 // add r2, pc, #96
- .long 0xf4220acf // vld1.64 {d0-d1}, [r2]
- .long 0xe4912004 // ldr r2, [r1], #4
- .long 0xf2462c70 // vfma.f32 q9, q3, q8
- .long 0xf2060c72 // vfma.f32 q0, q3, q9
- .long 0xf2202150 // vorr q1, q0, q0
- .long 0xf2204150 // vorr q2, q0, q0
- .long 0xf2206150 // vorr q3, q0, q0
- .long 0xe12fff12 // bx r2
- .long 0xe320f000 // nop {0}
- .long 0xc011102d // .word 0xc011102d
- .long 0xc011102d // .word 0xc011102d
- .long 0xc011102d // .word 0xc011102d
- .long 0xc011102d // .word 0xc011102d
- .long 0x40397812 // .word 0x40397812
- .long 0x40397812 // .word 0x40397812
- .long 0x40397812 // .word 0x40397812
- .long 0x40397812 // .word 0x40397812
- .long 0x3e5a9420 // .word 0x3e5a9420
- .long 0x3e5a9420 // .word 0x3e5a9420
- .long 0x3e5a9420 // .word 0x3e5a9420
- .long 0x3e5a9420 // .word 0x3e5a9420
- .long 0x3e1e9d04 // .word 0x3e1e9d04
- .long 0x3e1e9d04 // .word 0x3e1e9d04
- .long 0x3e1e9d04 // .word 0x3e1e9d04
- .long 0x3e1e9d04 // .word 0x3e1e9d04
- .long 0x39a11800 // .word 0x39a11800
- .long 0x39a11800 // .word 0x39a11800
- .long 0x39a11800 // .word 0x39a11800
- .long 0x39a11800 // .word 0x39a11800
HIDDEN _sk_gradient_vfp4
.globl _sk_gradient_vfp4
@@ -7087,7 +7041,7 @@ _sk_gradient_vfp4:
.long 0xf2c00050 // vmov.i32 q8, #0
.long 0xe5923000 // ldr r3, [r2]
.long 0xe3530002 // cmp r3, #2
- .long 0x3a00000a // bcc 649c <sk_gradient_vfp4+0x54>
+ .long 0x3a00000a // bcc 63f8 <sk_gradient_vfp4+0x54>
.long 0xe5927024 // ldr r7, [r2, #36]
.long 0xf2c04051 // vmov.i32 q10, #1
.long 0xf2c00050 // vmov.i32 q8, #0
@@ -7098,7 +7052,7 @@ _sk_gradient_vfp4:
.long 0xf3468ee8 // vcge.f32 q12, q11, q12
.long 0xf35481f2 // vbsl q12, q10, q9
.long 0xf26008e8 // vadd.i32 q8, q8, q12
- .long 0x1afffff9 // bne 6484 <sk_gradient_vfp4+0x3c>
+ .long 0x1afffff9 // bne 63e0 <sk_gradient_vfp4+0x3c>
.long 0xee314b90 // vmov.32 r4, d17[1]
.long 0xe5926010 // ldr r6, [r2, #16]
.long 0xee11cb90 // vmov.32 ip, d17[0]
@@ -7217,6 +7171,7 @@ _sk_evenly_spaced_2_stop_gradient_vfp4:
.long 0xf22001f0 // vorr q0, q8, q8
.long 0xe8bd4010 // pop {r4, lr}
.long 0xe12fff1c // bx ip
+ .long 0xe320f000 // nop {0}
HIDDEN _sk_xy_to_unit_angle_vfp4
.globl _sk_xy_to_unit_angle_vfp4
@@ -8242,7 +8197,7 @@ _sk_clut_3D_vfp4:
.long 0xe0835105 // add r5, r3, r5, lsl #2
.long 0xedd55a00 // vldr s11, [r5]
.long 0xee325b90 // vmov.32 r5, d18[1]
- .long 0xea000004 // b 74b0 <sk_clut_3D_vfp4+0x508>
+ .long 0xea000004 // b 7410 <sk_clut_3D_vfp4+0x508>
.long 0xe320f000 // nop {0}
.long 0x3f7ff972 // .word 0x3f7ff972
.long 0x3f7ff972 // .word 0x3f7ff972
@@ -8759,7 +8714,7 @@ _sk_clut_4D_vfp4:
.long 0xf2802051 // vmov.i32 q1, #1
.long 0xf22e29e0 // vmla.i32 q1, q15, q8
.long 0xedd20a00 // vldr s1, [r2]
- .long 0xea000004 // b 7cb0 <sk_clut_4D_vfp4+0x528>
+ .long 0xea000004 // b 7c10 <sk_clut_4D_vfp4+0x528>
.long 0xe320f000 // nop {0}
.long 0x3f7ff972 // .word 0x3f7ff972
.long 0x3f7ff972 // .word 0x3f7ff972
@@ -9483,6 +9438,51 @@ _sk_clut_4D_vfp4:
.long 0x3f800000 // .word 0x3f800000
.long 0x3f800000 // .word 0x3f800000
.long 0x3f800000 // .word 0x3f800000
+
+HIDDEN _sk_gauss_a_to_rgba_vfp4
+.globl _sk_gauss_a_to_rgba_vfp4
+FUNCTION(_sk_gauss_a_to_rgba_vfp4)
+_sk_gauss_a_to_rgba_vfp4:
+ .long 0xe28f2048 // add r2, pc, #72
+ .long 0xf4620acf // vld1.64 {d16-d17}, [r2]
+ .long 0xe28f2050 // add r2, pc, #80
+ .long 0xf4622acf // vld1.64 {d18-d19}, [r2]
+ .long 0xe28f2058 // add r2, pc, #88
+ .long 0xf2462c70 // vfma.f32 q9, q3, q8
+ .long 0xf4620acf // vld1.64 {d16-d17}, [r2]
+ .long 0xe28f205c // add r2, pc, #92
+ .long 0xf2460c72 // vfma.f32 q8, q3, q9
+ .long 0xf4622acf // vld1.64 {d18-d19}, [r2]
+ .long 0xe28f2060 // add r2, pc, #96
+ .long 0xf4220acf // vld1.64 {d0-d1}, [r2]
+ .long 0xe4912004 // ldr r2, [r1], #4
+ .long 0xf2462c70 // vfma.f32 q9, q3, q8
+ .long 0xf2060c72 // vfma.f32 q0, q3, q9
+ .long 0xf2202150 // vorr q1, q0, q0
+ .long 0xf2204150 // vorr q2, q0, q0
+ .long 0xf2206150 // vorr q3, q0, q0
+ .long 0xe12fff12 // bx r2
+ .long 0xe320f000 // nop {0}
+ .long 0xc011102d // .word 0xc011102d
+ .long 0xc011102d // .word 0xc011102d
+ .long 0xc011102d // .word 0xc011102d
+ .long 0xc011102d // .word 0xc011102d
+ .long 0x40397812 // .word 0x40397812
+ .long 0x40397812 // .word 0x40397812
+ .long 0x40397812 // .word 0x40397812
+ .long 0x40397812 // .word 0x40397812
+ .long 0x3e5a9420 // .word 0x3e5a9420
+ .long 0x3e5a9420 // .word 0x3e5a9420
+ .long 0x3e5a9420 // .word 0x3e5a9420
+ .long 0x3e5a9420 // .word 0x3e5a9420
+ .long 0x3e1e9d04 // .word 0x3e1e9d04
+ .long 0x3e1e9d04 // .word 0x3e1e9d04
+ .long 0x3e1e9d04 // .word 0x3e1e9d04
+ .long 0x3e1e9d04 // .word 0x3e1e9d04
+ .long 0x39a11800 // .word 0x39a11800
+ .long 0x39a11800 // .word 0x39a11800
+ .long 0x39a11800 // .word 0x39a11800
+ .long 0x39a11800 // .word 0x39a11800
#elif defined(__x86_64__)
BALIGN32
@@ -15465,21 +15465,6 @@ _sk_evenly_spaced_gradient_skx:
.byte 197,124,41,192 // vmovaps %ymm8,%ymm0
.byte 255,224 // jmpq *%rax
-HIDDEN _sk_gauss_a_to_rgba_skx
-.globl _sk_gauss_a_to_rgba_skx
-FUNCTION(_sk_gauss_a_to_rgba_skx)
-_sk_gauss_a_to_rgba_skx:
- .byte 196,226,125,24,5,27,247,2,0 // vbroadcastss 0x2f71b(%rip),%ymm0 # 356e4 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
- .byte 98,242,101,56,168,5,21,247,2,0 // vfmadd213ps 0x2f715(%rip){1to8},%ymm3,%ymm0 # 356e8 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
- .byte 98,242,101,56,168,5,15,247,2,0 // vfmadd213ps 0x2f70f(%rip){1to8},%ymm3,%ymm0 # 356ec <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
- .byte 98,242,101,56,168,5,9,247,2,0 // vfmadd213ps 0x2f709(%rip){1to8},%ymm3,%ymm0 # 356f0 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
- .byte 98,242,101,56,168,5,3,247,2,0 // vfmadd213ps 0x2f703(%rip){1to8},%ymm3,%ymm0 # 356f4 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
- .byte 72,173 // lods %ds:(%rsi),%rax
- .byte 197,252,40,200 // vmovaps %ymm0,%ymm1
- .byte 197,252,40,208 // vmovaps %ymm0,%ymm2
- .byte 197,252,40,216 // vmovaps %ymm0,%ymm3
- .byte 255,224 // jmpq *%rax
-
HIDDEN _sk_gradient_skx
.globl _sk_gradient_skx
FUNCTION(_sk_gradient_skx)
@@ -15487,11 +15472,11 @@ _sk_gradient_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,0 // mov (%rax),%r8
.byte 73,131,248,1 // cmp $0x1,%r8
- .byte 15,134,229,0,0,0 // jbe 60f5 <_sk_gradient_skx+0xf4>
+ .byte 15,134,229,0,0,0 // jbe 60b4 <_sk_gradient_skx+0xf4>
.byte 76,139,72,72 // mov 0x48(%rax),%r9
.byte 197,244,87,201 // vxorps %ymm1,%ymm1,%ymm1
.byte 65,186,1,0,0,0 // mov $0x1,%r10d
- .byte 196,226,125,24,21,149,245,2,0 // vbroadcastss 0x2f595(%rip),%ymm2 # 355bc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
+ .byte 196,226,125,24,21,214,245,2,0 // vbroadcastss 0x2f5d6(%rip),%ymm2 # 355bc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
.byte 196,65,53,239,201 // vpxor %ymm9,%ymm9,%ymm9
.byte 196,130,125,24,28,145 // vbroadcastss (%r9,%r10,4),%ymm3
.byte 98,241,100,40,194,192,2 // vcmpleps %ymm0,%ymm3,%k0
@@ -15500,10 +15485,10 @@ _sk_gradient_skx:
.byte 197,53,254,203 // vpaddd %ymm3,%ymm9,%ymm9
.byte 73,131,194,1 // add $0x1,%r10
.byte 77,57,208 // cmp %r10,%r8
- .byte 117,218 // jne 602c <_sk_gradient_skx+0x2b>
+ .byte 117,218 // jne 5feb <_sk_gradient_skx+0x2b>
.byte 76,139,72,8 // mov 0x8(%rax),%r9
.byte 73,131,248,8 // cmp $0x8,%r8
- .byte 15,134,158,0,0,0 // jbe 60fe <_sk_gradient_skx+0xfd>
+ .byte 15,134,158,0,0,0 // jbe 60bd <_sk_gradient_skx+0xfd>
.byte 197,245,118,201 // vpcmpeqd %ymm1,%ymm1,%ymm1
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
.byte 196,2,117,146,4,137 // vgatherdps %ymm1,(%r9,%ymm9,4),%ymm8
@@ -15535,7 +15520,7 @@ _sk_gradient_skx:
.byte 196,65,20,87,237 // vxorps %ymm13,%ymm13,%ymm13
.byte 72,139,64,64 // mov 0x40(%rax),%rax
.byte 196,34,13,146,44,136 // vgatherdps %ymm14,(%rax,%ymm9,4),%ymm13
- .byte 235,77 // jmp 6142 <_sk_gradient_skx+0x141>
+ .byte 235,77 // jmp 6101 <_sk_gradient_skx+0x141>
.byte 76,139,72,8 // mov 0x8(%rax),%r9
.byte 196,65,52,87,201 // vxorps %ymm9,%ymm9,%ymm9
.byte 196,66,53,22,1 // vpermps (%r9),%ymm9,%ymm8
@@ -15591,24 +15576,24 @@ _sk_xy_to_unit_angle_skx:
.byte 196,65,52,95,226 // vmaxps %ymm10,%ymm9,%ymm12
.byte 196,65,36,94,220 // vdivps %ymm12,%ymm11,%ymm11
.byte 196,65,36,89,227 // vmulps %ymm11,%ymm11,%ymm12
- .byte 196,98,125,24,45,43,245,2,0 // vbroadcastss 0x2f52b(%rip),%ymm13 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
- .byte 98,114,29,56,168,45,37,245,2,0 // vfmadd213ps 0x2f525(%rip){1to8},%ymm12,%ymm13 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
- .byte 98,114,29,56,168,45,31,245,2,0 // vfmadd213ps 0x2f51f(%rip){1to8},%ymm12,%ymm13 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
- .byte 98,114,29,56,168,45,25,245,2,0 // vfmadd213ps 0x2f519(%rip){1to8},%ymm12,%ymm13 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,45,88,245,2,0 // vbroadcastss 0x2f558(%rip),%ymm13 # 356e4 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
+ .byte 98,114,29,56,168,45,82,245,2,0 // vfmadd213ps 0x2f552(%rip){1to8},%ymm12,%ymm13 # 356e8 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
+ .byte 98,114,29,56,168,45,76,245,2,0 // vfmadd213ps 0x2f54c(%rip){1to8},%ymm12,%ymm13 # 356ec <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
+ .byte 98,114,29,56,168,45,70,245,2,0 // vfmadd213ps 0x2f546(%rip){1to8},%ymm12,%ymm13 # 356f0 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
.byte 196,65,36,89,221 // vmulps %ymm13,%ymm11,%ymm11
.byte 98,209,52,40,194,194,1 // vcmpltps %ymm10,%ymm9,%k0
.byte 98,114,126,40,56,200 // vpmovm2d %k0,%ymm9
- .byte 196,98,125,24,21,2,245,2,0 // vbroadcastss 0x2f502(%rip),%ymm10 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ .byte 196,98,125,24,21,47,245,2,0 // vbroadcastss 0x2f52f(%rip),%ymm10 # 356f4 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
.byte 196,65,44,92,211 // vsubps %ymm11,%ymm10,%ymm10
.byte 196,67,37,74,202,144 // vblendvps %ymm9,%ymm10,%ymm11,%ymm9
.byte 98,209,124,40,194,192,1 // vcmpltps %ymm8,%ymm0,%k0
.byte 98,242,126,40,56,192 // vpmovm2d %k0,%ymm0
- .byte 196,98,125,24,21,141,243,2,0 // vbroadcastss 0x2f38d(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,21,206,243,2,0 // vbroadcastss 0x2f3ce(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,44,92,209 // vsubps %ymm9,%ymm10,%ymm10
.byte 196,195,53,74,194,0 // vblendvps %ymm0,%ymm10,%ymm9,%ymm0
.byte 98,209,116,40,194,192,1 // vcmpltps %ymm8,%ymm1,%k0
.byte 98,114,126,40,56,200 // vpmovm2d %k0,%ymm9
- .byte 196,98,125,24,21,112,243,2,0 // vbroadcastss 0x2f370(%rip),%ymm10 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,21,177,243,2,0 // vbroadcastss 0x2f3b1(%rip),%ymm10 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,44,92,208 // vsubps %ymm0,%ymm10,%ymm10
.byte 196,195,125,74,194,144 // vblendvps %ymm9,%ymm10,%ymm0,%ymm0
.byte 98,209,124,40,194,192,3 // vcmpunordps %ymm8,%ymm0,%k0
@@ -15637,20 +15622,20 @@ _sk_xy_to_2pt_conical_quadratic_max_skx:
.byte 197,50,89,80,76 // vmulss 0x4c(%rax),%xmm9,%xmm10
.byte 196,66,125,24,210 // vbroadcastss %xmm10,%ymm10
.byte 197,44,88,208 // vaddps %ymm0,%ymm10,%ymm10
- .byte 98,113,44,56,89,21,108,244,2,0 // vmulps 0x2f46c(%rip){1to8},%ymm10,%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,113,44,56,89,21,153,244,2,0 // vmulps 0x2f499(%rip){1to8},%ymm10,%ymm10 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 197,116,89,217 // vmulps %ymm1,%ymm1,%ymm11
.byte 196,98,125,184,216 // vfmadd231ps %ymm0,%ymm0,%ymm11
.byte 196,193,50,89,193 // vmulss %xmm9,%xmm9,%xmm0
.byte 196,226,125,24,192 // vbroadcastss %xmm0,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
- .byte 98,113,60,56,89,5,79,244,2,0 // vmulps 0x2f44f(%rip){1to8},%ymm8,%ymm8 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 98,113,60,56,89,5,124,244,2,0 // vmulps 0x2f47c(%rip){1to8},%ymm8,%ymm8 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,194,45,184,194 // vfmadd231ps %ymm10,%ymm10,%ymm0
.byte 197,252,81,192 // vsqrtps %ymm0,%ymm0
.byte 196,98,125,24,64,68 // vbroadcastss 0x44(%rax),%ymm8
- .byte 98,113,44,56,87,13,54,244,2,0 // vxorps 0x2f436(%rip){1to8},%ymm10,%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 98,113,44,56,87,13,99,244,2,0 // vxorps 0x2f463(%rip){1to8},%ymm10,%ymm9 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 98,113,60,56,89,5,199,242,2,0 // vmulps 0x2f2c7(%rip){1to8},%ymm8,%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 98,113,60,56,89,5,8,243,2,0 // vmulps 0x2f308(%rip){1to8},%ymm8,%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,44,89,208 // vmulps %ymm8,%ymm10,%ymm10
.byte 197,180,92,192 // vsubps %ymm0,%ymm9,%ymm0
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
@@ -15668,20 +15653,20 @@ _sk_xy_to_2pt_conical_quadratic_min_skx:
.byte 197,50,89,80,76 // vmulss 0x4c(%rax),%xmm9,%xmm10
.byte 196,66,125,24,210 // vbroadcastss %xmm10,%ymm10
.byte 197,44,88,208 // vaddps %ymm0,%ymm10,%ymm10
- .byte 98,113,44,56,89,21,228,243,2,0 // vmulps 0x2f3e4(%rip){1to8},%ymm10,%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,113,44,56,89,21,17,244,2,0 // vmulps 0x2f411(%rip){1to8},%ymm10,%ymm10 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 197,116,89,217 // vmulps %ymm1,%ymm1,%ymm11
.byte 196,98,125,184,216 // vfmadd231ps %ymm0,%ymm0,%ymm11
.byte 196,193,50,89,193 // vmulss %xmm9,%xmm9,%xmm0
.byte 196,226,125,24,192 // vbroadcastss %xmm0,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
- .byte 98,113,60,56,89,5,199,243,2,0 // vmulps 0x2f3c7(%rip){1to8},%ymm8,%ymm8 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 98,113,60,56,89,5,244,243,2,0 // vmulps 0x2f3f4(%rip){1to8},%ymm8,%ymm8 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,194,45,184,194 // vfmadd231ps %ymm10,%ymm10,%ymm0
.byte 197,252,81,192 // vsqrtps %ymm0,%ymm0
.byte 196,98,125,24,64,68 // vbroadcastss 0x44(%rax),%ymm8
- .byte 98,113,44,56,87,13,174,243,2,0 // vxorps 0x2f3ae(%rip){1to8},%ymm10,%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 98,113,44,56,87,13,219,243,2,0 // vxorps 0x2f3db(%rip){1to8},%ymm10,%ymm9 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 98,113,60,56,89,5,63,242,2,0 // vmulps 0x2f23f(%rip){1to8},%ymm8,%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 98,113,60,56,89,5,128,242,2,0 // vmulps 0x2f280(%rip){1to8},%ymm8,%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,44,89,208 // vmulps %ymm8,%ymm10,%ymm10
.byte 197,180,92,192 // vsubps %ymm0,%ymm9,%ymm0
.byte 196,193,124,89,192 // vmulps %ymm8,%ymm0,%ymm0
@@ -15698,13 +15683,13 @@ _sk_xy_to_2pt_conical_linear_skx:
.byte 197,58,89,72,76 // vmulss 0x4c(%rax),%xmm8,%xmm9
.byte 196,66,125,24,201 // vbroadcastss %xmm9,%ymm9
.byte 197,52,88,200 // vaddps %ymm0,%ymm9,%ymm9
- .byte 98,113,52,56,89,13,98,243,2,0 // vmulps 0x2f362(%rip){1to8},%ymm9,%ymm9 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,113,52,56,89,13,143,243,2,0 // vmulps 0x2f38f(%rip){1to8},%ymm9,%ymm9 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 197,116,89,209 // vmulps %ymm1,%ymm1,%ymm10
.byte 196,98,125,184,208 // vfmadd231ps %ymm0,%ymm0,%ymm10
.byte 196,193,58,89,192 // vmulss %xmm8,%xmm8,%xmm0
.byte 196,226,125,24,192 // vbroadcastss %xmm0,%ymm0
.byte 197,172,92,192 // vsubps %ymm0,%ymm10,%ymm0
- .byte 98,241,124,56,87,5,73,243,2,0 // vxorps 0x2f349(%rip){1to8},%ymm0,%ymm0 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 98,241,124,56,87,5,118,243,2,0 // vxorps 0x2f376(%rip){1to8},%ymm0,%ymm0 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,193,124,94,193 // vdivps %ymm9,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15746,7 +15731,7 @@ HIDDEN _sk_save_xy_skx
FUNCTION(_sk_save_xy_skx)
_sk_save_xy_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,118,241,2,0 // vbroadcastss 0x2f176(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,183,241,2,0 // vbroadcastss 0x2f1b7(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,124,88,200 // vaddps %ymm8,%ymm0,%ymm9
.byte 196,67,125,8,209,1 // vroundps $0x1,%ymm9,%ymm10
.byte 196,65,52,92,202 // vsubps %ymm10,%ymm9,%ymm9
@@ -15781,8 +15766,8 @@ FUNCTION(_sk_bilinear_nx_skx)
_sk_bilinear_nx_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,0 // vmovups (%rax),%ymm0
- .byte 98,241,124,56,88,5,95,242,2,0 // vaddps 0x2f25f(%rip){1to8},%ymm0,%ymm0 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
- .byte 196,98,125,24,5,246,240,2,0 // vbroadcastss 0x2f0f6(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 98,241,124,56,88,5,140,242,2,0 // vaddps 0x2f28c(%rip){1to8},%ymm0,%ymm0 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,5,55,241,2,0 // vbroadcastss 0x2f137(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -15795,7 +15780,7 @@ _sk_bilinear_px_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,0 // vmovups (%rax),%ymm0
.byte 197,124,16,128,128,0,0,0 // vmovups 0x80(%rax),%ymm8
- .byte 98,241,124,56,88,5,198,240,2,0 // vaddps 0x2f0c6(%rip){1to8},%ymm0,%ymm0 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 98,241,124,56,88,5,7,241,2,0 // vaddps 0x2f107(%rip){1to8},%ymm0,%ymm0 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15806,8 +15791,8 @@ FUNCTION(_sk_bilinear_ny_skx)
_sk_bilinear_ny_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,72,64 // vmovups 0x40(%rax),%ymm1
- .byte 98,241,116,56,88,13,13,242,2,0 // vaddps 0x2f20d(%rip){1to8},%ymm1,%ymm1 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
- .byte 196,98,125,24,5,164,240,2,0 // vbroadcastss 0x2f0a4(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 98,241,116,56,88,13,58,242,2,0 // vaddps 0x2f23a(%rip){1to8},%ymm1,%ymm1 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,5,229,240,2,0 // vbroadcastss 0x2f0e5(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -15820,7 +15805,7 @@ _sk_bilinear_py_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,72,64 // vmovups 0x40(%rax),%ymm1
.byte 197,124,16,128,192,0,0,0 // vmovups 0xc0(%rax),%ymm8
- .byte 98,241,116,56,88,13,115,240,2,0 // vaddps 0x2f073(%rip){1to8},%ymm1,%ymm1 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 98,241,116,56,88,13,180,240,2,0 // vaddps 0x2f0b4(%rip){1to8},%ymm1,%ymm1 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15831,12 +15816,12 @@ FUNCTION(_sk_bicubic_n3x_skx)
_sk_bicubic_n3x_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,0 // vmovups (%rax),%ymm0
- .byte 98,241,124,56,88,5,191,241,2,0 // vaddps 0x2f1bf(%rip){1to8},%ymm0,%ymm0 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
- .byte 196,98,125,24,5,82,240,2,0 // vbroadcastss 0x2f052(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 98,241,124,56,88,5,236,241,2,0 // vaddps 0x2f1ec(%rip){1to8},%ymm0,%ymm0 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ .byte 196,98,125,24,5,147,240,2,0 // vbroadcastss 0x2f093(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,164,241,2,0 // vbroadcastss 0x2f1a4(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
- .byte 98,114,61,56,168,21,166,240,2,0 // vfmadd213ps 0x2f0a6(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,209,241,2,0 // vbroadcastss 0x2f1d1(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,114,61,56,168,21,231,240,2,0 // vfmadd213ps 0x2f0e7(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,44,89,193 // vmulps %ymm9,%ymm10,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -15848,13 +15833,13 @@ FUNCTION(_sk_bicubic_n1x_skx)
_sk_bicubic_n1x_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,0 // vmovups (%rax),%ymm0
- .byte 98,241,124,56,88,5,113,241,2,0 // vaddps 0x2f171(%rip){1to8},%ymm0,%ymm0 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
- .byte 196,98,125,24,5,8,240,2,0 // vbroadcastss 0x2f008(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 98,241,124,56,88,5,158,241,2,0 // vaddps 0x2f19e(%rip){1to8},%ymm0,%ymm0 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,5,73,240,2,0 // vbroadcastss 0x2f049(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,99,241,2,0 // vbroadcastss 0x2f163(%rip),%ymm9 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- .byte 98,114,61,56,168,13,93,241,2,0 // vfmadd213ps 0x2f15d(%rip){1to8},%ymm8,%ymm9 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
- .byte 98,114,61,56,168,13,223,239,2,0 // vfmadd213ps 0x2efdf(%rip){1to8},%ymm8,%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
- .byte 98,114,61,56,168,13,77,241,2,0 // vfmadd213ps 0x2f14d(%rip){1to8},%ymm8,%ymm9 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,13,144,241,2,0 // vbroadcastss 0x2f190(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 98,114,61,56,168,13,138,241,2,0 // vfmadd213ps 0x2f18a(%rip){1to8},%ymm8,%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 98,114,61,56,168,13,32,240,2,0 // vfmadd213ps 0x2f020(%rip){1to8},%ymm8,%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 98,114,61,56,168,13,122,241,2,0 // vfmadd213ps 0x2f17a(%rip){1to8},%ymm8,%ymm9 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 197,124,17,136,0,1,0,0 // vmovups %ymm9,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15864,13 +15849,13 @@ HIDDEN _sk_bicubic_p1x_skx
FUNCTION(_sk_bicubic_p1x_skx)
_sk_bicubic_p1x_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,190,239,2,0 // vbroadcastss 0x2efbe(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,255,239,2,0 // vbroadcastss 0x2efff(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,188,88,0 // vaddps (%rax),%ymm8,%ymm0
.byte 197,124,16,136,128,0,0,0 // vmovups 0x80(%rax),%ymm9
- .byte 196,98,125,24,21,25,241,2,0 // vbroadcastss 0x2f119(%rip),%ymm10 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- .byte 98,114,53,56,168,21,19,241,2,0 // vfmadd213ps 0x2f113(%rip){1to8},%ymm9,%ymm10 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,98,125,24,21,70,241,2,0 // vbroadcastss 0x2f146(%rip),%ymm10 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 98,114,53,56,168,21,64,241,2,0 // vfmadd213ps 0x2f140(%rip){1to8},%ymm9,%ymm10 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,66,53,168,208 // vfmadd213ps %ymm8,%ymm9,%ymm10
- .byte 98,114,53,56,168,21,8,241,2,0 // vfmadd213ps 0x2f108(%rip){1to8},%ymm9,%ymm10 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 98,114,53,56,168,21,53,241,2,0 // vfmadd213ps 0x2f135(%rip){1to8},%ymm9,%ymm10 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 197,124,17,144,0,1,0,0 // vmovups %ymm10,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15882,10 +15867,10 @@ _sk_bicubic_p3x_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,0 // vmovups (%rax),%ymm0
.byte 197,124,16,128,128,0,0,0 // vmovups 0x80(%rax),%ymm8
- .byte 98,241,124,56,88,5,224,240,2,0 // vaddps 0x2f0e0(%rip){1to8},%ymm0,%ymm0 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 98,241,124,56,88,5,13,241,2,0 // vaddps 0x2f10d(%rip){1to8},%ymm0,%ymm0 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,202,240,2,0 // vbroadcastss 0x2f0ca(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
- .byte 98,114,61,56,168,21,204,239,2,0 // vfmadd213ps 0x2efcc(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,247,240,2,0 // vbroadcastss 0x2f0f7(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,114,61,56,168,21,13,240,2,0 // vfmadd213ps 0x2f00d(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,52,89,194 // vmulps %ymm10,%ymm9,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -15897,12 +15882,12 @@ FUNCTION(_sk_bicubic_n3y_skx)
_sk_bicubic_n3y_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,72,64 // vmovups 0x40(%rax),%ymm1
- .byte 98,241,116,56,88,13,154,240,2,0 // vaddps 0x2f09a(%rip){1to8},%ymm1,%ymm1 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
- .byte 196,98,125,24,5,45,239,2,0 // vbroadcastss 0x2ef2d(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 98,241,116,56,88,13,199,240,2,0 // vaddps 0x2f0c7(%rip){1to8},%ymm1,%ymm1 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ .byte 196,98,125,24,5,110,239,2,0 // vbroadcastss 0x2ef6e(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,127,240,2,0 // vbroadcastss 0x2f07f(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
- .byte 98,114,61,56,168,21,129,239,2,0 // vfmadd213ps 0x2ef81(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,172,240,2,0 // vbroadcastss 0x2f0ac(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,114,61,56,168,21,194,239,2,0 // vfmadd213ps 0x2efc2(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,44,89,193 // vmulps %ymm9,%ymm10,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -15914,13 +15899,13 @@ FUNCTION(_sk_bicubic_n1y_skx)
_sk_bicubic_n1y_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,72,64 // vmovups 0x40(%rax),%ymm1
- .byte 98,241,116,56,88,13,75,240,2,0 // vaddps 0x2f04b(%rip){1to8},%ymm1,%ymm1 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
- .byte 196,98,125,24,5,226,238,2,0 // vbroadcastss 0x2eee2(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 98,241,116,56,88,13,120,240,2,0 // vaddps 0x2f078(%rip){1to8},%ymm1,%ymm1 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,5,35,239,2,0 // vbroadcastss 0x2ef23(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,61,240,2,0 // vbroadcastss 0x2f03d(%rip),%ymm9 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- .byte 98,114,61,56,168,13,55,240,2,0 // vfmadd213ps 0x2f037(%rip){1to8},%ymm8,%ymm9 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
- .byte 98,114,61,56,168,13,185,238,2,0 // vfmadd213ps 0x2eeb9(%rip){1to8},%ymm8,%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
- .byte 98,114,61,56,168,13,39,240,2,0 // vfmadd213ps 0x2f027(%rip){1to8},%ymm8,%ymm9 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,13,106,240,2,0 // vbroadcastss 0x2f06a(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 98,114,61,56,168,13,100,240,2,0 // vfmadd213ps 0x2f064(%rip){1to8},%ymm8,%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 98,114,61,56,168,13,250,238,2,0 // vfmadd213ps 0x2eefa(%rip){1to8},%ymm8,%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 98,114,61,56,168,13,84,240,2,0 // vfmadd213ps 0x2f054(%rip){1to8},%ymm8,%ymm9 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 197,124,17,136,64,1,0,0 // vmovups %ymm9,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15930,13 +15915,13 @@ HIDDEN _sk_bicubic_p1y_skx
FUNCTION(_sk_bicubic_p1y_skx)
_sk_bicubic_p1y_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,152,238,2,0 // vbroadcastss 0x2ee98(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,217,238,2,0 // vbroadcastss 0x2eed9(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,188,88,72,64 // vaddps 0x40(%rax),%ymm8,%ymm1
.byte 197,124,16,136,192,0,0,0 // vmovups 0xc0(%rax),%ymm9
- .byte 196,98,125,24,21,242,239,2,0 // vbroadcastss 0x2eff2(%rip),%ymm10 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- .byte 98,114,53,56,168,21,236,239,2,0 // vfmadd213ps 0x2efec(%rip){1to8},%ymm9,%ymm10 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,98,125,24,21,31,240,2,0 // vbroadcastss 0x2f01f(%rip),%ymm10 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 98,114,53,56,168,21,25,240,2,0 // vfmadd213ps 0x2f019(%rip){1to8},%ymm9,%ymm10 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,66,53,168,208 // vfmadd213ps %ymm8,%ymm9,%ymm10
- .byte 98,114,53,56,168,21,225,239,2,0 // vfmadd213ps 0x2efe1(%rip){1to8},%ymm9,%ymm10 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 98,114,53,56,168,21,14,240,2,0 // vfmadd213ps 0x2f00e(%rip){1to8},%ymm9,%ymm10 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 197,124,17,144,64,1,0,0 // vmovups %ymm10,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -15948,10 +15933,10 @@ _sk_bicubic_p3y_skx:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 197,252,16,72,64 // vmovups 0x40(%rax),%ymm1
.byte 197,124,16,128,192,0,0,0 // vmovups 0xc0(%rax),%ymm8
- .byte 98,241,116,56,88,13,184,239,2,0 // vaddps 0x2efb8(%rip){1to8},%ymm1,%ymm1 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 98,241,116,56,88,13,229,239,2,0 // vaddps 0x2efe5(%rip){1to8},%ymm1,%ymm1 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,162,239,2,0 // vbroadcastss 0x2efa2(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
- .byte 98,114,61,56,168,21,164,238,2,0 // vfmadd213ps 0x2eea4(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,207,239,2,0 // vbroadcastss 0x2efcf(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 98,114,61,56,168,21,229,238,2,0 // vfmadd213ps 0x2eee5(%rip){1to8},%ymm8,%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,52,89,194 // vmulps %ymm10,%ymm9,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -16077,7 +16062,7 @@ _sk_clut_3D_skx:
.byte 98,226,61,40,64,224 // vpmulld %ymm0,%ymm8,%ymm20
.byte 98,209,93,32,254,193 // vpaddd %ymm9,%ymm20,%ymm0
.byte 72,139,0 // mov (%rax),%rax
- .byte 98,98,125,40,88,29,172,237,2,0 // vpbroadcastd 0x2edac(%rip),%ymm27 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 98,98,125,40,88,29,217,237,2,0 // vpbroadcastd 0x2edd9(%rip),%ymm27 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
.byte 98,146,125,40,64,195 // vpmulld %ymm27,%ymm0,%ymm0
.byte 196,65,45,239,210 // vpxor %ymm10,%ymm10,%ymm10
.byte 197,245,118,201 // vpcmpeqd %ymm1,%ymm1,%ymm1
@@ -16090,9 +16075,9 @@ _sk_clut_3D_skx:
.byte 196,65,37,118,219 // vpcmpeqd %ymm11,%ymm11,%ymm11
.byte 196,162,37,146,12,144 // vgatherdps %ymm11,(%rax,%ymm10,4),%ymm1
.byte 98,97,124,40,40,233 // vmovaps %ymm1,%ymm29
- .byte 196,98,125,24,21,98,237,2,0 // vbroadcastss 0x2ed62(%rip),%ymm10 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,98,125,24,21,143,237,2,0 // vbroadcastss 0x2ed8f(%rip),%ymm10 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
.byte 98,81,60,32,88,218 // vaddps %ymm10,%ymm24,%ymm11
- .byte 98,226,125,40,88,5,230,235,2,0 // vpbroadcastd 0x2ebe6(%rip),%ymm16 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ .byte 98,226,125,40,88,5,39,236,2,0 // vpbroadcastd 0x2ec27(%rip),%ymm16 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
.byte 98,177,125,40,254,192 // vpaddd %ymm16,%ymm0,%ymm0
.byte 197,244,87,201 // vxorps %ymm1,%ymm1,%ymm1
.byte 196,65,29,118,228 // vpcmpeqd %ymm12,%ymm12,%ymm12
@@ -16332,7 +16317,7 @@ _sk_clut_4D_skx:
.byte 98,162,45,40,64,229 // vpmulld %ymm21,%ymm10,%ymm20
.byte 98,241,93,32,254,193 // vpaddd %ymm1,%ymm20,%ymm0
.byte 72,139,0 // mov (%rax),%rax
- .byte 98,226,125,40,88,5,62,232,2,0 // vpbroadcastd 0x2e83e(%rip),%ymm16 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 98,226,125,40,88,5,107,232,2,0 // vpbroadcastd 0x2e86b(%rip),%ymm16 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
.byte 98,50,125,40,64,216 // vpmulld %ymm16,%ymm0,%ymm11
.byte 196,65,28,87,228 // vxorps %ymm12,%ymm12,%ymm12
.byte 197,253,118,192 // vpcmpeqd %ymm0,%ymm0,%ymm0
@@ -16344,9 +16329,9 @@ _sk_clut_4D_skx:
.byte 196,65,29,118,228 // vpcmpeqd %ymm12,%ymm12,%ymm12
.byte 196,98,29,146,44,128 // vgatherdps %ymm12,(%rax,%ymm0,4),%ymm13
.byte 197,124,17,172,36,192,4,0,0 // vmovups %ymm13,0x4c0(%rsp)
- .byte 196,226,125,24,5,240,231,2,0 // vbroadcastss 0x2e7f0(%rip),%ymm0 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,226,125,24,5,29,232,2,0 // vbroadcastss 0x2e81d(%rip),%ymm0 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
.byte 98,113,28,32,88,224 // vaddps %ymm0,%ymm28,%ymm12
- .byte 98,226,125,40,88,13,116,230,2,0 // vpbroadcastd 0x2e674(%rip),%ymm17 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ .byte 98,226,125,40,88,13,181,230,2,0 // vpbroadcastd 0x2e6b5(%rip),%ymm17 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
.byte 98,49,37,40,254,217 // vpaddd %ymm17,%ymm11,%ymm11
.byte 197,236,87,210 // vxorps %ymm2,%ymm2,%ymm2
.byte 196,65,21,118,237 // vpcmpeqd %ymm13,%ymm13,%ymm13
@@ -16751,13 +16736,28 @@ _sk_clut_4D_skx:
.byte 197,228,92,214 // vsubps %ymm6,%ymm3,%ymm2
.byte 196,226,93,168,214 // vfmadd213ps %ymm6,%ymm4,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,18,221,2,0 // vbroadcastss 0x2dd12(%rip),%ymm3 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,226,125,24,29,83,221,2,0 // vbroadcastss 0x2dd53(%rip),%ymm3 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 98,145,124,40,40,227 // vmovaps %ymm27,%ymm4
.byte 197,252,16,108,36,128 // vmovups -0x80(%rsp),%ymm5
.byte 197,252,16,116,36,160 // vmovups -0x60(%rsp),%ymm6
.byte 197,252,16,124,36,224 // vmovups -0x20(%rsp),%ymm7
.byte 72,129,196,88,5,0,0 // add $0x558,%rsp
.byte 255,224 // jmpq *%rax
+
+HIDDEN _sk_gauss_a_to_rgba_skx
+.globl _sk_gauss_a_to_rgba_skx
+FUNCTION(_sk_gauss_a_to_rgba_skx)
+_sk_gauss_a_to_rgba_skx:
+ .byte 196,226,125,24,5,149,222,2,0 // vbroadcastss 0x2de95(%rip),%ymm0 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 98,242,101,56,168,5,143,222,2,0 // vfmadd213ps 0x2de8f(%rip){1to8},%ymm3,%ymm0 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 98,242,101,56,168,5,137,222,2,0 // vfmadd213ps 0x2de89(%rip){1to8},%ymm3,%ymm0 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 98,242,101,56,168,5,131,222,2,0 // vfmadd213ps 0x2de83(%rip){1to8},%ymm3,%ymm0 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 98,242,101,56,168,5,125,222,2,0 // vfmadd213ps 0x2de7d(%rip){1to8},%ymm3,%ymm0 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 72,173 // lods %ds:(%rsi),%rax
+ .byte 197,252,40,200 // vmovaps %ymm0,%ymm1
+ .byte 197,252,40,208 // vmovaps %ymm0,%ymm2
+ .byte 197,252,40,216 // vmovaps %ymm0,%ymm3
+ .byte 255,224 // jmpq *%rax
.byte 144 // nop
HIDDEN _sk_start_pipeline_hsw
@@ -22813,25 +22813,6 @@ _sk_evenly_spaced_gradient_hsw:
.byte 197,124,41,192 // vmovaps %ymm8,%ymm0
.byte 255,224 // jmpq *%rax
-HIDDEN _sk_gauss_a_to_rgba_hsw
-.globl _sk_gauss_a_to_rgba_hsw
-FUNCTION(_sk_gauss_a_to_rgba_hsw)
-_sk_gauss_a_to_rgba_hsw:
- .byte 196,226,125,24,5,126,127,2,0 // vbroadcastss 0x27f7e(%rip),%ymm0 # 356e8 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
- .byte 196,226,125,24,13,113,127,2,0 // vbroadcastss 0x27f71(%rip),%ymm1 # 356e4 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
- .byte 196,226,101,168,200 // vfmadd213ps %ymm0,%ymm3,%ymm1
- .byte 196,226,125,24,5,107,127,2,0 // vbroadcastss 0x27f6b(%rip),%ymm0 # 356ec <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
- .byte 196,226,101,184,193 // vfmadd231ps %ymm1,%ymm3,%ymm0
- .byte 196,226,125,24,13,97,127,2,0 // vbroadcastss 0x27f61(%rip),%ymm1 # 356f0 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
- .byte 196,226,101,184,200 // vfmadd231ps %ymm0,%ymm3,%ymm1
- .byte 196,226,125,24,5,87,127,2,0 // vbroadcastss 0x27f57(%rip),%ymm0 # 356f4 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
- .byte 196,226,101,184,193 // vfmadd231ps %ymm1,%ymm3,%ymm0
- .byte 72,173 // lods %ds:(%rsi),%rax
- .byte 197,252,40,200 // vmovaps %ymm0,%ymm1
- .byte 197,252,40,208 // vmovaps %ymm0,%ymm2
- .byte 197,252,40,216 // vmovaps %ymm0,%ymm3
- .byte 255,224 // jmpq *%rax
-
HIDDEN _sk_gradient_hsw
.globl _sk_gradient_hsw
FUNCTION(_sk_gradient_hsw)
@@ -22839,11 +22820,11 @@ _sk_gradient_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 76,139,0 // mov (%rax),%r8
.byte 73,131,248,1 // cmp $0x1,%r8
- .byte 15,134,220,0,0,0 // jbe d89d <_sk_gradient_hsw+0xeb>
+ .byte 15,134,220,0,0,0 // jbe d84c <_sk_gradient_hsw+0xeb>
.byte 76,139,72,72 // mov 0x48(%rax),%r9
.byte 197,244,87,201 // vxorps %ymm1,%ymm1,%ymm1
.byte 65,186,1,0,0,0 // mov $0x1,%r10d
- .byte 196,226,125,24,21,228,125,2,0 // vbroadcastss 0x27de4(%rip),%ymm2 # 355bc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
+ .byte 196,226,125,24,21,53,126,2,0 // vbroadcastss 0x27e35(%rip),%ymm2 # 355bc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
.byte 196,65,53,239,201 // vpxor %ymm9,%ymm9,%ymm9
.byte 196,130,125,24,28,145 // vbroadcastss (%r9,%r10,4),%ymm3
.byte 197,228,194,216,2 // vcmpleps %ymm0,%ymm3,%ymm3
@@ -22851,10 +22832,10 @@ _sk_gradient_hsw:
.byte 197,53,254,203 // vpaddd %ymm3,%ymm9,%ymm9
.byte 73,255,194 // inc %r10
.byte 77,57,208 // cmp %r10,%r8
- .byte 117,227 // jne d7dd <_sk_gradient_hsw+0x2b>
+ .byte 117,227 // jne d78c <_sk_gradient_hsw+0x2b>
.byte 76,139,72,8 // mov 0x8(%rax),%r9
.byte 73,131,248,8 // cmp $0x8,%r8
- .byte 15,134,158,0,0,0 // jbe d8a6 <_sk_gradient_hsw+0xf4>
+ .byte 15,134,158,0,0,0 // jbe d855 <_sk_gradient_hsw+0xf4>
.byte 196,65,13,118,246 // vpcmpeqd %ymm14,%ymm14,%ymm14
.byte 196,65,36,87,219 // vxorps %ymm11,%ymm11,%ymm11
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
@@ -22886,7 +22867,7 @@ _sk_gradient_hsw:
.byte 196,130,5,146,28,136 // vgatherdps %ymm15,(%r8,%ymm9,4),%ymm3
.byte 72,139,64,64 // mov 0x40(%rax),%rax
.byte 196,34,13,146,28,136 // vgatherdps %ymm14,(%rax,%ymm9,4),%ymm11
- .byte 235,77 // jmp d8ea <_sk_gradient_hsw+0x138>
+ .byte 235,77 // jmp d899 <_sk_gradient_hsw+0x138>
.byte 76,139,72,8 // mov 0x8(%rax),%r9
.byte 196,65,52,87,201 // vxorps %ymm9,%ymm9,%ymm9
.byte 196,66,53,22,1 // vpermps (%r9),%ymm9,%ymm8
@@ -22946,24 +22927,24 @@ _sk_xy_to_unit_angle_hsw:
.byte 196,65,52,95,226 // vmaxps %ymm10,%ymm9,%ymm12
.byte 196,65,36,94,220 // vdivps %ymm12,%ymm11,%ymm11
.byte 196,65,36,89,227 // vmulps %ymm11,%ymm11,%ymm12
- .byte 196,98,125,24,45,115,125,2,0 // vbroadcastss 0x27d73(%rip),%ymm13 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
- .byte 196,98,125,24,53,110,125,2,0 // vbroadcastss 0x27d6e(%rip),%ymm14 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
+ .byte 196,98,125,24,45,176,125,2,0 // vbroadcastss 0x27db0(%rip),%ymm13 # 356e4 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
+ .byte 196,98,125,24,53,171,125,2,0 // vbroadcastss 0x27dab(%rip),%ymm14 # 356e8 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
.byte 196,66,29,184,245 // vfmadd231ps %ymm13,%ymm12,%ymm14
- .byte 196,98,125,24,45,100,125,2,0 // vbroadcastss 0x27d64(%rip),%ymm13 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
+ .byte 196,98,125,24,45,161,125,2,0 // vbroadcastss 0x27da1(%rip),%ymm13 # 356ec <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
.byte 196,66,29,184,238 // vfmadd231ps %ymm14,%ymm12,%ymm13
- .byte 196,98,125,24,53,90,125,2,0 // vbroadcastss 0x27d5a(%rip),%ymm14 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,53,151,125,2,0 // vbroadcastss 0x27d97(%rip),%ymm14 # 356f0 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
.byte 196,66,29,184,245 // vfmadd231ps %ymm13,%ymm12,%ymm14
.byte 196,65,36,89,222 // vmulps %ymm14,%ymm11,%ymm11
.byte 196,65,52,194,202,1 // vcmpltps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,24,21,69,125,2,0 // vbroadcastss 0x27d45(%rip),%ymm10 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ .byte 196,98,125,24,21,130,125,2,0 // vbroadcastss 0x27d82(%rip),%ymm10 # 356f4 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
.byte 196,65,44,92,211 // vsubps %ymm11,%ymm10,%ymm10
.byte 196,67,37,74,202,144 // vblendvps %ymm9,%ymm10,%ymm11,%ymm9
.byte 196,193,124,194,192,1 // vcmpltps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,21,215,123,2,0 // vbroadcastss 0x27bd7(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,21,40,124,2,0 // vbroadcastss 0x27c28(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,44,92,209 // vsubps %ymm9,%ymm10,%ymm10
.byte 196,195,53,74,194,0 // vblendvps %ymm0,%ymm10,%ymm9,%ymm0
.byte 196,65,116,194,200,1 // vcmpltps %ymm8,%ymm1,%ymm9
- .byte 196,98,125,24,21,193,123,2,0 // vbroadcastss 0x27bc1(%rip),%ymm10 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,21,18,124,2,0 // vbroadcastss 0x27c12(%rip),%ymm10 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,44,92,208 // vsubps %ymm0,%ymm10,%ymm10
.byte 196,195,125,74,194,144 // vblendvps %ymm9,%ymm10,%ymm0,%ymm0
.byte 196,65,124,194,200,3 // vcmpunordps %ymm8,%ymm0,%ymm9
@@ -22991,23 +22972,23 @@ _sk_xy_to_2pt_conical_quadratic_max_hsw:
.byte 197,50,89,80,76 // vmulss 0x4c(%rax),%xmm9,%xmm10
.byte 196,66,125,24,210 // vbroadcastss %xmm10,%ymm10
.byte 197,44,88,208 // vaddps %ymm0,%ymm10,%ymm10
- .byte 196,98,125,24,29,197,124,2,0 // vbroadcastss 0x27cc5(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 196,98,125,24,29,2,125,2,0 // vbroadcastss 0x27d02(%rip),%ymm11 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 196,65,44,89,211 // vmulps %ymm11,%ymm10,%ymm10
.byte 197,116,89,217 // vmulps %ymm1,%ymm1,%ymm11
.byte 196,98,125,184,216 // vfmadd231ps %ymm0,%ymm0,%ymm11
.byte 196,193,50,89,193 // vmulss %xmm9,%xmm9,%xmm0
.byte 196,226,125,24,192 // vbroadcastss %xmm0,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
- .byte 196,98,125,24,13,164,124,2,0 // vbroadcastss 0x27ca4(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 196,98,125,24,13,225,124,2,0 // vbroadcastss 0x27ce1(%rip),%ymm9 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,194,45,184,194 // vfmadd231ps %ymm10,%ymm10,%ymm0
.byte 197,252,81,192 // vsqrtps %ymm0,%ymm0
.byte 196,98,125,24,64,68 // vbroadcastss 0x44(%rax),%ymm8
- .byte 196,98,125,24,13,135,124,2,0 // vbroadcastss 0x27c87(%rip),%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,13,196,124,2,0 // vbroadcastss 0x27cc4(%rip),%ymm9 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,44,87,201 // vxorps %ymm9,%ymm10,%ymm9
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 196,98,125,24,29,20,123,2,0 // vbroadcastss 0x27b14(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,29,101,123,2,0 // vbroadcastss 0x27b65(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,60,89,195 // vmulps %ymm11,%ymm8,%ymm8
.byte 196,65,44,89,208 // vmulps %ymm8,%ymm10,%ymm10
.byte 197,180,92,192 // vsubps %ymm0,%ymm9,%ymm0
@@ -23026,23 +23007,23 @@ _sk_xy_to_2pt_conical_quadratic_min_hsw:
.byte 197,50,89,80,76 // vmulss 0x4c(%rax),%xmm9,%xmm10
.byte 196,66,125,24,210 // vbroadcastss %xmm10,%ymm10
.byte 197,44,88,208 // vaddps %ymm0,%ymm10,%ymm10
- .byte 196,98,125,24,29,45,124,2,0 // vbroadcastss 0x27c2d(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 196,98,125,24,29,106,124,2,0 // vbroadcastss 0x27c6a(%rip),%ymm11 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 196,65,44,89,211 // vmulps %ymm11,%ymm10,%ymm10
.byte 197,116,89,217 // vmulps %ymm1,%ymm1,%ymm11
.byte 196,98,125,184,216 // vfmadd231ps %ymm0,%ymm0,%ymm11
.byte 196,193,50,89,193 // vmulss %xmm9,%xmm9,%xmm0
.byte 196,226,125,24,192 // vbroadcastss %xmm0,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
- .byte 196,98,125,24,13,12,124,2,0 // vbroadcastss 0x27c0c(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 196,98,125,24,13,73,124,2,0 // vbroadcastss 0x27c49(%rip),%ymm9 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,194,45,184,194 // vfmadd231ps %ymm10,%ymm10,%ymm0
.byte 197,252,81,192 // vsqrtps %ymm0,%ymm0
.byte 196,98,125,24,64,68 // vbroadcastss 0x44(%rax),%ymm8
- .byte 196,98,125,24,13,239,123,2,0 // vbroadcastss 0x27bef(%rip),%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,13,44,124,2,0 // vbroadcastss 0x27c2c(%rip),%ymm9 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,44,87,201 // vxorps %ymm9,%ymm10,%ymm9
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 196,98,125,24,29,124,122,2,0 // vbroadcastss 0x27a7c(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,29,205,122,2,0 // vbroadcastss 0x27acd(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,60,89,195 // vmulps %ymm11,%ymm8,%ymm8
.byte 196,65,44,89,208 // vmulps %ymm8,%ymm10,%ymm10
.byte 197,180,92,192 // vsubps %ymm0,%ymm9,%ymm0
@@ -23060,14 +23041,14 @@ _sk_xy_to_2pt_conical_linear_hsw:
.byte 197,58,89,72,76 // vmulss 0x4c(%rax),%xmm8,%xmm9
.byte 196,66,125,24,201 // vbroadcastss %xmm9,%ymm9
.byte 197,52,88,200 // vaddps %ymm0,%ymm9,%ymm9
- .byte 196,98,125,24,21,155,123,2,0 // vbroadcastss 0x27b9b(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 196,98,125,24,21,216,123,2,0 // vbroadcastss 0x27bd8(%rip),%ymm10 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 196,65,52,89,202 // vmulps %ymm10,%ymm9,%ymm9
.byte 197,116,89,209 // vmulps %ymm1,%ymm1,%ymm10
.byte 196,98,125,184,208 // vfmadd231ps %ymm0,%ymm0,%ymm10
.byte 196,193,58,89,192 // vmulss %xmm8,%xmm8,%xmm0
.byte 196,226,125,24,192 // vbroadcastss %xmm0,%ymm0
.byte 197,172,92,192 // vsubps %ymm0,%ymm10,%ymm0
- .byte 196,98,125,24,5,126,123,2,0 // vbroadcastss 0x27b7e(%rip),%ymm8 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,5,187,123,2,0 // vbroadcastss 0x27bbb(%rip),%ymm8 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,193,124,87,192 // vxorps %ymm8,%ymm0,%ymm0
.byte 196,193,124,94,193 // vdivps %ymm9,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23110,7 +23091,7 @@ HIDDEN _sk_save_xy_hsw
FUNCTION(_sk_save_xy_hsw)
_sk_save_xy_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,169,121,2,0 // vbroadcastss 0x279a9(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,250,121,2,0 // vbroadcastss 0x279fa(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,124,88,200 // vaddps %ymm8,%ymm0,%ymm9
.byte 196,67,125,8,209,1 // vroundps $0x1,%ymm9,%ymm10
.byte 196,65,52,92,202 // vsubps %ymm10,%ymm9,%ymm9
@@ -23144,9 +23125,9 @@ HIDDEN _sk_bilinear_nx_hsw
FUNCTION(_sk_bilinear_nx_hsw)
_sk_bilinear_nx_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,151,122,2,0 // vbroadcastss 0x27a97(%rip),%ymm0 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,5,212,122,2,0 // vbroadcastss 0x27ad4(%rip),%ymm0 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,42,121,2,0 // vbroadcastss 0x2792a(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,123,121,2,0 // vbroadcastss 0x2797b(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23157,7 +23138,7 @@ HIDDEN _sk_bilinear_px_hsw
FUNCTION(_sk_bilinear_px_hsw)
_sk_bilinear_px_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,7,121,2,0 // vbroadcastss 0x27907(%rip),%ymm0 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,226,125,24,5,88,121,2,0 // vbroadcastss 0x27958(%rip),%ymm0 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,128,128,0,0,0 // vmovups 0x80(%rax),%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
@@ -23169,9 +23150,9 @@ HIDDEN _sk_bilinear_ny_hsw
FUNCTION(_sk_bilinear_ny_hsw)
_sk_bilinear_ny_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,72,122,2,0 // vbroadcastss 0x27a48(%rip),%ymm1 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,13,133,122,2,0 // vbroadcastss 0x27a85(%rip),%ymm1 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,218,120,2,0 // vbroadcastss 0x278da(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,43,121,2,0 // vbroadcastss 0x2792b(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23182,7 +23163,7 @@ HIDDEN _sk_bilinear_py_hsw
FUNCTION(_sk_bilinear_py_hsw)
_sk_bilinear_py_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,183,120,2,0 // vbroadcastss 0x278b7(%rip),%ymm1 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,226,125,24,13,8,121,2,0 // vbroadcastss 0x27908(%rip),%ymm1 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
.byte 197,124,16,128,192,0,0,0 // vmovups 0xc0(%rax),%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
@@ -23194,13 +23175,13 @@ HIDDEN _sk_bicubic_n3x_hsw
FUNCTION(_sk_bicubic_n3x_hsw)
_sk_bicubic_n3x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,251,121,2,0 // vbroadcastss 0x279fb(%rip),%ymm0 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ .byte 196,226,125,24,5,56,122,2,0 // vbroadcastss 0x27a38(%rip),%ymm0 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,138,120,2,0 // vbroadcastss 0x2788a(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,219,120,2,0 // vbroadcastss 0x278db(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,232,120,2,0 // vbroadcastss 0x278e8(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- .byte 196,98,125,24,29,211,121,2,0 // vbroadcastss 0x279d3(%rip),%ymm11 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,57,121,2,0 // vbroadcastss 0x27939(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,29,16,122,2,0 // vbroadcastss 0x27a10(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,36,89,193 // vmulps %ymm9,%ymm11,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
@@ -23212,16 +23193,16 @@ HIDDEN _sk_bicubic_n1x_hsw
FUNCTION(_sk_bicubic_n1x_hsw)
_sk_bicubic_n1x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,170,121,2,0 // vbroadcastss 0x279aa(%rip),%ymm0 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,5,231,121,2,0 // vbroadcastss 0x279e7(%rip),%ymm0 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,61,120,2,0 // vbroadcastss 0x2783d(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,142,120,2,0 // vbroadcastss 0x2788e(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,156,121,2,0 // vbroadcastss 0x2799c(%rip),%ymm9 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
- .byte 196,98,125,24,21,143,121,2,0 // vbroadcastss 0x2798f(%rip),%ymm10 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,13,217,121,2,0 // vbroadcastss 0x279d9(%rip),%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,21,204,121,2,0 // vbroadcastss 0x279cc(%rip),%ymm10 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,66,61,168,209 // vfmadd213ps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,13,17,120,2,0 // vbroadcastss 0x27811(%rip),%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,13,98,120,2,0 // vbroadcastss 0x27862(%rip),%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,66,61,184,202 // vfmadd231ps %ymm10,%ymm8,%ymm9
- .byte 196,98,125,24,21,123,121,2,0 // vbroadcastss 0x2797b(%rip),%ymm10 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,21,184,121,2,0 // vbroadcastss 0x279b8(%rip),%ymm10 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,66,61,184,209 // vfmadd231ps %ymm9,%ymm8,%ymm10
.byte 197,124,17,144,0,1,0,0 // vmovups %ymm10,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23232,14 +23213,14 @@ HIDDEN _sk_bicubic_p1x_hsw
FUNCTION(_sk_bicubic_p1x_hsw)
_sk_bicubic_p1x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,231,119,2,0 // vbroadcastss 0x277e7(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,56,120,2,0 // vbroadcastss 0x27838(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,188,88,0 // vaddps (%rax),%ymm8,%ymm0
.byte 197,124,16,136,128,0,0,0 // vmovups 0x80(%rax),%ymm9
- .byte 196,98,125,24,21,70,121,2,0 // vbroadcastss 0x27946(%rip),%ymm10 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
- .byte 196,98,125,24,29,57,121,2,0 // vbroadcastss 0x27939(%rip),%ymm11 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,21,131,121,2,0 // vbroadcastss 0x27983(%rip),%ymm10 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,29,118,121,2,0 // vbroadcastss 0x27976(%rip),%ymm11 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,66,53,168,218 // vfmadd213ps %ymm10,%ymm9,%ymm11
.byte 196,66,53,168,216 // vfmadd213ps %ymm8,%ymm9,%ymm11
- .byte 196,98,125,24,5,46,121,2,0 // vbroadcastss 0x2792e(%rip),%ymm8 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,5,107,121,2,0 // vbroadcastss 0x2796b(%rip),%ymm8 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,66,53,184,195 // vfmadd231ps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23250,12 +23231,12 @@ HIDDEN _sk_bicubic_p3x_hsw
FUNCTION(_sk_bicubic_p3x_hsw)
_sk_bicubic_p3x_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,14,121,2,0 // vbroadcastss 0x2790e(%rip),%ymm0 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,226,125,24,5,75,121,2,0 // vbroadcastss 0x2794b(%rip),%ymm0 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,128,128,0,0,0 // vmovups 0x80(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,248,119,2,0 // vbroadcastss 0x277f8(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- .byte 196,98,125,24,29,227,120,2,0 // vbroadcastss 0x278e3(%rip),%ymm11 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,73,120,2,0 // vbroadcastss 0x27849(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,29,32,121,2,0 // vbroadcastss 0x27920(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,52,89,195 // vmulps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
@@ -23267,13 +23248,13 @@ HIDDEN _sk_bicubic_n3y_hsw
FUNCTION(_sk_bicubic_n3y_hsw)
_sk_bicubic_n3y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,190,120,2,0 // vbroadcastss 0x278be(%rip),%ymm1 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ .byte 196,226,125,24,13,251,120,2,0 // vbroadcastss 0x278fb(%rip),%ymm1 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,76,119,2,0 // vbroadcastss 0x2774c(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,157,119,2,0 // vbroadcastss 0x2779d(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,170,119,2,0 // vbroadcastss 0x277aa(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- .byte 196,98,125,24,29,149,120,2,0 // vbroadcastss 0x27895(%rip),%ymm11 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,251,119,2,0 // vbroadcastss 0x277fb(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,29,210,120,2,0 // vbroadcastss 0x278d2(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,36,89,193 // vmulps %ymm9,%ymm11,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
@@ -23285,16 +23266,16 @@ HIDDEN _sk_bicubic_n1y_hsw
FUNCTION(_sk_bicubic_n1y_hsw)
_sk_bicubic_n1y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,108,120,2,0 // vbroadcastss 0x2786c(%rip),%ymm1 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,13,169,120,2,0 // vbroadcastss 0x278a9(%rip),%ymm1 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,254,118,2,0 // vbroadcastss 0x276fe(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,79,119,2,0 // vbroadcastss 0x2774f(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,93,120,2,0 // vbroadcastss 0x2785d(%rip),%ymm9 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
- .byte 196,98,125,24,21,80,120,2,0 // vbroadcastss 0x27850(%rip),%ymm10 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,13,154,120,2,0 // vbroadcastss 0x2789a(%rip),%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,21,141,120,2,0 // vbroadcastss 0x2788d(%rip),%ymm10 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,66,61,168,209 // vfmadd213ps %ymm9,%ymm8,%ymm10
- .byte 196,98,125,24,13,210,118,2,0 // vbroadcastss 0x276d2(%rip),%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,13,35,119,2,0 // vbroadcastss 0x27723(%rip),%ymm9 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,66,61,184,202 // vfmadd231ps %ymm10,%ymm8,%ymm9
- .byte 196,98,125,24,21,60,120,2,0 // vbroadcastss 0x2783c(%rip),%ymm10 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,21,121,120,2,0 // vbroadcastss 0x27879(%rip),%ymm10 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,66,61,184,209 // vfmadd231ps %ymm9,%ymm8,%ymm10
.byte 197,124,17,144,64,1,0,0 // vmovups %ymm10,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23305,14 +23286,14 @@ HIDDEN _sk_bicubic_p1y_hsw
FUNCTION(_sk_bicubic_p1y_hsw)
_sk_bicubic_p1y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,168,118,2,0 // vbroadcastss 0x276a8(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,249,118,2,0 // vbroadcastss 0x276f9(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,188,88,72,64 // vaddps 0x40(%rax),%ymm8,%ymm1
.byte 197,124,16,136,192,0,0,0 // vmovups 0xc0(%rax),%ymm9
- .byte 196,98,125,24,21,6,120,2,0 // vbroadcastss 0x27806(%rip),%ymm10 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
- .byte 196,98,125,24,29,249,119,2,0 // vbroadcastss 0x277f9(%rip),%ymm11 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,21,67,120,2,0 // vbroadcastss 0x27843(%rip),%ymm10 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,29,54,120,2,0 // vbroadcastss 0x27836(%rip),%ymm11 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,66,53,168,218 // vfmadd213ps %ymm10,%ymm9,%ymm11
.byte 196,66,53,168,216 // vfmadd213ps %ymm8,%ymm9,%ymm11
- .byte 196,98,125,24,5,238,119,2,0 // vbroadcastss 0x277ee(%rip),%ymm8 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,5,43,120,2,0 // vbroadcastss 0x2782b(%rip),%ymm8 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,66,53,184,195 // vfmadd231ps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -23323,12 +23304,12 @@ HIDDEN _sk_bicubic_p3y_hsw
FUNCTION(_sk_bicubic_p3y_hsw)
_sk_bicubic_p3y_hsw:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,206,119,2,0 // vbroadcastss 0x277ce(%rip),%ymm1 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,226,125,24,13,11,120,2,0 // vbroadcastss 0x2780b(%rip),%ymm1 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
.byte 197,124,16,128,192,0,0,0 // vmovups 0xc0(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,183,118,2,0 // vbroadcastss 0x276b7(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- .byte 196,98,125,24,29,162,119,2,0 // vbroadcastss 0x277a2(%rip),%ymm11 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,8,119,2,0 // vbroadcastss 0x27708(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,29,223,119,2,0 // vbroadcastss 0x277df(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,66,61,168,218 // vfmadd213ps %ymm10,%ymm8,%ymm11
.byte 196,65,52,89,195 // vmulps %ymm11,%ymm9,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
@@ -23468,7 +23449,7 @@ _sk_clut_3D_hsw:
.byte 196,98,93,64,218 // vpmulld %ymm2,%ymm4,%ymm11
.byte 72,139,0 // mov (%rax),%rax
.byte 197,165,254,193 // vpaddd %ymm1,%ymm11,%ymm0
- .byte 196,98,125,88,61,100,117,2,0 // vpbroadcastd 0x27564(%rip),%ymm15 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 196,98,125,88,61,161,117,2,0 // vpbroadcastd 0x275a1(%rip),%ymm15 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
.byte 196,194,125,64,199 // vpmulld %ymm15,%ymm0,%ymm0
.byte 197,213,239,237 // vpxor %ymm5,%ymm5,%ymm5
.byte 197,237,118,210 // vpcmpeqd %ymm2,%ymm2,%ymm2
@@ -23480,13 +23461,13 @@ _sk_clut_3D_hsw:
.byte 197,213,118,237 // vpcmpeqd %ymm5,%ymm5,%ymm5
.byte 196,226,85,146,60,144 // vgatherdps %ymm5,(%rax,%ymm2,4),%ymm7
.byte 197,252,17,188,36,0,2,0,0 // vmovups %ymm7,0x200(%rsp)
- .byte 196,226,125,88,61,174,115,2,0 // vpbroadcastd 0x273ae(%rip),%ymm7 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ .byte 196,226,125,88,61,255,115,2,0 // vpbroadcastd 0x273ff(%rip),%ymm7 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
.byte 197,253,254,199 // vpaddd %ymm7,%ymm0,%ymm0
.byte 197,236,87,210 // vxorps %ymm2,%ymm2,%ymm2
.byte 197,213,118,237 // vpcmpeqd %ymm5,%ymm5,%ymm5
.byte 196,226,85,146,20,128 // vgatherdps %ymm5,(%rax,%ymm0,4),%ymm2
.byte 197,252,17,148,36,32,1,0,0 // vmovups %ymm2,0x120(%rsp)
- .byte 196,226,125,24,5,246,116,2,0 // vbroadcastss 0x274f6(%rip),%ymm0 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,226,125,24,5,51,117,2,0 // vbroadcastss 0x27533(%rip),%ymm0 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
.byte 197,172,88,232 // vaddps %ymm0,%ymm10,%ymm5
.byte 197,254,91,237 // vcvttps2dq %ymm5,%ymm5
.byte 196,226,93,64,213 // vpmulld %ymm5,%ymm4,%ymm2
@@ -23748,7 +23729,7 @@ _sk_clut_4D_hsw:
.byte 197,254,127,132,36,0,1,0,0 // vmovdqu %ymm0,0x100(%rsp)
.byte 196,98,109,64,200 // vpmulld %ymm0,%ymm2,%ymm9
.byte 197,181,254,199 // vpaddd %ymm7,%ymm9,%ymm0
- .byte 196,98,125,88,21,143,111,2,0 // vpbroadcastd 0x26f8f(%rip),%ymm10 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 196,98,125,88,21,204,111,2,0 // vpbroadcastd 0x26fcc(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
.byte 196,194,125,64,194 // vpmulld %ymm10,%ymm0,%ymm0
.byte 197,213,118,237 // vpcmpeqd %ymm5,%ymm5,%ymm5
.byte 196,65,60,87,192 // vxorps %ymm8,%ymm8,%ymm8
@@ -23760,13 +23741,13 @@ _sk_clut_4D_hsw:
.byte 196,65,36,87,219 // vxorps %ymm11,%ymm11,%ymm11
.byte 196,98,61,146,28,168 // vgatherdps %ymm8,(%rax,%ymm5,4),%ymm11
.byte 197,124,17,156,36,192,0,0,0 // vmovups %ymm11,0xc0(%rsp)
- .byte 196,98,125,88,29,214,109,2,0 // vpbroadcastd 0x26dd6(%rip),%ymm11 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ .byte 196,98,125,88,29,39,110,2,0 // vpbroadcastd 0x26e27(%rip),%ymm11 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
.byte 196,193,125,254,195 // vpaddd %ymm11,%ymm0,%ymm0
.byte 196,65,61,118,192 // vpcmpeqd %ymm8,%ymm8,%ymm8
.byte 197,212,87,237 // vxorps %ymm5,%ymm5,%ymm5
.byte 196,226,61,146,44,128 // vgatherdps %ymm8,(%rax,%ymm0,4),%ymm5
.byte 197,252,17,108,36,32 // vmovups %ymm5,0x20(%rsp)
- .byte 196,226,125,24,5,31,111,2,0 // vbroadcastss 0x26f1f(%rip),%ymm0 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,226,125,24,5,92,111,2,0 // vbroadcastss 0x26f5c(%rip),%ymm0 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
.byte 197,116,88,192 // vaddps %ymm0,%ymm1,%ymm8
.byte 196,65,126,91,192 // vcvttps2dq %ymm8,%ymm8
.byte 196,194,109,64,232 // vpmulld %ymm8,%ymm2,%ymm5
@@ -24199,7 +24180,7 @@ _sk_clut_4D_hsw:
.byte 196,193,100,92,210 // vsubps %ymm10,%ymm3,%ymm2
.byte 196,194,77,168,210 // vfmadd213ps %ymm10,%ymm6,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,249,99,2,0 // vbroadcastss 0x263f9(%rip),%ymm3 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,226,125,24,29,74,100,2,0 // vbroadcastss 0x2644a(%rip),%ymm3 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,252,16,164,36,96,6,0,0 // vmovups 0x660(%rsp),%ymm4
.byte 197,252,16,172,36,128,6,0,0 // vmovups 0x680(%rsp),%ymm5
.byte 197,252,16,180,36,160,6,0,0 // vmovups 0x6a0(%rsp),%ymm6
@@ -24207,6 +24188,25 @@ _sk_clut_4D_hsw:
.byte 72,129,196,248,6,0,0 // add $0x6f8,%rsp
.byte 255,224 // jmpq *%rax
+HIDDEN _sk_gauss_a_to_rgba_hsw
+.globl _sk_gauss_a_to_rgba_hsw
+FUNCTION(_sk_gauss_a_to_rgba_hsw)
+_sk_gauss_a_to_rgba_hsw:
+ .byte 196,226,125,24,5,132,101,2,0 // vbroadcastss 0x26584(%rip),%ymm0 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,226,125,24,13,119,101,2,0 // vbroadcastss 0x26577(%rip),%ymm1 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,226,101,168,200 // vfmadd213ps %ymm0,%ymm3,%ymm1
+ .byte 196,226,125,24,5,113,101,2,0 // vbroadcastss 0x26571(%rip),%ymm0 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,226,101,184,193 // vfmadd231ps %ymm1,%ymm3,%ymm0
+ .byte 196,226,125,24,13,103,101,2,0 // vbroadcastss 0x26567(%rip),%ymm1 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,226,101,184,200 // vfmadd231ps %ymm0,%ymm3,%ymm1
+ .byte 196,226,125,24,5,93,101,2,0 // vbroadcastss 0x2655d(%rip),%ymm0 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 196,226,101,184,193 // vfmadd231ps %ymm1,%ymm3,%ymm0
+ .byte 72,173 // lods %ds:(%rsi),%rax
+ .byte 197,252,40,200 // vmovaps %ymm0,%ymm1
+ .byte 197,252,40,208 // vmovaps %ymm0,%ymm2
+ .byte 197,252,40,216 // vmovaps %ymm0,%ymm3
+ .byte 255,224 // jmpq *%rax
+
HIDDEN _sk_start_pipeline_avx
.globl _sk_start_pipeline_avx
FUNCTION(_sk_start_pipeline_avx)
@@ -30486,7 +30486,7 @@ _sk_store_f16_avx:
.byte 197,252,17,108,36,192 // vmovups %ymm5,-0x40(%rsp)
.byte 197,252,17,100,36,160 // vmovups %ymm4,-0x60(%rsp)
.byte 197,252,40,225 // vmovaps %ymm1,%ymm4
- .byte 196,98,125,24,5,236,254,1,0 // vbroadcastss 0x1feec(%rip),%ymm8 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,5,216,254,1,0 // vbroadcastss 0x1fed8(%rip),%ymm8 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,124,84,216 // vandps %ymm8,%ymm0,%ymm11
.byte 196,98,125,24,21,18,255,1,0 // vbroadcastss 0x1ff12(%rip),%ymm10 # 35748 <_sk_srcover_bgra_8888_sse2_lowp+0x440>
.byte 196,65,124,84,226 // vandps %ymm10,%ymm0,%ymm12
@@ -31712,29 +31712,6 @@ _sk_evenly_spaced_gradient_avx:
.byte 93 // pop %rbp
.byte 255,224 // jmpq *%rax
-HIDDEN _sk_gauss_a_to_rgba_avx
-.globl _sk_gauss_a_to_rgba_avx
-FUNCTION(_sk_gauss_a_to_rgba_avx)
-_sk_gauss_a_to_rgba_avx:
- .byte 196,226,125,24,5,1,234,1,0 // vbroadcastss 0x1ea01(%rip),%ymm0 # 356e4 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
- .byte 197,228,89,192 // vmulps %ymm0,%ymm3,%ymm0
- .byte 196,226,125,24,13,248,233,1,0 // vbroadcastss 0x1e9f8(%rip),%ymm1 # 356e8 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
- .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
- .byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
- .byte 196,226,125,24,13,235,233,1,0 // vbroadcastss 0x1e9eb(%rip),%ymm1 # 356ec <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
- .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
- .byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
- .byte 196,226,125,24,13,222,233,1,0 // vbroadcastss 0x1e9de(%rip),%ymm1 # 356f0 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
- .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
- .byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
- .byte 196,226,125,24,13,209,233,1,0 // vbroadcastss 0x1e9d1(%rip),%ymm1 # 356f4 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
- .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
- .byte 72,173 // lods %ds:(%rsi),%rax
- .byte 197,252,40,200 // vmovaps %ymm0,%ymm1
- .byte 197,252,40,208 // vmovaps %ymm0,%ymm2
- .byte 197,252,40,216 // vmovaps %ymm0,%ymm3
- .byte 255,224 // jmpq *%rax
-
HIDDEN _sk_gradient_avx
.globl _sk_gradient_avx
FUNCTION(_sk_gradient_avx)
@@ -31749,12 +31726,12 @@ _sk_gradient_avx:
.byte 76,139,0 // mov (%rax),%r8
.byte 197,244,87,201 // vxorps %ymm1,%ymm1,%ymm1
.byte 73,131,248,2 // cmp $0x2,%r8
- .byte 114,81 // jb 16da6 <_sk_gradient_avx+0x6f>
+ .byte 114,81 // jb 16d49 <_sk_gradient_avx+0x6f>
.byte 72,139,88,72 // mov 0x48(%rax),%rbx
.byte 73,255,200 // dec %r8
.byte 72,131,195,4 // add $0x4,%rbx
.byte 196,65,52,87,201 // vxorps %ymm9,%ymm9,%ymm9
- .byte 196,98,125,24,21,78,232,1,0 // vbroadcastss 0x1e84e(%rip),%ymm10 # 355bc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
+ .byte 196,98,125,24,21,171,232,1,0 // vbroadcastss 0x1e8ab(%rip),%ymm10 # 355bc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
.byte 197,244,87,201 // vxorps %ymm1,%ymm1,%ymm1
.byte 196,98,125,24,3 // vbroadcastss (%rbx),%ymm8
.byte 197,60,194,192,2 // vcmpleps %ymm0,%ymm8,%ymm8
@@ -31766,7 +31743,7 @@ _sk_gradient_avx:
.byte 196,227,117,24,202,1 // vinsertf128 $0x1,%xmm2,%ymm1,%ymm1
.byte 72,131,195,4 // add $0x4,%rbx
.byte 73,255,200 // dec %r8
- .byte 117,204 // jne 16d72 <_sk_gradient_avx+0x3b>
+ .byte 117,204 // jne 16d15 <_sk_gradient_avx+0x3b>
.byte 196,195,249,22,200,1 // vpextrq $0x1,%xmm1,%r8
.byte 69,137,193 // mov %r8d,%r9d
.byte 73,193,232,32 // shr $0x20,%r8
@@ -31948,27 +31925,27 @@ _sk_xy_to_unit_angle_avx:
.byte 196,65,52,95,226 // vmaxps %ymm10,%ymm9,%ymm12
.byte 196,65,36,94,220 // vdivps %ymm12,%ymm11,%ymm11
.byte 196,65,36,89,227 // vmulps %ymm11,%ymm11,%ymm12
- .byte 196,98,125,24,45,124,229,1,0 // vbroadcastss 0x1e57c(%rip),%ymm13 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
+ .byte 196,98,125,24,45,197,229,1,0 // vbroadcastss 0x1e5c5(%rip),%ymm13 # 356e4 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
.byte 196,65,28,89,237 // vmulps %ymm13,%ymm12,%ymm13
- .byte 196,98,125,24,53,114,229,1,0 // vbroadcastss 0x1e572(%rip),%ymm14 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
+ .byte 196,98,125,24,53,187,229,1,0 // vbroadcastss 0x1e5bb(%rip),%ymm14 # 356e8 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
.byte 196,65,20,88,238 // vaddps %ymm14,%ymm13,%ymm13
.byte 196,65,28,89,237 // vmulps %ymm13,%ymm12,%ymm13
- .byte 196,98,125,24,53,99,229,1,0 // vbroadcastss 0x1e563(%rip),%ymm14 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
+ .byte 196,98,125,24,53,172,229,1,0 // vbroadcastss 0x1e5ac(%rip),%ymm14 # 356ec <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
.byte 196,65,20,88,238 // vaddps %ymm14,%ymm13,%ymm13
.byte 196,65,28,89,229 // vmulps %ymm13,%ymm12,%ymm12
- .byte 196,98,125,24,45,84,229,1,0 // vbroadcastss 0x1e554(%rip),%ymm13 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ .byte 196,98,125,24,45,157,229,1,0 // vbroadcastss 0x1e59d(%rip),%ymm13 # 356f0 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
.byte 196,65,28,88,229 // vaddps %ymm13,%ymm12,%ymm12
.byte 196,65,36,89,220 // vmulps %ymm12,%ymm11,%ymm11
.byte 196,65,52,194,202,1 // vcmpltps %ymm10,%ymm9,%ymm9
- .byte 196,98,125,24,21,63,229,1,0 // vbroadcastss 0x1e53f(%rip),%ymm10 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ .byte 196,98,125,24,21,136,229,1,0 // vbroadcastss 0x1e588(%rip),%ymm10 # 356f4 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
.byte 196,65,44,92,211 // vsubps %ymm11,%ymm10,%ymm10
.byte 196,67,37,74,202,144 // vblendvps %ymm9,%ymm10,%ymm11,%ymm9
.byte 196,193,124,194,192,1 // vcmpltps %ymm8,%ymm0,%ymm0
- .byte 196,98,125,24,21,209,227,1,0 // vbroadcastss 0x1e3d1(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,21,46,228,1,0 // vbroadcastss 0x1e42e(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,44,92,209 // vsubps %ymm9,%ymm10,%ymm10
.byte 196,195,53,74,194,0 // vblendvps %ymm0,%ymm10,%ymm9,%ymm0
.byte 196,65,116,194,200,1 // vcmpltps %ymm8,%ymm1,%ymm9
- .byte 196,98,125,24,21,187,227,1,0 // vbroadcastss 0x1e3bb(%rip),%ymm10 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,21,24,228,1,0 // vbroadcastss 0x1e418(%rip),%ymm10 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,44,92,208 // vsubps %ymm0,%ymm10,%ymm10
.byte 196,195,125,74,194,144 // vblendvps %ymm9,%ymm10,%ymm0,%ymm0
.byte 196,65,124,194,200,3 // vcmpunordps %ymm8,%ymm0,%ymm9
@@ -31998,7 +31975,7 @@ _sk_xy_to_2pt_conical_quadratic_max_avx:
.byte 196,67,121,4,210,0 // vpermilps $0x0,%xmm10,%xmm10
.byte 196,67,45,24,210,1 // vinsertf128 $0x1,%xmm10,%ymm10,%ymm10
.byte 197,44,88,208 // vaddps %ymm0,%ymm10,%ymm10
- .byte 196,98,125,24,29,181,228,1,0 // vbroadcastss 0x1e4b5(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 196,98,125,24,29,254,228,1,0 // vbroadcastss 0x1e4fe(%rip),%ymm11 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 196,65,44,89,211 // vmulps %ymm11,%ymm10,%ymm10
.byte 197,252,89,192 // vmulps %ymm0,%ymm0,%ymm0
.byte 197,116,89,217 // vmulps %ymm1,%ymm1,%ymm11
@@ -32007,17 +31984,17 @@ _sk_xy_to_2pt_conical_quadratic_max_avx:
.byte 196,227,121,4,192,0 // vpermilps $0x0,%xmm0,%xmm0
.byte 196,227,125,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
- .byte 196,98,125,24,13,137,228,1,0 // vbroadcastss 0x1e489(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 196,98,125,24,13,210,228,1,0 // vbroadcastss 0x1e4d2(%rip),%ymm9 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,65,44,89,194 // vmulps %ymm10,%ymm10,%ymm8
.byte 196,193,124,88,192 // vaddps %ymm8,%ymm0,%ymm0
.byte 197,252,81,192 // vsqrtps %ymm0,%ymm0
.byte 196,98,125,24,64,68 // vbroadcastss 0x44(%rax),%ymm8
- .byte 196,98,125,24,13,103,228,1,0 // vbroadcastss 0x1e467(%rip),%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,13,176,228,1,0 // vbroadcastss 0x1e4b0(%rip),%ymm9 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,44,87,201 // vxorps %ymm9,%ymm10,%ymm9
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 196,98,125,24,29,244,226,1,0 // vbroadcastss 0x1e2f4(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,29,81,227,1,0 // vbroadcastss 0x1e351(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,60,89,195 // vmulps %ymm11,%ymm8,%ymm8
.byte 196,65,60,89,210 // vmulps %ymm10,%ymm8,%ymm10
.byte 197,180,92,192 // vsubps %ymm0,%ymm9,%ymm0
@@ -32037,7 +32014,7 @@ _sk_xy_to_2pt_conical_quadratic_min_avx:
.byte 196,67,121,4,210,0 // vpermilps $0x0,%xmm10,%xmm10
.byte 196,67,45,24,210,1 // vinsertf128 $0x1,%xmm10,%ymm10,%ymm10
.byte 197,44,88,208 // vaddps %ymm0,%ymm10,%ymm10
- .byte 196,98,125,24,29,7,228,1,0 // vbroadcastss 0x1e407(%rip),%ymm11 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 196,98,125,24,29,80,228,1,0 // vbroadcastss 0x1e450(%rip),%ymm11 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 196,65,44,89,211 // vmulps %ymm11,%ymm10,%ymm10
.byte 197,252,89,192 // vmulps %ymm0,%ymm0,%ymm0
.byte 197,116,89,217 // vmulps %ymm1,%ymm1,%ymm11
@@ -32046,17 +32023,17 @@ _sk_xy_to_2pt_conical_quadratic_min_avx:
.byte 196,227,121,4,192,0 // vpermilps $0x0,%xmm0,%xmm0
.byte 196,227,125,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
.byte 197,164,92,192 // vsubps %ymm0,%ymm11,%ymm0
- .byte 196,98,125,24,13,219,227,1,0 // vbroadcastss 0x1e3db(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ .byte 196,98,125,24,13,36,228,1,0 // vbroadcastss 0x1e424(%rip),%ymm9 # 356fc <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
.byte 197,188,89,192 // vmulps %ymm0,%ymm8,%ymm0
.byte 196,65,44,89,194 // vmulps %ymm10,%ymm10,%ymm8
.byte 196,193,124,88,192 // vaddps %ymm8,%ymm0,%ymm0
.byte 197,252,81,192 // vsqrtps %ymm0,%ymm0
.byte 196,98,125,24,64,68 // vbroadcastss 0x44(%rax),%ymm8
- .byte 196,98,125,24,13,185,227,1,0 // vbroadcastss 0x1e3b9(%rip),%ymm9 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,13,2,228,1,0 // vbroadcastss 0x1e402(%rip),%ymm9 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,65,44,87,201 // vxorps %ymm9,%ymm10,%ymm9
.byte 196,65,124,92,210 // vsubps %ymm10,%ymm0,%ymm10
- .byte 196,98,125,24,29,70,226,1,0 // vbroadcastss 0x1e246(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,29,163,226,1,0 // vbroadcastss 0x1e2a3(%rip),%ymm11 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,60,89,195 // vmulps %ymm11,%ymm8,%ymm8
.byte 196,65,60,89,210 // vmulps %ymm10,%ymm8,%ymm10
.byte 197,180,92,192 // vsubps %ymm0,%ymm9,%ymm0
@@ -32075,7 +32052,7 @@ _sk_xy_to_2pt_conical_linear_avx:
.byte 196,67,121,4,201,0 // vpermilps $0x0,%xmm9,%xmm9
.byte 196,67,53,24,201,1 // vinsertf128 $0x1,%xmm9,%ymm9,%ymm9
.byte 197,52,88,200 // vaddps %ymm0,%ymm9,%ymm9
- .byte 196,98,125,24,21,95,227,1,0 // vbroadcastss 0x1e35f(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ .byte 196,98,125,24,21,168,227,1,0 // vbroadcastss 0x1e3a8(%rip),%ymm10 # 356f8 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
.byte 196,65,52,89,202 // vmulps %ymm10,%ymm9,%ymm9
.byte 197,252,89,192 // vmulps %ymm0,%ymm0,%ymm0
.byte 197,116,89,209 // vmulps %ymm1,%ymm1,%ymm10
@@ -32084,7 +32061,7 @@ _sk_xy_to_2pt_conical_linear_avx:
.byte 196,227,121,4,192,0 // vpermilps $0x0,%xmm0,%xmm0
.byte 196,227,125,24,192,1 // vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
.byte 197,172,92,192 // vsubps %ymm0,%ymm10,%ymm0
- .byte 196,98,125,24,5,55,227,1,0 // vbroadcastss 0x1e337(%rip),%ymm8 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ .byte 196,98,125,24,5,128,227,1,0 // vbroadcastss 0x1e380(%rip),%ymm8 # 35700 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
.byte 196,193,124,87,192 // vxorps %ymm8,%ymm0,%ymm0
.byte 196,193,124,94,193 // vdivps %ymm9,%ymm0,%ymm0
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32128,7 +32105,7 @@ HIDDEN _sk_save_xy_avx
FUNCTION(_sk_save_xy_avx)
_sk_save_xy_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,93,225,1,0 // vbroadcastss 0x1e15d(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,186,225,1,0 // vbroadcastss 0x1e1ba(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,124,88,200 // vaddps %ymm8,%ymm0,%ymm9
.byte 196,67,125,8,209,1 // vroundps $0x1,%ymm9,%ymm10
.byte 196,65,52,92,202 // vsubps %ymm10,%ymm9,%ymm9
@@ -32165,9 +32142,9 @@ HIDDEN _sk_bilinear_nx_avx
FUNCTION(_sk_bilinear_nx_avx)
_sk_bilinear_nx_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,67,226,1,0 // vbroadcastss 0x1e243(%rip),%ymm0 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,5,140,226,1,0 // vbroadcastss 0x1e28c(%rip),%ymm0 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,214,224,1,0 // vbroadcastss 0x1e0d6(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,51,225,1,0 // vbroadcastss 0x1e133(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32178,7 +32155,7 @@ HIDDEN _sk_bilinear_px_avx
FUNCTION(_sk_bilinear_px_avx)
_sk_bilinear_px_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,179,224,1,0 // vbroadcastss 0x1e0b3(%rip),%ymm0 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,226,125,24,5,16,225,1,0 // vbroadcastss 0x1e110(%rip),%ymm0 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,128,128,0,0,0 // vmovups 0x80(%rax),%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
@@ -32190,9 +32167,9 @@ HIDDEN _sk_bilinear_ny_avx
FUNCTION(_sk_bilinear_ny_avx)
_sk_bilinear_ny_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,244,225,1,0 // vbroadcastss 0x1e1f4(%rip),%ymm1 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,13,61,226,1,0 // vbroadcastss 0x1e23d(%rip),%ymm1 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,134,224,1,0 // vbroadcastss 0x1e086(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,227,224,1,0 // vbroadcastss 0x1e0e3(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32203,7 +32180,7 @@ HIDDEN _sk_bilinear_py_avx
FUNCTION(_sk_bilinear_py_avx)
_sk_bilinear_py_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,99,224,1,0 // vbroadcastss 0x1e063(%rip),%ymm1 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,226,125,24,13,192,224,1,0 // vbroadcastss 0x1e0c0(%rip),%ymm1 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
.byte 197,124,16,128,192,0,0,0 // vmovups 0xc0(%rax),%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
@@ -32215,14 +32192,14 @@ HIDDEN _sk_bicubic_n3x_avx
FUNCTION(_sk_bicubic_n3x_avx)
_sk_bicubic_n3x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,167,225,1,0 // vbroadcastss 0x1e1a7(%rip),%ymm0 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ .byte 196,226,125,24,5,240,225,1,0 // vbroadcastss 0x1e1f0(%rip),%ymm0 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,54,224,1,0 // vbroadcastss 0x1e036(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,147,224,1,0 // vbroadcastss 0x1e093(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,136,225,1,0 // vbroadcastss 0x1e188(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,209,225,1,0 // vbroadcastss 0x1e1d1(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,134,224,1,0 // vbroadcastss 0x1e086(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,227,224,1,0 // vbroadcastss 0x1e0e3(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
@@ -32234,19 +32211,19 @@ HIDDEN _sk_bicubic_n1x_avx
FUNCTION(_sk_bicubic_n1x_avx)
_sk_bicubic_n1x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,81,225,1,0 // vbroadcastss 0x1e151(%rip),%ymm0 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,5,154,225,1,0 // vbroadcastss 0x1e19a(%rip),%ymm0 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
- .byte 196,98,125,24,5,228,223,1,0 // vbroadcastss 0x1dfe4(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,65,224,1,0 // vbroadcastss 0x1e041(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,128,0,0,0 // vsubps 0x80(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,63,225,1,0 // vbroadcastss 0x1e13f(%rip),%ymm9 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,13,136,225,1,0 // vbroadcastss 0x1e188(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,53,225,1,0 // vbroadcastss 0x1e135(%rip),%ymm10 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,98,125,24,21,126,225,1,0 // vbroadcastss 0x1e17e(%rip),%ymm10 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,174,223,1,0 // vbroadcastss 0x1dfae(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,21,11,224,1,0 // vbroadcastss 0x1e00b(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,24,13,19,225,1,0 // vbroadcastss 0x1e113(%rip),%ymm9 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,13,92,225,1,0 // vbroadcastss 0x1e15c(%rip),%ymm9 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32257,17 +32234,17 @@ HIDDEN _sk_bicubic_p1x_avx
FUNCTION(_sk_bicubic_p1x_avx)
_sk_bicubic_p1x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,127,223,1,0 // vbroadcastss 0x1df7f(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,220,223,1,0 // vbroadcastss 0x1dfdc(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,188,88,0 // vaddps (%rax),%ymm8,%ymm0
.byte 197,124,16,136,128,0,0,0 // vmovups 0x80(%rax),%ymm9
- .byte 196,98,125,24,21,218,224,1,0 // vbroadcastss 0x1e0da(%rip),%ymm10 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,21,35,225,1,0 // vbroadcastss 0x1e123(%rip),%ymm10 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
- .byte 196,98,125,24,29,208,224,1,0 // vbroadcastss 0x1e0d0(%rip),%ymm11 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,98,125,24,29,25,225,1,0 // vbroadcastss 0x1e119(%rip),%ymm11 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,65,44,88,211 // vaddps %ymm11,%ymm10,%ymm10
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
.byte 196,65,44,88,192 // vaddps %ymm8,%ymm10,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
- .byte 196,98,125,24,13,183,224,1,0 // vbroadcastss 0x1e0b7(%rip),%ymm9 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,13,0,225,1,0 // vbroadcastss 0x1e100(%rip),%ymm9 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32278,13 +32255,13 @@ HIDDEN _sk_bicubic_p3x_avx
FUNCTION(_sk_bicubic_p3x_avx)
_sk_bicubic_p3x_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,5,151,224,1,0 // vbroadcastss 0x1e097(%rip),%ymm0 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,226,125,24,5,224,224,1,0 // vbroadcastss 0x1e0e0(%rip),%ymm0 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 197,252,88,0 // vaddps (%rax),%ymm0,%ymm0
.byte 197,124,16,128,128,0,0,0 // vmovups 0x80(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,117,224,1,0 // vbroadcastss 0x1e075(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,190,224,1,0 // vbroadcastss 0x1e0be(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,115,223,1,0 // vbroadcastss 0x1df73(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,208,223,1,0 // vbroadcastss 0x1dfd0(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,0,1,0,0 // vmovups %ymm8,0x100(%rax)
@@ -32296,14 +32273,14 @@ HIDDEN _sk_bicubic_n3y_avx
FUNCTION(_sk_bicubic_n3y_avx)
_sk_bicubic_n3y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,66,224,1,0 // vbroadcastss 0x1e042(%rip),%ymm1 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ .byte 196,226,125,24,13,139,224,1,0 // vbroadcastss 0x1e08b(%rip),%ymm1 # 35708 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,208,222,1,0 // vbroadcastss 0x1ded0(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,45,223,1,0 // vbroadcastss 0x1df2d(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,34,224,1,0 // vbroadcastss 0x1e022(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,107,224,1,0 // vbroadcastss 0x1e06b(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,32,223,1,0 // vbroadcastss 0x1df20(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,125,223,1,0 // vbroadcastss 0x1df7d(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
@@ -32315,19 +32292,19 @@ HIDDEN _sk_bicubic_n1y_avx
FUNCTION(_sk_bicubic_n1y_avx)
_sk_bicubic_n1y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,235,223,1,0 // vbroadcastss 0x1dfeb(%rip),%ymm1 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ .byte 196,226,125,24,13,52,224,1,0 // vbroadcastss 0x1e034(%rip),%ymm1 # 35704 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
- .byte 196,98,125,24,5,125,222,1,0 // vbroadcastss 0x1de7d(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,98,125,24,5,218,222,1,0 // vbroadcastss 0x1deda(%rip),%ymm8 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,60,92,128,192,0,0,0 // vsubps 0xc0(%rax),%ymm8,%ymm8
- .byte 196,98,125,24,13,216,223,1,0 // vbroadcastss 0x1dfd8(%rip),%ymm9 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,13,33,224,1,0 // vbroadcastss 0x1e021(%rip),%ymm9 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,206,223,1,0 // vbroadcastss 0x1dfce(%rip),%ymm10 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,98,125,24,21,23,224,1,0 // vbroadcastss 0x1e017(%rip),%ymm10 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,201 // vmulps %ymm9,%ymm8,%ymm9
- .byte 196,98,125,24,21,71,222,1,0 // vbroadcastss 0x1de47(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,21,164,222,1,0 // vbroadcastss 0x1dea4(%rip),%ymm10 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 196,65,52,88,202 // vaddps %ymm10,%ymm9,%ymm9
.byte 196,65,60,89,193 // vmulps %ymm9,%ymm8,%ymm8
- .byte 196,98,125,24,13,172,223,1,0 // vbroadcastss 0x1dfac(%rip),%ymm9 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,13,245,223,1,0 // vbroadcastss 0x1dff5(%rip),%ymm9 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32338,17 +32315,17 @@ HIDDEN _sk_bicubic_p1y_avx
FUNCTION(_sk_bicubic_p1y_avx)
_sk_bicubic_p1y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,98,125,24,5,24,222,1,0 // vbroadcastss 0x1de18(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ .byte 196,98,125,24,5,117,222,1,0 // vbroadcastss 0x1de75(%rip),%ymm8 # 355b4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
.byte 197,188,88,72,64 // vaddps 0x40(%rax),%ymm8,%ymm1
.byte 197,124,16,136,192,0,0,0 // vmovups 0xc0(%rax),%ymm9
- .byte 196,98,125,24,21,114,223,1,0 // vbroadcastss 0x1df72(%rip),%ymm10 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 196,98,125,24,21,187,223,1,0 // vbroadcastss 0x1dfbb(%rip),%ymm10 # 35710 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
- .byte 196,98,125,24,29,104,223,1,0 // vbroadcastss 0x1df68(%rip),%ymm11 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,98,125,24,29,177,223,1,0 // vbroadcastss 0x1dfb1(%rip),%ymm11 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 196,65,44,88,211 // vaddps %ymm11,%ymm10,%ymm10
.byte 196,65,52,89,210 // vmulps %ymm10,%ymm9,%ymm10
.byte 196,65,44,88,192 // vaddps %ymm8,%ymm10,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
- .byte 196,98,125,24,13,79,223,1,0 // vbroadcastss 0x1df4f(%rip),%ymm9 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 196,98,125,24,13,152,223,1,0 // vbroadcastss 0x1df98(%rip),%ymm9 # 35718 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
.byte 196,65,60,88,193 // vaddps %ymm9,%ymm8,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -32359,13 +32336,13 @@ HIDDEN _sk_bicubic_p3y_avx
FUNCTION(_sk_bicubic_p3y_avx)
_sk_bicubic_p3y_avx:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,13,47,223,1,0 // vbroadcastss 0x1df2f(%rip),%ymm1 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 196,226,125,24,13,120,223,1,0 // vbroadcastss 0x1df78(%rip),%ymm1 # 35714 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
.byte 197,244,88,72,64 // vaddps 0x40(%rax),%ymm1,%ymm1
.byte 197,124,16,128,192,0,0,0 // vmovups 0xc0(%rax),%ymm8
.byte 196,65,60,89,200 // vmulps %ymm8,%ymm8,%ymm9
- .byte 196,98,125,24,21,12,223,1,0 // vbroadcastss 0x1df0c(%rip),%ymm10 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ .byte 196,98,125,24,21,85,223,1,0 // vbroadcastss 0x1df55(%rip),%ymm10 # 3570c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
.byte 196,65,60,89,194 // vmulps %ymm10,%ymm8,%ymm8
- .byte 196,98,125,24,21,10,222,1,0 // vbroadcastss 0x1de0a(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ .byte 196,98,125,24,21,103,222,1,0 // vbroadcastss 0x1de67(%rip),%ymm10 # 3562c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
.byte 196,65,60,88,194 // vaddps %ymm10,%ymm8,%ymm8
.byte 196,65,52,89,192 // vmulps %ymm8,%ymm9,%ymm8
.byte 197,124,17,128,64,1,0,0 // vmovups %ymm8,0x140(%rax)
@@ -32513,7 +32490,7 @@ _sk_clut_3D_avx:
.byte 72,139,0 // mov (%rax),%rax
.byte 197,217,254,207 // vpaddd %xmm7,%xmm4,%xmm1
.byte 197,249,254,193 // vpaddd %xmm1,%xmm0,%xmm0
- .byte 196,226,121,24,37,164,220,1,0 // vbroadcastss 0x1dca4(%rip),%xmm4 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 196,226,121,24,37,237,220,1,0 // vbroadcastss 0x1dced(%rip),%xmm4 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
.byte 196,98,121,64,228 // vpmulld %xmm4,%xmm0,%xmm12
.byte 196,226,49,64,198 // vpmulld %xmm6,%xmm9,%xmm0
.byte 197,249,127,132,36,128,0,0,0 // vmovdqa %xmm0,0x80(%rsp)
@@ -32567,7 +32544,7 @@ _sk_clut_3D_avx:
.byte 196,161,122,16,60,128 // vmovss (%rax,%r8,4),%xmm7
.byte 196,227,73,33,247,48 // vinsertps $0x30,%xmm7,%xmm6,%xmm6
.byte 196,227,77,24,237,1 // vinsertf128 $0x1,%xmm5,%ymm6,%ymm5
- .byte 196,98,121,24,21,9,218,1,0 // vbroadcastss 0x1da09(%rip),%xmm10 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ .byte 196,98,121,24,21,102,218,1,0 // vbroadcastss 0x1da66(%rip),%xmm10 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
.byte 196,193,105,254,210 // vpaddd %xmm10,%xmm2,%xmm2
.byte 196,195,249,22,208,1 // vpextrq $0x1,%xmm2,%r8
.byte 196,193,249,126,209 // vmovq %xmm2,%r9
@@ -32595,7 +32572,7 @@ _sk_clut_3D_avx:
.byte 196,161,122,16,60,128 // vmovss (%rax,%r8,4),%xmm7
.byte 196,227,73,33,247,48 // vinsertps $0x30,%xmm7,%xmm6,%xmm6
.byte 196,227,77,24,210,1 // vinsertf128 $0x1,%xmm2,%ymm6,%ymm2
- .byte 196,226,125,24,61,225,218,1,0 // vbroadcastss 0x1dae1(%rip),%ymm7 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,226,125,24,61,42,219,1,0 // vbroadcastss 0x1db2a(%rip),%ymm7 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
.byte 197,148,88,247 // vaddps %ymm7,%ymm13,%ymm6
.byte 197,124,40,231 // vmovaps %ymm7,%ymm12
.byte 197,124,17,36,36 // vmovups %ymm12,(%rsp)
@@ -33338,7 +33315,7 @@ _sk_clut_4D_avx:
.byte 197,249,127,68,36,32 // vmovdqa %xmm0,0x20(%rsp)
.byte 197,225,254,216 // vpaddd %xmm0,%xmm3,%xmm3
.byte 197,233,254,195 // vpaddd %xmm3,%xmm2,%xmm0
- .byte 196,98,121,24,13,165,203,1,0 // vbroadcastss 0x1cba5(%rip),%xmm9 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 196,98,121,24,13,238,203,1,0 // vbroadcastss 0x1cbee(%rip),%xmm9 # 35720 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
.byte 196,194,121,64,209 // vpmulld %xmm9,%xmm0,%xmm2
.byte 196,226,81,64,199 // vpmulld %xmm7,%xmm5,%xmm0
.byte 197,249,127,132,36,96,1,0,0 // vmovdqa %xmm0,0x160(%rsp)
@@ -33395,7 +33372,7 @@ _sk_clut_4D_avx:
.byte 196,161,122,16,60,128 // vmovss (%rax,%r8,4),%xmm7
.byte 196,227,73,33,247,48 // vinsertps $0x30,%xmm7,%xmm6,%xmm6
.byte 196,227,77,24,237,1 // vinsertf128 $0x1,%xmm5,%ymm6,%ymm5
- .byte 196,98,121,24,21,250,200,1,0 // vbroadcastss 0x1c8fa(%rip),%xmm10 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ .byte 196,98,121,24,21,87,201,1,0 // vbroadcastss 0x1c957(%rip),%xmm10 # 355c4 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
.byte 196,193,121,254,194 // vpaddd %xmm10,%xmm0,%xmm0
.byte 196,195,249,22,192,1 // vpextrq $0x1,%xmm0,%r8
.byte 196,193,249,126,193 // vmovq %xmm0,%r9
@@ -33423,7 +33400,7 @@ _sk_clut_4D_avx:
.byte 196,161,122,16,52,128 // vmovss (%rax,%r8,4),%xmm6
.byte 196,227,105,33,214,48 // vinsertps $0x30,%xmm6,%xmm2,%xmm2
.byte 196,227,109,24,208,1 // vinsertf128 $0x1,%xmm0,%ymm2,%ymm2
- .byte 196,98,125,24,37,210,201,1,0 // vbroadcastss 0x1c9d2(%rip),%ymm12 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 196,98,125,24,37,27,202,1,0 // vbroadcastss 0x1ca1b(%rip),%ymm12 # 3571c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
.byte 196,193,4,88,196 // vaddps %ymm12,%ymm15,%ymm0
.byte 197,124,17,36,36 // vmovups %ymm12,(%rsp)
.byte 197,254,91,192 // vcvttps2dq %ymm0,%ymm0
@@ -34821,7 +34798,7 @@ _sk_clut_4D_avx:
.byte 197,228,89,210 // vmulps %ymm2,%ymm3,%ymm2
.byte 197,220,88,210 // vaddps %ymm2,%ymm4,%ymm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 196,226,125,24,29,27,171,1,0 // vbroadcastss 0x1ab1b(%rip),%ymm3 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ .byte 196,226,125,24,29,120,171,1,0 // vbroadcastss 0x1ab78(%rip),%ymm3 # 355b8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
.byte 197,252,16,164,36,64,2,0,0 // vmovups 0x240(%rsp),%ymm4
.byte 197,252,16,172,36,96,2,0,0 // vmovups 0x260(%rsp),%ymm5
.byte 197,252,16,180,36,128,2,0,0 // vmovups 0x280(%rsp),%ymm6
@@ -34833,6 +34810,29 @@ _sk_clut_4D_avx:
.byte 65,95 // pop %r15
.byte 255,224 // jmpq *%rax
+HIDDEN _sk_gauss_a_to_rgba_avx
+.globl _sk_gauss_a_to_rgba_avx
+FUNCTION(_sk_gauss_a_to_rgba_avx)
+_sk_gauss_a_to_rgba_avx:
+ .byte 196,226,125,24,5,167,172,1,0 // vbroadcastss 0x1aca7(%rip),%ymm0 # 35724 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ .byte 197,228,89,192 // vmulps %ymm0,%ymm3,%ymm0
+ .byte 196,226,125,24,13,158,172,1,0 // vbroadcastss 0x1ac9e(%rip),%ymm1 # 35728 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
+ .byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
+ .byte 196,226,125,24,13,145,172,1,0 // vbroadcastss 0x1ac91(%rip),%ymm1 # 3572c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
+ .byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
+ .byte 196,226,125,24,13,132,172,1,0 // vbroadcastss 0x1ac84(%rip),%ymm1 # 35730 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
+ .byte 197,252,89,195 // vmulps %ymm3,%ymm0,%ymm0
+ .byte 196,226,125,24,13,119,172,1,0 // vbroadcastss 0x1ac77(%rip),%ymm1 # 35734 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ .byte 197,252,88,193 // vaddps %ymm1,%ymm0,%ymm0
+ .byte 72,173 // lods %ds:(%rsi),%rax
+ .byte 197,252,40,200 // vmovaps %ymm0,%ymm1
+ .byte 197,252,40,208 // vmovaps %ymm0,%ymm2
+ .byte 197,252,40,216 // vmovaps %ymm0,%ymm3
+ .byte 255,224 // jmpq *%rax
+
HIDDEN _sk_start_pipeline_sse41
.globl _sk_start_pipeline_sse41
FUNCTION(_sk_start_pipeline_sse41)
@@ -40824,25 +40824,6 @@ _sk_evenly_spaced_gradient_sse41:
.byte 65,94 // pop %r14
.byte 255,224 // jmpq *%rax
-HIDDEN _sk_gauss_a_to_rgba_sse41
-.globl _sk_gauss_a_to_rgba_sse41
-FUNCTION(_sk_gauss_a_to_rgba_sse41)
-_sk_gauss_a_to_rgba_sse41:
- .byte 15,40,5,0,95,1,0 // movaps 0x15f00(%rip),%xmm0 # 363e0 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,6,95,1,0 // addps 0x15f06(%rip),%xmm0 # 363f0 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,12,95,1,0 // addps 0x15f0c(%rip),%xmm0 # 36400 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,18,95,1,0 // addps 0x15f12(%rip),%xmm0 # 36410 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,24,95,1,0 // addps 0x15f18(%rip),%xmm0 # 36420 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
- .byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,200 // movaps %xmm0,%xmm1
- .byte 15,40,208 // movaps %xmm0,%xmm2
- .byte 15,40,216 // movaps %xmm0,%xmm3
- .byte 255,224 // jmpq *%rax
-
HIDDEN _sk_gradient_sse41
.globl _sk_gradient_sse41
FUNCTION(_sk_gradient_sse41)
@@ -40851,7 +40832,7 @@ _sk_gradient_sse41:
.byte 76,139,0 // mov (%rax),%r8
.byte 102,15,239,201 // pxor %xmm1,%xmm1
.byte 73,131,248,2 // cmp $0x2,%r8
- .byte 114,41 // jb 2054d <_sk_gradient_sse41+0x38>
+ .byte 114,41 // jb 20511 <_sk_gradient_sse41+0x38>
.byte 76,139,72,72 // mov 0x48(%rax),%r9
.byte 73,255,200 // dec %r8
.byte 73,131,193,4 // add $0x4,%r9
@@ -40862,7 +40843,7 @@ _sk_gradient_sse41:
.byte 102,15,250,202 // psubd %xmm2,%xmm1
.byte 73,131,193,4 // add $0x4,%r9
.byte 73,255,200 // dec %r8
- .byte 117,230 // jne 20533 <_sk_gradient_sse41+0x1e>
+ .byte 117,230 // jne 204f7 <_sk_gradient_sse41+0x1e>
.byte 65,86 // push %r14
.byte 83 // push %rbx
.byte 102,73,15,58,22,200,1 // pextrq $0x1,%xmm1,%r8
@@ -40993,26 +40974,26 @@ _sk_xy_to_unit_angle_sse41:
.byte 69,15,94,226 // divps %xmm10,%xmm12
.byte 69,15,40,236 // movaps %xmm12,%xmm13
.byte 69,15,89,237 // mulps %xmm13,%xmm13
- .byte 68,15,40,21,143,92,1,0 // movaps 0x15c8f(%rip),%xmm10 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ .byte 68,15,40,21,123,92,1,0 // movaps 0x15c7b(%rip),%xmm10 # 363e0 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
.byte 69,15,89,213 // mulps %xmm13,%xmm10
- .byte 68,15,88,21,147,92,1,0 // addps 0x15c93(%rip),%xmm10 # 36440 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ .byte 68,15,88,21,127,92,1,0 // addps 0x15c7f(%rip),%xmm10 # 363f0 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
.byte 69,15,89,213 // mulps %xmm13,%xmm10
- .byte 68,15,88,21,151,92,1,0 // addps 0x15c97(%rip),%xmm10 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,88,21,131,92,1,0 // addps 0x15c83(%rip),%xmm10 # 36400 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
.byte 69,15,89,213 // mulps %xmm13,%xmm10
- .byte 68,15,88,21,155,92,1,0 // addps 0x15c9b(%rip),%xmm10 # 36460 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ .byte 68,15,88,21,135,92,1,0 // addps 0x15c87(%rip),%xmm10 # 36410 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
.byte 69,15,89,212 // mulps %xmm12,%xmm10
.byte 65,15,194,195,1 // cmpltps %xmm11,%xmm0
- .byte 68,15,40,29,154,92,1,0 // movaps 0x15c9a(%rip),%xmm11 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,40,29,134,92,1,0 // movaps 0x15c86(%rip),%xmm11 # 36420 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
.byte 69,15,92,218 // subps %xmm10,%xmm11
.byte 102,69,15,56,20,211 // blendvps %xmm0,%xmm11,%xmm10
.byte 69,15,194,200,1 // cmpltps %xmm8,%xmm9
- .byte 68,15,40,29,83,86,1,0 // movaps 0x15653(%rip),%xmm11 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,29,143,86,1,0 // movaps 0x1568f(%rip),%xmm11 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 69,15,92,218 // subps %xmm10,%xmm11
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 102,69,15,56,20,211 // blendvps %xmm0,%xmm11,%xmm10
.byte 15,40,193 // movaps %xmm1,%xmm0
.byte 65,15,194,192,1 // cmpltps %xmm8,%xmm0
- .byte 68,15,40,13,69,86,1,0 // movaps 0x15645(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 68,15,40,13,129,86,1,0 // movaps 0x15681(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,202 // subps %xmm10,%xmm9
.byte 102,69,15,56,20,209 // blendvps %xmm0,%xmm9,%xmm10
.byte 69,15,194,194,7 // cmpordps %xmm10,%xmm8
@@ -41046,7 +41027,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41:
.byte 243,69,15,89,203 // mulss %xmm11,%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 68,15,88,200 // addps %xmm0,%xmm9
- .byte 68,15,89,13,14,92,1,0 // mulps 0x15c0e(%rip),%xmm9 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
+ .byte 68,15,89,13,250,91,1,0 // mulps 0x15bfa(%rip),%xmm9 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 68,15,40,225 // movaps %xmm1,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
@@ -41054,7 +41035,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41:
.byte 243,69,15,89,219 // mulss %xmm11,%xmm11
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,92,227 // subps %xmm11,%xmm12
- .byte 68,15,89,21,249,91,1,0 // mulps 0x15bf9(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
+ .byte 68,15,89,21,229,91,1,0 // mulps 0x15be5(%rip),%xmm10 # 36440 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
.byte 69,15,89,212 // mulps %xmm12,%xmm10
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 15,89,192 // mulps %xmm0,%xmm0
@@ -41063,8 +41044,8 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41:
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 65,15,92,193 // subps %xmm9,%xmm0
- .byte 68,15,87,13,161,90,1,0 // xorps 0x15aa1(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
- .byte 68,15,89,5,121,85,1,0 // mulps 0x15579(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,87,13,221,90,1,0 // xorps 0x15add(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
+ .byte 68,15,89,5,181,85,1,0 // mulps 0x155b5(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 69,15,92,202 // subps %xmm10,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
@@ -41085,7 +41066,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41:
.byte 243,69,15,89,203 // mulss %xmm11,%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 68,15,88,200 // addps %xmm0,%xmm9
- .byte 68,15,89,13,112,91,1,0 // mulps 0x15b70(%rip),%xmm9 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
+ .byte 68,15,89,13,92,91,1,0 // mulps 0x15b5c(%rip),%xmm9 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 68,15,40,225 // movaps %xmm1,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
@@ -41093,7 +41074,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41:
.byte 243,69,15,89,219 // mulss %xmm11,%xmm11
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,92,227 // subps %xmm11,%xmm12
- .byte 68,15,89,21,91,91,1,0 // mulps 0x15b5b(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
+ .byte 68,15,89,21,71,91,1,0 // mulps 0x15b47(%rip),%xmm10 # 36440 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
.byte 69,15,89,212 // mulps %xmm12,%xmm10
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 15,89,192 // mulps %xmm0,%xmm0
@@ -41102,8 +41083,8 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41:
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 65,15,92,193 // subps %xmm9,%xmm0
- .byte 68,15,87,13,3,90,1,0 // xorps 0x15a03(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
- .byte 68,15,89,5,219,84,1,0 // mulps 0x154db(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,87,13,63,90,1,0 // xorps 0x15a3f(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
+ .byte 68,15,89,5,23,85,1,0 // mulps 0x15517(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 69,15,92,202 // subps %xmm10,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
@@ -41121,7 +41102,7 @@ _sk_xy_to_2pt_conical_linear_sse41:
.byte 243,69,15,89,200 // mulss %xmm8,%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 68,15,88,200 // addps %xmm0,%xmm9
- .byte 68,15,89,13,227,90,1,0 // mulps 0x15ae3(%rip),%xmm9 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
+ .byte 68,15,89,13,207,90,1,0 // mulps 0x15acf(%rip),%xmm9 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 68,15,40,209 // movaps %xmm1,%xmm10
.byte 69,15,89,210 // mulps %xmm10,%xmm10
@@ -41129,7 +41110,7 @@ _sk_xy_to_2pt_conical_linear_sse41:
.byte 243,69,15,89,192 // mulss %xmm8,%xmm8
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
.byte 65,15,92,192 // subps %xmm8,%xmm0
- .byte 15,87,5,159,89,1,0 // xorps 0x1599f(%rip),%xmm0 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
+ .byte 15,87,5,219,89,1,0 // xorps 0x159db(%rip),%xmm0 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
.byte 65,15,94,193 // divps %xmm9,%xmm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41177,7 +41158,7 @@ HIDDEN _sk_save_xy_sse41
FUNCTION(_sk_save_xy_sse41)
_sk_save_xy_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,254,83,1,0 // movaps 0x153fe(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,5,58,84,1,0 // movaps 0x1543a(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 15,17,0 // movups %xmm0,(%rax)
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,88,200 // addps %xmm8,%xmm9
@@ -41221,8 +41202,8 @@ _sk_bilinear_nx_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,199,89,1,0 // addps 0x159c7(%rip),%xmm0 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,111,83,1,0 // movaps 0x1536f(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,5,179,89,1,0 // addps 0x159b3(%rip),%xmm0 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,171,83,1,0 // movaps 0x153ab(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,0,1,0,0 // movups %xmm9,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -41235,7 +41216,7 @@ _sk_bilinear_px_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,59,83,1,0 // addps 0x1533b(%rip),%xmm0 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 15,88,5,119,83,1,0 // addps 0x15377(%rip),%xmm0 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 68,15,17,128,0,1,0,0 // movups %xmm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41247,8 +41228,8 @@ _sk_bilinear_ny_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,122,89,1,0 // addps 0x1597a(%rip),%xmm1 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,34,83,1,0 // movaps 0x15322(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,13,102,89,1,0 // addps 0x15966(%rip),%xmm1 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,94,83,1,0 // movaps 0x1535e(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,64,1,0,0 // movups %xmm9,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -41261,7 +41242,7 @@ _sk_bilinear_py_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,237,82,1,0 // addps 0x152ed(%rip),%xmm1 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 15,88,13,41,83,1,0 // addps 0x15329(%rip),%xmm1 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 68,15,17,128,64,1,0,0 // movups %xmm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41273,13 +41254,13 @@ _sk_bicubic_n3x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,61,89,1,0 // addps 0x1593d(%rip),%xmm0 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
- .byte 68,15,40,13,213,82,1,0 // movaps 0x152d5(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,5,41,89,1,0 // addps 0x15929(%rip),%xmm0 # 36460 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ .byte 68,15,40,13,17,83,1,0 // movaps 0x15311(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,49,89,1,0 // mulps 0x15931(%rip),%xmm9 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,13,185,84,1,0 // addps 0x154b9(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,13,29,89,1,0 // mulps 0x1591d(%rip),%xmm9 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,13,245,84,1,0 // addps 0x154f5(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,0,1,0,0 // movups %xmm9,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -41292,16 +41273,16 @@ _sk_bicubic_n1x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,229,88,1,0 // addps 0x158e5(%rip),%xmm0 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,141,82,1,0 // movaps 0x1528d(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,5,209,88,1,0 // addps 0x158d1(%rip),%xmm0 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,201,82,1,0 // movaps 0x152c9(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,1,89,1,0 // movaps 0x15901(%rip),%xmm8 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,5,237,88,1,0 // movaps 0x158ed(%rip),%xmm8 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,5,89,1,0 // addps 0x15905(%rip),%xmm8 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,5,241,88,1,0 // addps 0x158f1(%rip),%xmm8 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,89,82,1,0 // addps 0x15259(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,88,5,149,82,1,0 // addps 0x15295(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,253,88,1,0 // addps 0x158fd(%rip),%xmm8 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,5,233,88,1,0 // addps 0x158e9(%rip),%xmm8 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,128,0,1,0,0 // movups %xmm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41311,17 +41292,17 @@ HIDDEN _sk_bicubic_p1x_sse41
FUNCTION(_sk_bicubic_p1x_sse41)
_sk_bicubic_p1x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,55,82,1,0 // movaps 0x15237(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,5,115,82,1,0 // movaps 0x15273(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,136,128,0,0,0 // movups 0x80(%rax),%xmm9
.byte 65,15,88,192 // addps %xmm8,%xmm0
- .byte 68,15,40,21,176,88,1,0 // movaps 0x158b0(%rip),%xmm10 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,21,156,88,1,0 // movaps 0x1589c(%rip),%xmm10 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,180,88,1,0 // addps 0x158b4(%rip),%xmm10 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,21,160,88,1,0 // addps 0x158a0(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,176,88,1,0 // addps 0x158b0(%rip),%xmm10 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,21,156,88,1,0 // addps 0x1589c(%rip),%xmm10 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,144,0,1,0,0 // movups %xmm10,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41333,11 +41314,11 @@ _sk_bicubic_p3x_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,128,88,1,0 // addps 0x15880(%rip),%xmm0 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 15,88,5,108,88,1,0 // addps 0x1586c(%rip),%xmm0 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,80,88,1,0 // mulps 0x15850(%rip),%xmm8 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,5,216,83,1,0 // addps 0x153d8(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,5,60,88,1,0 // mulps 0x1583c(%rip),%xmm8 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,5,20,84,1,0 // addps 0x15414(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,0,1,0,0 // movups %xmm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -41350,13 +41331,13 @@ _sk_bicubic_n3y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,19,88,1,0 // addps 0x15813(%rip),%xmm1 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
- .byte 68,15,40,13,171,81,1,0 // movaps 0x151ab(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,13,255,87,1,0 // addps 0x157ff(%rip),%xmm1 # 36460 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ .byte 68,15,40,13,231,81,1,0 // movaps 0x151e7(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,7,88,1,0 // mulps 0x15807(%rip),%xmm9 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,13,143,83,1,0 // addps 0x1538f(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,13,243,87,1,0 // mulps 0x157f3(%rip),%xmm9 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,13,203,83,1,0 // addps 0x153cb(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,64,1,0,0 // movups %xmm9,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -41369,16 +41350,16 @@ _sk_bicubic_n1y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,186,87,1,0 // addps 0x157ba(%rip),%xmm1 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,98,81,1,0 // movaps 0x15162(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,13,166,87,1,0 // addps 0x157a6(%rip),%xmm1 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,158,81,1,0 // movaps 0x1519e(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,214,87,1,0 // movaps 0x157d6(%rip),%xmm8 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,5,194,87,1,0 // movaps 0x157c2(%rip),%xmm8 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,218,87,1,0 // addps 0x157da(%rip),%xmm8 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,5,198,87,1,0 // addps 0x157c6(%rip),%xmm8 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,46,81,1,0 // addps 0x1512e(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,88,5,106,81,1,0 // addps 0x1516a(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,210,87,1,0 // addps 0x157d2(%rip),%xmm8 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,5,190,87,1,0 // addps 0x157be(%rip),%xmm8 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,128,64,1,0,0 // movups %xmm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41388,17 +41369,17 @@ HIDDEN _sk_bicubic_p1y_sse41
FUNCTION(_sk_bicubic_p1y_sse41)
_sk_bicubic_p1y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,12,81,1,0 // movaps 0x1510c(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,5,72,81,1,0 // movaps 0x15148(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,136,192,0,0,0 // movups 0xc0(%rax),%xmm9
.byte 65,15,88,200 // addps %xmm8,%xmm1
- .byte 68,15,40,21,132,87,1,0 // movaps 0x15784(%rip),%xmm10 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,21,112,87,1,0 // movaps 0x15770(%rip),%xmm10 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,136,87,1,0 // addps 0x15788(%rip),%xmm10 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,21,116,87,1,0 // addps 0x15774(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,132,87,1,0 // addps 0x15784(%rip),%xmm10 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,21,112,87,1,0 // addps 0x15770(%rip),%xmm10 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,144,64,1,0,0 // movups %xmm10,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -41410,11 +41391,11 @@ _sk_bicubic_p3y_sse41:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,83,87,1,0 // addps 0x15753(%rip),%xmm1 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 15,88,13,63,87,1,0 // addps 0x1573f(%rip),%xmm1 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,35,87,1,0 // mulps 0x15723(%rip),%xmm8 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,5,171,82,1,0 // addps 0x152ab(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,5,15,87,1,0 // mulps 0x1570f(%rip),%xmm8 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,5,231,82,1,0 // addps 0x152e7(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,64,1,0,0 // movups %xmm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -41525,7 +41506,7 @@ _sk_clut_3D_sse41:
.byte 15,89,194 // mulps %xmm2,%xmm0
.byte 15,41,68,36,208 // movaps %xmm0,-0x30(%rsp)
.byte 243,15,91,240 // cvttps2dq %xmm0,%xmm6
- .byte 15,40,37,14,86,1,0 // movaps 0x1560e(%rip),%xmm4 # 36500 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ .byte 15,40,37,250,85,1,0 // movaps 0x155fa(%rip),%xmm4 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
.byte 15,88,196 // addps %xmm4,%xmm0
.byte 15,41,68,36,176 // movaps %xmm0,-0x50(%rsp)
.byte 102,65,15,110,208 // movd %r8d,%xmm2
@@ -41564,7 +41545,7 @@ _sk_clut_3D_sse41:
.byte 102,68,15,56,64,192 // pmulld %xmm0,%xmm8
.byte 102,65,15,111,216 // movdqa %xmm8,%xmm3
.byte 102,15,254,218 // paddd %xmm2,%xmm3
- .byte 102,68,15,111,37,101,85,1,0 // movdqa 0x15565(%rip),%xmm12 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,68,15,111,37,81,85,1,0 // movdqa 0x15551(%rip),%xmm12 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,65,15,56,64,220 // pmulld %xmm12,%xmm3
.byte 102,15,118,228 // pcmpeqd %xmm4,%xmm4
.byte 102,15,111,203 // movdqa %xmm3,%xmm1
@@ -41587,7 +41568,7 @@ _sk_clut_3D_sse41:
.byte 102,65,15,58,22,217,1 // pextrd $0x1,%xmm3,%r9d
.byte 102,65,15,58,22,218,2 // pextrd $0x2,%xmm3,%r10d
.byte 102,65,15,58,22,219,3 // pextrd $0x3,%xmm3,%r11d
- .byte 102,15,111,37,89,78,1,0 // movdqa 0x14e59(%rip),%xmm4 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,37,149,78,1,0 // movdqa 0x14e95(%rip),%xmm4 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,254,220 // paddd %xmm4,%xmm3
.byte 102,15,111,252 // movdqa %xmm4,%xmm7
.byte 102,73,15,58,22,222,1 // pextrq $0x1,%xmm3,%r14
@@ -41760,7 +41741,7 @@ _sk_clut_3D_sse41:
.byte 102,68,15,254,202 // paddd %xmm2,%xmm9
.byte 102,65,15,111,192 // movdqa %xmm8,%xmm0
.byte 102,65,15,254,193 // paddd %xmm9,%xmm0
- .byte 102,15,111,45,116,81,1,0 // movdqa 0x15174(%rip),%xmm5 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,45,96,81,1,0 // movdqa 0x15160(%rip),%xmm5 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,56,64,197 // pmulld %xmm5,%xmm0
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
.byte 102,15,118,246 // pcmpeqd %xmm6,%xmm6
@@ -41781,7 +41762,7 @@ _sk_clut_3D_sse41:
.byte 102,65,15,58,22,193,1 // pextrd $0x1,%xmm0,%r9d
.byte 102,65,15,58,22,194,2 // pextrd $0x2,%xmm0,%r10d
.byte 102,65,15,58,22,195,3 // pextrd $0x3,%xmm0,%r11d
- .byte 102,15,111,61,117,74,1,0 // movdqa 0x14a75(%rip),%xmm7 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,61,177,74,1,0 // movdqa 0x14ab1(%rip),%xmm7 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,254,199 // paddd %xmm7,%xmm0
.byte 102,72,15,58,22,193,1 // pextrq $0x1,%xmm0,%rcx
.byte 102,72,15,126,195 // movq %xmm0,%rbx
@@ -41847,7 +41828,7 @@ _sk_clut_3D_sse41:
.byte 15,88,248 // addps %xmm0,%xmm7
.byte 102,68,15,254,210 // paddd %xmm2,%xmm10
.byte 102,69,15,254,194 // paddd %xmm10,%xmm8
- .byte 102,15,111,13,176,79,1,0 // movdqa 0x14fb0(%rip),%xmm1 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,13,156,79,1,0 // movdqa 0x14f9c(%rip),%xmm1 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,68,15,56,64,193 // pmulld %xmm1,%xmm8
.byte 102,65,15,111,192 // movdqa %xmm8,%xmm0
.byte 102,15,118,237 // pcmpeqd %xmm5,%xmm5
@@ -41868,7 +41849,7 @@ _sk_clut_3D_sse41:
.byte 102,69,15,58,22,193,1 // pextrd $0x1,%xmm8,%r9d
.byte 102,69,15,58,22,194,2 // pextrd $0x2,%xmm8,%r10d
.byte 102,69,15,58,22,195,3 // pextrd $0x3,%xmm8,%r11d
- .byte 102,15,111,21,171,72,1,0 // movdqa 0x148ab(%rip),%xmm2 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,21,231,72,1,0 // movdqa 0x148e7(%rip),%xmm2 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,68,15,254,194 // paddd %xmm2,%xmm8
.byte 102,76,15,58,22,193,1 // pextrq $0x1,%xmm8,%rcx
.byte 102,76,15,126,195 // movq %xmm8,%rbx
@@ -41995,7 +41976,7 @@ _sk_clut_4D_sse41:
.byte 15,89,203 // mulps %xmm3,%xmm1
.byte 15,41,76,36,48 // movaps %xmm1,0x30(%rsp)
.byte 243,15,91,249 // cvttps2dq %xmm1,%xmm7
- .byte 15,40,29,14,77,1,0 // movaps 0x14d0e(%rip),%xmm3 # 36500 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ .byte 15,40,29,250,76,1,0 // movaps 0x14cfa(%rip),%xmm3 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
.byte 15,88,203 // addps %xmm3,%xmm1
.byte 15,41,76,36,160 // movaps %xmm1,-0x60(%rsp)
.byte 102,65,15,110,232 // movd %r8d,%xmm5
@@ -42052,7 +42033,7 @@ _sk_clut_4D_sse41:
.byte 102,68,15,56,64,253 // pmulld %xmm5,%xmm15
.byte 102,65,15,111,223 // movdqa %xmm15,%xmm3
.byte 102,15,254,217 // paddd %xmm1,%xmm3
- .byte 102,68,15,111,29,13,76,1,0 // movdqa 0x14c0d(%rip),%xmm11 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,68,15,111,29,249,75,1,0 // movdqa 0x14bf9(%rip),%xmm11 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,65,15,56,64,219 // pmulld %xmm11,%xmm3
.byte 102,15,118,192 // pcmpeqd %xmm0,%xmm0
.byte 102,15,111,243 // movdqa %xmm3,%xmm6
@@ -42074,7 +42055,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,58,22,217,1 // pextrd $0x1,%xmm3,%r9d
.byte 102,65,15,58,22,218,2 // pextrd $0x2,%xmm3,%r10d
.byte 102,65,15,58,22,219,3 // pextrd $0x3,%xmm3,%r11d
- .byte 102,68,15,111,21,5,69,1,0 // movdqa 0x14505(%rip),%xmm10 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,21,65,69,1,0 // movdqa 0x14541(%rip),%xmm10 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,218 // paddd %xmm10,%xmm3
.byte 102,73,15,58,22,222,1 // pextrq $0x1,%xmm3,%r14
.byte 102,72,15,126,219 // movq %xmm3,%rbx
@@ -42092,7 +42073,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,254,201 // paddd %xmm9,%xmm1
.byte 102,65,15,56,64,203 // pmulld %xmm11,%xmm1
.byte 102,15,111,217 // movdqa %xmm1,%xmm3
- .byte 102,15,250,29,67,75,1,0 // psubd 0x14b43(%rip),%xmm3 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,29,47,75,1,0 // psubd 0x14b2f(%rip),%xmm3 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,73,15,58,22,222,1 // pextrq $0x1,%xmm3,%r14
.byte 102,72,15,126,219 // movq %xmm3,%rbx
.byte 65,137,223 // mov %ebx,%r15d
@@ -42147,7 +42128,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,254,199 // paddd %xmm15,%xmm0
.byte 102,65,15,56,64,195 // pmulld %xmm11,%xmm0
.byte 102,15,111,232 // movdqa %xmm0,%xmm5
- .byte 102,15,250,45,35,74,1,0 // psubd 0x14a23(%rip),%xmm5 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,45,15,74,1,0 // psubd 0x14a0f(%rip),%xmm5 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,69,15,118,192 // pcmpeqd %xmm8,%xmm8
.byte 102,72,15,58,22,233,1 // pextrq $0x1,%xmm5,%rcx
.byte 102,72,15,126,237 // movq %xmm5,%rbp
@@ -42272,7 +42253,7 @@ _sk_clut_4D_sse41:
.byte 72,193,233,32 // shr $0x20,%rcx
.byte 243,15,16,36,136 // movss (%rax,%rcx,4),%xmm4
.byte 102,68,15,58,33,220,48 // insertps $0x30,%xmm4,%xmm11
- .byte 102,15,111,61,247,64,1,0 // movdqa 0x140f7(%rip),%xmm7 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,61,51,65,1,0 // movdqa 0x14133(%rip),%xmm7 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,254,223 // paddd %xmm7,%xmm3
.byte 102,72,15,58,22,217,1 // pextrq $0x1,%xmm3,%rcx
.byte 102,72,15,126,221 // movq %xmm3,%rbp
@@ -42358,7 +42339,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,58,22,201,1 // pextrd $0x1,%xmm1,%r9d
.byte 102,65,15,58,22,202,2 // pextrd $0x2,%xmm1,%r10d
.byte 102,65,15,58,22,203,3 // pextrd $0x3,%xmm1,%r11d
- .byte 102,68,15,111,21,59,63,1,0 // movdqa 0x13f3b(%rip),%xmm10 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,21,119,63,1,0 // movdqa 0x13f77(%rip),%xmm10 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,202 // paddd %xmm10,%xmm1
.byte 102,72,15,58,22,201,1 // pextrq $0x1,%xmm1,%rcx
.byte 102,72,15,126,203 // movq %xmm1,%rbx
@@ -42454,7 +42435,7 @@ _sk_clut_4D_sse41:
.byte 102,15,111,124,36,192 // movdqa -0x40(%rsp),%xmm7
.byte 102,15,111,199 // movdqa %xmm7,%xmm0
.byte 102,15,254,195 // paddd %xmm3,%xmm0
- .byte 102,15,111,21,229,67,1,0 // movdqa 0x143e5(%rip),%xmm2 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,21,209,67,1,0 // movdqa 0x143d1(%rip),%xmm2 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,56,64,194 // pmulld %xmm2,%xmm0
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
.byte 102,69,15,118,192 // pcmpeqd %xmm8,%xmm8
@@ -42475,7 +42456,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,58,22,193,1 // pextrd $0x1,%xmm0,%r9d
.byte 102,65,15,58,22,194,2 // pextrd $0x2,%xmm0,%r10d
.byte 102,65,15,58,22,195,3 // pextrd $0x3,%xmm0,%r11d
- .byte 102,15,111,37,228,60,1,0 // movdqa 0x13ce4(%rip),%xmm4 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,37,32,61,1,0 // movdqa 0x13d20(%rip),%xmm4 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,254,196 // paddd %xmm4,%xmm0
.byte 102,72,15,58,22,193,1 // pextrq $0x1,%xmm0,%rcx
.byte 102,72,15,126,195 // movq %xmm0,%rbx
@@ -42547,7 +42528,7 @@ _sk_clut_4D_sse41:
.byte 102,68,15,111,226 // movdqa %xmm2,%xmm12
.byte 102,65,15,56,64,204 // pmulld %xmm12,%xmm1
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
- .byte 102,15,250,21,16,66,1,0 // psubd 0x14210(%rip),%xmm2 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,21,252,65,1,0 // psubd 0x141fc(%rip),%xmm2 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,72,15,58,22,209,1 // pextrq $0x1,%xmm2,%rcx
.byte 102,72,15,126,213 // movq %xmm2,%rbp
.byte 137,235 // mov %ebp,%ebx
@@ -42581,7 +42562,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,111,249 // movdqa %xmm9,%xmm7
.byte 102,69,15,56,64,236 // pmulld %xmm12,%xmm13
.byte 102,65,15,111,205 // movdqa %xmm13,%xmm1
- .byte 102,15,250,13,92,65,1,0 // psubd 0x1415c(%rip),%xmm1 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,13,72,65,1,0 // psubd 0x14148(%rip),%xmm1 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,72,15,58,22,201,1 // pextrq $0x1,%xmm1,%rcx
.byte 102,72,15,126,203 // movq %xmm1,%rbx
.byte 137,221 // mov %ebx,%ebp
@@ -42646,7 +42627,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,111,206 // movdqa %xmm14,%xmm1
.byte 102,15,111,108,36,192 // movdqa -0x40(%rsp),%xmm5
.byte 102,15,254,205 // paddd %xmm5,%xmm1
- .byte 102,15,111,37,243,63,1,0 // movdqa 0x13ff3(%rip),%xmm4 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,37,223,63,1,0 // movdqa 0x13fdf(%rip),%xmm4 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,56,64,204 // pmulld %xmm4,%xmm1
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,118,246 // pcmpeqd %xmm6,%xmm6
@@ -42667,7 +42648,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,58,22,201,1 // pextrd $0x1,%xmm1,%r9d
.byte 102,65,15,58,22,202,2 // pextrd $0x2,%xmm1,%r10d
.byte 102,65,15,58,22,203,3 // pextrd $0x3,%xmm1,%r11d
- .byte 102,15,111,29,244,56,1,0 // movdqa 0x138f4(%rip),%xmm3 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,29,48,57,1,0 // movdqa 0x13930(%rip),%xmm3 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,254,203 // paddd %xmm3,%xmm1
.byte 102,72,15,58,22,201,1 // pextrq $0x1,%xmm1,%rcx
.byte 102,72,15,126,203 // movq %xmm1,%rbx
@@ -42739,7 +42720,7 @@ _sk_clut_4D_sse41:
.byte 102,15,56,64,239 // pmulld %xmm7,%xmm5
.byte 102,15,111,205 // movdqa %xmm5,%xmm1
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
- .byte 102,15,250,5,36,62,1,0 // psubd 0x13e24(%rip),%xmm0 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,5,16,62,1,0 // psubd 0x13e10(%rip),%xmm0 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,72,15,58,22,193,1 // pextrq $0x1,%xmm0,%rcx
.byte 102,72,15,126,197 // movq %xmm0,%rbp
.byte 137,235 // mov %ebp,%ebx
@@ -42757,7 +42738,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,58,22,193,1 // pextrd $0x1,%xmm0,%r9d
.byte 102,65,15,58,22,194,2 // pextrd $0x2,%xmm0,%r10d
.byte 102,65,15,58,22,195,3 // pextrd $0x3,%xmm0,%r11d
- .byte 102,15,254,5,34,55,1,0 // paddd 0x13722(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,5,94,55,1,0 // paddd 0x1375e(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,72,15,58,22,193,1 // pextrq $0x1,%xmm0,%rcx
.byte 102,72,15,126,195 // movq %xmm0,%rbx
.byte 137,221 // mov %ebx,%ebp
@@ -42773,7 +42754,7 @@ _sk_clut_4D_sse41:
.byte 102,15,254,84,36,176 // paddd -0x50(%rsp),%xmm2
.byte 102,15,56,64,215 // pmulld %xmm7,%xmm2
.byte 102,15,111,194 // movdqa %xmm2,%xmm0
- .byte 102,15,250,5,107,61,1,0 // psubd 0x13d6b(%rip),%xmm0 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,5,87,61,1,0 // psubd 0x13d57(%rip),%xmm0 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,72,15,58,22,193,1 // pextrq $0x1,%xmm0,%rcx
.byte 102,72,15,126,195 // movq %xmm0,%rbx
.byte 137,221 // mov %ebx,%ebp
@@ -42791,7 +42772,7 @@ _sk_clut_4D_sse41:
.byte 102,65,15,58,22,199,1 // pextrd $0x1,%xmm0,%r15d
.byte 102,65,15,58,22,196,2 // pextrd $0x2,%xmm0,%r12d
.byte 102,65,15,58,22,198,3 // pextrd $0x3,%xmm0,%r14d
- .byte 102,15,254,5,105,54,1,0 // paddd 0x13669(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,5,165,54,1,0 // paddd 0x136a5(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,72,15,58,22,195,1 // pextrq $0x1,%xmm0,%rbx
.byte 102,72,15,126,197 // movq %xmm0,%rbp
.byte 137,233 // mov %ebp,%ecx
@@ -42854,7 +42835,7 @@ _sk_clut_4D_sse41:
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 65,15,88,211 // addps %xmm11,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,38,53,1,0 // movaps 0x13526(%rip),%xmm3 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,40,29,98,53,1,0 // movaps 0x13562(%rip),%xmm3 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 72,139,76,36,248 // mov -0x8(%rsp),%rcx
.byte 15,40,100,36,64 // movaps 0x40(%rsp),%xmm4
.byte 15,40,108,36,80 // movaps 0x50(%rsp),%xmm5
@@ -42869,6 +42850,25 @@ _sk_clut_4D_sse41:
.byte 93 // pop %rbp
.byte 255,224 // jmpq *%rax
+HIDDEN _sk_gauss_a_to_rgba_sse41
+.globl _sk_gauss_a_to_rgba_sse41
+FUNCTION(_sk_gauss_a_to_rgba_sse41)
+_sk_gauss_a_to_rgba_sse41:
+ .byte 15,40,5,191,59,1,0 // movaps 0x13bbf(%rip),%xmm0 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,197,59,1,0 // addps 0x13bc5(%rip),%xmm0 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,203,59,1,0 // addps 0x13bcb(%rip),%xmm0 # 36500 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,209,59,1,0 // addps 0x13bd1(%rip),%xmm0 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,215,59,1,0 // addps 0x13bd7(%rip),%xmm0 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 72,173 // lods %ds:(%rsi),%rax
+ .byte 15,40,200 // movaps %xmm0,%xmm1
+ .byte 15,40,208 // movaps %xmm0,%xmm2
+ .byte 15,40,216 // movaps %xmm0,%xmm3
+ .byte 255,224 // jmpq *%rax
+
HIDDEN _sk_start_pipeline_sse2
.globl _sk_start_pipeline_sse2
FUNCTION(_sk_start_pipeline_sse2)
@@ -49231,25 +49231,6 @@ _sk_evenly_spaced_gradient_sse2:
.byte 65,94 // pop %r14
.byte 255,224 // jmpq *%rax
-HIDDEN _sk_gauss_a_to_rgba_sse2
-.globl _sk_gauss_a_to_rgba_sse2
-FUNCTION(_sk_gauss_a_to_rgba_sse2)
-_sk_gauss_a_to_rgba_sse2:
- .byte 15,40,5,106,220,0,0 // movaps 0xdc6a(%rip),%xmm0 # 363e0 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,112,220,0,0 // addps 0xdc70(%rip),%xmm0 # 363f0 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,118,220,0,0 // addps 0xdc76(%rip),%xmm0 # 36400 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,124,220,0,0 // addps 0xdc7c(%rip),%xmm0 # 36410 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,5,130,220,0,0 // addps 0xdc82(%rip),%xmm0 # 36420 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
- .byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,200 // movaps %xmm0,%xmm1
- .byte 15,40,208 // movaps %xmm0,%xmm2
- .byte 15,40,216 // movaps %xmm0,%xmm3
- .byte 255,224 // jmpq *%rax
-
HIDDEN _sk_gradient_sse2
.globl _sk_gradient_sse2
FUNCTION(_sk_gradient_sse2)
@@ -49258,7 +49239,7 @@ _sk_gradient_sse2:
.byte 76,139,0 // mov (%rax),%r8
.byte 102,15,239,201 // pxor %xmm1,%xmm1
.byte 73,131,248,2 // cmp $0x2,%r8
- .byte 114,41 // jb 287e3 <_sk_gradient_sse2+0x38>
+ .byte 114,41 // jb 287a7 <_sk_gradient_sse2+0x38>
.byte 76,139,72,72 // mov 0x48(%rax),%r9
.byte 73,255,200 // dec %r8
.byte 73,131,193,4 // add $0x4,%r9
@@ -49269,7 +49250,7 @@ _sk_gradient_sse2:
.byte 102,15,250,202 // psubd %xmm2,%xmm1
.byte 73,131,193,4 // add $0x4,%r9
.byte 73,255,200 // dec %r8
- .byte 117,230 // jne 287c9 <_sk_gradient_sse2+0x1e>
+ .byte 117,230 // jne 2878d <_sk_gradient_sse2+0x1e>
.byte 65,86 // push %r14
.byte 83 // push %rbx
.byte 102,15,112,209,78 // pshufd $0x4e,%xmm1,%xmm2
@@ -49409,29 +49390,29 @@ _sk_xy_to_unit_angle_sse2:
.byte 69,15,94,220 // divps %xmm12,%xmm11
.byte 69,15,40,227 // movaps %xmm11,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
- .byte 68,15,40,45,18,218,0,0 // movaps 0xda12(%rip),%xmm13 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ .byte 68,15,40,45,254,217,0,0 // movaps 0xd9fe(%rip),%xmm13 # 363e0 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
- .byte 68,15,88,45,22,218,0,0 // addps 0xda16(%rip),%xmm13 # 36440 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ .byte 68,15,88,45,2,218,0,0 // addps 0xda02(%rip),%xmm13 # 363f0 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
- .byte 68,15,88,45,26,218,0,0 // addps 0xda1a(%rip),%xmm13 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,88,45,6,218,0,0 // addps 0xda06(%rip),%xmm13 # 36400 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
.byte 69,15,89,236 // mulps %xmm12,%xmm13
- .byte 68,15,88,45,30,218,0,0 // addps 0xda1e(%rip),%xmm13 # 36460 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ .byte 68,15,88,45,10,218,0,0 // addps 0xda0a(%rip),%xmm13 # 36410 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
.byte 69,15,89,235 // mulps %xmm11,%xmm13
.byte 69,15,194,202,1 // cmpltps %xmm10,%xmm9
- .byte 68,15,40,21,29,218,0,0 // movaps 0xda1d(%rip),%xmm10 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,40,21,9,218,0,0 // movaps 0xda09(%rip),%xmm10 # 36420 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
.byte 69,15,92,213 // subps %xmm13,%xmm10
.byte 69,15,84,209 // andps %xmm9,%xmm10
.byte 69,15,85,205 // andnps %xmm13,%xmm9
.byte 69,15,86,202 // orps %xmm10,%xmm9
.byte 68,15,194,192,1 // cmpltps %xmm0,%xmm8
- .byte 68,15,40,21,208,211,0,0 // movaps 0xd3d0(%rip),%xmm10 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,21,12,212,0,0 // movaps 0xd40c(%rip),%xmm10 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 69,15,92,209 // subps %xmm9,%xmm10
.byte 69,15,84,208 // andps %xmm8,%xmm10
.byte 69,15,85,193 // andnps %xmm9,%xmm8
.byte 69,15,86,194 // orps %xmm10,%xmm8
.byte 68,15,40,201 // movaps %xmm1,%xmm9
.byte 68,15,194,200,1 // cmpltps %xmm0,%xmm9
- .byte 68,15,40,21,191,211,0,0 // movaps 0xd3bf(%rip),%xmm10 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 68,15,40,21,251,211,0,0 // movaps 0xd3fb(%rip),%xmm10 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,208 // subps %xmm8,%xmm10
.byte 69,15,84,209 // andps %xmm9,%xmm10
.byte 69,15,85,200 // andnps %xmm8,%xmm9
@@ -49466,7 +49447,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 243,69,15,89,203 // mulss %xmm11,%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 68,15,88,200 // addps %xmm0,%xmm9
- .byte 68,15,89,13,134,217,0,0 // mulps 0xd986(%rip),%xmm9 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
+ .byte 68,15,89,13,114,217,0,0 // mulps 0xd972(%rip),%xmm9 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 68,15,40,225 // movaps %xmm1,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
@@ -49474,7 +49455,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 243,69,15,89,219 // mulss %xmm11,%xmm11
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,92,227 // subps %xmm11,%xmm12
- .byte 68,15,89,21,113,217,0,0 // mulps 0xd971(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
+ .byte 68,15,89,21,93,217,0,0 // mulps 0xd95d(%rip),%xmm10 # 36440 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
.byte 69,15,89,212 // mulps %xmm12,%xmm10
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 15,89,192 // mulps %xmm0,%xmm0
@@ -49483,8 +49464,8 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 65,15,92,193 // subps %xmm9,%xmm0
- .byte 68,15,87,13,25,216,0,0 // xorps 0xd819(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
- .byte 68,15,89,5,241,210,0,0 // mulps 0xd2f1(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,87,13,85,216,0,0 // xorps 0xd855(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
+ .byte 68,15,89,5,45,211,0,0 // mulps 0xd32d(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 69,15,92,202 // subps %xmm10,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
@@ -49505,7 +49486,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 243,69,15,89,203 // mulss %xmm11,%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 68,15,88,200 // addps %xmm0,%xmm9
- .byte 68,15,89,13,232,216,0,0 // mulps 0xd8e8(%rip),%xmm9 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
+ .byte 68,15,89,13,212,216,0,0 // mulps 0xd8d4(%rip),%xmm9 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 68,15,40,225 // movaps %xmm1,%xmm12
.byte 69,15,89,228 // mulps %xmm12,%xmm12
@@ -49513,7 +49494,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 243,69,15,89,219 // mulss %xmm11,%xmm11
.byte 69,15,198,219,0 // shufps $0x0,%xmm11,%xmm11
.byte 69,15,92,227 // subps %xmm11,%xmm12
- .byte 68,15,89,21,211,216,0,0 // mulps 0xd8d3(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
+ .byte 68,15,89,21,191,216,0,0 // mulps 0xd8bf(%rip),%xmm10 # 36440 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
.byte 69,15,89,212 // mulps %xmm12,%xmm10
.byte 65,15,40,193 // movaps %xmm9,%xmm0
.byte 15,89,192 // mulps %xmm0,%xmm0
@@ -49522,8 +49503,8 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
.byte 65,15,40,194 // movaps %xmm10,%xmm0
.byte 65,15,92,193 // subps %xmm9,%xmm0
- .byte 68,15,87,13,123,215,0,0 // xorps 0xd77b(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
- .byte 68,15,89,5,83,210,0,0 // mulps 0xd253(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,87,13,183,215,0,0 // xorps 0xd7b7(%rip),%xmm9 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
+ .byte 68,15,89,5,143,210,0,0 // mulps 0xd28f(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 65,15,89,192 // mulps %xmm8,%xmm0
.byte 69,15,92,202 // subps %xmm10,%xmm9
.byte 69,15,89,200 // mulps %xmm8,%xmm9
@@ -49541,7 +49522,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 243,69,15,89,200 // mulss %xmm8,%xmm9
.byte 69,15,198,201,0 // shufps $0x0,%xmm9,%xmm9
.byte 68,15,88,200 // addps %xmm0,%xmm9
- .byte 68,15,89,13,91,216,0,0 // mulps 0xd85b(%rip),%xmm9 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
+ .byte 68,15,89,13,71,216,0,0 // mulps 0xd847(%rip),%xmm9 # 36430 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 68,15,40,209 // movaps %xmm1,%xmm10
.byte 69,15,89,210 // mulps %xmm10,%xmm10
@@ -49549,7 +49530,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 243,69,15,89,192 // mulss %xmm8,%xmm8
.byte 69,15,198,192,0 // shufps $0x0,%xmm8,%xmm8
.byte 65,15,92,192 // subps %xmm8,%xmm0
- .byte 15,87,5,23,215,0,0 // xorps 0xd717(%rip),%xmm0 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
+ .byte 15,87,5,83,215,0,0 // xorps 0xd753(%rip),%xmm0 # 36360 <_sk_srcover_bgra_8888_sse2_lowp+0x1058>
.byte 65,15,94,193 // divps %xmm9,%xmm0
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49595,7 +49576,7 @@ HIDDEN _sk_save_xy_sse2
FUNCTION(_sk_save_xy_sse2)
_sk_save_xy_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,126,209,0,0 // movaps 0xd17e(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,5,186,209,0,0 // movaps 0xd1ba(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 15,17,0 // movups %xmm0,(%rax)
.byte 68,15,40,200 // movaps %xmm0,%xmm9
.byte 69,15,88,200 // addps %xmm8,%xmm9
@@ -49603,7 +49584,7 @@ _sk_save_xy_sse2:
.byte 69,15,91,210 // cvtdq2ps %xmm10,%xmm10
.byte 69,15,40,217 // movaps %xmm9,%xmm11
.byte 69,15,194,218,1 // cmpltps %xmm10,%xmm11
- .byte 68,15,40,37,105,209,0,0 // movaps 0xd169(%rip),%xmm12 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 68,15,40,37,165,209,0,0 // movaps 0xd1a5(%rip),%xmm12 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,84,220 // andps %xmm12,%xmm11
.byte 69,15,92,211 // subps %xmm11,%xmm10
.byte 69,15,92,202 // subps %xmm10,%xmm9
@@ -49650,8 +49631,8 @@ _sk_bilinear_nx_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,25,215,0,0 // addps 0xd719(%rip),%xmm0 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,193,208,0,0 // movaps 0xd0c1(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,5,5,215,0,0 // addps 0xd705(%rip),%xmm0 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,253,208,0,0 // movaps 0xd0fd(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,0,1,0,0 // movups %xmm9,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -49664,7 +49645,7 @@ _sk_bilinear_px_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,141,208,0,0 // addps 0xd08d(%rip),%xmm0 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 15,88,5,201,208,0,0 // addps 0xd0c9(%rip),%xmm0 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 68,15,17,128,0,1,0,0 // movups %xmm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49676,8 +49657,8 @@ _sk_bilinear_ny_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,204,214,0,0 // addps 0xd6cc(%rip),%xmm1 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,116,208,0,0 // movaps 0xd074(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,13,184,214,0,0 // addps 0xd6b8(%rip),%xmm1 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,176,208,0,0 // movaps 0xd0b0(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 68,15,17,136,64,1,0,0 // movups %xmm9,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -49690,7 +49671,7 @@ _sk_bilinear_py_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,63,208,0,0 // addps 0xd03f(%rip),%xmm1 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 15,88,13,123,208,0,0 // addps 0xd07b(%rip),%xmm1 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 68,15,17,128,64,1,0,0 // movups %xmm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49702,13 +49683,13 @@ _sk_bicubic_n3x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,143,214,0,0 // addps 0xd68f(%rip),%xmm0 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
- .byte 68,15,40,13,39,208,0,0 // movaps 0xd027(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,5,123,214,0,0 // addps 0xd67b(%rip),%xmm0 # 36460 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ .byte 68,15,40,13,99,208,0,0 // movaps 0xd063(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,131,214,0,0 // mulps 0xd683(%rip),%xmm9 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,13,11,210,0,0 // addps 0xd20b(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,13,111,214,0,0 // mulps 0xd66f(%rip),%xmm9 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,13,71,210,0,0 // addps 0xd247(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,0,1,0,0 // movups %xmm9,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -49721,16 +49702,16 @@ _sk_bicubic_n1x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,55,214,0,0 // addps 0xd637(%rip),%xmm0 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,223,207,0,0 // movaps 0xcfdf(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,5,35,214,0,0 // addps 0xd623(%rip),%xmm0 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,27,208,0,0 // movaps 0xd01b(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,83,214,0,0 // movaps 0xd653(%rip),%xmm8 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,5,63,214,0,0 // movaps 0xd63f(%rip),%xmm8 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,87,214,0,0 // addps 0xd657(%rip),%xmm8 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,5,67,214,0,0 // addps 0xd643(%rip),%xmm8 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,171,207,0,0 // addps 0xcfab(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,88,5,231,207,0,0 // addps 0xcfe7(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,79,214,0,0 // addps 0xd64f(%rip),%xmm8 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,5,59,214,0,0 // addps 0xd63b(%rip),%xmm8 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,128,0,1,0,0 // movups %xmm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49740,17 +49721,17 @@ HIDDEN _sk_bicubic_p1x_sse2
FUNCTION(_sk_bicubic_p1x_sse2)
_sk_bicubic_p1x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,137,207,0,0 // movaps 0xcf89(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,5,197,207,0,0 // movaps 0xcfc5(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,136,128,0,0,0 // movups 0x80(%rax),%xmm9
.byte 65,15,88,192 // addps %xmm8,%xmm0
- .byte 68,15,40,21,2,214,0,0 // movaps 0xd602(%rip),%xmm10 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,21,238,213,0,0 // movaps 0xd5ee(%rip),%xmm10 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,6,214,0,0 // addps 0xd606(%rip),%xmm10 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,21,242,213,0,0 // addps 0xd5f2(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,2,214,0,0 // addps 0xd602(%rip),%xmm10 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,21,238,213,0,0 // addps 0xd5ee(%rip),%xmm10 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,144,0,1,0,0 // movups %xmm10,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49762,11 +49743,11 @@ _sk_bicubic_p3x_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,0 // movups (%rax),%xmm0
.byte 68,15,16,128,128,0,0,0 // movups 0x80(%rax),%xmm8
- .byte 15,88,5,210,213,0,0 // addps 0xd5d2(%rip),%xmm0 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 15,88,5,190,213,0,0 // addps 0xd5be(%rip),%xmm0 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,162,213,0,0 // mulps 0xd5a2(%rip),%xmm8 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,5,42,209,0,0 // addps 0xd12a(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,5,142,213,0,0 // mulps 0xd58e(%rip),%xmm8 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,5,102,209,0,0 // addps 0xd166(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,0,1,0,0 // movups %xmm8,0x100(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -49779,13 +49760,13 @@ _sk_bicubic_n3y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,101,213,0,0 // addps 0xd565(%rip),%xmm1 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
- .byte 68,15,40,13,253,206,0,0 // movaps 0xcefd(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,13,81,213,0,0 // addps 0xd551(%rip),%xmm1 # 36460 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ .byte 68,15,40,13,57,207,0,0 // movaps 0xcf39(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
.byte 69,15,40,193 // movaps %xmm9,%xmm8
.byte 69,15,89,192 // mulps %xmm8,%xmm8
- .byte 68,15,89,13,89,213,0,0 // mulps 0xd559(%rip),%xmm9 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,13,225,208,0,0 // addps 0xd0e1(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,13,69,213,0,0 // mulps 0xd545(%rip),%xmm9 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,13,29,209,0,0 // addps 0xd11d(%rip),%xmm9 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,200 // mulps %xmm8,%xmm9
.byte 68,15,17,136,64,1,0,0 // movups %xmm9,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -49798,16 +49779,16 @@ _sk_bicubic_n1y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,12,213,0,0 // addps 0xd50c(%rip),%xmm1 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- .byte 68,15,40,13,180,206,0,0 // movaps 0xceb4(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,88,13,248,212,0,0 // addps 0xd4f8(%rip),%xmm1 # 36450 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ .byte 68,15,40,13,240,206,0,0 // movaps 0xcef0(%rip),%xmm9 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 69,15,92,200 // subps %xmm8,%xmm9
- .byte 68,15,40,5,40,213,0,0 // movaps 0xd528(%rip),%xmm8 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,5,20,213,0,0 // movaps 0xd514(%rip),%xmm8 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,44,213,0,0 // addps 0xd52c(%rip),%xmm8 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,5,24,213,0,0 // addps 0xd518(%rip),%xmm8 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,128,206,0,0 // addps 0xce80(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,88,5,188,206,0,0 // addps 0xcebc(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
- .byte 68,15,88,5,36,213,0,0 // addps 0xd524(%rip),%xmm8 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,5,16,213,0,0 // addps 0xd510(%rip),%xmm8 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,128,64,1,0,0 // movups %xmm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49817,17 +49798,17 @@ HIDDEN _sk_bicubic_p1y_sse2
FUNCTION(_sk_bicubic_p1y_sse2)
_sk_bicubic_p1y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 68,15,40,5,94,206,0,0 // movaps 0xce5e(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
+ .byte 68,15,40,5,154,206,0,0 // movaps 0xce9a(%rip),%xmm8 # 35e40 <_sk_srcover_bgra_8888_sse2_lowp+0xb38>
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,136,192,0,0,0 // movups 0xc0(%rax),%xmm9
.byte 65,15,88,200 // addps %xmm8,%xmm1
- .byte 68,15,40,21,214,212,0,0 // movaps 0xd4d6(%rip),%xmm10 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ .byte 68,15,40,21,194,212,0,0 // movaps 0xd4c2(%rip),%xmm10 # 36480 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,218,212,0,0 // addps 0xd4da(%rip),%xmm10 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 68,15,88,21,198,212,0,0 // addps 0xd4c6(%rip),%xmm10 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,89,209 // mulps %xmm9,%xmm10
.byte 69,15,88,208 // addps %xmm8,%xmm10
.byte 69,15,89,209 // mulps %xmm9,%xmm10
- .byte 68,15,88,21,214,212,0,0 // addps 0xd4d6(%rip),%xmm10 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 68,15,88,21,194,212,0,0 // addps 0xd4c2(%rip),%xmm10 # 364a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
.byte 68,15,17,144,64,1,0,0 // movups %xmm10,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 255,224 // jmpq *%rax
@@ -49839,11 +49820,11 @@ _sk_bicubic_p3y_sse2:
.byte 72,173 // lods %ds:(%rsi),%rax
.byte 15,16,72,64 // movups 0x40(%rax),%xmm1
.byte 68,15,16,128,192,0,0,0 // movups 0xc0(%rax),%xmm8
- .byte 15,88,13,165,212,0,0 // addps 0xd4a5(%rip),%xmm1 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 15,88,13,145,212,0,0 // addps 0xd491(%rip),%xmm1 # 36490 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
.byte 69,15,40,200 // movaps %xmm8,%xmm9
.byte 69,15,89,201 // mulps %xmm9,%xmm9
- .byte 68,15,89,5,117,212,0,0 // mulps 0xd475(%rip),%xmm8 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
- .byte 68,15,88,5,253,207,0,0 // addps 0xcffd(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
+ .byte 68,15,89,5,97,212,0,0 // mulps 0xd461(%rip),%xmm8 # 36470 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ .byte 68,15,88,5,57,208,0,0 // addps 0xd039(%rip),%xmm8 # 36050 <_sk_srcover_bgra_8888_sse2_lowp+0xd48>
.byte 69,15,89,193 // mulps %xmm9,%xmm8
.byte 68,15,17,128,64,1,0,0 // movups %xmm8,0x140(%rax)
.byte 72,173 // lods %ds:(%rsi),%rax
@@ -49988,7 +49969,7 @@ _sk_clut_3D_sse2:
.byte 102,65,15,254,205 // paddd %xmm13,%xmm1
.byte 102,68,15,127,108,36,208 // movdqa %xmm13,-0x30(%rsp)
.byte 102,15,254,217 // paddd %xmm1,%xmm3
- .byte 102,68,15,111,5,188,210,0,0 // movdqa 0xd2bc(%rip),%xmm8 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,68,15,111,5,168,210,0,0 // movdqa 0xd2a8(%rip),%xmm8 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,112,195,245 // pshufd $0xf5,%xmm3,%xmm0
.byte 102,65,15,244,216 // pmuludq %xmm8,%xmm3
.byte 102,65,15,244,192 // pmuludq %xmm8,%xmm0
@@ -50027,7 +50008,7 @@ _sk_clut_3D_sse2:
.byte 243,66,15,16,44,139 // movss (%rbx,%r9,4),%xmm5
.byte 15,20,236 // unpcklps %xmm4,%xmm5
.byte 102,15,20,221 // unpcklpd %xmm5,%xmm3
- .byte 102,68,15,111,37,115,203,0,0 // movdqa 0xcb73(%rip),%xmm12 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,37,175,203,0,0 // movdqa 0xcbaf(%rip),%xmm12 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,196 // paddd %xmm12,%xmm0
.byte 102,15,112,224,78 // pshufd $0x4e,%xmm0,%xmm4
.byte 102,73,15,126,224 // movq %xmm4,%r8
@@ -50043,7 +50024,7 @@ _sk_clut_3D_sse2:
.byte 243,66,15,16,36,139 // movss (%rbx,%r9,4),%xmm4
.byte 15,20,224 // unpcklps %xmm0,%xmm4
.byte 102,15,20,236 // unpcklpd %xmm4,%xmm5
- .byte 15,40,37,168,209,0,0 // movaps 0xd1a8(%rip),%xmm4 # 36500 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ .byte 15,40,37,148,209,0,0 // movaps 0xd194(%rip),%xmm4 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
.byte 68,15,88,220 // addps %xmm4,%xmm11
.byte 68,15,41,92,36,192 // movaps %xmm11,-0x40(%rsp)
.byte 68,15,40,223 // movaps %xmm7,%xmm11
@@ -50079,7 +50060,7 @@ _sk_clut_3D_sse2:
.byte 15,20,249 // unpcklps %xmm1,%xmm7
.byte 102,15,20,252 // unpcklpd %xmm4,%xmm7
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
- .byte 102,15,250,13,29,209,0,0 // psubd 0xd11d(%rip),%xmm1 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,13,9,209,0,0 // psubd 0xd109(%rip),%xmm1 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,225,78 // pshufd $0x4e,%xmm1,%xmm4
.byte 102,73,15,126,224 // movq %xmm4,%r8
.byte 102,72,15,126,200 // movq %xmm1,%rax
@@ -50169,7 +50150,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,44,131 // movss (%rbx,%rax,4),%xmm5
.byte 15,20,233 // unpcklps %xmm1,%xmm5
.byte 102,15,20,221 // unpcklpd %xmm5,%xmm3
- .byte 102,68,15,111,45,229,200,0,0 // movdqa 0xc8e5(%rip),%xmm13 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,45,33,201,0,0 // movdqa 0xc921(%rip),%xmm13 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,197 // paddd %xmm13,%xmm0
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
.byte 102,73,15,126,200 // movq %xmm1,%r8
@@ -50266,7 +50247,7 @@ _sk_clut_3D_sse2:
.byte 102,15,111,206 // movdqa %xmm6,%xmm1
.byte 102,65,15,254,202 // paddd %xmm10,%xmm1
.byte 102,15,112,209,245 // pshufd $0xf5,%xmm1,%xmm2
- .byte 102,15,111,29,184,205,0,0 // movdqa 0xcdb8(%rip),%xmm3 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,29,164,205,0,0 // movdqa 0xcda4(%rip),%xmm3 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,203 // pmuludq %xmm3,%xmm1
.byte 102,15,244,211 // pmuludq %xmm3,%xmm2
.byte 102,15,111,251 // movdqa %xmm3,%xmm7
@@ -50304,7 +50285,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,44,131 // movss (%rbx,%rax,4),%xmm5
.byte 15,20,236 // unpcklps %xmm4,%xmm5
.byte 102,15,20,213 // unpcklpd %xmm5,%xmm2
- .byte 102,15,111,5,120,198,0,0 // movdqa 0xc678(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,111,5,180,198,0,0 // movdqa 0xc6b4(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,254,216 // paddd %xmm0,%xmm3
.byte 102,15,112,227,78 // pshufd $0x4e,%xmm3,%xmm4
.byte 102,73,15,126,224 // movq %xmm4,%r8
@@ -50385,7 +50366,7 @@ _sk_clut_3D_sse2:
.byte 102,15,111,214 // movdqa %xmm6,%xmm2
.byte 102,65,15,254,212 // paddd %xmm12,%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,13,149,203,0,0 // movdqa 0xcb95(%rip),%xmm1 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,13,129,203,0,0 // movdqa 0xcb81(%rip),%xmm1 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,209 // pmuludq %xmm1,%xmm2
.byte 102,15,244,193 // pmuludq %xmm1,%xmm0
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
@@ -50407,7 +50388,7 @@ _sk_clut_3D_sse2:
.byte 68,15,20,209 // unpcklps %xmm1,%xmm10
.byte 102,68,15,20,210 // unpcklpd %xmm2,%xmm10
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 102,15,250,13,58,203,0,0 // psubd 0xcb3a(%rip),%xmm1 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,13,38,203,0,0 // psubd 0xcb26(%rip),%xmm1 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,209,78 // pshufd $0x4e,%xmm1,%xmm2
.byte 102,73,15,126,208 // movq %xmm2,%r8
.byte 102,72,15,126,200 // movq %xmm1,%rax
@@ -50422,7 +50403,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,20,131 // movss (%rbx,%rax,4),%xmm2
.byte 15,20,209 // unpcklps %xmm1,%xmm2
.byte 102,15,20,226 // unpcklpd %xmm2,%xmm4
- .byte 102,15,254,5,85,196,0,0 // paddd 0xc455(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,5,145,196,0,0 // paddd 0xc491(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
.byte 102,73,15,126,200 // movq %xmm1,%r8
.byte 102,72,15,126,192 // movq %xmm0,%rax
@@ -50459,7 +50440,7 @@ _sk_clut_3D_sse2:
.byte 15,20,199 // unpcklps %xmm7,%xmm0
.byte 102,15,20,193 // unpcklpd %xmm1,%xmm0
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
- .byte 102,15,250,13,68,202,0,0 // psubd 0xca44(%rip),%xmm1 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,13,48,202,0,0 // psubd 0xca30(%rip),%xmm1 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,249,78 // pshufd $0x4e,%xmm1,%xmm7
.byte 102,73,15,126,248 // movq %xmm7,%r8
.byte 102,72,15,126,200 // movq %xmm1,%rax
@@ -50474,7 +50455,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,52,131 // movss (%rbx,%rax,4),%xmm6
.byte 15,20,247 // unpcklps %xmm7,%xmm6
.byte 102,15,20,206 // unpcklpd %xmm6,%xmm1
- .byte 102,15,254,21,95,195,0,0 // paddd 0xc35f(%rip),%xmm2 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,21,155,195,0,0 // paddd 0xc39b(%rip),%xmm2 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,112,242,78 // pshufd $0x4e,%xmm2,%xmm6
.byte 102,73,15,126,240 // movq %xmm6,%r8
.byte 102,72,15,126,208 // movq %xmm2,%rax
@@ -50620,7 +50601,7 @@ _sk_clut_4D_sse2:
.byte 102,65,15,254,210 // paddd %xmm10,%xmm2
.byte 102,15,111,220 // movdqa %xmm4,%xmm3
.byte 102,15,254,218 // paddd %xmm2,%xmm3
- .byte 102,15,111,37,135,199,0,0 // movdqa 0xc787(%rip),%xmm4 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,37,115,199,0,0 // movdqa 0xc773(%rip),%xmm4 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,112,195,245 // pshufd $0xf5,%xmm3,%xmm0
.byte 102,15,244,220 // pmuludq %xmm4,%xmm3
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
@@ -50659,7 +50640,7 @@ _sk_clut_4D_sse2:
.byte 243,66,15,16,52,139 // movss (%rbx,%r9,4),%xmm6
.byte 15,20,244 // unpcklps %xmm4,%xmm6
.byte 102,15,20,238 // unpcklpd %xmm6,%xmm5
- .byte 102,15,254,5,65,192,0,0 // paddd 0xc041(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,5,125,192,0,0 // paddd 0xc07d(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,112,224,78 // pshufd $0x4e,%xmm0,%xmm4
.byte 102,73,15,126,224 // movq %xmm4,%r8
.byte 102,73,15,126,193 // movq %xmm0,%r9
@@ -50674,7 +50655,7 @@ _sk_clut_4D_sse2:
.byte 243,66,15,16,52,139 // movss (%rbx,%r9,4),%xmm6
.byte 15,20,244 // unpcklps %xmm4,%xmm6
.byte 102,15,20,222 // unpcklpd %xmm6,%xmm3
- .byte 15,40,53,123,198,0,0 // movaps 0xc67b(%rip),%xmm6 # 36500 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ .byte 15,40,53,103,198,0,0 // movaps 0xc667(%rip),%xmm6 # 364b0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
.byte 68,15,88,198 // addps %xmm6,%xmm8
.byte 68,15,41,68,36,176 // movaps %xmm8,-0x50(%rsp)
.byte 68,15,88,254 // addps %xmm6,%xmm15
@@ -50692,7 +50673,7 @@ _sk_clut_4D_sse2:
.byte 102,65,15,254,215 // paddd %xmm15,%xmm2
.byte 102,68,15,127,124,36,224 // movdqa %xmm15,-0x20(%rsp)
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,13,49,198,0,0 // movdqa 0xc631(%rip),%xmm1 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,13,29,198,0,0 // movdqa 0xc61d(%rip),%xmm1 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,209 // pmuludq %xmm1,%xmm2
.byte 102,15,244,193 // pmuludq %xmm1,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
@@ -50713,7 +50694,7 @@ _sk_clut_4D_sse2:
.byte 15,20,240 // unpcklps %xmm0,%xmm6
.byte 102,15,20,242 // unpcklpd %xmm2,%xmm6
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
- .byte 102,15,250,5,220,197,0,0 // psubd 0xc5dc(%rip),%xmm0 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,5,200,197,0,0 // psubd 0xc5c8(%rip),%xmm0 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,208,78 // pshufd $0x4e,%xmm0,%xmm2
.byte 102,73,15,126,208 // movq %xmm2,%r8
.byte 102,72,15,126,192 // movq %xmm0,%rax
@@ -50728,7 +50709,7 @@ _sk_clut_4D_sse2:
.byte 243,68,15,16,28,131 // movss (%rbx,%rax,4),%xmm11
.byte 68,15,20,216 // unpcklps %xmm0,%xmm11
.byte 102,65,15,20,211 // unpcklpd %xmm11,%xmm2
- .byte 102,15,254,13,244,190,0,0 // paddd 0xbef4(%rip),%xmm1 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,13,48,191,0,0 // paddd 0xbf30(%rip),%xmm1 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,112,193,78 // pshufd $0x4e,%xmm1,%xmm0
.byte 102,73,15,126,192 // movq %xmm0,%r8
.byte 102,72,15,126,200 // movq %xmm1,%rax
@@ -50766,7 +50747,7 @@ _sk_clut_4D_sse2:
.byte 102,65,15,111,194 // movdqa %xmm10,%xmm0
.byte 102,15,254,68,36,160 // paddd -0x60(%rsp),%xmm0
.byte 102,15,112,216,245 // pshufd $0xf5,%xmm0,%xmm3
- .byte 102,15,111,37,219,196,0,0 // movdqa 0xc4db(%rip),%xmm4 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,37,199,196,0,0 // movdqa 0xc4c7(%rip),%xmm4 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
.byte 102,15,244,220 // pmuludq %xmm4,%xmm3
.byte 102,68,15,111,220 // movdqa %xmm4,%xmm11
@@ -50804,7 +50785,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,60,131 // movss (%rbx,%rax,4),%xmm7
.byte 15,20,253 // unpcklps %xmm5,%xmm7
.byte 102,15,20,199 // unpcklpd %xmm7,%xmm0
- .byte 102,68,15,111,5,151,189,0,0 // movdqa 0xbd97(%rip),%xmm8 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,5,211,189,0,0 // movdqa 0xbdd3(%rip),%xmm8 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,224 // paddd %xmm8,%xmm4
.byte 102,15,112,236,78 // pshufd $0x4e,%xmm4,%xmm5
.byte 102,73,15,126,232 // movq %xmm5,%r8
@@ -50950,7 +50931,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,131 // movss (%rbx,%rax,4),%xmm4
.byte 15,20,226 // unpcklps %xmm2,%xmm4
.byte 102,15,20,252 // unpcklpd %xmm4,%xmm7
- .byte 102,68,15,111,61,241,186,0,0 // movdqa 0xbaf1(%rip),%xmm15 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,61,45,187,0,0 // movdqa 0xbb2d(%rip),%xmm15 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,207 // paddd %xmm15,%xmm1
.byte 102,15,112,209,78 // pshufd $0x4e,%xmm1,%xmm2
.byte 102,73,15,126,208 // movq %xmm2,%r8
@@ -51033,7 +51014,7 @@ _sk_clut_4D_sse2:
.byte 102,65,15,111,217 // movdqa %xmm9,%xmm3
.byte 102,65,15,254,216 // paddd %xmm8,%xmm3
.byte 102,15,112,211,245 // pshufd $0xf5,%xmm3,%xmm2
- .byte 102,15,111,45,16,192,0,0 // movdqa 0xc010(%rip),%xmm5 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,45,252,191,0,0 // movdqa 0xbffc(%rip),%xmm5 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,221 // pmuludq %xmm5,%xmm3
.byte 102,15,244,213 // pmuludq %xmm5,%xmm2
.byte 102,15,112,234,232 // pshufd $0xe8,%xmm2,%xmm5
@@ -51054,7 +51035,7 @@ _sk_clut_4D_sse2:
.byte 68,15,20,198 // unpcklps %xmm6,%xmm8
.byte 102,68,15,20,197 // unpcklpd %xmm5,%xmm8
.byte 102,15,111,234 // movdqa %xmm2,%xmm5
- .byte 102,15,250,45,185,191,0,0 // psubd 0xbfb9(%rip),%xmm5 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,45,165,191,0,0 // psubd 0xbfa5(%rip),%xmm5 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,245,78 // pshufd $0x4e,%xmm5,%xmm6
.byte 102,73,15,126,240 // movq %xmm6,%r8
.byte 102,72,15,126,232 // movq %xmm5,%rax
@@ -51086,7 +51067,7 @@ _sk_clut_4D_sse2:
.byte 102,15,20,214 // unpcklpd %xmm6,%xmm2
.byte 102,69,15,254,205 // paddd %xmm13,%xmm9
.byte 102,65,15,112,233,245 // pshufd $0xf5,%xmm9,%xmm5
- .byte 102,15,111,29,23,191,0,0 // movdqa 0xbf17(%rip),%xmm3 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,29,3,191,0,0 // movdqa 0xbf03(%rip),%xmm3 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,68,15,244,203 // pmuludq %xmm3,%xmm9
.byte 102,15,244,235 // pmuludq %xmm3,%xmm5
.byte 102,15,112,237,232 // pshufd $0xe8,%xmm5,%xmm5
@@ -51107,7 +51088,7 @@ _sk_clut_4D_sse2:
.byte 69,15,20,233 // unpcklps %xmm9,%xmm13
.byte 102,68,15,20,237 // unpcklpd %xmm5,%xmm13
.byte 102,65,15,111,239 // movdqa %xmm15,%xmm5
- .byte 102,15,250,45,183,190,0,0 // psubd 0xbeb7(%rip),%xmm5 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,45,163,190,0,0 // psubd 0xbea3(%rip),%xmm5 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,221,78 // pshufd $0x4e,%xmm5,%xmm3
.byte 102,73,15,126,216 // movq %xmm3,%r8
.byte 102,72,15,126,232 // movq %xmm5,%rax
@@ -51122,7 +51103,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,131 // movss (%rbx,%rax,4),%xmm5
.byte 15,20,235 // unpcklps %xmm3,%xmm5
.byte 102,15,20,245 // unpcklpd %xmm5,%xmm6
- .byte 102,68,15,111,13,209,183,0,0 // movdqa 0xb7d1(%rip),%xmm9 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,13,13,184,0,0 // movdqa 0xb80d(%rip),%xmm9 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,69,15,254,249 // paddd %xmm9,%xmm15
.byte 102,65,15,112,223,78 // pshufd $0x4e,%xmm15,%xmm3
.byte 102,73,15,126,216 // movq %xmm3,%r8
@@ -51184,7 +51165,7 @@ _sk_clut_4D_sse2:
.byte 102,65,15,111,195 // movdqa %xmm11,%xmm0
.byte 102,15,254,195 // paddd %xmm3,%xmm0
.byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1
- .byte 102,15,111,21,82,189,0,0 // movdqa 0xbd52(%rip),%xmm2 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,21,62,189,0,0 // movdqa 0xbd3e(%rip),%xmm2 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,68,15,111,234 // movdqa %xmm2,%xmm13
@@ -51377,7 +51358,7 @@ _sk_clut_4D_sse2:
.byte 68,15,20,238 // unpcklps %xmm6,%xmm13
.byte 102,68,15,20,234 // unpcklpd %xmm2,%xmm13
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
- .byte 102,15,250,21,238,185,0,0 // psubd 0xb9ee(%rip),%xmm2 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,21,218,185,0,0 // psubd 0xb9da(%rip),%xmm2 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,242,78 // pshufd $0x4e,%xmm2,%xmm6
.byte 102,73,15,126,240 // movq %xmm6,%r8
.byte 102,72,15,126,208 // movq %xmm2,%rax
@@ -51437,7 +51418,7 @@ _sk_clut_4D_sse2:
.byte 102,68,15,111,116,36,160 // movdqa -0x60(%rsp),%xmm14
.byte 102,65,15,254,198 // paddd %xmm14,%xmm0
.byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1
- .byte 102,68,15,111,5,205,184,0,0 // movdqa 0xb8cd(%rip),%xmm8 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,68,15,111,5,185,184,0,0 // movdqa 0xb8b9(%rip),%xmm8 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,65,15,244,192 // pmuludq %xmm8,%xmm0
.byte 102,65,15,244,200 // pmuludq %xmm8,%xmm1
.byte 102,65,15,111,240 // movdqa %xmm8,%xmm6
@@ -51475,7 +51456,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,131 // movss (%rbx,%rax,4),%xmm5
.byte 15,20,235 // unpcklps %xmm3,%xmm5
.byte 102,15,20,205 // unpcklpd %xmm5,%xmm1
- .byte 102,68,15,111,5,139,177,0,0 // movdqa 0xb18b(%rip),%xmm8 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,68,15,111,5,199,177,0,0 // movdqa 0xb1c7(%rip),%xmm8 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,65,15,254,208 // paddd %xmm8,%xmm2
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
.byte 102,73,15,126,216 // movq %xmm3,%r8
@@ -51558,7 +51539,7 @@ _sk_clut_4D_sse2:
.byte 102,15,254,208 // paddd %xmm0,%xmm2
.byte 102,15,111,240 // movdqa %xmm0,%xmm6
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,37,167,182,0,0 // movdqa 0xb6a7(%rip),%xmm4 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 102,15,111,37,147,182,0,0 // movdqa 0xb693(%rip),%xmm4 # 364c0 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
.byte 102,15,244,212 // pmuludq %xmm4,%xmm2
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
.byte 102,15,112,200,232 // pshufd $0xe8,%xmm0,%xmm1
@@ -51579,7 +51560,7 @@ _sk_clut_4D_sse2:
.byte 68,15,20,193 // unpcklps %xmm1,%xmm8
.byte 102,68,15,20,194 // unpcklpd %xmm2,%xmm8
.byte 102,15,111,200 // movdqa %xmm0,%xmm1
- .byte 102,15,250,13,80,182,0,0 // psubd 0xb650(%rip),%xmm1 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,13,60,182,0,0 // psubd 0xb63c(%rip),%xmm1 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,209,78 // pshufd $0x4e,%xmm1,%xmm2
.byte 102,73,15,126,208 // movq %xmm2,%r8
.byte 102,72,15,126,200 // movq %xmm1,%rax
@@ -51594,7 +51575,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,20,131 // movss (%rbx,%rax,4),%xmm2
.byte 15,20,209 // unpcklps %xmm1,%xmm2
.byte 102,68,15,20,242 // unpcklpd %xmm2,%xmm14
- .byte 102,15,254,5,105,175,0,0 // paddd 0xaf69(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,5,165,175,0,0 // paddd 0xafa5(%rip),%xmm0 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
.byte 102,73,15,126,200 // movq %xmm1,%r8
.byte 102,72,15,126,192 // movq %xmm0,%rax
@@ -51632,7 +51613,7 @@ _sk_clut_4D_sse2:
.byte 15,20,198 // unpcklps %xmm6,%xmm0
.byte 102,15,20,193 // unpcklpd %xmm1,%xmm0
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
- .byte 102,15,250,13,88,181,0,0 // psubd 0xb558(%rip),%xmm1 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 102,15,250,13,68,181,0,0 // psubd 0xb544(%rip),%xmm1 # 364d0 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
.byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6
.byte 102,73,15,126,240 // movq %xmm6,%r8
.byte 102,72,15,126,200 // movq %xmm1,%rax
@@ -51647,7 +51628,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,131 // movss (%rbx,%rax,4),%xmm4
.byte 15,20,230 // unpcklps %xmm6,%xmm4
.byte 102,15,20,204 // unpcklpd %xmm4,%xmm1
- .byte 102,15,254,21,115,174,0,0 // paddd 0xae73(%rip),%xmm2 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
+ .byte 102,15,254,21,175,174,0,0 // paddd 0xaeaf(%rip),%xmm2 # 35e80 <_sk_srcover_bgra_8888_sse2_lowp+0xb78>
.byte 102,15,112,226,78 // pshufd $0x4e,%xmm2,%xmm4
.byte 102,73,15,126,224 // movq %xmm4,%r8
.byte 102,72,15,126,208 // movq %xmm2,%rax
@@ -51706,7 +51687,7 @@ _sk_clut_4D_sse2:
.byte 15,89,212 // mulps %xmm4,%xmm2
.byte 65,15,88,215 // addps %xmm15,%xmm2
.byte 72,173 // lods %ds:(%rsi),%rax
- .byte 15,40,29,95,173,0,0 // movaps 0xad5f(%rip),%xmm3 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
+ .byte 15,40,29,155,173,0,0 // movaps 0xad9b(%rip),%xmm3 # 35e50 <_sk_srcover_bgra_8888_sse2_lowp+0xb48>
.byte 15,40,100,36,96 // movaps 0x60(%rsp),%xmm4
.byte 15,40,108,36,112 // movaps 0x70(%rsp),%xmm5
.byte 15,40,180,36,128,0,0,0 // movaps 0x80(%rsp),%xmm6
@@ -51714,6 +51695,25 @@ _sk_clut_4D_sse2:
.byte 72,129,196,160,0,0,0 // add $0xa0,%rsp
.byte 91 // pop %rbx
.byte 255,224 // jmpq *%rax
+
+HIDDEN _sk_gauss_a_to_rgba_sse2
+.globl _sk_gauss_a_to_rgba_sse2
+FUNCTION(_sk_gauss_a_to_rgba_sse2)
+_sk_gauss_a_to_rgba_sse2:
+ .byte 15,40,5,0,180,0,0 // movaps 0xb400(%rip),%xmm0 # 364e0 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,6,180,0,0 // addps 0xb406(%rip),%xmm0 # 364f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,12,180,0,0 // addps 0xb40c(%rip),%xmm0 # 36500 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,18,180,0,0 // addps 0xb412(%rip),%xmm0 # 36510 <_sk_srcover_bgra_8888_sse2_lowp+0x1208>
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,5,24,180,0,0 // addps 0xb418(%rip),%xmm0 # 36520 <_sk_srcover_bgra_8888_sse2_lowp+0x1218>
+ .byte 72,173 // lods %ds:(%rsi),%rax
+ .byte 15,40,200 // movaps %xmm0,%xmm1
+ .byte 15,40,208 // movaps %xmm0,%xmm2
+ .byte 15,40,216 // movaps %xmm0,%xmm3
+ .byte 255,224 // jmpq *%rax
.byte 144 // nop
.byte 144 // nop
.byte 144 // nop
@@ -62778,16 +62778,9 @@ BALIGN4
.byte 208 // (bad)
.byte 179,89 // mov $0x59,%bl
.byte 62,152 // ds cwtl
- .byte 221,147,61,45,16,17 // fstl 0x11102d3d(%rbx)
- .byte 192,18,120 // rclb $0x78,(%rdx)
- .byte 57,64,32 // cmp %eax,0x20(%rax)
- .byte 148 // xchg %eax,%esp
- .byte 90 // pop %rdx
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // (bad)
- .byte 62,0,24 // add %bl,%ds:(%rax)
- .byte 161,57,111,43,231,187,159,215,202 // movabs 0xcad79fbbe72b6f39,%eax
- .byte 60,212 // cmp $0xd4,%al
+ .byte 221,147,61,111,43,231 // fstl -0x18d490c3(%rbx)
+ .byte 187,159,215,202,60 // mov $0x3ccad79f,%ebx
+ .byte 212 // (bad)
.byte 100,84 // fs push %rsp
.byte 189,169,240,34,62 // mov $0x3e22f0a9,%ebp
.byte 0,0 // add %al,(%rax)
@@ -62798,26 +62791,25 @@ BALIGN4
.byte 0,0 // add %al,(%rax)
.byte 128,0,0 // addb $0x0,(%rax)
.byte 0,191,0,0,192,191 // add %bh,-0x40400000(%rdi)
- .byte 114,28 // jb 3573e <.literal4+0x18a>
+ .byte 114,28 // jb 3572a <.literal4+0x176>
.byte 199 // (bad)
.byte 62,85 // ds push %rbp
.byte 85 // push %rbp
.byte 149 // xchg %eax,%ebp
.byte 191,0,0,192,63 // mov $0x3fc00000,%edi
.byte 57,142,99,61,114,249 // cmp %ecx,-0x68dc29d(%rsi)
- .byte 127,63 // jg 35773 <_sk_srcover_bgra_8888_sse2_lowp+0x46b>
+ .byte 127,63 // jg 3575f <_sk_srcover_bgra_8888_sse2_lowp+0x457>
.byte 3,0 // add (%rax),%eax
.byte 0,0 // add %al,(%rax)
- .byte 109 // insl (%dx),%es:(%rdi)
- .byte 165 // movsl %ds:(%rsi),%es:(%rdi)
- .byte 144 // nop
- .byte 63 // (bad)
- .byte 252 // cld
- .byte 191,16,62,0,4 // mov $0x4003e10,%edi
+ .byte 45,16,17,192,18 // sub $0x12c01110,%eax
+ .byte 120,57 // js 35764 <_sk_srcover_bgra_8888_sse2_lowp+0x45c>
+ .byte 64,32,148,90,62,4,157,30 // and %dl,0x1e9d043e(%rdx,%rbx,2)
+ .byte 62,0,24 // add %bl,%ds:(%rax)
+ .byte 161,57,109,165,144,63,252,191,16 // movabs 0x10bffc3f90a56d39,%eax
+ .byte 62,0,4,0 // add %al,%ds:(%rax,%rax,1)
.byte 0,0 // add %al,(%rax)
.byte 0,0 // add %al,(%rax)
- .byte 0,56 // add %bh,(%rax)
- .byte 255 // (bad)
+ .byte 56,255 // cmp %bh,%bh
.byte 255 // (bad)
.byte 255 // (bad)
.byte 127,0 // jg 3574d <.literal4+0x199>
@@ -64364,28 +64356,7 @@ BALIGN16
.byte 221,147,61,152,221,147 // fstl -0x6c2267c3(%rbx)
.byte 61,152,221,147,61 // cmp $0x3d93dd98,%eax
.byte 152 // cwtl
- .byte 221,147,61,45,16,17 // fstl 0x11102d3d(%rbx)
- .byte 192,45,16,17,192,45,16 // shrb $0x10,0x2dc01110(%rip) # 2dc374fa <_sk_srcover_bgra_8888_sse2_lowp+0x2dc021f2>
- .byte 17,192 // adc %eax,%eax
- .byte 45,16,17,192,18 // sub $0x12c01110,%eax
- .byte 120,57 // js 3642c <.literal16+0x63c>
- .byte 64,18,120,57 // adc 0x39(%rax),%dil
- .byte 64,18,120,57 // adc 0x39(%rax),%dil
- .byte 64,18,120,57 // adc 0x39(%rax),%dil
- .byte 64,32,148,90,62,32,148,90 // and %dl,0x5a94203e(%rdx,%rbx,2)
- .byte 62,32,148,90,62,32,148,90 // and %dl,%ds:0x5a94203e(%rdx,%rbx,2)
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // (bad)
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // (bad)
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // (bad)
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // (bad)
- .byte 62,0,24 // add %bl,%ds:(%rax)
- .byte 161,57,0,24,161,57,0,24,161 // movabs 0xa1180039a1180039,%eax
- .byte 57,0 // cmp %eax,(%rax)
- .byte 24,161,57,111,43,231 // sbb %ah,-0x18d490c7(%rcx)
+ .byte 221,147,61,111,43,231 // fstl -0x18d490c3(%rbx)
.byte 187,111,43,231,187 // mov $0xbbe72b6f,%ebx
.byte 111 // outsl %ds:(%rsi),(%dx)
.byte 43,231 // sub %edi,%esp
@@ -64433,13 +64404,13 @@ BALIGN16
.byte 192,191,0,0,192,191,0 // sarb $0x0,-0x40400000(%rdi)
.byte 0,192 // add %al,%al
.byte 191,0,0,192,191 // mov $0xbfc00000,%edi
- .byte 114,28 // jb 364de <.literal16+0x6ee>
+ .byte 114,28 // jb 3648e <.literal16+0x69e>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 364e2 <.literal16+0x6f2>
+ .byte 62,114,28 // jb,pt 36492 <.literal16+0x6a2>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 364e6 <.literal16+0x6f6>
+ .byte 62,114,28 // jb,pt 36496 <.literal16+0x6a6>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt 364ea <.literal16+0x6fa>
+ .byte 62,114,28 // jb,pt 3649a <.literal16+0x6aa>
.byte 199 // (bad)
.byte 62,85 // ds push %rbp
.byte 85 // push %rbp
@@ -64458,15 +64429,15 @@ BALIGN16
.byte 0,192 // add %al,%al
.byte 63 // (bad)
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%rsi)
- .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d66f335 <_sk_srcover_bgra_8888_sse2_lowp+0x3d63a02d>
+ .byte 99,61,57,142,99,61 // movslq 0x3d638e39(%rip),%edi # 3d66f2e5 <_sk_srcover_bgra_8888_sse2_lowp+0x3d639fdd>
.byte 57,142,99,61,114,249 // cmp %ecx,-0x68dc29d(%rsi)
- .byte 127,63 // jg 36543 <.literal16+0x753>
- .byte 114,249 // jb 364ff <.literal16+0x70f>
- .byte 127,63 // jg 36547 <.literal16+0x757>
- .byte 114,249 // jb 36503 <.literal16+0x713>
- .byte 127,63 // jg 3654b <.literal16+0x75b>
- .byte 114,249 // jb 36507 <.literal16+0x717>
- .byte 127,63 // jg 3654f <.literal16+0x75f>
+ .byte 127,63 // jg 364f3 <.literal16+0x703>
+ .byte 114,249 // jb 364af <.literal16+0x6bf>
+ .byte 127,63 // jg 364f7 <.literal16+0x707>
+ .byte 114,249 // jb 364b3 <.literal16+0x6c3>
+ .byte 127,63 // jg 364fb <.literal16+0x70b>
+ .byte 114,249 // jb 364b7 <.literal16+0x6c7>
+ .byte 127,63 // jg 364ff <.literal16+0x70f>
.byte 3,0 // add (%rax),%eax
.byte 0,0 // add %al,(%rax)
.byte 3,0 // add (%rax),%eax
@@ -64490,8 +64461,28 @@ BALIGN16
.byte 255 // (bad)
.byte 255 // (bad)
.byte 255 // (bad)
- .byte 255,0 // incl (%rax)
- .byte 0,255 // add %bh,%bh
+ .byte 255,45,16,17,192,45 // ljmp *0x2dc01110(%rip) # 2dc375f5 <_sk_srcover_bgra_8888_sse2_lowp+0x2dc022ed>
+ .byte 16,17 // adc %dl,(%rcx)
+ .byte 192,45,16,17,192,45,16 // shrb $0x10,0x2dc01110(%rip) # 2dc375fe <_sk_srcover_bgra_8888_sse2_lowp+0x2dc022f6>
+ .byte 17,192 // adc %eax,%eax
+ .byte 18,120,57 // adc 0x39(%rax),%bh
+ .byte 64,18,120,57 // adc 0x39(%rax),%dil
+ .byte 64,18,120,57 // adc 0x39(%rax),%dil
+ .byte 64,18,120,57 // adc 0x39(%rax),%dil
+ .byte 64,32,148,90,62,32,148,90 // and %dl,0x5a94203e(%rdx,%rbx,2)
+ .byte 62,32,148,90,62,32,148,90 // and %dl,%ds:0x5a94203e(%rdx,%rbx,2)
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // (bad)
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // (bad)
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // (bad)
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // (bad)
+ .byte 62,0,24 // add %bl,%ds:(%rax)
+ .byte 161,57,0,24,161,57,0,24,161 // movabs 0xa1180039a1180039,%eax
+ .byte 57,0 // cmp %eax,(%rax)
+ .byte 24,161,57,0,0,255 // sbb %ah,-0xffffc7(%rcx)
.byte 255,0 // incl (%rax)
.byte 0,255 // add %bh,%bh
.byte 255,0 // incl (%rax)
@@ -73210,37 +73201,6 @@ _sk_evenly_spaced_gradient_sse2:
.byte 93 // pop %ebp
.byte 195 // ret
-HIDDEN _sk_gauss_a_to_rgba_sse2
-.globl _sk_gauss_a_to_rgba_sse2
-FUNCTION(_sk_gauss_a_to_rgba_sse2)
-_sk_gauss_a_to_rgba_sse2:
- .byte 85 // push %ebp
- .byte 137,229 // mov %esp,%ebp
- .byte 131,236,8 // sub $0x8,%esp
- .byte 232,0,0,0,0 // call 697e <_sk_gauss_a_to_rgba_sse2+0xb>
- .byte 88 // pop %eax
- .byte 139,77,12 // mov 0xc(%ebp),%ecx
- .byte 15,40,128,226,121,0,0 // movaps 0x79e2(%eax),%xmm0
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,242,121,0,0 // addps 0x79f2(%eax),%xmm0
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,2,122,0,0 // addps 0x7a02(%eax),%xmm0
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,18,122,0,0 // addps 0x7a12(%eax),%xmm0
- .byte 15,89,195 // mulps %xmm3,%xmm0
- .byte 15,88,128,34,122,0,0 // addps 0x7a22(%eax),%xmm0
- .byte 141,65,4 // lea 0x4(%ecx),%eax
- .byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,200 // movaps %xmm0,%xmm1
- .byte 15,40,208 // movaps %xmm0,%xmm2
- .byte 15,40,216 // movaps %xmm0,%xmm3
- .byte 80 // push %eax
- .byte 255,117,8 // pushl 0x8(%ebp)
- .byte 255,17 // call *(%ecx)
- .byte 131,196,24 // add $0x18,%esp
- .byte 93 // pop %ebp
- .byte 195 // ret
-
HIDDEN _sk_gradient_sse2
.globl _sk_gradient_sse2
FUNCTION(_sk_gradient_sse2)
@@ -73256,7 +73216,7 @@ _sk_gradient_sse2:
.byte 139,10 // mov (%edx),%ecx
.byte 102,15,239,201 // pxor %xmm1,%xmm1
.byte 131,249,2 // cmp $0x2,%ecx
- .byte 114,33 // jb 6a05 <_sk_gradient_sse2+0x3a>
+ .byte 114,33 // jb 69ad <_sk_gradient_sse2+0x3a>
.byte 139,114,36 // mov 0x24(%edx),%esi
.byte 73 // dec %ecx
.byte 131,198,4 // add $0x4,%esi
@@ -73267,7 +73227,7 @@ _sk_gradient_sse2:
.byte 102,15,250,202 // psubd %xmm2,%xmm1
.byte 131,198,4 // add $0x4,%esi
.byte 73 // dec %ecx
- .byte 117,234 // jne 69ef <_sk_gradient_sse2+0x24>
+ .byte 117,234 // jne 6997 <_sk_gradient_sse2+0x24>
.byte 102,15,126,206 // movd %xmm1,%esi
.byte 102,15,112,209,229 // pshufd $0xe5,%xmm1,%xmm2
.byte 102,15,112,217,78 // pshufd $0x4e,%xmm1,%xmm3
@@ -73420,7 +73380,7 @@ _sk_xy_to_unit_angle_sse2:
.byte 15,40,218 // movaps %xmm2,%xmm3
.byte 15,40,209 // movaps %xmm1,%xmm2
.byte 15,40,200 // movaps %xmm0,%xmm1
- .byte 232,0,0,0,0 // call 6c0d <_sk_xy_to_unit_angle_sse2+0x18>
+ .byte 232,0,0,0,0 // call 6bb5 <_sk_xy_to_unit_angle_sse2+0x18>
.byte 88 // pop %eax
.byte 15,87,237 // xorps %xmm5,%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
@@ -73435,30 +73395,30 @@ _sk_xy_to_unit_angle_sse2:
.byte 15,94,247 // divps %xmm7,%xmm6
.byte 15,40,254 // movaps %xmm6,%xmm7
.byte 15,89,255 // mulps %xmm7,%xmm7
- .byte 15,40,128,163,119,0,0 // movaps 0x77a3(%eax),%xmm0
+ .byte 15,40,128,171,119,0,0 // movaps 0x77ab(%eax),%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 15,88,128,179,119,0,0 // addps 0x77b3(%eax),%xmm0
+ .byte 15,88,128,187,119,0,0 // addps 0x77bb(%eax),%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 15,88,128,195,119,0,0 // addps 0x77c3(%eax),%xmm0
+ .byte 15,88,128,203,119,0,0 // addps 0x77cb(%eax),%xmm0
.byte 15,89,199 // mulps %xmm7,%xmm0
- .byte 15,88,128,211,119,0,0 // addps 0x77d3(%eax),%xmm0
+ .byte 15,88,128,219,119,0,0 // addps 0x77db(%eax),%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
.byte 15,194,236,1 // cmpltps %xmm4,%xmm5
- .byte 15,40,176,227,119,0,0 // movaps 0x77e3(%eax),%xmm6
+ .byte 15,40,176,235,119,0,0 // movaps 0x77eb(%eax),%xmm6
.byte 15,92,240 // subps %xmm0,%xmm6
.byte 15,84,245 // andps %xmm5,%xmm6
.byte 15,85,232 // andnps %xmm0,%xmm5
.byte 15,87,228 // xorps %xmm4,%xmm4
.byte 15,86,238 // orps %xmm6,%xmm5
.byte 15,194,204,1 // cmpltps %xmm4,%xmm1
- .byte 15,40,128,163,113,0,0 // movaps 0x71a3(%eax),%xmm0
+ .byte 15,40,128,251,113,0,0 // movaps 0x71fb(%eax),%xmm0
.byte 15,92,197 // subps %xmm5,%xmm0
.byte 15,84,193 // andps %xmm1,%xmm0
.byte 15,85,205 // andnps %xmm5,%xmm1
.byte 15,86,200 // orps %xmm0,%xmm1
.byte 15,40,194 // movaps %xmm2,%xmm0
.byte 15,194,196,1 // cmpltps %xmm4,%xmm0
- .byte 15,40,168,179,113,0,0 // movaps 0x71b3(%eax),%xmm5
+ .byte 15,40,168,11,114,0,0 // movaps 0x720b(%eax),%xmm5
.byte 15,92,233 // subps %xmm1,%xmm5
.byte 15,84,232 // andps %xmm0,%xmm5
.byte 15,85,193 // andnps %xmm1,%xmm0
@@ -73519,15 +73479,15 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,246 // mulps %xmm6,%xmm6
.byte 15,88,240 // addps %xmm0,%xmm6
- .byte 232,0,0,0,0 // call 6d2a <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
+ .byte 232,0,0,0,0 // call 6cd2 <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
.byte 90 // pop %edx
.byte 243,15,89,237 // mulss %xmm5,%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 243,15,16,65,64 // movss 0x40(%ecx),%xmm0
.byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0
- .byte 15,89,162,214,118,0,0 // mulps 0x76d6(%edx),%xmm4
- .byte 15,89,130,230,118,0,0 // mulps 0x76e6(%edx),%xmm0
+ .byte 15,89,162,222,118,0,0 // mulps 0x76de(%edx),%xmm4
+ .byte 15,89,130,238,118,0,0 // mulps 0x76ee(%edx),%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
@@ -73535,11 +73495,11 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2:
.byte 15,81,237 // sqrtps %xmm5,%xmm5
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,87,162,134,117,0,0 // xorps 0x7586(%edx),%xmm4
+ .byte 15,87,162,222,117,0,0 // xorps 0x75de(%edx),%xmm4
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 243,15,16,105,68 // movss 0x44(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
- .byte 15,89,170,134,112,0,0 // mulps 0x7086(%edx),%xmm5
+ .byte 15,89,170,222,112,0,0 // mulps 0x70de(%edx),%xmm5
.byte 15,89,197 // mulps %xmm5,%xmm0
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,95,196 // maxps %xmm4,%xmm0
@@ -73570,15 +73530,15 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,246 // mulps %xmm6,%xmm6
.byte 15,88,240 // addps %xmm0,%xmm6
- .byte 232,0,0,0,0 // call 6dc8 <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
+ .byte 232,0,0,0,0 // call 6d70 <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
.byte 90 // pop %edx
.byte 243,15,89,237 // mulss %xmm5,%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,92,245 // subps %xmm5,%xmm6
.byte 243,15,16,65,64 // movss 0x40(%ecx),%xmm0
.byte 15,198,192,0 // shufps $0x0,%xmm0,%xmm0
- .byte 15,89,162,56,118,0,0 // mulps 0x7638(%edx),%xmm4
- .byte 15,89,130,72,118,0,0 // mulps 0x7648(%edx),%xmm0
+ .byte 15,89,162,64,118,0,0 // mulps 0x7640(%edx),%xmm4
+ .byte 15,89,130,80,118,0,0 // mulps 0x7650(%edx),%xmm0
.byte 15,89,198 // mulps %xmm6,%xmm0
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
@@ -73586,11 +73546,11 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2:
.byte 15,81,237 // sqrtps %xmm5,%xmm5
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,87,162,232,116,0,0 // xorps 0x74e8(%edx),%xmm4
+ .byte 15,87,162,64,117,0,0 // xorps 0x7540(%edx),%xmm4
.byte 15,92,229 // subps %xmm5,%xmm4
.byte 243,15,16,105,68 // movss 0x44(%ecx),%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
- .byte 15,89,170,232,111,0,0 // mulps 0x6fe8(%edx),%xmm5
+ .byte 15,89,170,64,112,0,0 // mulps 0x7040(%edx),%xmm5
.byte 15,89,197 // mulps %xmm5,%xmm0
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,93,196 // minps %xmm4,%xmm0
@@ -73610,7 +73570,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 85 // push %ebp
.byte 137,229 // mov %esp,%ebp
.byte 131,236,8 // sub $0x8,%esp
- .byte 232,0,0,0,0 // call 6e40 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
+ .byte 232,0,0,0,0 // call 6de8 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
.byte 89 // pop %ecx
.byte 139,69,12 // mov 0xc(%ebp),%eax
.byte 139,16 // mov (%eax),%edx
@@ -73619,7 +73579,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 243,15,89,236 // mulss %xmm4,%xmm5
.byte 15,198,237,0 // shufps $0x0,%xmm5,%xmm5
.byte 15,88,232 // addps %xmm0,%xmm5
- .byte 15,89,169,192,117,0,0 // mulps 0x75c0(%ecx),%xmm5
+ .byte 15,89,169,200,117,0,0 // mulps 0x75c8(%ecx),%xmm5
.byte 15,89,192 // mulps %xmm0,%xmm0
.byte 15,40,241 // movaps %xmm1,%xmm6
.byte 15,89,246 // mulps %xmm6,%xmm6
@@ -73627,7 +73587,7 @@ _sk_xy_to_2pt_conical_linear_sse2:
.byte 243,15,89,228 // mulss %xmm4,%xmm4
.byte 15,198,228,0 // shufps $0x0,%xmm4,%xmm4
.byte 15,92,196 // subps %xmm4,%xmm0
- .byte 15,87,129,112,116,0,0 // xorps 0x7470(%ecx),%xmm0
+ .byte 15,87,129,200,116,0,0 // xorps 0x74c8(%ecx),%xmm0
.byte 15,94,197 // divps %xmm5,%xmm0
.byte 141,72,8 // lea 0x8(%eax),%ecx
.byte 131,236,8 // sub $0x8,%esp
@@ -73704,16 +73664,16 @@ _sk_save_xy_sse2:
.byte 131,236,24 // sub $0x18,%esp
.byte 15,41,93,232 // movaps %xmm3,-0x18(%ebp)
.byte 15,40,218 // movaps %xmm2,%xmm3
- .byte 232,0,0,0,0 // call 6f29 <_sk_save_xy_sse2+0x12>
+ .byte 232,0,0,0,0 // call 6ed1 <_sk_save_xy_sse2+0x12>
.byte 88 // pop %eax
- .byte 15,40,160,135,110,0,0 // movaps 0x6e87(%eax),%xmm4
+ .byte 15,40,160,223,110,0,0 // movaps 0x6edf(%eax),%xmm4
.byte 15,40,232 // movaps %xmm0,%xmm5
.byte 15,88,236 // addps %xmm4,%xmm5
.byte 243,15,91,245 // cvttps2dq %xmm5,%xmm6
.byte 15,91,246 // cvtdq2ps %xmm6,%xmm6
.byte 15,40,253 // movaps %xmm5,%xmm7
.byte 15,194,254,1 // cmpltps %xmm6,%xmm7
- .byte 15,40,144,151,110,0,0 // movaps 0x6e97(%eax),%xmm2
+ .byte 15,40,144,239,110,0,0 // movaps 0x6eef(%eax),%xmm2
.byte 15,84,250 // andps %xmm2,%xmm7
.byte 15,92,247 // subps %xmm7,%xmm6
.byte 15,92,238 // subps %xmm6,%xmm5
@@ -73788,15 +73748,15 @@ _sk_bilinear_nx_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7011 <_sk_bilinear_nx_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6fb9 <_sk_bilinear_nx_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,166,128,0,0,0 // movups 0x80(%esi),%xmm4
- .byte 15,88,128,15,116,0,0 // addps 0x740f(%eax),%xmm0
- .byte 15,40,168,175,109,0,0 // movaps 0x6daf(%eax),%xmm5
+ .byte 15,88,128,23,116,0,0 // addps 0x7417(%eax),%xmm0
+ .byte 15,40,168,7,110,0,0 // movaps 0x6e07(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,17,174,0,1,0,0 // movups %xmm5,0x100(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -73817,14 +73777,14 @@ _sk_bilinear_px_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7057 <_sk_bilinear_px_sse2+0xa>
+ .byte 232,0,0,0,0 // call 6fff <_sk_bilinear_px_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,166,128,0,0,0 // movups 0x80(%esi),%xmm4
- .byte 15,88,128,89,109,0,0 // addps 0x6d59(%eax),%xmm0
+ .byte 15,88,128,177,109,0,0 // addps 0x6db1(%eax),%xmm0
.byte 15,17,166,0,1,0,0 // movups %xmm4,0x100(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -73844,15 +73804,15 @@ _sk_bilinear_ny_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7093 <_sk_bilinear_ny_sse2+0xa>
+ .byte 232,0,0,0,0 // call 703b <_sk_bilinear_ny_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,64 // movups 0x40(%esi),%xmm1
.byte 15,16,166,192,0,0,0 // movups 0xc0(%esi),%xmm4
- .byte 15,88,136,141,115,0,0 // addps 0x738d(%eax),%xmm1
- .byte 15,40,168,45,109,0,0 // movaps 0x6d2d(%eax),%xmm5
+ .byte 15,88,136,149,115,0,0 // addps 0x7395(%eax),%xmm1
+ .byte 15,40,168,133,109,0,0 // movaps 0x6d85(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,17,174,64,1,0,0 // movups %xmm5,0x140(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -73873,14 +73833,14 @@ _sk_bilinear_py_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 70da <_sk_bilinear_py_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7082 <_sk_bilinear_py_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,64 // movups 0x40(%esi),%xmm1
.byte 15,16,166,192,0,0,0 // movups 0xc0(%esi),%xmm4
- .byte 15,88,136,214,108,0,0 // addps 0x6cd6(%eax),%xmm1
+ .byte 15,88,136,46,109,0,0 // addps 0x6d2e(%eax),%xmm1
.byte 15,17,166,64,1,0,0 // movups %xmm4,0x140(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -73900,20 +73860,20 @@ _sk_bicubic_n3x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7117 <_sk_bicubic_n3x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 70bf <_sk_bicubic_n3x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,166,128,0,0,0 // movups 0x80(%esi),%xmm4
- .byte 15,88,128,25,115,0,0 // addps 0x7319(%eax),%xmm0
- .byte 15,40,168,169,108,0,0 // movaps 0x6ca9(%eax),%xmm5
+ .byte 15,88,128,33,115,0,0 // addps 0x7321(%eax),%xmm0
+ .byte 15,40,168,1,109,0,0 // movaps 0x6d01(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,40,229 // movaps %xmm5,%xmm4
.byte 15,89,228 // mulps %xmm4,%xmm4
- .byte 15,89,168,41,115,0,0 // mulps 0x7329(%eax),%xmm5
- .byte 15,88,168,153,110,0,0 // addps 0x6e99(%eax),%xmm5
+ .byte 15,89,168,49,115,0,0 // mulps 0x7331(%eax),%xmm5
+ .byte 15,88,168,241,110,0,0 // addps 0x6ef1(%eax),%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
.byte 15,17,174,0,1,0,0 // movups %xmm5,0x100(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -73934,23 +73894,23 @@ _sk_bicubic_n1x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7174 <_sk_bicubic_n1x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 711c <_sk_bicubic_n1x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,166,128,0,0,0 // movups 0x80(%esi),%xmm4
- .byte 15,88,128,172,114,0,0 // addps 0x72ac(%eax),%xmm0
- .byte 15,40,168,76,108,0,0 // movaps 0x6c4c(%eax),%xmm5
+ .byte 15,88,128,180,114,0,0 // addps 0x72b4(%eax),%xmm0
+ .byte 15,40,168,164,108,0,0 // movaps 0x6ca4(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
- .byte 15,40,160,220,114,0,0 // movaps 0x72dc(%eax),%xmm4
+ .byte 15,40,160,228,114,0,0 // movaps 0x72e4(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,236,114,0,0 // addps 0x72ec(%eax),%xmm4
+ .byte 15,88,160,244,114,0,0 // addps 0x72f4(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,60,108,0,0 // addps 0x6c3c(%eax),%xmm4
+ .byte 15,88,160,148,108,0,0 // addps 0x6c94(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,252,114,0,0 // addps 0x72fc(%eax),%xmm4
+ .byte 15,88,160,4,115,0,0 // addps 0x7304(%eax),%xmm4
.byte 15,17,166,0,1,0,0 // movups %xmm4,0x100(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -73970,22 +73930,22 @@ _sk_bicubic_p1x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 71df <_sk_bicubic_p1x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7187 <_sk_bicubic_p1x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
- .byte 15,40,160,209,107,0,0 // movaps 0x6bd1(%eax),%xmm4
+ .byte 15,40,160,41,108,0,0 // movaps 0x6c29(%eax),%xmm4
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,174,128,0,0,0 // movups 0x80(%esi),%xmm5
.byte 15,88,196 // addps %xmm4,%xmm0
- .byte 15,40,176,113,114,0,0 // movaps 0x7271(%eax),%xmm6
+ .byte 15,40,176,121,114,0,0 // movaps 0x7279(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,129,114,0,0 // addps 0x7281(%eax),%xmm6
+ .byte 15,88,176,137,114,0,0 // addps 0x7289(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,88,244 // addps %xmm4,%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,145,114,0,0 // addps 0x7291(%eax),%xmm6
+ .byte 15,88,176,153,114,0,0 // addps 0x7299(%eax),%xmm6
.byte 15,17,182,0,1,0,0 // movups %xmm6,0x100(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -74005,18 +73965,18 @@ _sk_bicubic_p3x_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 723f <_sk_bicubic_p3x_sse2+0xa>
+ .byte 232,0,0,0,0 // call 71e7 <_sk_bicubic_p3x_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,6 // movups (%esi),%xmm0
.byte 15,16,166,128,0,0,0 // movups 0x80(%esi),%xmm4
- .byte 15,88,128,33,114,0,0 // addps 0x7221(%eax),%xmm0
+ .byte 15,88,128,41,114,0,0 // addps 0x7229(%eax),%xmm0
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
- .byte 15,89,160,1,114,0,0 // mulps 0x7201(%eax),%xmm4
- .byte 15,88,160,113,109,0,0 // addps 0x6d71(%eax),%xmm4
+ .byte 15,89,160,9,114,0,0 // mulps 0x7209(%eax),%xmm4
+ .byte 15,88,160,201,109,0,0 // addps 0x6dc9(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,17,166,0,1,0,0 // movups %xmm4,0x100(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -74037,20 +73997,20 @@ _sk_bicubic_n3y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 7292 <_sk_bicubic_n3y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 723a <_sk_bicubic_n3y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,64 // movups 0x40(%esi),%xmm1
.byte 15,16,166,192,0,0,0 // movups 0xc0(%esi),%xmm4
- .byte 15,88,136,158,113,0,0 // addps 0x719e(%eax),%xmm1
- .byte 15,40,168,46,107,0,0 // movaps 0x6b2e(%eax),%xmm5
+ .byte 15,88,136,166,113,0,0 // addps 0x71a6(%eax),%xmm1
+ .byte 15,40,168,134,107,0,0 // movaps 0x6b86(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
.byte 15,40,229 // movaps %xmm5,%xmm4
.byte 15,89,228 // mulps %xmm4,%xmm4
- .byte 15,89,168,174,113,0,0 // mulps 0x71ae(%eax),%xmm5
- .byte 15,88,168,30,109,0,0 // addps 0x6d1e(%eax),%xmm5
+ .byte 15,89,168,182,113,0,0 // mulps 0x71b6(%eax),%xmm5
+ .byte 15,88,168,118,109,0,0 // addps 0x6d76(%eax),%xmm5
.byte 15,89,236 // mulps %xmm4,%xmm5
.byte 15,17,174,64,1,0,0 // movups %xmm5,0x140(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -74071,23 +74031,23 @@ _sk_bicubic_n1y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 72f0 <_sk_bicubic_n1y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7298 <_sk_bicubic_n1y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,64 // movups 0x40(%esi),%xmm1
.byte 15,16,166,192,0,0,0 // movups 0xc0(%esi),%xmm4
- .byte 15,88,136,48,113,0,0 // addps 0x7130(%eax),%xmm1
- .byte 15,40,168,208,106,0,0 // movaps 0x6ad0(%eax),%xmm5
+ .byte 15,88,136,56,113,0,0 // addps 0x7138(%eax),%xmm1
+ .byte 15,40,168,40,107,0,0 // movaps 0x6b28(%eax),%xmm5
.byte 15,92,236 // subps %xmm4,%xmm5
- .byte 15,40,160,96,113,0,0 // movaps 0x7160(%eax),%xmm4
+ .byte 15,40,160,104,113,0,0 // movaps 0x7168(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,112,113,0,0 // addps 0x7170(%eax),%xmm4
+ .byte 15,88,160,120,113,0,0 // addps 0x7178(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,192,106,0,0 // addps 0x6ac0(%eax),%xmm4
+ .byte 15,88,160,24,107,0,0 // addps 0x6b18(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
- .byte 15,88,160,128,113,0,0 // addps 0x7180(%eax),%xmm4
+ .byte 15,88,160,136,113,0,0 // addps 0x7188(%eax),%xmm4
.byte 15,17,166,64,1,0,0 // movups %xmm4,0x140(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -74107,22 +74067,22 @@ _sk_bicubic_p1y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 735c <_sk_bicubic_p1y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7304 <_sk_bicubic_p1y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
- .byte 15,40,160,84,106,0,0 // movaps 0x6a54(%eax),%xmm4
+ .byte 15,40,160,172,106,0,0 // movaps 0x6aac(%eax),%xmm4
.byte 15,16,78,64 // movups 0x40(%esi),%xmm1
.byte 15,16,174,192,0,0,0 // movups 0xc0(%esi),%xmm5
.byte 15,88,204 // addps %xmm4,%xmm1
- .byte 15,40,176,244,112,0,0 // movaps 0x70f4(%eax),%xmm6
+ .byte 15,40,176,252,112,0,0 // movaps 0x70fc(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,4,113,0,0 // addps 0x7104(%eax),%xmm6
+ .byte 15,88,176,12,113,0,0 // addps 0x710c(%eax),%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
.byte 15,88,244 // addps %xmm4,%xmm6
.byte 15,89,245 // mulps %xmm5,%xmm6
- .byte 15,88,176,20,113,0,0 // addps 0x7114(%eax),%xmm6
+ .byte 15,88,176,28,113,0,0 // addps 0x711c(%eax),%xmm6
.byte 15,17,182,64,1,0,0 // movups %xmm6,0x140(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
@@ -74142,18 +74102,18 @@ _sk_bicubic_p3y_sse2:
.byte 137,229 // mov %esp,%ebp
.byte 86 // push %esi
.byte 80 // push %eax
- .byte 232,0,0,0,0 // call 73bd <_sk_bicubic_p3y_sse2+0xa>
+ .byte 232,0,0,0,0 // call 7365 <_sk_bicubic_p3y_sse2+0xa>
.byte 88 // pop %eax
.byte 139,77,8 // mov 0x8(%ebp),%ecx
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 139,50 // mov (%edx),%esi
.byte 15,16,78,64 // movups 0x40(%esi),%xmm1
.byte 15,16,166,192,0,0,0 // movups 0xc0(%esi),%xmm4
- .byte 15,88,136,163,112,0,0 // addps 0x70a3(%eax),%xmm1
+ .byte 15,88,136,171,112,0,0 // addps 0x70ab(%eax),%xmm1
.byte 15,40,236 // movaps %xmm4,%xmm5
.byte 15,89,237 // mulps %xmm5,%xmm5
- .byte 15,89,160,131,112,0,0 // mulps 0x7083(%eax),%xmm4
- .byte 15,88,160,243,107,0,0 // addps 0x6bf3(%eax),%xmm4
+ .byte 15,89,160,139,112,0,0 // mulps 0x708b(%eax),%xmm4
+ .byte 15,88,160,75,108,0,0 // addps 0x6c4b(%eax),%xmm4
.byte 15,89,229 // mulps %xmm5,%xmm4
.byte 15,17,166,64,1,0,0 // movups %xmm4,0x140(%esi)
.byte 141,66,8 // lea 0x8(%edx),%eax
@@ -74296,7 +74256,7 @@ _sk_clut_3D_sse2:
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
.byte 102,15,98,200 // punpckldq %xmm0,%xmm1
.byte 102,15,127,77,136 // movdqa %xmm1,-0x78(%ebp)
- .byte 232,0,0,0,0 // call 75a3 <_sk_clut_3D_sse2+0xee>
+ .byte 232,0,0,0,0 // call 754b <_sk_clut_3D_sse2+0xee>
.byte 90 // pop %edx
.byte 243,15,91,196 // cvttps2dq %xmm4,%xmm0
.byte 102,15,127,133,8,255,255,255 // movdqa %xmm0,-0xf8(%ebp)
@@ -74304,7 +74264,7 @@ _sk_clut_3D_sse2:
.byte 102,15,254,216 // paddd %xmm0,%xmm3
.byte 102,15,111,193 // movdqa %xmm1,%xmm0
.byte 102,15,254,195 // paddd %xmm3,%xmm0
- .byte 102,15,111,162,237,110,0,0 // movdqa 0x6eed(%edx),%xmm4
+ .byte 102,15,111,162,245,110,0,0 // movdqa 0x6ef5(%edx),%xmm4
.byte 102,15,127,165,120,255,255,255 // movdqa %xmm4,-0x88(%ebp)
.byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
@@ -74344,7 +74304,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,4,129 // movss (%ecx,%eax,4),%xmm0
.byte 15,20,248 // unpcklps %xmm0,%xmm7
.byte 102,15,20,252 // unpcklpd %xmm4,%xmm7
- .byte 102,15,111,130,93,104,0,0 // movdqa 0x685d(%edx),%xmm0
+ .byte 102,15,111,130,181,104,0,0 // movdqa 0x68b5(%edx),%xmm0
.byte 102,15,127,133,104,255,255,255 // movdqa %xmm0,-0x98(%ebp)
.byte 102,15,254,200 // paddd %xmm0,%xmm1
.byte 102,15,112,193,229 // pshufd $0xe5,%xmm1,%xmm0
@@ -74361,7 +74321,7 @@ _sk_clut_3D_sse2:
.byte 243,15,16,4,129 // movss (%ecx,%eax,4),%xmm0
.byte 15,20,240 // unpcklps %xmm0,%xmm6
.byte 102,15,20,241 // unpcklpd %xmm1,%xmm6
- .byte 15,40,130,221,110,0,0 // movaps 0x6edd(%edx),%xmm0
+ .byte 15,40,130,229,110,0,0 // movaps 0x6ee5(%edx),%xmm0
.byte 15,40,141,248,254,255,255 // movaps -0x108(%ebp),%xmm1
.byte 15,88,200 // addps %xmm0,%xmm1
.byte 15,41,77,200 // movaps %xmm1,-0x38(%ebp)
@@ -74981,7 +74941,7 @@ _sk_clut_4D_sse2:
.byte 102,15,112,201,232 // pshufd $0xe8,%xmm1,%xmm1
.byte 102,15,98,217 // punpckldq %xmm1,%xmm3
.byte 102,15,127,93,152 // movdqa %xmm3,-0x68(%ebp)
- .byte 232,0,0,0,0 // call 812f <_sk_clut_4D_sse2+0x165>
+ .byte 232,0,0,0,0 // call 80d7 <_sk_clut_4D_sse2+0x165>
.byte 89 // pop %ecx
.byte 15,40,197 // movaps %xmm5,%xmm0
.byte 15,41,133,168,254,255,255 // movaps %xmm0,-0x158(%ebp)
@@ -74992,7 +74952,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
.byte 102,15,254,214 // paddd %xmm6,%xmm2
.byte 102,15,254,218 // paddd %xmm2,%xmm3
- .byte 102,15,111,161,97,99,0,0 // movdqa 0x6361(%ecx),%xmm4
+ .byte 102,15,111,161,105,99,0,0 // movdqa 0x6369(%ecx),%xmm4
.byte 102,15,112,203,245 // pshufd $0xf5,%xmm3,%xmm1
.byte 102,15,244,220 // pmuludq %xmm4,%xmm3
.byte 102,15,244,204 // pmuludq %xmm4,%xmm1
@@ -75034,7 +74994,7 @@ _sk_clut_4D_sse2:
.byte 15,20,223 // unpcklps %xmm7,%xmm3
.byte 102,15,20,222 // unpcklpd %xmm6,%xmm3
.byte 102,15,41,157,232,254,255,255 // movapd %xmm3,-0x118(%ebp)
- .byte 102,15,254,137,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm1
+ .byte 102,15,254,137,41,93,0,0 // paddd 0x5d29(%ecx),%xmm1
.byte 102,15,112,241,229 // pshufd $0xe5,%xmm1,%xmm6
.byte 102,15,126,240 // movd %xmm6,%eax
.byte 102,15,112,241,78 // pshufd $0x4e,%xmm1,%xmm6
@@ -75049,7 +75009,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,60,130 // movss (%edx,%eax,4),%xmm7
.byte 15,20,223 // unpcklps %xmm7,%xmm3
.byte 102,15,20,222 // unpcklpd %xmm6,%xmm3
- .byte 15,40,185,81,99,0,0 // movaps 0x6351(%ecx),%xmm7
+ .byte 15,40,185,89,99,0,0 // movaps 0x6359(%ecx),%xmm7
.byte 15,88,199 // addps %xmm7,%xmm0
.byte 15,41,133,120,255,255,255 // movaps %xmm0,-0x88(%ebp)
.byte 15,40,133,248,254,255,255 // movaps -0x108(%ebp),%xmm0
@@ -75070,7 +75030,7 @@ _sk_clut_4D_sse2:
.byte 102,15,127,101,168 // movdqa %xmm4,-0x58(%ebp)
.byte 102,15,254,212 // paddd %xmm4,%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,161,97,99,0,0 // movdqa 0x6361(%ecx),%xmm4
+ .byte 102,15,111,161,105,99,0,0 // movdqa 0x6369(%ecx),%xmm4
.byte 102,15,244,212 // pmuludq %xmm4,%xmm2
.byte 102,15,244,196 // pmuludq %xmm4,%xmm0
.byte 102,15,112,240,232 // pshufd $0xe8,%xmm0,%xmm6
@@ -75106,7 +75066,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5
.byte 15,20,213 // unpcklps %xmm5,%xmm2
.byte 102,15,20,214 // unpcklpd %xmm6,%xmm2
- .byte 102,15,254,129,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm0
+ .byte 102,15,254,129,41,93,0,0 // paddd 0x5d29(%ecx),%xmm0
.byte 102,15,112,232,229 // pshufd $0xe5,%xmm0,%xmm5
.byte 102,15,126,232 // movd %xmm5,%eax
.byte 102,15,112,232,78 // pshufd $0x4e,%xmm0,%xmm5
@@ -75190,7 +75150,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5
.byte 15,20,245 // unpcklps %xmm5,%xmm6
.byte 102,15,20,240 // unpcklpd %xmm0,%xmm6
- .byte 102,15,254,137,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm1
+ .byte 102,15,254,137,41,93,0,0 // paddd 0x5d29(%ecx),%xmm1
.byte 102,15,112,193,229 // pshufd $0xe5,%xmm1,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
.byte 102,15,112,193,78 // pshufd $0x4e,%xmm1,%xmm0
@@ -75208,7 +75168,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
.byte 102,15,254,77,168 // paddd -0x58(%ebp),%xmm1
.byte 102,15,112,193,245 // pshufd $0xf5,%xmm1,%xmm0
- .byte 102,15,111,145,97,99,0,0 // movdqa 0x6361(%ecx),%xmm2
+ .byte 102,15,111,145,105,99,0,0 // movdqa 0x6369(%ecx),%xmm2
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
@@ -75244,7 +75204,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0
.byte 15,20,216 // unpcklps %xmm0,%xmm3
.byte 102,15,20,217 // unpcklpd %xmm1,%xmm3
- .byte 102,15,254,169,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm5
+ .byte 102,15,254,169,41,93,0,0 // paddd 0x5d29(%ecx),%xmm5
.byte 102,15,112,197,229 // pshufd $0xe5,%xmm5,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
.byte 102,15,112,197,78 // pshufd $0x4e,%xmm5,%xmm0
@@ -75304,7 +75264,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,209 // movdqa %xmm1,%xmm2
.byte 102,15,254,85,152 // paddd -0x68(%ebp),%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,153,97,99,0,0 // movdqa 0x6361(%ecx),%xmm3
+ .byte 102,15,111,153,105,99,0,0 // movdqa 0x6369(%ecx),%xmm3
.byte 102,15,244,211 // pmuludq %xmm3,%xmm2
.byte 102,15,244,195 // pmuludq %xmm3,%xmm0
.byte 102,15,111,251 // movdqa %xmm3,%xmm7
@@ -75343,7 +75303,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,44,130 // movss (%edx,%eax,4),%xmm5
.byte 15,20,229 // unpcklps %xmm5,%xmm4
.byte 102,15,20,227 // unpcklpd %xmm3,%xmm4
- .byte 102,15,254,129,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm0
+ .byte 102,15,254,129,41,93,0,0 // paddd 0x5d29(%ecx),%xmm0
.byte 102,15,112,216,229 // pshufd $0xe5,%xmm0,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,216,78 // pshufd $0x4e,%xmm0,%xmm3
@@ -75395,7 +75355,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,52,130 // movss (%edx,%eax,4),%xmm6
.byte 15,20,238 // unpcklps %xmm6,%xmm5
.byte 102,15,20,235 // unpcklpd %xmm3,%xmm5
- .byte 102,15,111,137,209,92,0,0 // movdqa 0x5cd1(%ecx),%xmm1
+ .byte 102,15,111,137,41,93,0,0 // movdqa 0x5d29(%ecx),%xmm1
.byte 102,15,254,249 // paddd %xmm1,%xmm7
.byte 102,15,112,223,229 // pshufd $0xe5,%xmm7,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
@@ -75429,7 +75389,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,226 // movdqa %xmm2,%xmm4
.byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0
.byte 102,15,112,208,245 // pshufd $0xf5,%xmm0,%xmm2
- .byte 102,15,111,153,97,99,0,0 // movdqa 0x6361(%ecx),%xmm3
+ .byte 102,15,111,153,105,99,0,0 // movdqa 0x6369(%ecx),%xmm3
.byte 102,15,244,195 // pmuludq %xmm3,%xmm0
.byte 102,15,244,211 // pmuludq %xmm3,%xmm2
.byte 102,15,112,218,232 // pshufd $0xe8,%xmm2,%xmm3
@@ -75486,7 +75446,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,212 // movdqa %xmm4,%xmm2
.byte 102,15,254,85,168 // paddd -0x58(%ebp),%xmm2
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,137,97,99,0,0 // movdqa 0x6361(%ecx),%xmm1
+ .byte 102,15,111,137,105,99,0,0 // movdqa 0x6369(%ecx),%xmm1
.byte 102,15,244,209 // pmuludq %xmm1,%xmm2
.byte 102,15,244,193 // pmuludq %xmm1,%xmm0
.byte 102,15,112,240,232 // pshufd $0xe8,%xmm0,%xmm6
@@ -75523,7 +75483,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4
.byte 15,20,212 // unpcklps %xmm4,%xmm2
.byte 102,15,20,214 // unpcklpd %xmm6,%xmm2
- .byte 102,15,254,129,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm0
+ .byte 102,15,254,129,41,93,0,0 // paddd 0x5d29(%ecx),%xmm0
.byte 102,15,112,224,229 // pshufd $0xe5,%xmm0,%xmm4
.byte 102,15,126,224 // movd %xmm4,%eax
.byte 102,15,112,224,78 // pshufd $0x4e,%xmm0,%xmm4
@@ -75591,7 +75551,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,93,152 // movdqa -0x68(%ebp),%xmm3
.byte 102,15,254,217 // paddd %xmm1,%xmm3
.byte 102,15,112,211,245 // pshufd $0xf5,%xmm3,%xmm2
- .byte 102,15,111,129,97,99,0,0 // movdqa 0x6361(%ecx),%xmm0
+ .byte 102,15,111,129,105,99,0,0 // movdqa 0x6369(%ecx),%xmm0
.byte 102,15,244,216 // pmuludq %xmm0,%xmm3
.byte 102,15,244,208 // pmuludq %xmm0,%xmm2
.byte 102,15,111,248 // movdqa %xmm0,%xmm7
@@ -75630,7 +75590,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,28,130 // movss (%edx,%eax,4),%xmm3
.byte 15,20,235 // unpcklps %xmm3,%xmm5
.byte 102,15,20,238 // unpcklpd %xmm6,%xmm5
- .byte 102,15,254,145,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm2
+ .byte 102,15,254,145,41,93,0,0 // paddd 0x5d29(%ecx),%xmm2
.byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
@@ -75682,7 +75642,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0
.byte 15,20,208 // unpcklps %xmm0,%xmm2
.byte 102,15,20,215 // unpcklpd %xmm7,%xmm2
- .byte 102,15,111,137,209,92,0,0 // movdqa 0x5cd1(%ecx),%xmm1
+ .byte 102,15,111,137,41,93,0,0 // movdqa 0x5d29(%ecx),%xmm1
.byte 102,15,254,217 // paddd %xmm1,%xmm3
.byte 102,15,112,195,229 // pshufd $0xe5,%xmm3,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
@@ -75717,7 +75677,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,194 // movdqa %xmm2,%xmm0
.byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0
.byte 102,15,112,224,245 // pshufd $0xf5,%xmm0,%xmm4
- .byte 102,15,111,169,97,99,0,0 // movdqa 0x6361(%ecx),%xmm5
+ .byte 102,15,111,169,105,99,0,0 // movdqa 0x6369(%ecx),%xmm5
.byte 102,15,111,221 // movdqa %xmm5,%xmm3
.byte 102,15,244,195 // pmuludq %xmm3,%xmm0
.byte 102,15,244,227 // pmuludq %xmm3,%xmm4
@@ -75773,7 +75733,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,202 // movdqa %xmm2,%xmm1
.byte 102,15,254,77,168 // paddd -0x58(%ebp),%xmm1
.byte 102,15,112,193,245 // pshufd $0xf5,%xmm1,%xmm0
- .byte 102,15,111,145,97,99,0,0 // movdqa 0x6361(%ecx),%xmm2
+ .byte 102,15,111,145,105,99,0,0 // movdqa 0x6369(%ecx),%xmm2
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,112,192,232 // pshufd $0xe8,%xmm0,%xmm0
@@ -75809,7 +75769,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,4,130 // movss (%edx,%eax,4),%xmm0
.byte 15,20,216 // unpcklps %xmm0,%xmm3
.byte 102,15,20,217 // unpcklpd %xmm1,%xmm3
- .byte 102,15,254,185,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm7
+ .byte 102,15,254,185,41,93,0,0 // paddd 0x5d29(%ecx),%xmm7
.byte 102,15,112,199,229 // pshufd $0xe5,%xmm7,%xmm0
.byte 102,15,126,192 // movd %xmm0,%eax
.byte 102,15,112,199,78 // pshufd $0x4e,%xmm7,%xmm0
@@ -75859,7 +75819,7 @@ _sk_clut_4D_sse2:
.byte 102,15,111,233 // movdqa %xmm1,%xmm5
.byte 102,15,254,69,152 // paddd -0x68(%ebp),%xmm0
.byte 102,15,112,200,245 // pshufd $0xf5,%xmm0,%xmm1
- .byte 102,15,111,145,97,99,0,0 // movdqa 0x6361(%ecx),%xmm2
+ .byte 102,15,111,145,105,99,0,0 // movdqa 0x6369(%ecx),%xmm2
.byte 102,15,244,194 // pmuludq %xmm2,%xmm0
.byte 102,15,244,202 // pmuludq %xmm2,%xmm1
.byte 102,15,111,250 // movdqa %xmm2,%xmm7
@@ -75898,7 +75858,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4
.byte 15,20,204 // unpcklps %xmm4,%xmm1
.byte 102,15,20,203 // unpcklpd %xmm3,%xmm1
- .byte 102,15,254,145,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm2
+ .byte 102,15,254,145,41,93,0,0 // paddd 0x5d29(%ecx),%xmm2
.byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
@@ -75952,7 +75912,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,36,130 // movss (%edx,%eax,4),%xmm4
.byte 15,20,252 // unpcklps %xmm4,%xmm7
.byte 102,15,20,254 // unpcklpd %xmm6,%xmm7
- .byte 102,15,254,153,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm3
+ .byte 102,15,254,153,41,93,0,0 // paddd 0x5d29(%ecx),%xmm3
.byte 102,15,112,227,229 // pshufd $0xe5,%xmm3,%xmm4
.byte 102,15,126,224 // movd %xmm4,%eax
.byte 102,15,112,227,78 // pshufd $0x4e,%xmm3,%xmm4
@@ -75985,7 +75945,7 @@ _sk_clut_4D_sse2:
.byte 102,15,254,208 // paddd %xmm0,%xmm2
.byte 102,15,111,216 // movdqa %xmm0,%xmm3
.byte 102,15,112,194,245 // pshufd $0xf5,%xmm2,%xmm0
- .byte 102,15,111,137,97,99,0,0 // movdqa 0x6361(%ecx),%xmm1
+ .byte 102,15,111,137,105,99,0,0 // movdqa 0x6369(%ecx),%xmm1
.byte 102,15,244,209 // pmuludq %xmm1,%xmm2
.byte 102,15,244,193 // pmuludq %xmm1,%xmm0
.byte 102,15,111,241 // movdqa %xmm1,%xmm6
@@ -76025,7 +75985,7 @@ _sk_clut_4D_sse2:
.byte 15,20,225 // unpcklps %xmm1,%xmm4
.byte 102,15,20,226 // unpcklpd %xmm2,%xmm4
.byte 102,15,41,165,88,255,255,255 // movapd %xmm4,-0xa8(%ebp)
- .byte 102,15,254,129,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm0
+ .byte 102,15,254,129,41,93,0,0 // paddd 0x5d29(%ecx),%xmm0
.byte 102,15,112,200,229 // pshufd $0xe5,%xmm0,%xmm1
.byte 102,15,126,200 // movd %xmm1,%eax
.byte 102,15,112,200,78 // pshufd $0x4e,%xmm0,%xmm1
@@ -76079,7 +76039,7 @@ _sk_clut_4D_sse2:
.byte 243,15,16,52,130 // movss (%edx,%eax,4),%xmm6
.byte 15,20,206 // unpcklps %xmm6,%xmm1
.byte 102,15,20,203 // unpcklpd %xmm3,%xmm1
- .byte 102,15,254,145,209,92,0,0 // paddd 0x5cd1(%ecx),%xmm2
+ .byte 102,15,254,145,41,93,0,0 // paddd 0x5d29(%ecx),%xmm2
.byte 102,15,112,218,229 // pshufd $0xe5,%xmm2,%xmm3
.byte 102,15,126,216 // movd %xmm3,%eax
.byte 102,15,112,218,78 // pshufd $0x4e,%xmm2,%xmm3
@@ -76148,7 +76108,7 @@ _sk_clut_4D_sse2:
.byte 139,85,12 // mov 0xc(%ebp),%edx
.byte 141,66,8 // lea 0x8(%edx),%eax
.byte 131,236,8 // sub $0x8,%esp
- .byte 15,40,153,145,92,0,0 // movaps 0x5c91(%ecx),%xmm3
+ .byte 15,40,153,233,92,0,0 // movaps 0x5ce9(%ecx),%xmm3
.byte 80 // push %eax
.byte 255,117,8 // pushl 0x8(%ebp)
.byte 255,82,4 // call *0x4(%edx)
@@ -76158,6 +76118,37 @@ _sk_clut_4D_sse2:
.byte 91 // pop %ebx
.byte 93 // pop %ebp
.byte 195 // ret
+
+HIDDEN _sk_gauss_a_to_rgba_sse2
+.globl _sk_gauss_a_to_rgba_sse2
+FUNCTION(_sk_gauss_a_to_rgba_sse2)
+_sk_gauss_a_to_rgba_sse2:
+ .byte 85 // push %ebp
+ .byte 137,229 // mov %esp,%ebp
+ .byte 131,236,8 // sub $0x8,%esp
+ .byte 232,0,0,0,0 // call 952c <_sk_gauss_a_to_rgba_sse2+0xb>
+ .byte 88 // pop %eax
+ .byte 139,77,12 // mov 0xc(%ebp),%ecx
+ .byte 15,40,128,36,79,0,0 // movaps 0x4f24(%eax),%xmm0
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,128,52,79,0,0 // addps 0x4f34(%eax),%xmm0
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,128,68,79,0,0 // addps 0x4f44(%eax),%xmm0
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,128,84,79,0,0 // addps 0x4f54(%eax),%xmm0
+ .byte 15,89,195 // mulps %xmm3,%xmm0
+ .byte 15,88,128,100,79,0,0 // addps 0x4f64(%eax),%xmm0
+ .byte 141,65,4 // lea 0x4(%ecx),%eax
+ .byte 131,236,8 // sub $0x8,%esp
+ .byte 15,40,200 // movaps %xmm0,%xmm1
+ .byte 15,40,208 // movaps %xmm0,%xmm2
+ .byte 15,40,216 // movaps %xmm0,%xmm3
+ .byte 80 // push %eax
+ .byte 255,117,8 // pushl 0x8(%ebp)
+ .byte 255,17 // call *(%ecx)
+ .byte 131,196,24 // add $0x18,%esp
+ .byte 93 // pop %ebp
+ .byte 195 // ret
.byte 144 // nop
.byte 144 // nop
.byte 144 // nop
@@ -82226,47 +82217,20 @@ BALIGN16
.byte 0,0 // add %al,(%eax)
.byte 211,128,0,0,211,128 // roll %cl,-0x7f2d0000(%eax)
.byte 0,0 // add %al,(%eax)
- .byte 211,128,0,0,211,45 // roll %cl,0x2dd30000(%eax)
- .byte 16,17 // adc %dl,(%ecx)
- .byte 192,45,16,17,192,45,16 // shrb $0x10,0x2dc01110
- .byte 17,192 // adc %eax,%eax
- .byte 45,16,17,192,18 // sub $0x12c01110,%eax
- .byte 120,57 // js e3ac <.literal16+0x5fc>
- .byte 64 // inc %eax
- .byte 18,120,57 // adc 0x39(%eax),%bh
- .byte 64 // inc %eax
- .byte 18,120,57 // adc 0x39(%eax),%bh
- .byte 64 // inc %eax
- .byte 18,120,57 // adc 0x39(%eax),%bh
- .byte 64 // inc %eax
- .byte 32,148,90,62,32,148,90 // and %dl,0x5a94203e(%edx,%ebx,2)
- .byte 62,32,148,90,62,32,148,90 // and %dl,%ds:0x5a94203e(%edx,%ebx,2)
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // push %ds
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // push %ds
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // push %ds
- .byte 62,4,157 // ds add $0x9d,%al
- .byte 30 // push %ds
- .byte 62,0,24 // add %bl,%ds:(%eax)
- .byte 161,57,0,24,161 // mov 0xa1180039,%eax
- .byte 57,0 // cmp %eax,(%eax)
- .byte 24,161,57,0,24,161 // sbb %ah,-0x5ee7ffc7(%ecx)
- .byte 57,111,43 // cmp %ebp,0x2b(%edi)
- .byte 231,187 // out %eax,$0xbb
- .byte 111 // outsl %ds:(%esi),(%dx)
+ .byte 211,128,0,0,211,111 // roll %cl,0x6fd30000(%eax)
.byte 43,231 // sub %edi,%esp
.byte 187,111,43,231,187 // mov $0xbbe72b6f,%ebx
.byte 111 // outsl %ds:(%esi),(%dx)
.byte 43,231 // sub %edi,%esp
- .byte 187,159,215,202,60 // mov $0x3ccad79f,%ebx
+ .byte 187,111,43,231,187 // mov $0xbbe72b6f,%ebx
.byte 159 // lahf
.byte 215 // xlat %ds:(%ebx)
.byte 202,60,159 // lret $0x9f3c
.byte 215 // xlat %ds:(%ebx)
.byte 202,60,159 // lret $0x9f3c
.byte 215 // xlat %ds:(%ebx)
+ .byte 202,60,159 // lret $0x9f3c
+ .byte 215 // xlat %ds:(%ebx)
.byte 202,60,212 // lret $0xd43c
.byte 100,84 // fs push %esp
.byte 189,212,100,84,189 // mov $0xbd5464d4,%ebp
@@ -82302,13 +82266,13 @@ BALIGN16
.byte 192,191,0,0,192,191,0 // sarb $0x0,-0x40400000(%edi)
.byte 0,192 // add %al,%al
.byte 191,0,0,192,191 // mov $0xbfc00000,%edi
- .byte 114,28 // jb e45e <.literal16+0x6ae>
+ .byte 114,28 // jb e40e <.literal16+0x65e>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt e462 <.literal16+0x6b2>
+ .byte 62,114,28 // jb,pt e412 <.literal16+0x662>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt e466 <.literal16+0x6b6>
+ .byte 62,114,28 // jb,pt e416 <.literal16+0x666>
.byte 199 // (bad)
- .byte 62,114,28 // jb,pt e46a <.literal16+0x6ba>
+ .byte 62,114,28 // jb,pt e41a <.literal16+0x66a>
.byte 199 // (bad)
.byte 62,85 // ds push %ebp
.byte 85 // push %ebp
@@ -82329,13 +82293,13 @@ BALIGN16
.byte 57,142,99,61,57,142 // cmp %ecx,-0x71c6c29d(%esi)
.byte 99,61,57,142,99,61 // arpl %di,0x3d638e39
.byte 57,142,99,61,114,249 // cmp %ecx,-0x68dc29d(%esi)
- .byte 127,63 // jg e4c3 <.literal16+0x713>
- .byte 114,249 // jb e47f <.literal16+0x6cf>
- .byte 127,63 // jg e4c7 <.literal16+0x717>
- .byte 114,249 // jb e483 <.literal16+0x6d3>
- .byte 127,63 // jg e4cb <.literal16+0x71b>
- .byte 114,249 // jb e487 <.literal16+0x6d7>
- .byte 127,63 // jg e4cf <.literal16+0x71f>
+ .byte 127,63 // jg e473 <.literal16+0x6c3>
+ .byte 114,249 // jb e42f <.literal16+0x67f>
+ .byte 127,63 // jg e477 <.literal16+0x6c7>
+ .byte 114,249 // jb e433 <.literal16+0x683>
+ .byte 127,63 // jg e47b <.literal16+0x6cb>
+ .byte 114,249 // jb e437 <.literal16+0x687>
+ .byte 127,63 // jg e47f <.literal16+0x6cf>
.byte 3,0 // add (%eax),%eax
.byte 0,0 // add %al,(%eax)
.byte 3,0 // add (%eax),%eax
@@ -82344,25 +82308,53 @@ BALIGN16
.byte 0,0 // add %al,(%eax)
.byte 3,0 // add (%eax),%eax
.byte 0,0 // add %al,(%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 255,0 // incl (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
- .byte 254,0 // incb (%eax)
+ .byte 45,16,17,192,45 // sub $0x2dc01110,%eax
+ .byte 16,17 // adc %dl,(%ecx)
+ .byte 192,45,16,17,192,45,16 // shrb $0x10,0x2dc01110
+ .byte 17,192 // adc %eax,%eax
+ .byte 18,120,57 // adc 0x39(%eax),%bh
+ .byte 64 // inc %eax
+ .byte 18,120,57 // adc 0x39(%eax),%bh
+ .byte 64 // inc %eax
+ .byte 18,120,57 // adc 0x39(%eax),%bh
+ .byte 64 // inc %eax
+ .byte 18,120,57 // adc 0x39(%eax),%bh
+ .byte 64 // inc %eax
+ .byte 32,148,90,62,32,148,90 // and %dl,0x5a94203e(%edx,%ebx,2)
+ .byte 62,32,148,90,62,32,148,90 // and %dl,%ds:0x5a94203e(%edx,%ebx,2)
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // push %ds
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // push %ds
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // push %ds
+ .byte 62,4,157 // ds add $0x9d,%al
+ .byte 30 // push %ds
+ .byte 62,0,24 // add %bl,%ds:(%eax)
+ .byte 161,57,0,24,161 // mov 0xa1180039,%eax
+ .byte 57,0 // cmp %eax,(%eax)
+ .byte 24,161,57,0,24,161 // sbb %ah,-0x5ee7ffc7(%ecx)
+ .byte 57,255 // cmp %edi,%edi
+ .byte 0,255 // add %bh,%bh
+ .byte 0,255 // add %bh,%bh
+ .byte 0,255 // add %bh,%bh
+ .byte 0,255 // add %bh,%bh
+ .byte 0,255 // add %bh,%bh
+ .byte 0,255 // add %bh,%bh
+ .byte 0,255 // add %bh,%bh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,254 // add %bh,%dh
+ .byte 0,0 // add %al,(%eax)
+ .byte 128,0,128 // addb $0x80,(%eax)
.byte 0,128,0,128,0,128 // add %al,-0x7fff8000(%eax)
.byte 0,128,0,128,0,128 // add %al,-0x7fff8000(%eax)
- .byte 0,128,0,128,254,1 // add %al,0x1fe8000(%eax)
+ .byte 254,1 // incb (%ecx)
.byte 254,1 // incb (%ecx)
.byte 254,1 // incb (%ecx)
.byte 254,1 // incb (%ecx)
diff --git a/src/jumper/SkJumper_generated_win.S b/src/jumper/SkJumper_generated_win.S
index 1365ba09a5..a8842f044c 100644
--- a/src/jumper/SkJumper_generated_win.S
+++ b/src/jumper/SkJumper_generated_win.S
@@ -5845,33 +5845,16 @@ _sk_evenly_spaced_gradient_hsw LABEL PROC
DB 197,124,41,192 ; vmovaps %ymm8,%ymm0
DB 255,224 ; jmpq *%rax
-PUBLIC _sk_gauss_a_to_rgba_hsw
-_sk_gauss_a_to_rgba_hsw LABEL PROC
- DB 196,226,125,24,5,154,133,2,0 ; vbroadcastss 0x2859a(%rip),%ymm0 # 2e524 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
- DB 196,226,125,24,13,149,133,2,0 ; vbroadcastss 0x28595(%rip),%ymm1 # 2e528 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
- DB 196,226,101,168,200 ; vfmadd213ps %ymm0,%ymm3,%ymm1
- DB 196,226,125,24,5,139,133,2,0 ; vbroadcastss 0x2858b(%rip),%ymm0 # 2e52c <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
- DB 196,226,101,184,193 ; vfmadd231ps %ymm1,%ymm3,%ymm0
- DB 196,226,125,24,13,129,133,2,0 ; vbroadcastss 0x28581(%rip),%ymm1 # 2e530 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
- DB 196,226,101,184,200 ; vfmadd231ps %ymm0,%ymm3,%ymm1
- DB 196,226,125,24,5,119,133,2,0 ; vbroadcastss 0x28577(%rip),%ymm0 # 2e534 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
- DB 196,226,101,184,193 ; vfmadd231ps %ymm1,%ymm3,%ymm0
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
- DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
- DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
- DB 255,224 ; jmpq *%rax
-
PUBLIC _sk_gradient_hsw
_sk_gradient_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 76,139,0 ; mov (%rax),%r8
DB 73,131,248,1 ; cmp $0x1,%r8
- DB 15,134,220,0,0,0 ; jbe 60bd <_sk_gradient_hsw+0xeb>
+ DB 15,134,220,0,0,0 ; jbe 606c <_sk_gradient_hsw+0xeb>
DB 76,139,72,72 ; mov 0x48(%rax),%r9
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 65,186,1,0,0,0 ; mov $0x1,%r10d
- DB 196,226,125,24,21,4,132,2,0 ; vbroadcastss 0x28404(%rip),%ymm2 # 2e3fc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
+ DB 196,226,125,24,21,85,132,2,0 ; vbroadcastss 0x28455(%rip),%ymm2 # 2e3fc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
DB 196,65,53,239,201 ; vpxor %ymm9,%ymm9,%ymm9
DB 196,130,125,24,28,145 ; vbroadcastss (%r9,%r10,4),%ymm3
DB 197,228,194,216,2 ; vcmpleps %ymm0,%ymm3,%ymm3
@@ -5879,10 +5862,10 @@ _sk_gradient_hsw LABEL PROC
DB 197,53,254,203 ; vpaddd %ymm3,%ymm9,%ymm9
DB 73,255,194 ; inc %r10
DB 77,57,208 ; cmp %r10,%r8
- DB 117,227 ; jne 5ffd <_sk_gradient_hsw+0x2b>
+ DB 117,227 ; jne 5fac <_sk_gradient_hsw+0x2b>
DB 76,139,72,8 ; mov 0x8(%rax),%r9
DB 73,131,248,8 ; cmp $0x8,%r8
- DB 15,134,158,0,0,0 ; jbe 60c6 <_sk_gradient_hsw+0xf4>
+ DB 15,134,158,0,0,0 ; jbe 6075 <_sk_gradient_hsw+0xf4>
DB 196,65,13,118,246 ; vpcmpeqd %ymm14,%ymm14,%ymm14
DB 196,65,36,87,219 ; vxorps %ymm11,%ymm11,%ymm11
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
@@ -5914,7 +5897,7 @@ _sk_gradient_hsw LABEL PROC
DB 196,130,5,146,28,136 ; vgatherdps %ymm15,(%r8,%ymm9,4),%ymm3
DB 72,139,64,64 ; mov 0x40(%rax),%rax
DB 196,34,13,146,28,136 ; vgatherdps %ymm14,(%rax,%ymm9,4),%ymm11
- DB 235,77 ; jmp 610a <_sk_gradient_hsw+0x138>
+ DB 235,77 ; jmp 60b9 <_sk_gradient_hsw+0x138>
DB 76,139,72,8 ; mov 0x8(%rax),%r9
DB 196,65,52,87,201 ; vxorps %ymm9,%ymm9,%ymm9
DB 196,66,53,22,1 ; vpermps (%r9),%ymm9,%ymm8
@@ -5970,24 +5953,24 @@ _sk_xy_to_unit_angle_hsw LABEL PROC
DB 196,65,52,95,226 ; vmaxps %ymm10,%ymm9,%ymm12
DB 196,65,36,94,220 ; vdivps %ymm12,%ymm11,%ymm11
DB 196,65,36,89,227 ; vmulps %ymm11,%ymm11,%ymm12
- DB 196,98,125,24,45,147,131,2,0 ; vbroadcastss 0x28393(%rip),%ymm13 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
- DB 196,98,125,24,53,142,131,2,0 ; vbroadcastss 0x2838e(%rip),%ymm14 # 2e53c <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
+ DB 196,98,125,24,45,208,131,2,0 ; vbroadcastss 0x283d0(%rip),%ymm13 # 2e524 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
+ DB 196,98,125,24,53,203,131,2,0 ; vbroadcastss 0x283cb(%rip),%ymm14 # 2e528 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
DB 196,66,29,184,245 ; vfmadd231ps %ymm13,%ymm12,%ymm14
- DB 196,98,125,24,45,132,131,2,0 ; vbroadcastss 0x28384(%rip),%ymm13 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
+ DB 196,98,125,24,45,193,131,2,0 ; vbroadcastss 0x283c1(%rip),%ymm13 # 2e52c <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
DB 196,66,29,184,238 ; vfmadd231ps %ymm14,%ymm12,%ymm13
- DB 196,98,125,24,53,122,131,2,0 ; vbroadcastss 0x2837a(%rip),%ymm14 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ DB 196,98,125,24,53,183,131,2,0 ; vbroadcastss 0x283b7(%rip),%ymm14 # 2e530 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
DB 196,66,29,184,245 ; vfmadd231ps %ymm13,%ymm12,%ymm14
DB 196,65,36,89,222 ; vmulps %ymm14,%ymm11,%ymm11
DB 196,65,52,194,202,1 ; vcmpltps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,101,131,2,0 ; vbroadcastss 0x28365(%rip),%ymm10 # 2e548 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ DB 196,98,125,24,21,162,131,2,0 ; vbroadcastss 0x283a2(%rip),%ymm10 # 2e534 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
DB 196,65,44,92,211 ; vsubps %ymm11,%ymm10,%ymm10
DB 196,67,37,74,202,144 ; vblendvps %ymm9,%ymm10,%ymm11,%ymm9
DB 196,193,124,194,192,1 ; vcmpltps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,21,247,129,2,0 ; vbroadcastss 0x281f7(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,21,72,130,2,0 ; vbroadcastss 0x28248(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,44,92,209 ; vsubps %ymm9,%ymm10,%ymm10
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 196,65,116,194,200,1 ; vcmpltps %ymm8,%ymm1,%ymm9
- DB 196,98,125,24,21,225,129,2,0 ; vbroadcastss 0x281e1(%rip),%ymm10 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,21,50,130,2,0 ; vbroadcastss 0x28232(%rip),%ymm10 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,44,92,208 ; vsubps %ymm0,%ymm10,%ymm10
DB 196,195,125,74,194,144 ; vblendvps %ymm9,%ymm10,%ymm0,%ymm0
DB 196,65,124,194,200,3 ; vcmpunordps %ymm8,%ymm0,%ymm9
@@ -6011,23 +5994,23 @@ _sk_xy_to_2pt_conical_quadratic_max_hsw LABEL PROC
DB 197,50,89,80,76 ; vmulss 0x4c(%rax),%xmm9,%xmm10
DB 196,66,125,24,210 ; vbroadcastss %xmm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,229,130,2,0 ; vbroadcastss 0x282e5(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ DB 196,98,125,24,29,34,131,2,0 ; vbroadcastss 0x28322(%rip),%ymm11 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
DB 196,98,125,184,216 ; vfmadd231ps %ymm0,%ymm0,%ymm11
DB 196,193,50,89,193 ; vmulss %xmm9,%xmm9,%xmm0
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,196,130,2,0 ; vbroadcastss 0x282c4(%rip),%ymm9 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,13,1,131,2,0 ; vbroadcastss 0x28301(%rip),%ymm9 # 2e53c <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,194,45,184,194 ; vfmadd231ps %ymm10,%ymm10,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,68 ; vbroadcastss 0x44(%rax),%ymm8
- DB 196,98,125,24,13,167,130,2,0 ; vbroadcastss 0x282a7(%rip),%ymm9 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,13,228,130,2,0 ; vbroadcastss 0x282e4(%rip),%ymm9 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,52,129,2,0 ; vbroadcastss 0x28134(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,29,133,129,2,0 ; vbroadcastss 0x28185(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,44,89,208 ; vmulps %ymm8,%ymm10,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -6044,23 +6027,23 @@ _sk_xy_to_2pt_conical_quadratic_min_hsw LABEL PROC
DB 197,50,89,80,76 ; vmulss 0x4c(%rax),%xmm9,%xmm10
DB 196,66,125,24,210 ; vbroadcastss %xmm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,77,130,2,0 ; vbroadcastss 0x2824d(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ DB 196,98,125,24,29,138,130,2,0 ; vbroadcastss 0x2828a(%rip),%ymm11 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
DB 196,98,125,184,216 ; vfmadd231ps %ymm0,%ymm0,%ymm11
DB 196,193,50,89,193 ; vmulss %xmm9,%xmm9,%xmm0
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,44,130,2,0 ; vbroadcastss 0x2822c(%rip),%ymm9 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,13,105,130,2,0 ; vbroadcastss 0x28269(%rip),%ymm9 # 2e53c <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,194,45,184,194 ; vfmadd231ps %ymm10,%ymm10,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,68 ; vbroadcastss 0x44(%rax),%ymm8
- DB 196,98,125,24,13,15,130,2,0 ; vbroadcastss 0x2820f(%rip),%ymm9 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,13,76,130,2,0 ; vbroadcastss 0x2824c(%rip),%ymm9 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,156,128,2,0 ; vbroadcastss 0x2809c(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,29,237,128,2,0 ; vbroadcastss 0x280ed(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,44,89,208 ; vmulps %ymm8,%ymm10,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -6076,14 +6059,14 @@ _sk_xy_to_2pt_conical_linear_hsw LABEL PROC
DB 197,58,89,72,76 ; vmulss 0x4c(%rax),%xmm8,%xmm9
DB 196,66,125,24,201 ; vbroadcastss %xmm9,%ymm9
DB 197,52,88,200 ; vaddps %ymm0,%ymm9,%ymm9
- DB 196,98,125,24,21,187,129,2,0 ; vbroadcastss 0x281bb(%rip),%ymm10 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ DB 196,98,125,24,21,248,129,2,0 ; vbroadcastss 0x281f8(%rip),%ymm10 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
DB 197,116,89,209 ; vmulps %ymm1,%ymm1,%ymm10
DB 196,98,125,184,208 ; vfmadd231ps %ymm0,%ymm0,%ymm10
DB 196,193,58,89,192 ; vmulss %xmm8,%xmm8,%xmm0
DB 196,226,125,24,192 ; vbroadcastss %xmm0,%ymm0
DB 197,172,92,192 ; vsubps %ymm0,%ymm10,%ymm0
- DB 196,98,125,24,5,158,129,2,0 ; vbroadcastss 0x2819e(%rip),%ymm8 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,5,219,129,2,0 ; vbroadcastss 0x281db(%rip),%ymm8 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,193,124,87,192 ; vxorps %ymm8,%ymm0,%ymm0
DB 196,193,124,94,193 ; vdivps %ymm9,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6120,7 +6103,7 @@ _sk_apply_vector_mask_hsw LABEL PROC
PUBLIC _sk_save_xy_hsw
_sk_save_xy_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,201,127,2,0 ; vbroadcastss 0x27fc9(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,5,26,128,2,0 ; vbroadcastss 0x2801a(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,124,88,200 ; vaddps %ymm8,%ymm0,%ymm9
DB 196,67,125,8,209,1 ; vroundps $0x1,%ymm9,%ymm10
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
@@ -6150,9 +6133,9 @@ _sk_accumulate_hsw LABEL PROC
PUBLIC _sk_bilinear_nx_hsw
_sk_bilinear_nx_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,183,128,2,0 ; vbroadcastss 0x280b7(%rip),%ymm0 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,5,244,128,2,0 ; vbroadcastss 0x280f4(%rip),%ymm0 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,74,127,2,0 ; vbroadcastss 0x27f4a(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,155,127,2,0 ; vbroadcastss 0x27f9b(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,128,0,0,0 ; vsubps 0x80(%rax),%ymm8,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6161,7 +6144,7 @@ _sk_bilinear_nx_hsw LABEL PROC
PUBLIC _sk_bilinear_px_hsw
_sk_bilinear_px_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,39,127,2,0 ; vbroadcastss 0x27f27(%rip),%ymm0 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,226,125,24,5,120,127,2,0 ; vbroadcastss 0x27f78(%rip),%ymm0 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,128,128,0,0,0 ; vmovups 0x80(%rax),%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
@@ -6171,9 +6154,9 @@ _sk_bilinear_px_hsw LABEL PROC
PUBLIC _sk_bilinear_ny_hsw
_sk_bilinear_ny_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,104,128,2,0 ; vbroadcastss 0x28068(%rip),%ymm1 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,13,165,128,2,0 ; vbroadcastss 0x280a5(%rip),%ymm1 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,250,126,2,0 ; vbroadcastss 0x27efa(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,75,127,2,0 ; vbroadcastss 0x27f4b(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,192,0,0,0 ; vsubps 0xc0(%rax),%ymm8,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6182,7 +6165,7 @@ _sk_bilinear_ny_hsw LABEL PROC
PUBLIC _sk_bilinear_py_hsw
_sk_bilinear_py_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,215,126,2,0 ; vbroadcastss 0x27ed7(%rip),%ymm1 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,226,125,24,13,40,127,2,0 ; vbroadcastss 0x27f28(%rip),%ymm1 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
DB 197,124,16,128,192,0,0,0 ; vmovups 0xc0(%rax),%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
@@ -6192,13 +6175,13 @@ _sk_bilinear_py_hsw LABEL PROC
PUBLIC _sk_bicubic_n3x_hsw
_sk_bicubic_n3x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,27,128,2,0 ; vbroadcastss 0x2801b(%rip),%ymm0 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ DB 196,226,125,24,5,88,128,2,0 ; vbroadcastss 0x28058(%rip),%ymm0 # 2e548 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,170,126,2,0 ; vbroadcastss 0x27eaa(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,251,126,2,0 ; vbroadcastss 0x27efb(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,128,0,0,0 ; vsubps 0x80(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,8,127,2,0 ; vbroadcastss 0x27f08(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- DB 196,98,125,24,29,243,127,2,0 ; vbroadcastss 0x27ff3(%rip),%ymm11 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,89,127,2,0 ; vbroadcastss 0x27f59(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,29,48,128,2,0 ; vbroadcastss 0x28030(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,36,89,193 ; vmulps %ymm9,%ymm11,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
@@ -6208,16 +6191,16 @@ _sk_bicubic_n3x_hsw LABEL PROC
PUBLIC _sk_bicubic_n1x_hsw
_sk_bicubic_n1x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,202,127,2,0 ; vbroadcastss 0x27fca(%rip),%ymm0 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,5,7,128,2,0 ; vbroadcastss 0x28007(%rip),%ymm0 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,93,126,2,0 ; vbroadcastss 0x27e5d(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,174,126,2,0 ; vbroadcastss 0x27eae(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,128,0,0,0 ; vsubps 0x80(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,184,127,2,0 ; vbroadcastss 0x27fb8(%rip),%ymm9 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- DB 196,98,125,24,21,179,127,2,0 ; vbroadcastss 0x27fb3(%rip),%ymm10 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,13,245,127,2,0 ; vbroadcastss 0x27ff5(%rip),%ymm9 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,21,240,127,2,0 ; vbroadcastss 0x27ff0(%rip),%ymm10 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,66,61,168,209 ; vfmadd213ps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,13,49,126,2,0 ; vbroadcastss 0x27e31(%rip),%ymm9 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,13,130,126,2,0 ; vbroadcastss 0x27e82(%rip),%ymm9 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,66,61,184,202 ; vfmadd231ps %ymm10,%ymm8,%ymm9
- DB 196,98,125,24,21,155,127,2,0 ; vbroadcastss 0x27f9b(%rip),%ymm10 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,21,216,127,2,0 ; vbroadcastss 0x27fd8(%rip),%ymm10 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 197,124,17,144,0,1,0,0 ; vmovups %ymm10,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6226,14 +6209,14 @@ _sk_bicubic_n1x_hsw LABEL PROC
PUBLIC _sk_bicubic_p1x_hsw
_sk_bicubic_p1x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,7,126,2,0 ; vbroadcastss 0x27e07(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,5,88,126,2,0 ; vbroadcastss 0x27e58(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,188,88,0 ; vaddps (%rax),%ymm8,%ymm0
DB 197,124,16,136,128,0,0,0 ; vmovups 0x80(%rax),%ymm9
- DB 196,98,125,24,21,98,127,2,0 ; vbroadcastss 0x27f62(%rip),%ymm10 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- DB 196,98,125,24,29,93,127,2,0 ; vbroadcastss 0x27f5d(%rip),%ymm11 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,21,159,127,2,0 ; vbroadcastss 0x27f9f(%rip),%ymm10 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,29,154,127,2,0 ; vbroadcastss 0x27f9a(%rip),%ymm11 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,66,53,168,218 ; vfmadd213ps %ymm10,%ymm9,%ymm11
DB 196,66,53,168,216 ; vfmadd213ps %ymm8,%ymm9,%ymm11
- DB 196,98,125,24,5,78,127,2,0 ; vbroadcastss 0x27f4e(%rip),%ymm8 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,5,139,127,2,0 ; vbroadcastss 0x27f8b(%rip),%ymm8 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,66,53,184,195 ; vfmadd231ps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6242,12 +6225,12 @@ _sk_bicubic_p1x_hsw LABEL PROC
PUBLIC _sk_bicubic_p3x_hsw
_sk_bicubic_p3x_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,42,127,2,0 ; vbroadcastss 0x27f2a(%rip),%ymm0 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,226,125,24,5,103,127,2,0 ; vbroadcastss 0x27f67(%rip),%ymm0 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,128,128,0,0,0 ; vmovups 0x80(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,24,126,2,0 ; vbroadcastss 0x27e18(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- DB 196,98,125,24,29,3,127,2,0 ; vbroadcastss 0x27f03(%rip),%ymm11 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,105,126,2,0 ; vbroadcastss 0x27e69(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,29,64,127,2,0 ; vbroadcastss 0x27f40(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,52,89,195 ; vmulps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
@@ -6257,13 +6240,13 @@ _sk_bicubic_p3x_hsw LABEL PROC
PUBLIC _sk_bicubic_n3y_hsw
_sk_bicubic_n3y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,222,126,2,0 ; vbroadcastss 0x27ede(%rip),%ymm1 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ DB 196,226,125,24,13,27,127,2,0 ; vbroadcastss 0x27f1b(%rip),%ymm1 # 2e548 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,108,125,2,0 ; vbroadcastss 0x27d6c(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,189,125,2,0 ; vbroadcastss 0x27dbd(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,192,0,0,0 ; vsubps 0xc0(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,202,125,2,0 ; vbroadcastss 0x27dca(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- DB 196,98,125,24,29,181,126,2,0 ; vbroadcastss 0x27eb5(%rip),%ymm11 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,27,126,2,0 ; vbroadcastss 0x27e1b(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,29,242,126,2,0 ; vbroadcastss 0x27ef2(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,36,89,193 ; vmulps %ymm9,%ymm11,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
@@ -6273,16 +6256,16 @@ _sk_bicubic_n3y_hsw LABEL PROC
PUBLIC _sk_bicubic_n1y_hsw
_sk_bicubic_n1y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,140,126,2,0 ; vbroadcastss 0x27e8c(%rip),%ymm1 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,13,201,126,2,0 ; vbroadcastss 0x27ec9(%rip),%ymm1 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,30,125,2,0 ; vbroadcastss 0x27d1e(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,111,125,2,0 ; vbroadcastss 0x27d6f(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,192,0,0,0 ; vsubps 0xc0(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,121,126,2,0 ; vbroadcastss 0x27e79(%rip),%ymm9 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- DB 196,98,125,24,21,116,126,2,0 ; vbroadcastss 0x27e74(%rip),%ymm10 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,13,182,126,2,0 ; vbroadcastss 0x27eb6(%rip),%ymm9 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,21,177,126,2,0 ; vbroadcastss 0x27eb1(%rip),%ymm10 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,66,61,168,209 ; vfmadd213ps %ymm9,%ymm8,%ymm10
- DB 196,98,125,24,13,242,124,2,0 ; vbroadcastss 0x27cf2(%rip),%ymm9 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,13,67,125,2,0 ; vbroadcastss 0x27d43(%rip),%ymm9 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,66,61,184,202 ; vfmadd231ps %ymm10,%ymm8,%ymm9
- DB 196,98,125,24,21,92,126,2,0 ; vbroadcastss 0x27e5c(%rip),%ymm10 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,21,153,126,2,0 ; vbroadcastss 0x27e99(%rip),%ymm10 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,66,61,184,209 ; vfmadd231ps %ymm9,%ymm8,%ymm10
DB 197,124,17,144,64,1,0,0 ; vmovups %ymm10,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6291,14 +6274,14 @@ _sk_bicubic_n1y_hsw LABEL PROC
PUBLIC _sk_bicubic_p1y_hsw
_sk_bicubic_p1y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,200,124,2,0 ; vbroadcastss 0x27cc8(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,5,25,125,2,0 ; vbroadcastss 0x27d19(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,188,88,72,64 ; vaddps 0x40(%rax),%ymm8,%ymm1
DB 197,124,16,136,192,0,0,0 ; vmovups 0xc0(%rax),%ymm9
- DB 196,98,125,24,21,34,126,2,0 ; vbroadcastss 0x27e22(%rip),%ymm10 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
- DB 196,98,125,24,29,29,126,2,0 ; vbroadcastss 0x27e1d(%rip),%ymm11 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,21,95,126,2,0 ; vbroadcastss 0x27e5f(%rip),%ymm10 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,29,90,126,2,0 ; vbroadcastss 0x27e5a(%rip),%ymm11 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,66,53,168,218 ; vfmadd213ps %ymm10,%ymm9,%ymm11
DB 196,66,53,168,216 ; vfmadd213ps %ymm8,%ymm9,%ymm11
- DB 196,98,125,24,5,14,126,2,0 ; vbroadcastss 0x27e0e(%rip),%ymm8 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,5,75,126,2,0 ; vbroadcastss 0x27e4b(%rip),%ymm8 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,66,53,184,195 ; vfmadd231ps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -6307,12 +6290,12 @@ _sk_bicubic_p1y_hsw LABEL PROC
PUBLIC _sk_bicubic_p3y_hsw
_sk_bicubic_p3y_hsw LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,234,125,2,0 ; vbroadcastss 0x27dea(%rip),%ymm1 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,226,125,24,13,39,126,2,0 ; vbroadcastss 0x27e27(%rip),%ymm1 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
DB 197,124,16,128,192,0,0,0 ; vmovups 0xc0(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,215,124,2,0 ; vbroadcastss 0x27cd7(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
- DB 196,98,125,24,29,194,125,2,0 ; vbroadcastss 0x27dc2(%rip),%ymm11 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,40,125,2,0 ; vbroadcastss 0x27d28(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,29,255,125,2,0 ; vbroadcastss 0x27dff(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,66,61,168,218 ; vfmadd213ps %ymm10,%ymm8,%ymm11
DB 196,65,52,89,195 ; vmulps %ymm11,%ymm9,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
@@ -6440,7 +6423,7 @@ _sk_clut_3D_hsw LABEL PROC
DB 196,98,93,64,218 ; vpmulld %ymm2,%ymm4,%ymm11
DB 72,139,0 ; mov (%rax),%rax
DB 197,165,254,193 ; vpaddd %ymm1,%ymm11,%ymm0
- DB 196,98,125,88,61,145,123,2,0 ; vpbroadcastd 0x27b91(%rip),%ymm15 # 2e574 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ DB 196,98,125,88,61,206,123,2,0 ; vpbroadcastd 0x27bce(%rip),%ymm15 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
DB 196,194,125,64,199 ; vpmulld %ymm15,%ymm0,%ymm0
DB 197,213,239,237 ; vpxor %ymm5,%ymm5,%ymm5
DB 197,237,118,210 ; vpcmpeqd %ymm2,%ymm2,%ymm2
@@ -6452,13 +6435,13 @@ _sk_clut_3D_hsw LABEL PROC
DB 197,213,118,237 ; vpcmpeqd %ymm5,%ymm5,%ymm5
DB 196,226,85,146,60,144 ; vgatherdps %ymm5,(%rax,%ymm2,4),%ymm7
DB 197,252,17,188,36,128,2,0,0 ; vmovups %ymm7,0x280(%rsp)
- DB 196,226,125,88,61,219,121,2,0 ; vpbroadcastd 0x279db(%rip),%ymm7 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ DB 196,226,125,88,61,44,122,2,0 ; vpbroadcastd 0x27a2c(%rip),%ymm7 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
DB 197,253,254,199 ; vpaddd %ymm7,%ymm0,%ymm0
DB 197,236,87,210 ; vxorps %ymm2,%ymm2,%ymm2
DB 197,213,118,237 ; vpcmpeqd %ymm5,%ymm5,%ymm5
DB 196,226,85,146,20,128 ; vgatherdps %ymm5,(%rax,%ymm0,4),%ymm2
DB 197,252,17,148,36,160,1,0,0 ; vmovups %ymm2,0x1a0(%rsp)
- DB 196,226,125,24,5,35,123,2,0 ; vbroadcastss 0x27b23(%rip),%ymm0 # 2e570 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ DB 196,226,125,24,5,96,123,2,0 ; vbroadcastss 0x27b60(%rip),%ymm0 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
DB 197,172,88,232 ; vaddps %ymm0,%ymm10,%ymm5
DB 197,254,91,237 ; vcvttps2dq %ymm5,%ymm5
DB 196,226,93,64,213 ; vpmulld %ymm5,%ymm4,%ymm2
@@ -6718,7 +6701,7 @@ _sk_clut_4D_hsw LABEL PROC
DB 197,254,127,132,36,128,1,0,0 ; vmovdqu %ymm0,0x180(%rsp)
DB 196,98,109,64,200 ; vpmulld %ymm0,%ymm2,%ymm9
DB 197,181,254,199 ; vpaddd %ymm7,%ymm9,%ymm0
- DB 196,98,125,88,21,165,117,2,0 ; vpbroadcastd 0x275a5(%rip),%ymm10 # 2e574 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ DB 196,98,125,88,21,226,117,2,0 ; vpbroadcastd 0x275e2(%rip),%ymm10 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
DB 196,194,125,64,194 ; vpmulld %ymm10,%ymm0,%ymm0
DB 197,213,118,237 ; vpcmpeqd %ymm5,%ymm5,%ymm5
DB 196,65,60,87,192 ; vxorps %ymm8,%ymm8,%ymm8
@@ -6730,13 +6713,13 @@ _sk_clut_4D_hsw LABEL PROC
DB 196,65,36,87,219 ; vxorps %ymm11,%ymm11,%ymm11
DB 196,98,61,146,28,168 ; vgatherdps %ymm8,(%rax,%ymm5,4),%ymm11
DB 197,124,17,156,36,64,1,0,0 ; vmovups %ymm11,0x140(%rsp)
- DB 196,98,125,88,29,236,115,2,0 ; vpbroadcastd 0x273ec(%rip),%ymm11 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ DB 196,98,125,88,29,61,116,2,0 ; vpbroadcastd 0x2743d(%rip),%ymm11 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
DB 196,193,125,254,195 ; vpaddd %ymm11,%ymm0,%ymm0
DB 196,65,61,118,192 ; vpcmpeqd %ymm8,%ymm8,%ymm8
DB 197,212,87,237 ; vxorps %ymm5,%ymm5,%ymm5
DB 196,226,61,146,44,128 ; vgatherdps %ymm8,(%rax,%ymm0,4),%ymm5
DB 197,252,17,172,36,160,0,0,0 ; vmovups %ymm5,0xa0(%rsp)
- DB 196,226,125,24,5,50,117,2,0 ; vbroadcastss 0x27532(%rip),%ymm0 # 2e570 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ DB 196,226,125,24,5,111,117,2,0 ; vbroadcastss 0x2756f(%rip),%ymm0 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
DB 197,116,88,192 ; vaddps %ymm0,%ymm1,%ymm8
DB 196,65,126,91,192 ; vcvttps2dq %ymm8,%ymm8
DB 196,194,109,64,232 ; vpmulld %ymm8,%ymm2,%ymm5
@@ -7169,13 +7152,30 @@ _sk_clut_4D_hsw LABEL PROC
DB 196,193,100,92,210 ; vsubps %ymm10,%ymm3,%ymm2
DB 196,194,77,168,210 ; vfmadd213ps %ymm10,%ymm6,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,222,105,2,0 ; vbroadcastss 0x269de(%rip),%ymm3 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,226,125,24,29,47,106,2,0 ; vbroadcastss 0x26a2f(%rip),%ymm3 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,252,16,164,36,224,6,0,0 ; vmovups 0x6e0(%rsp),%ymm4
DB 197,252,16,172,36,0,7,0,0 ; vmovups 0x700(%rsp),%ymm5
DB 197,252,16,180,36,32,7,0,0 ; vmovups 0x720(%rsp),%ymm6
DB 197,252,16,188,36,64,7,0,0 ; vmovups 0x740(%rsp),%ymm7
DB 72,129,196,120,7,0,0 ; add $0x778,%rsp
DB 255,224 ; jmpq *%rax
+
+PUBLIC _sk_gauss_a_to_rgba_hsw
+_sk_gauss_a_to_rgba_hsw LABEL PROC
+ DB 196,226,125,24,5,101,107,2,0 ; vbroadcastss 0x26b65(%rip),%ymm0 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,226,125,24,13,96,107,2,0 ; vbroadcastss 0x26b60(%rip),%ymm1 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,226,101,168,200 ; vfmadd213ps %ymm0,%ymm3,%ymm1
+ DB 196,226,125,24,5,86,107,2,0 ; vbroadcastss 0x26b56(%rip),%ymm0 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,226,101,184,193 ; vfmadd231ps %ymm1,%ymm3,%ymm0
+ DB 196,226,125,24,13,76,107,2,0 ; vbroadcastss 0x26b4c(%rip),%ymm1 # 2e570 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ DB 196,226,101,184,200 ; vfmadd231ps %ymm0,%ymm3,%ymm1
+ DB 196,226,125,24,5,66,107,2,0 ; vbroadcastss 0x26b42(%rip),%ymm0 # 2e574 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ DB 196,226,101,184,193 ; vfmadd231ps %ymm1,%ymm3,%ymm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
+ DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
+ DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
+ DB 255,224 ; jmpq *%rax
DB 144 ; nop
PUBLIC _sk_start_pipeline_avx
@@ -13294,7 +13294,7 @@ _sk_store_f16_avx LABEL PROC
DB 197,252,17,108,36,64 ; vmovups %ymm5,0x40(%rsp)
DB 197,252,17,100,36,32 ; vmovups %ymm4,0x20(%rsp)
DB 197,252,40,225 ; vmovaps %ymm1,%ymm4
- DB 196,98,125,24,5,197,3,2,0 ; vbroadcastss 0x203c5(%rip),%ymm8 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,5,177,3,2,0 ; vbroadcastss 0x203b1(%rip),%ymm8 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,65,124,84,216 ; vandps %ymm8,%ymm0,%ymm11
DB 196,98,125,24,21,227,3,2,0 ; vbroadcastss 0x203e3(%rip),%ymm10 # 2e580 <_sk_srcover_bgra_8888_sse2_lowp+0x438>
DB 196,65,124,84,226 ; vandps %ymm10,%ymm0,%ymm12
@@ -14478,27 +14478,6 @@ _sk_evenly_spaced_gradient_avx LABEL PROC
DB 93 ; pop %rbp
DB 255,224 ; jmpq *%rax
-PUBLIC _sk_gauss_a_to_rgba_avx
-_sk_gauss_a_to_rgba_avx LABEL PROC
- DB 196,226,125,24,5,203,238,1,0 ; vbroadcastss 0x1eecb(%rip),%ymm0 # 2e528 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
- DB 197,228,89,192 ; vmulps %ymm0,%ymm3,%ymm0
- DB 196,226,125,24,13,186,238,1,0 ; vbroadcastss 0x1eeba(%rip),%ymm1 # 2e524 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
- DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,13,177,238,1,0 ; vbroadcastss 0x1eeb1(%rip),%ymm1 # 2e52c <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
- DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,13,164,238,1,0 ; vbroadcastss 0x1eea4(%rip),%ymm1 # 2e530 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
- DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
- DB 196,226,125,24,13,151,238,1,0 ; vbroadcastss 0x1ee97(%rip),%ymm1 # 2e534 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
- DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
- DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
- DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
- DB 255,224 ; jmpq *%rax
-
PUBLIC _sk_gradient_avx
_sk_gradient_avx LABEL PROC
DB 65,87 ; push %r15
@@ -14512,12 +14491,12 @@ _sk_gradient_avx LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 73,131,248,2 ; cmp $0x2,%r8
- DB 114,81 ; jb f723 <_sk_gradient_avx+0x72>
+ DB 114,81 ; jb f6c6 <_sk_gradient_avx+0x72>
DB 72,139,88,72 ; mov 0x48(%rax),%rbx
DB 73,255,200 ; dec %r8
DB 72,131,195,4 ; add $0x4,%rbx
DB 196,65,52,87,201 ; vxorps %ymm9,%ymm9,%ymm9
- DB 196,98,125,24,21,17,237,1,0 ; vbroadcastss 0x1ed11(%rip),%ymm10 # 2e3fc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
+ DB 196,98,125,24,21,110,237,1,0 ; vbroadcastss 0x1ed6e(%rip),%ymm10 # 2e3fc <_sk_srcover_bgra_8888_sse2_lowp+0x2b4>
DB 197,244,87,201 ; vxorps %ymm1,%ymm1,%ymm1
DB 196,98,125,24,3 ; vbroadcastss (%rbx),%ymm8
DB 197,60,194,192,2 ; vcmpleps %ymm0,%ymm8,%ymm8
@@ -14529,7 +14508,7 @@ _sk_gradient_avx LABEL PROC
DB 196,227,117,24,202,1 ; vinsertf128 $0x1,%xmm2,%ymm1,%ymm1
DB 72,131,195,4 ; add $0x4,%rbx
DB 73,255,200 ; dec %r8
- DB 117,204 ; jne f6ef <_sk_gradient_avx+0x3e>
+ DB 117,204 ; jne f692 <_sk_gradient_avx+0x3e>
DB 196,195,249,22,200,1 ; vpextrq $0x1,%xmm1,%r8
DB 69,137,193 ; mov %r8d,%r9d
DB 73,193,232,32 ; shr $0x20,%r8
@@ -14708,27 +14687,27 @@ _sk_xy_to_unit_angle_avx LABEL PROC
DB 196,65,52,95,226 ; vmaxps %ymm10,%ymm9,%ymm12
DB 196,65,36,94,220 ; vdivps %ymm12,%ymm11,%ymm11
DB 196,65,36,89,227 ; vmulps %ymm11,%ymm11,%ymm12
- DB 196,98,125,24,45,60,234,1,0 ; vbroadcastss 0x1ea3c(%rip),%ymm13 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
+ DB 196,98,125,24,45,133,234,1,0 ; vbroadcastss 0x1ea85(%rip),%ymm13 # 2e524 <_sk_srcover_bgra_8888_sse2_lowp+0x3dc>
DB 196,65,28,89,237 ; vmulps %ymm13,%ymm12,%ymm13
- DB 196,98,125,24,53,50,234,1,0 ; vbroadcastss 0x1ea32(%rip),%ymm14 # 2e53c <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
+ DB 196,98,125,24,53,123,234,1,0 ; vbroadcastss 0x1ea7b(%rip),%ymm14 # 2e528 <_sk_srcover_bgra_8888_sse2_lowp+0x3e0>
DB 196,65,20,88,238 ; vaddps %ymm14,%ymm13,%ymm13
DB 196,65,28,89,237 ; vmulps %ymm13,%ymm12,%ymm13
- DB 196,98,125,24,53,35,234,1,0 ; vbroadcastss 0x1ea23(%rip),%ymm14 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
+ DB 196,98,125,24,53,108,234,1,0 ; vbroadcastss 0x1ea6c(%rip),%ymm14 # 2e52c <_sk_srcover_bgra_8888_sse2_lowp+0x3e4>
DB 196,65,20,88,238 ; vaddps %ymm14,%ymm13,%ymm13
DB 196,65,28,89,229 ; vmulps %ymm13,%ymm12,%ymm12
- DB 196,98,125,24,45,20,234,1,0 ; vbroadcastss 0x1ea14(%rip),%ymm13 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
+ DB 196,98,125,24,45,93,234,1,0 ; vbroadcastss 0x1ea5d(%rip),%ymm13 # 2e530 <_sk_srcover_bgra_8888_sse2_lowp+0x3e8>
DB 196,65,28,88,229 ; vaddps %ymm13,%ymm12,%ymm12
DB 196,65,36,89,220 ; vmulps %ymm12,%ymm11,%ymm11
DB 196,65,52,194,202,1 ; vcmpltps %ymm10,%ymm9,%ymm9
- DB 196,98,125,24,21,255,233,1,0 ; vbroadcastss 0x1e9ff(%rip),%ymm10 # 2e548 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
+ DB 196,98,125,24,21,72,234,1,0 ; vbroadcastss 0x1ea48(%rip),%ymm10 # 2e534 <_sk_srcover_bgra_8888_sse2_lowp+0x3ec>
DB 196,65,44,92,211 ; vsubps %ymm11,%ymm10,%ymm10
DB 196,67,37,74,202,144 ; vblendvps %ymm9,%ymm10,%ymm11,%ymm9
DB 196,193,124,194,192,1 ; vcmpltps %ymm8,%ymm0,%ymm0
- DB 196,98,125,24,21,145,232,1,0 ; vbroadcastss 0x1e891(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,21,238,232,1,0 ; vbroadcastss 0x1e8ee(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,44,92,209 ; vsubps %ymm9,%ymm10,%ymm10
DB 196,195,53,74,194,0 ; vblendvps %ymm0,%ymm10,%ymm9,%ymm0
DB 196,65,116,194,200,1 ; vcmpltps %ymm8,%ymm1,%ymm9
- DB 196,98,125,24,21,123,232,1,0 ; vbroadcastss 0x1e87b(%rip),%ymm10 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,21,216,232,1,0 ; vbroadcastss 0x1e8d8(%rip),%ymm10 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,44,92,208 ; vsubps %ymm0,%ymm10,%ymm10
DB 196,195,125,74,194,144 ; vblendvps %ymm9,%ymm10,%ymm0,%ymm0
DB 196,65,124,194,200,3 ; vcmpunordps %ymm8,%ymm0,%ymm9
@@ -14754,7 +14733,7 @@ _sk_xy_to_2pt_conical_quadratic_max_avx LABEL PROC
DB 196,67,121,4,210,0 ; vpermilps $0x0,%xmm10,%xmm10
DB 196,67,45,24,210,1 ; vinsertf128 $0x1,%xmm10,%ymm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,117,233,1,0 ; vbroadcastss 0x1e975(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ DB 196,98,125,24,29,190,233,1,0 ; vbroadcastss 0x1e9be(%rip),%ymm11 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,252,89,192 ; vmulps %ymm0,%ymm0,%ymm0
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
@@ -14763,17 +14742,17 @@ _sk_xy_to_2pt_conical_quadratic_max_avx LABEL PROC
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,73,233,1,0 ; vbroadcastss 0x1e949(%rip),%ymm9 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,13,146,233,1,0 ; vbroadcastss 0x1e992(%rip),%ymm9 # 2e53c <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,65,44,89,194 ; vmulps %ymm10,%ymm10,%ymm8
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,68 ; vbroadcastss 0x44(%rax),%ymm8
- DB 196,98,125,24,13,39,233,1,0 ; vbroadcastss 0x1e927(%rip),%ymm9 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,13,112,233,1,0 ; vbroadcastss 0x1e970(%rip),%ymm9 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,180,231,1,0 ; vbroadcastss 0x1e7b4(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,29,17,232,1,0 ; vbroadcastss 0x1e811(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,60,89,210 ; vmulps %ymm10,%ymm8,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -14791,7 +14770,7 @@ _sk_xy_to_2pt_conical_quadratic_min_avx LABEL PROC
DB 196,67,121,4,210,0 ; vpermilps $0x0,%xmm10,%xmm10
DB 196,67,45,24,210,1 ; vinsertf128 $0x1,%xmm10,%ymm10,%ymm10
DB 197,44,88,208 ; vaddps %ymm0,%ymm10,%ymm10
- DB 196,98,125,24,29,199,232,1,0 ; vbroadcastss 0x1e8c7(%rip),%ymm11 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ DB 196,98,125,24,29,16,233,1,0 ; vbroadcastss 0x1e910(%rip),%ymm11 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
DB 196,65,44,89,211 ; vmulps %ymm11,%ymm10,%ymm10
DB 197,252,89,192 ; vmulps %ymm0,%ymm0,%ymm0
DB 197,116,89,217 ; vmulps %ymm1,%ymm1,%ymm11
@@ -14800,17 +14779,17 @@ _sk_xy_to_2pt_conical_quadratic_min_avx LABEL PROC
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,164,92,192 ; vsubps %ymm0,%ymm11,%ymm0
- DB 196,98,125,24,13,155,232,1,0 ; vbroadcastss 0x1e89b(%rip),%ymm9 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
+ DB 196,98,125,24,13,228,232,1,0 ; vbroadcastss 0x1e8e4(%rip),%ymm9 # 2e53c <_sk_srcover_bgra_8888_sse2_lowp+0x3f4>
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
DB 197,188,89,192 ; vmulps %ymm0,%ymm8,%ymm0
DB 196,65,44,89,194 ; vmulps %ymm10,%ymm10,%ymm8
DB 196,193,124,88,192 ; vaddps %ymm8,%ymm0,%ymm0
DB 197,252,81,192 ; vsqrtps %ymm0,%ymm0
DB 196,98,125,24,64,68 ; vbroadcastss 0x44(%rax),%ymm8
- DB 196,98,125,24,13,121,232,1,0 ; vbroadcastss 0x1e879(%rip),%ymm9 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,13,194,232,1,0 ; vbroadcastss 0x1e8c2(%rip),%ymm9 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,65,44,87,201 ; vxorps %ymm9,%ymm10,%ymm9
DB 196,65,124,92,210 ; vsubps %ymm10,%ymm0,%ymm10
- DB 196,98,125,24,29,6,231,1,0 ; vbroadcastss 0x1e706(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,29,99,231,1,0 ; vbroadcastss 0x1e763(%rip),%ymm11 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,60,89,195 ; vmulps %ymm11,%ymm8,%ymm8
DB 196,65,60,89,210 ; vmulps %ymm10,%ymm8,%ymm10
DB 197,180,92,192 ; vsubps %ymm0,%ymm9,%ymm0
@@ -14827,7 +14806,7 @@ _sk_xy_to_2pt_conical_linear_avx LABEL PROC
DB 196,67,121,4,201,0 ; vpermilps $0x0,%xmm9,%xmm9
DB 196,67,53,24,201,1 ; vinsertf128 $0x1,%xmm9,%ymm9,%ymm9
DB 197,52,88,200 ; vaddps %ymm0,%ymm9,%ymm9
- DB 196,98,125,24,21,31,232,1,0 ; vbroadcastss 0x1e81f(%rip),%ymm10 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
+ DB 196,98,125,24,21,104,232,1,0 ; vbroadcastss 0x1e868(%rip),%ymm10 # 2e538 <_sk_srcover_bgra_8888_sse2_lowp+0x3f0>
DB 196,65,52,89,202 ; vmulps %ymm10,%ymm9,%ymm9
DB 197,252,89,192 ; vmulps %ymm0,%ymm0,%ymm0
DB 197,116,89,209 ; vmulps %ymm1,%ymm1,%ymm10
@@ -14836,7 +14815,7 @@ _sk_xy_to_2pt_conical_linear_avx LABEL PROC
DB 196,227,121,4,192,0 ; vpermilps $0x0,%xmm0,%xmm0
DB 196,227,125,24,192,1 ; vinsertf128 $0x1,%xmm0,%ymm0,%ymm0
DB 197,172,92,192 ; vsubps %ymm0,%ymm10,%ymm0
- DB 196,98,125,24,5,247,231,1,0 ; vbroadcastss 0x1e7f7(%rip),%ymm8 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
+ DB 196,98,125,24,5,64,232,1,0 ; vbroadcastss 0x1e840(%rip),%ymm8 # 2e540 <_sk_srcover_bgra_8888_sse2_lowp+0x3f8>
DB 196,193,124,87,192 ; vxorps %ymm8,%ymm0,%ymm0
DB 196,193,124,94,193 ; vdivps %ymm9,%ymm0,%ymm0
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14874,7 +14853,7 @@ _sk_apply_vector_mask_avx LABEL PROC
PUBLIC _sk_save_xy_avx
_sk_save_xy_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,29,230,1,0 ; vbroadcastss 0x1e61d(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,5,122,230,1,0 ; vbroadcastss 0x1e67a(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,124,88,200 ; vaddps %ymm8,%ymm0,%ymm9
DB 196,67,125,8,209,1 ; vroundps $0x1,%ymm9,%ymm10
DB 196,65,52,92,202 ; vsubps %ymm10,%ymm9,%ymm9
@@ -14907,9 +14886,9 @@ _sk_accumulate_avx LABEL PROC
PUBLIC _sk_bilinear_nx_avx
_sk_bilinear_nx_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,3,231,1,0 ; vbroadcastss 0x1e703(%rip),%ymm0 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,5,76,231,1,0 ; vbroadcastss 0x1e74c(%rip),%ymm0 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,150,229,1,0 ; vbroadcastss 0x1e596(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,243,229,1,0 ; vbroadcastss 0x1e5f3(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,128,0,0,0 ; vsubps 0x80(%rax),%ymm8,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14918,7 +14897,7 @@ _sk_bilinear_nx_avx LABEL PROC
PUBLIC _sk_bilinear_px_avx
_sk_bilinear_px_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,115,229,1,0 ; vbroadcastss 0x1e573(%rip),%ymm0 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,226,125,24,5,208,229,1,0 ; vbroadcastss 0x1e5d0(%rip),%ymm0 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,128,128,0,0,0 ; vmovups 0x80(%rax),%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
@@ -14928,9 +14907,9 @@ _sk_bilinear_px_avx LABEL PROC
PUBLIC _sk_bilinear_ny_avx
_sk_bilinear_ny_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,180,230,1,0 ; vbroadcastss 0x1e6b4(%rip),%ymm1 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,13,253,230,1,0 ; vbroadcastss 0x1e6fd(%rip),%ymm1 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,70,229,1,0 ; vbroadcastss 0x1e546(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,163,229,1,0 ; vbroadcastss 0x1e5a3(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,192,0,0,0 ; vsubps 0xc0(%rax),%ymm8,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14939,7 +14918,7 @@ _sk_bilinear_ny_avx LABEL PROC
PUBLIC _sk_bilinear_py_avx
_sk_bilinear_py_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,35,229,1,0 ; vbroadcastss 0x1e523(%rip),%ymm1 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,226,125,24,13,128,229,1,0 ; vbroadcastss 0x1e580(%rip),%ymm1 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
DB 197,124,16,128,192,0,0,0 ; vmovups 0xc0(%rax),%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
@@ -14949,14 +14928,14 @@ _sk_bilinear_py_avx LABEL PROC
PUBLIC _sk_bicubic_n3x_avx
_sk_bicubic_n3x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,103,230,1,0 ; vbroadcastss 0x1e667(%rip),%ymm0 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ DB 196,226,125,24,5,176,230,1,0 ; vbroadcastss 0x1e6b0(%rip),%ymm0 # 2e548 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,246,228,1,0 ; vbroadcastss 0x1e4f6(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,83,229,1,0 ; vbroadcastss 0x1e553(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,128,0,0,0 ; vsubps 0x80(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,72,230,1,0 ; vbroadcastss 0x1e648(%rip),%ymm10 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,145,230,1,0 ; vbroadcastss 0x1e691(%rip),%ymm10 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,70,229,1,0 ; vbroadcastss 0x1e546(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,21,163,229,1,0 ; vbroadcastss 0x1e5a3(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
@@ -14966,19 +14945,19 @@ _sk_bicubic_n3x_avx LABEL PROC
PUBLIC _sk_bicubic_n1x_avx
_sk_bicubic_n1x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,17,230,1,0 ; vbroadcastss 0x1e611(%rip),%ymm0 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,5,90,230,1,0 ; vbroadcastss 0x1e65a(%rip),%ymm0 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
- DB 196,98,125,24,5,164,228,1,0 ; vbroadcastss 0x1e4a4(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,1,229,1,0 ; vbroadcastss 0x1e501(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,128,0,0,0 ; vsubps 0x80(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,3,230,1,0 ; vbroadcastss 0x1e603(%rip),%ymm9 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,13,76,230,1,0 ; vbroadcastss 0x1e64c(%rip),%ymm9 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,241,229,1,0 ; vbroadcastss 0x1e5f1(%rip),%ymm10 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,98,125,24,21,58,230,1,0 ; vbroadcastss 0x1e63a(%rip),%ymm10 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,110,228,1,0 ; vbroadcastss 0x1e46e(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,21,203,228,1,0 ; vbroadcastss 0x1e4cb(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,211,229,1,0 ; vbroadcastss 0x1e5d3(%rip),%ymm9 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,13,28,230,1,0 ; vbroadcastss 0x1e61c(%rip),%ymm9 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -14987,17 +14966,17 @@ _sk_bicubic_n1x_avx LABEL PROC
PUBLIC _sk_bicubic_p1x_avx
_sk_bicubic_p1x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,63,228,1,0 ; vbroadcastss 0x1e43f(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,5,156,228,1,0 ; vbroadcastss 0x1e49c(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,188,88,0 ; vaddps (%rax),%ymm8,%ymm0
DB 197,124,16,136,128,0,0,0 ; vmovups 0x80(%rax),%ymm9
- DB 196,98,125,24,21,158,229,1,0 ; vbroadcastss 0x1e59e(%rip),%ymm10 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,21,231,229,1,0 ; vbroadcastss 0x1e5e7(%rip),%ymm10 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
- DB 196,98,125,24,29,140,229,1,0 ; vbroadcastss 0x1e58c(%rip),%ymm11 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,98,125,24,29,213,229,1,0 ; vbroadcastss 0x1e5d5(%rip),%ymm11 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 196,98,125,24,13,119,229,1,0 ; vbroadcastss 0x1e577(%rip),%ymm9 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,13,192,229,1,0 ; vbroadcastss 0x1e5c0(%rip),%ymm9 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -15006,13 +14985,13 @@ _sk_bicubic_p1x_avx LABEL PROC
PUBLIC _sk_bicubic_p3x_avx
_sk_bicubic_p3x_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,5,83,229,1,0 ; vbroadcastss 0x1e553(%rip),%ymm0 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,226,125,24,5,156,229,1,0 ; vbroadcastss 0x1e59c(%rip),%ymm0 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 197,252,88,0 ; vaddps (%rax),%ymm0,%ymm0
DB 197,124,16,128,128,0,0,0 ; vmovups 0x80(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,53,229,1,0 ; vbroadcastss 0x1e535(%rip),%ymm10 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,126,229,1,0 ; vbroadcastss 0x1e57e(%rip),%ymm10 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,51,228,1,0 ; vbroadcastss 0x1e433(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,21,144,228,1,0 ; vbroadcastss 0x1e490(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,0,1,0,0 ; vmovups %ymm8,0x100(%rax)
@@ -15022,14 +15001,14 @@ _sk_bicubic_p3x_avx LABEL PROC
PUBLIC _sk_bicubic_n3y_avx
_sk_bicubic_n3y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,2,229,1,0 ; vbroadcastss 0x1e502(%rip),%ymm1 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
+ DB 196,226,125,24,13,75,229,1,0 ; vbroadcastss 0x1e54b(%rip),%ymm1 # 2e548 <_sk_srcover_bgra_8888_sse2_lowp+0x400>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,144,227,1,0 ; vbroadcastss 0x1e390(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,237,227,1,0 ; vbroadcastss 0x1e3ed(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,192,0,0,0 ; vsubps 0xc0(%rax),%ymm8,%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,226,228,1,0 ; vbroadcastss 0x1e4e2(%rip),%ymm10 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,43,229,1,0 ; vbroadcastss 0x1e52b(%rip),%ymm10 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,224,227,1,0 ; vbroadcastss 0x1e3e0(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,21,61,228,1,0 ; vbroadcastss 0x1e43d(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
@@ -15039,19 +15018,19 @@ _sk_bicubic_n3y_avx LABEL PROC
PUBLIC _sk_bicubic_n1y_avx
_sk_bicubic_n1y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,171,228,1,0 ; vbroadcastss 0x1e4ab(%rip),%ymm1 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
+ DB 196,226,125,24,13,244,228,1,0 ; vbroadcastss 0x1e4f4(%rip),%ymm1 # 2e544 <_sk_srcover_bgra_8888_sse2_lowp+0x3fc>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
- DB 196,98,125,24,5,61,227,1,0 ; vbroadcastss 0x1e33d(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,98,125,24,5,154,227,1,0 ; vbroadcastss 0x1e39a(%rip),%ymm8 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,60,92,128,192,0,0,0 ; vsubps 0xc0(%rax),%ymm8,%ymm8
- DB 196,98,125,24,13,156,228,1,0 ; vbroadcastss 0x1e49c(%rip),%ymm9 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,13,229,228,1,0 ; vbroadcastss 0x1e4e5(%rip),%ymm9 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,138,228,1,0 ; vbroadcastss 0x1e48a(%rip),%ymm10 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,98,125,24,21,211,228,1,0 ; vbroadcastss 0x1e4d3(%rip),%ymm10 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,201 ; vmulps %ymm9,%ymm8,%ymm9
- DB 196,98,125,24,21,7,227,1,0 ; vbroadcastss 0x1e307(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,21,100,227,1,0 ; vbroadcastss 0x1e364(%rip),%ymm10 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 196,65,52,88,202 ; vaddps %ymm10,%ymm9,%ymm9
DB 196,65,60,89,193 ; vmulps %ymm9,%ymm8,%ymm8
- DB 196,98,125,24,13,108,228,1,0 ; vbroadcastss 0x1e46c(%rip),%ymm9 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,13,181,228,1,0 ; vbroadcastss 0x1e4b5(%rip),%ymm9 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -15060,17 +15039,17 @@ _sk_bicubic_n1y_avx LABEL PROC
PUBLIC _sk_bicubic_p1y_avx
_sk_bicubic_p1y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,98,125,24,5,216,226,1,0 ; vbroadcastss 0x1e2d8(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
+ DB 196,98,125,24,5,53,227,1,0 ; vbroadcastss 0x1e335(%rip),%ymm8 # 2e3f4 <_sk_srcover_bgra_8888_sse2_lowp+0x2ac>
DB 197,188,88,72,64 ; vaddps 0x40(%rax),%ymm8,%ymm1
DB 197,124,16,136,192,0,0,0 ; vmovups 0xc0(%rax),%ymm9
- DB 196,98,125,24,21,54,228,1,0 ; vbroadcastss 0x1e436(%rip),%ymm10 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 196,98,125,24,21,127,228,1,0 ; vbroadcastss 0x1e47f(%rip),%ymm10 # 2e554 <_sk_srcover_bgra_8888_sse2_lowp+0x40c>
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
- DB 196,98,125,24,29,36,228,1,0 ; vbroadcastss 0x1e424(%rip),%ymm11 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,98,125,24,29,109,228,1,0 ; vbroadcastss 0x1e46d(%rip),%ymm11 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 196,65,44,88,211 ; vaddps %ymm11,%ymm10,%ymm10
DB 196,65,52,89,210 ; vmulps %ymm10,%ymm9,%ymm10
DB 196,65,44,88,192 ; vaddps %ymm8,%ymm10,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
- DB 196,98,125,24,13,15,228,1,0 ; vbroadcastss 0x1e40f(%rip),%ymm9 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 196,98,125,24,13,88,228,1,0 ; vbroadcastss 0x1e458(%rip),%ymm9 # 2e558 <_sk_srcover_bgra_8888_sse2_lowp+0x410>
DB 196,65,60,88,193 ; vaddps %ymm9,%ymm8,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -15079,13 +15058,13 @@ _sk_bicubic_p1y_avx LABEL PROC
PUBLIC _sk_bicubic_p3y_avx
_sk_bicubic_p3y_avx LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,13,235,227,1,0 ; vbroadcastss 0x1e3eb(%rip),%ymm1 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 196,226,125,24,13,52,228,1,0 ; vbroadcastss 0x1e434(%rip),%ymm1 # 2e550 <_sk_srcover_bgra_8888_sse2_lowp+0x408>
DB 197,244,88,72,64 ; vaddps 0x40(%rax),%ymm1,%ymm1
DB 197,124,16,128,192,0,0,0 ; vmovups 0xc0(%rax),%ymm8
DB 196,65,60,89,200 ; vmulps %ymm8,%ymm8,%ymm9
- DB 196,98,125,24,21,204,227,1,0 ; vbroadcastss 0x1e3cc(%rip),%ymm10 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
+ DB 196,98,125,24,21,21,228,1,0 ; vbroadcastss 0x1e415(%rip),%ymm10 # 2e54c <_sk_srcover_bgra_8888_sse2_lowp+0x404>
DB 196,65,60,89,194 ; vmulps %ymm10,%ymm8,%ymm8
- DB 196,98,125,24,21,202,226,1,0 ; vbroadcastss 0x1e2ca(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
+ DB 196,98,125,24,21,39,227,1,0 ; vbroadcastss 0x1e327(%rip),%ymm10 # 2e46c <_sk_srcover_bgra_8888_sse2_lowp+0x324>
DB 196,65,60,88,194 ; vaddps %ymm10,%ymm8,%ymm8
DB 196,65,52,89,192 ; vmulps %ymm8,%ymm9,%ymm8
DB 197,124,17,128,64,1,0,0 ; vmovups %ymm8,0x140(%rax)
@@ -15221,7 +15200,7 @@ _sk_clut_3D_avx LABEL PROC
DB 72,139,0 ; mov (%rax),%rax
DB 197,217,254,207 ; vpaddd %xmm7,%xmm4,%xmm1
DB 197,249,254,193 ; vpaddd %xmm1,%xmm0,%xmm0
- DB 196,226,121,24,37,110,225,1,0 ; vbroadcastss 0x1e16e(%rip),%xmm4 # 2e574 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ DB 196,226,121,24,37,183,225,1,0 ; vbroadcastss 0x1e1b7(%rip),%xmm4 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
DB 196,98,121,64,228 ; vpmulld %xmm4,%xmm0,%xmm12
DB 196,226,49,64,198 ; vpmulld %xmm6,%xmm9,%xmm0
DB 197,249,127,132,36,0,1,0,0 ; vmovdqa %xmm0,0x100(%rsp)
@@ -15275,7 +15254,7 @@ _sk_clut_3D_avx LABEL PROC
DB 196,161,122,16,60,128 ; vmovss (%rax,%r8,4),%xmm7
DB 196,227,73,33,247,48 ; vinsertps $0x30,%xmm7,%xmm6,%xmm6
DB 196,227,77,24,237,1 ; vinsertf128 $0x1,%xmm5,%ymm6,%ymm5
- DB 196,98,121,24,21,211,222,1,0 ; vbroadcastss 0x1ded3(%rip),%xmm10 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ DB 196,98,121,24,21,48,223,1,0 ; vbroadcastss 0x1df30(%rip),%xmm10 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
DB 196,193,105,254,210 ; vpaddd %xmm10,%xmm2,%xmm2
DB 196,195,249,22,208,1 ; vpextrq $0x1,%xmm2,%r8
DB 196,193,249,126,209 ; vmovq %xmm2,%r9
@@ -15303,7 +15282,7 @@ _sk_clut_3D_avx LABEL PROC
DB 196,161,122,16,60,128 ; vmovss (%rax,%r8,4),%xmm7
DB 196,227,73,33,247,48 ; vinsertps $0x30,%xmm7,%xmm6,%xmm6
DB 196,227,77,24,210,1 ; vinsertf128 $0x1,%xmm2,%ymm6,%ymm2
- DB 196,226,125,24,61,171,223,1,0 ; vbroadcastss 0x1dfab(%rip),%ymm7 # 2e570 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ DB 196,226,125,24,61,244,223,1,0 ; vbroadcastss 0x1dff4(%rip),%ymm7 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
DB 197,148,88,247 ; vaddps %ymm7,%ymm13,%ymm6
DB 197,124,40,231 ; vmovaps %ymm7,%ymm12
DB 197,124,17,164,36,128,0,0,0 ; vmovups %ymm12,0x80(%rsp)
@@ -16044,7 +16023,7 @@ _sk_clut_4D_avx LABEL PROC
DB 197,249,127,132,36,160,0,0,0 ; vmovdqa %xmm0,0xa0(%rsp)
DB 197,225,254,216 ; vpaddd %xmm0,%xmm3,%xmm3
DB 197,233,254,195 ; vpaddd %xmm3,%xmm2,%xmm0
- DB 196,98,121,24,13,60,208,1,0 ; vbroadcastss 0x1d03c(%rip),%xmm9 # 2e574 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ DB 196,98,121,24,13,133,208,1,0 ; vbroadcastss 0x1d085(%rip),%xmm9 # 2e560 <_sk_srcover_bgra_8888_sse2_lowp+0x418>
DB 196,194,121,64,209 ; vpmulld %xmm9,%xmm0,%xmm2
DB 196,226,81,64,199 ; vpmulld %xmm7,%xmm5,%xmm0
DB 197,249,127,132,36,224,1,0,0 ; vmovdqa %xmm0,0x1e0(%rsp)
@@ -16101,7 +16080,7 @@ _sk_clut_4D_avx LABEL PROC
DB 196,161,122,16,60,128 ; vmovss (%rax,%r8,4),%xmm7
DB 196,227,73,33,247,48 ; vinsertps $0x30,%xmm7,%xmm6,%xmm6
DB 196,227,77,24,237,1 ; vinsertf128 $0x1,%xmm5,%ymm6,%ymm5
- DB 196,98,121,24,21,145,205,1,0 ; vbroadcastss 0x1cd91(%rip),%xmm10 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
+ DB 196,98,121,24,21,238,205,1,0 ; vbroadcastss 0x1cdee(%rip),%xmm10 # 2e404 <_sk_srcover_bgra_8888_sse2_lowp+0x2bc>
DB 196,193,121,254,194 ; vpaddd %xmm10,%xmm0,%xmm0
DB 196,195,249,22,192,1 ; vpextrq $0x1,%xmm0,%r8
DB 196,193,249,126,193 ; vmovq %xmm0,%r9
@@ -16129,7 +16108,7 @@ _sk_clut_4D_avx LABEL PROC
DB 196,161,122,16,52,128 ; vmovss (%rax,%r8,4),%xmm6
DB 196,227,105,33,214,48 ; vinsertps $0x30,%xmm6,%xmm2,%xmm2
DB 196,227,109,24,208,1 ; vinsertf128 $0x1,%xmm0,%ymm2,%ymm2
- DB 196,98,125,24,37,105,206,1,0 ; vbroadcastss 0x1ce69(%rip),%ymm12 # 2e570 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ DB 196,98,125,24,37,178,206,1,0 ; vbroadcastss 0x1ceb2(%rip),%ymm12 # 2e55c <_sk_srcover_bgra_8888_sse2_lowp+0x414>
DB 196,193,4,88,196 ; vaddps %ymm12,%ymm15,%ymm0
DB 197,124,17,164,36,128,0,0,0 ; vmovups %ymm12,0x80(%rsp)
DB 197,254,91,192 ; vcvttps2dq %ymm0,%ymm0
@@ -17527,7 +17506,7 @@ _sk_clut_4D_avx LABEL PROC
DB 197,228,89,210 ; vmulps %ymm2,%ymm3,%ymm2
DB 197,220,88,210 ; vaddps %ymm2,%ymm4,%ymm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 196,226,125,24,29,107,175,1,0 ; vbroadcastss 0x1af6b(%rip),%ymm3 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
+ DB 196,226,125,24,29,200,175,1,0 ; vbroadcastss 0x1afc8(%rip),%ymm3 # 2e3f8 <_sk_srcover_bgra_8888_sse2_lowp+0x2b0>
DB 197,252,16,164,36,192,2,0,0 ; vmovups 0x2c0(%rsp),%ymm4
DB 197,252,16,172,36,224,2,0,0 ; vmovups 0x2e0(%rsp),%ymm5
DB 197,252,16,180,36,0,3,0,0 ; vmovups 0x300(%rsp),%ymm6
@@ -17539,6 +17518,27 @@ _sk_clut_4D_avx LABEL PROC
DB 65,95 ; pop %r15
DB 255,224 ; jmpq *%rax
+PUBLIC _sk_gauss_a_to_rgba_avx
+_sk_gauss_a_to_rgba_avx LABEL PROC
+ DB 196,226,125,24,5,251,176,1,0 ; vbroadcastss 0x1b0fb(%rip),%ymm0 # 2e568 <_sk_srcover_bgra_8888_sse2_lowp+0x420>
+ DB 197,228,89,192 ; vmulps %ymm0,%ymm3,%ymm0
+ DB 196,226,125,24,13,234,176,1,0 ; vbroadcastss 0x1b0ea(%rip),%ymm1 # 2e564 <_sk_srcover_bgra_8888_sse2_lowp+0x41c>
+ DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
+ DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
+ DB 196,226,125,24,13,225,176,1,0 ; vbroadcastss 0x1b0e1(%rip),%ymm1 # 2e56c <_sk_srcover_bgra_8888_sse2_lowp+0x424>
+ DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
+ DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
+ DB 196,226,125,24,13,212,176,1,0 ; vbroadcastss 0x1b0d4(%rip),%ymm1 # 2e570 <_sk_srcover_bgra_8888_sse2_lowp+0x428>
+ DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
+ DB 197,252,89,195 ; vmulps %ymm3,%ymm0,%ymm0
+ DB 196,226,125,24,13,199,176,1,0 ; vbroadcastss 0x1b0c7(%rip),%ymm1 # 2e574 <_sk_srcover_bgra_8888_sse2_lowp+0x42c>
+ DB 197,252,88,193 ; vaddps %ymm1,%ymm0,%ymm0
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 197,252,40,200 ; vmovaps %ymm0,%ymm1
+ DB 197,252,40,208 ; vmovaps %ymm0,%ymm2
+ DB 197,252,40,216 ; vmovaps %ymm0,%ymm3
+ DB 255,224 ; jmpq *%rax
+
PUBLIC _sk_start_pipeline_sse41
_sk_start_pipeline_sse41 LABEL PROC
DB 85 ; push %rbp
@@ -23324,23 +23324,6 @@ _sk_evenly_spaced_gradient_sse41 LABEL PROC
DB 65,94 ; pop %r14
DB 255,224 ; jmpq *%rax
-PUBLIC _sk_gauss_a_to_rgba_sse41
-_sk_gauss_a_to_rgba_sse41 LABEL PROC
- DB 15,40,5,71,98,1,0 ; movaps 0x16247(%rip),%xmm0 # 2f200 <_sk_srcover_bgra_8888_sse2_lowp+0x10b8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,77,98,1,0 ; addps 0x1624d(%rip),%xmm0 # 2f210 <_sk_srcover_bgra_8888_sse2_lowp+0x10c8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,83,98,1,0 ; addps 0x16253(%rip),%xmm0 # 2f220 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,89,98,1,0 ; addps 0x16259(%rip),%xmm0 # 2f230 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,95,98,1,0 ; addps 0x1625f(%rip),%xmm0 # 2f240 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 15,40,208 ; movaps %xmm0,%xmm2
- DB 15,40,216 ; movaps %xmm0,%xmm3
- DB 255,224 ; jmpq *%rax
-
PUBLIC _sk_gradient_sse41
_sk_gradient_sse41 LABEL PROC
DB 65,86 ; push %r14
@@ -23349,7 +23332,7 @@ _sk_gradient_sse41 LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 73,131,248,2 ; cmp $0x2,%r8
- DB 114,41 ; jb 19029 <_sk_gradient_sse41+0x3b>
+ DB 114,41 ; jb 18fed <_sk_gradient_sse41+0x3b>
DB 76,139,72,72 ; mov 0x48(%rax),%r9
DB 73,255,200 ; dec %r8
DB 73,131,193,4 ; add $0x4,%r9
@@ -23360,7 +23343,7 @@ _sk_gradient_sse41 LABEL PROC
DB 102,15,250,202 ; psubd %xmm2,%xmm1
DB 73,131,193,4 ; add $0x4,%r9
DB 73,255,200 ; dec %r8
- DB 117,230 ; jne 1900f <_sk_gradient_sse41+0x21>
+ DB 117,230 ; jne 18fd3 <_sk_gradient_sse41+0x21>
DB 102,73,15,58,22,200,1 ; pextrq $0x1,%xmm1,%r8
DB 69,137,193 ; mov %r8d,%r9d
DB 73,193,232,32 ; shr $0x20,%r8
@@ -23485,26 +23468,26 @@ _sk_xy_to_unit_angle_sse41 LABEL PROC
DB 69,15,94,226 ; divps %xmm10,%xmm12
DB 69,15,40,236 ; movaps %xmm12,%xmm13
DB 69,15,89,237 ; mulps %xmm13,%xmm13
- DB 68,15,40,21,214,95,1,0 ; movaps 0x15fd6(%rip),%xmm10 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
+ DB 68,15,40,21,194,95,1,0 ; movaps 0x15fc2(%rip),%xmm10 # 2f200 <_sk_srcover_bgra_8888_sse2_lowp+0x10b8>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,218,95,1,0 ; addps 0x15fda(%rip),%xmm10 # 2f260 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
+ DB 68,15,88,21,198,95,1,0 ; addps 0x15fc6(%rip),%xmm10 # 2f210 <_sk_srcover_bgra_8888_sse2_lowp+0x10c8>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,222,95,1,0 ; addps 0x15fde(%rip),%xmm10 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,88,21,202,95,1,0 ; addps 0x15fca(%rip),%xmm10 # 2f220 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
DB 69,15,89,213 ; mulps %xmm13,%xmm10
- DB 68,15,88,21,226,95,1,0 ; addps 0x15fe2(%rip),%xmm10 # 2f280 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ DB 68,15,88,21,206,95,1,0 ; addps 0x15fce(%rip),%xmm10 # 2f230 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,194,195,1 ; cmpltps %xmm11,%xmm0
- DB 68,15,40,29,225,95,1,0 ; movaps 0x15fe1(%rip),%xmm11 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,40,29,205,95,1,0 ; movaps 0x15fcd(%rip),%xmm11 # 2f240 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 102,69,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm10
DB 69,15,194,200,1 ; cmpltps %xmm8,%xmm9
- DB 68,15,40,29,154,89,1,0 ; movaps 0x1599a(%rip),%xmm11 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,29,214,89,1,0 ; movaps 0x159d6(%rip),%xmm11 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 69,15,92,218 ; subps %xmm10,%xmm11
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 102,69,15,56,20,211 ; blendvps %xmm0,%xmm11,%xmm10
DB 15,40,193 ; movaps %xmm1,%xmm0
DB 65,15,194,192,1 ; cmpltps %xmm8,%xmm0
- DB 68,15,40,13,140,89,1,0 ; movaps 0x1598c(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 68,15,40,13,200,89,1,0 ; movaps 0x159c8(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 102,69,15,56,20,209 ; blendvps %xmm0,%xmm9,%xmm10
DB 69,15,194,194,7 ; cmpordps %xmm10,%xmm8
@@ -23534,7 +23517,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,85,95,1,0 ; mulps 0x15f55(%rip),%xmm9 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ DB 68,15,89,13,65,95,1,0 ; mulps 0x15f41(%rip),%xmm9 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -23542,7 +23525,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,64,95,1,0 ; mulps 0x15f40(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ DB 68,15,89,21,44,95,1,0 ; mulps 0x15f2c(%rip),%xmm10 # 2f260 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -23551,8 +23534,8 @@ _sk_xy_to_2pt_conical_quadratic_max_sse41 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,232,93,1,0 ; xorps 0x15de8(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
- DB 68,15,89,5,192,88,1,0 ; mulps 0x158c0(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,87,13,36,94,1,0 ; xorps 0x15e24(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
+ DB 68,15,89,5,252,88,1,0 ; mulps 0x158fc(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -23571,7 +23554,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,183,94,1,0 ; mulps 0x15eb7(%rip),%xmm9 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ DB 68,15,89,13,163,94,1,0 ; mulps 0x15ea3(%rip),%xmm9 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -23579,7 +23562,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,162,94,1,0 ; mulps 0x15ea2(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ DB 68,15,89,21,142,94,1,0 ; mulps 0x15e8e(%rip),%xmm10 # 2f260 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -23588,8 +23571,8 @@ _sk_xy_to_2pt_conical_quadratic_min_sse41 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,74,93,1,0 ; xorps 0x15d4a(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
- DB 68,15,89,5,34,88,1,0 ; mulps 0x15822(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,87,13,134,93,1,0 ; xorps 0x15d86(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
+ DB 68,15,89,5,94,88,1,0 ; mulps 0x1585e(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -23605,7 +23588,7 @@ _sk_xy_to_2pt_conical_linear_sse41 LABEL PROC
DB 243,69,15,89,200 ; mulss %xmm8,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,42,94,1,0 ; mulps 0x15e2a(%rip),%xmm9 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ DB 68,15,89,13,22,94,1,0 ; mulps 0x15e16(%rip),%xmm9 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 69,15,89,210 ; mulps %xmm10,%xmm10
@@ -23613,7 +23596,7 @@ _sk_xy_to_2pt_conical_linear_sse41 LABEL PROC
DB 243,69,15,89,192 ; mulss %xmm8,%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,92,192 ; subps %xmm8,%xmm0
- DB 15,87,5,230,92,1,0 ; xorps 0x15ce6(%rip),%xmm0 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
+ DB 15,87,5,34,93,1,0 ; xorps 0x15d22(%rip),%xmm0 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
DB 65,15,94,193 ; divps %xmm9,%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23655,7 +23638,7 @@ _sk_apply_vector_mask_sse41 LABEL PROC
PUBLIC _sk_save_xy_sse41
_sk_save_xy_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,69,87,1,0 ; movaps 0x15745(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,5,129,87,1,0 ; movaps 0x15781(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 15,17,0 ; movups %xmm0,(%rax)
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,88,200 ; addps %xmm8,%xmm9
@@ -23695,8 +23678,8 @@ _sk_bilinear_nx_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,14,93,1,0 ; addps 0x15d0e(%rip),%xmm0 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,182,86,1,0 ; movaps 0x156b6(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,5,250,92,1,0 ; addps 0x15cfa(%rip),%xmm0 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,242,86,1,0 ; movaps 0x156f2(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,0,1,0,0 ; movups %xmm9,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23707,7 +23690,7 @@ _sk_bilinear_px_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,130,86,1,0 ; addps 0x15682(%rip),%xmm0 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 15,88,5,190,86,1,0 ; addps 0x156be(%rip),%xmm0 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 68,15,17,128,0,1,0,0 ; movups %xmm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23717,8 +23700,8 @@ _sk_bilinear_ny_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,193,92,1,0 ; addps 0x15cc1(%rip),%xmm1 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,105,86,1,0 ; movaps 0x15669(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,13,173,92,1,0 ; addps 0x15cad(%rip),%xmm1 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,165,86,1,0 ; movaps 0x156a5(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,64,1,0,0 ; movups %xmm9,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23729,7 +23712,7 @@ _sk_bilinear_py_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,52,86,1,0 ; addps 0x15634(%rip),%xmm1 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 15,88,13,112,86,1,0 ; addps 0x15670(%rip),%xmm1 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 68,15,17,128,64,1,0,0 ; movups %xmm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23739,13 +23722,13 @@ _sk_bicubic_n3x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,132,92,1,0 ; addps 0x15c84(%rip),%xmm0 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
- DB 68,15,40,13,28,86,1,0 ; movaps 0x1561c(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,5,112,92,1,0 ; addps 0x15c70(%rip),%xmm0 # 2f280 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ DB 68,15,40,13,88,86,1,0 ; movaps 0x15658(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,120,92,1,0 ; mulps 0x15c78(%rip),%xmm9 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,13,0,88,1,0 ; addps 0x15800(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,13,100,92,1,0 ; mulps 0x15c64(%rip),%xmm9 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,13,60,88,1,0 ; addps 0x1583c(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,0,1,0,0 ; movups %xmm9,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23756,16 +23739,16 @@ _sk_bicubic_n1x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,44,92,1,0 ; addps 0x15c2c(%rip),%xmm0 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,212,85,1,0 ; movaps 0x155d4(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,5,24,92,1,0 ; addps 0x15c18(%rip),%xmm0 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,16,86,1,0 ; movaps 0x15610(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,72,92,1,0 ; movaps 0x15c48(%rip),%xmm8 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,5,52,92,1,0 ; movaps 0x15c34(%rip),%xmm8 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,76,92,1,0 ; addps 0x15c4c(%rip),%xmm8 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,5,56,92,1,0 ; addps 0x15c38(%rip),%xmm8 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,160,85,1,0 ; addps 0x155a0(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,88,5,220,85,1,0 ; addps 0x155dc(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,68,92,1,0 ; addps 0x15c44(%rip),%xmm8 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,5,48,92,1,0 ; addps 0x15c30(%rip),%xmm8 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,128,0,1,0,0 ; movups %xmm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23773,17 +23756,17 @@ _sk_bicubic_n1x_sse41 LABEL PROC
PUBLIC _sk_bicubic_p1x_sse41
_sk_bicubic_p1x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,126,85,1,0 ; movaps 0x1557e(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,5,186,85,1,0 ; movaps 0x155ba(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,136,128,0,0,0 ; movups 0x80(%rax),%xmm9
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,21,247,91,1,0 ; movaps 0x15bf7(%rip),%xmm10 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,21,227,91,1,0 ; movaps 0x15be3(%rip),%xmm10 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,251,91,1,0 ; addps 0x15bfb(%rip),%xmm10 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,21,231,91,1,0 ; addps 0x15be7(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,247,91,1,0 ; addps 0x15bf7(%rip),%xmm10 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,21,227,91,1,0 ; addps 0x15be3(%rip),%xmm10 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,144,0,1,0,0 ; movups %xmm10,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23793,11 +23776,11 @@ _sk_bicubic_p3x_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,199,91,1,0 ; addps 0x15bc7(%rip),%xmm0 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 15,88,5,179,91,1,0 ; addps 0x15bb3(%rip),%xmm0 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,151,91,1,0 ; mulps 0x15b97(%rip),%xmm8 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,5,31,87,1,0 ; addps 0x1571f(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,5,131,91,1,0 ; mulps 0x15b83(%rip),%xmm8 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,5,91,87,1,0 ; addps 0x1575b(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,0,1,0,0 ; movups %xmm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23808,13 +23791,13 @@ _sk_bicubic_n3y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,90,91,1,0 ; addps 0x15b5a(%rip),%xmm1 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
- DB 68,15,40,13,242,84,1,0 ; movaps 0x154f2(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,13,70,91,1,0 ; addps 0x15b46(%rip),%xmm1 # 2f280 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ DB 68,15,40,13,46,85,1,0 ; movaps 0x1552e(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,78,91,1,0 ; mulps 0x15b4e(%rip),%xmm9 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,13,214,86,1,0 ; addps 0x156d6(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,13,58,91,1,0 ; mulps 0x15b3a(%rip),%xmm9 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,13,18,87,1,0 ; addps 0x15712(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,64,1,0,0 ; movups %xmm9,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23825,16 +23808,16 @@ _sk_bicubic_n1y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,1,91,1,0 ; addps 0x15b01(%rip),%xmm1 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,169,84,1,0 ; movaps 0x154a9(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,13,237,90,1,0 ; addps 0x15aed(%rip),%xmm1 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,229,84,1,0 ; movaps 0x154e5(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,29,91,1,0 ; movaps 0x15b1d(%rip),%xmm8 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,5,9,91,1,0 ; movaps 0x15b09(%rip),%xmm8 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,33,91,1,0 ; addps 0x15b21(%rip),%xmm8 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,5,13,91,1,0 ; addps 0x15b0d(%rip),%xmm8 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,117,84,1,0 ; addps 0x15475(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,88,5,177,84,1,0 ; addps 0x154b1(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,25,91,1,0 ; addps 0x15b19(%rip),%xmm8 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,5,5,91,1,0 ; addps 0x15b05(%rip),%xmm8 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,128,64,1,0,0 ; movups %xmm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23842,17 +23825,17 @@ _sk_bicubic_n1y_sse41 LABEL PROC
PUBLIC _sk_bicubic_p1y_sse41
_sk_bicubic_p1y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,83,84,1,0 ; movaps 0x15453(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,5,143,84,1,0 ; movaps 0x1548f(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,136,192,0,0,0 ; movups 0xc0(%rax),%xmm9
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 68,15,40,21,203,90,1,0 ; movaps 0x15acb(%rip),%xmm10 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,21,183,90,1,0 ; movaps 0x15ab7(%rip),%xmm10 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,207,90,1,0 ; addps 0x15acf(%rip),%xmm10 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,21,187,90,1,0 ; addps 0x15abb(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,203,90,1,0 ; addps 0x15acb(%rip),%xmm10 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,21,183,90,1,0 ; addps 0x15ab7(%rip),%xmm10 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,144,64,1,0,0 ; movups %xmm10,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -23862,11 +23845,11 @@ _sk_bicubic_p3y_sse41 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,154,90,1,0 ; addps 0x15a9a(%rip),%xmm1 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 15,88,13,134,90,1,0 ; addps 0x15a86(%rip),%xmm1 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,106,90,1,0 ; mulps 0x15a6a(%rip),%xmm8 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,5,242,85,1,0 ; addps 0x155f2(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,5,86,90,1,0 ; mulps 0x15a56(%rip),%xmm8 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,5,46,86,1,0 ; addps 0x1562e(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,64,1,0,0 ; movups %xmm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -23961,7 +23944,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 15,89,194 ; mulps %xmm2,%xmm0
DB 15,41,68,36,80 ; movaps %xmm0,0x50(%rsp)
DB 243,15,91,240 ; cvttps2dq %xmm0,%xmm6
- DB 15,40,37,109,89,1,0 ; movaps 0x1596d(%rip),%xmm4 # 2f320 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ DB 15,40,37,89,89,1,0 ; movaps 0x15959(%rip),%xmm4 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
DB 15,88,196 ; addps %xmm4,%xmm0
DB 15,41,68,36,48 ; movaps %xmm0,0x30(%rsp)
DB 102,65,15,110,208 ; movd %r8d,%xmm2
@@ -24000,7 +23983,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,68,15,56,64,192 ; pmulld %xmm0,%xmm8
DB 102,65,15,111,216 ; movdqa %xmm8,%xmm3
DB 102,15,254,218 ; paddd %xmm2,%xmm3
- DB 102,68,15,111,37,196,88,1,0 ; movdqa 0x158c4(%rip),%xmm12 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,68,15,111,37,176,88,1,0 ; movdqa 0x158b0(%rip),%xmm12 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,65,15,56,64,220 ; pmulld %xmm12,%xmm3
DB 102,15,118,228 ; pcmpeqd %xmm4,%xmm4
DB 102,15,111,203 ; movdqa %xmm3,%xmm1
@@ -24023,7 +24006,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,65,15,58,22,217,1 ; pextrd $0x1,%xmm3,%r9d
DB 102,65,15,58,22,218,2 ; pextrd $0x2,%xmm3,%r10d
DB 102,65,15,58,22,219,3 ; pextrd $0x3,%xmm3,%r11d
- DB 102,15,111,37,184,81,1,0 ; movdqa 0x151b8(%rip),%xmm4 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,37,244,81,1,0 ; movdqa 0x151f4(%rip),%xmm4 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,254,220 ; paddd %xmm4,%xmm3
DB 102,15,111,252 ; movdqa %xmm4,%xmm7
DB 102,73,15,58,22,222,1 ; pextrq $0x1,%xmm3,%r14
@@ -24196,7 +24179,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,68,15,254,202 ; paddd %xmm2,%xmm9
DB 102,65,15,111,192 ; movdqa %xmm8,%xmm0
DB 102,65,15,254,193 ; paddd %xmm9,%xmm0
- DB 102,15,111,45,211,84,1,0 ; movdqa 0x154d3(%rip),%xmm5 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,45,191,84,1,0 ; movdqa 0x154bf(%rip),%xmm5 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,56,64,197 ; pmulld %xmm5,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,15,118,246 ; pcmpeqd %xmm6,%xmm6
@@ -24217,7 +24200,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,65,15,58,22,193,1 ; pextrd $0x1,%xmm0,%r9d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,195,3 ; pextrd $0x3,%xmm0,%r11d
- DB 102,15,111,61,212,77,1,0 ; movdqa 0x14dd4(%rip),%xmm7 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,61,16,78,1,0 ; movdqa 0x14e10(%rip),%xmm7 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,254,199 ; paddd %xmm7,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
@@ -24283,7 +24266,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 15,88,248 ; addps %xmm0,%xmm7
DB 102,68,15,254,210 ; paddd %xmm2,%xmm10
DB 102,69,15,254,194 ; paddd %xmm10,%xmm8
- DB 102,15,111,13,15,83,1,0 ; movdqa 0x1530f(%rip),%xmm1 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,13,251,82,1,0 ; movdqa 0x152fb(%rip),%xmm1 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,68,15,56,64,193 ; pmulld %xmm1,%xmm8
DB 102,65,15,111,192 ; movdqa %xmm8,%xmm0
DB 102,15,118,237 ; pcmpeqd %xmm5,%xmm5
@@ -24304,7 +24287,7 @@ _sk_clut_3D_sse41 LABEL PROC
DB 102,69,15,58,22,193,1 ; pextrd $0x1,%xmm8,%r9d
DB 102,69,15,58,22,194,2 ; pextrd $0x2,%xmm8,%r10d
DB 102,69,15,58,22,195,3 ; pextrd $0x3,%xmm8,%r11d
- DB 102,15,111,21,10,76,1,0 ; movdqa 0x14c0a(%rip),%xmm2 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,21,70,76,1,0 ; movdqa 0x14c46(%rip),%xmm2 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,68,15,254,194 ; paddd %xmm2,%xmm8
DB 102,76,15,58,22,193,1 ; pextrq $0x1,%xmm8,%rcx
DB 102,76,15,126,195 ; movq %xmm8,%rbx
@@ -24429,7 +24412,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 15,89,203 ; mulps %xmm3,%xmm1
DB 15,41,140,36,176,0,0,0 ; movaps %xmm1,0xb0(%rsp)
DB 243,15,91,249 ; cvttps2dq %xmm1,%xmm7
- DB 15,40,29,81,80,1,0 ; movaps 0x15051(%rip),%xmm3 # 2f320 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ DB 15,40,29,61,80,1,0 ; movaps 0x1503d(%rip),%xmm3 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
DB 15,88,203 ; addps %xmm3,%xmm1
DB 15,41,76,36,32 ; movaps %xmm1,0x20(%rsp)
DB 102,65,15,110,232 ; movd %r8d,%xmm5
@@ -24486,7 +24469,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,68,15,56,64,253 ; pmulld %xmm5,%xmm15
DB 102,65,15,111,223 ; movdqa %xmm15,%xmm3
DB 102,15,254,217 ; paddd %xmm1,%xmm3
- DB 102,68,15,111,29,75,79,1,0 ; movdqa 0x14f4b(%rip),%xmm11 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,68,15,111,29,55,79,1,0 ; movdqa 0x14f37(%rip),%xmm11 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,65,15,56,64,219 ; pmulld %xmm11,%xmm3
DB 102,15,118,192 ; pcmpeqd %xmm0,%xmm0
DB 102,15,111,243 ; movdqa %xmm3,%xmm6
@@ -24508,7 +24491,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,217,1 ; pextrd $0x1,%xmm3,%r9d
DB 102,65,15,58,22,218,2 ; pextrd $0x2,%xmm3,%r10d
DB 102,65,15,58,22,219,3 ; pextrd $0x3,%xmm3,%r11d
- DB 102,68,15,111,21,67,72,1,0 ; movdqa 0x14843(%rip),%xmm10 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,21,127,72,1,0 ; movdqa 0x1487f(%rip),%xmm10 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,218 ; paddd %xmm10,%xmm3
DB 102,73,15,58,22,222,1 ; pextrq $0x1,%xmm3,%r14
DB 102,72,15,126,219 ; movq %xmm3,%rbx
@@ -24526,7 +24509,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,254,201 ; paddd %xmm9,%xmm1
DB 102,65,15,56,64,203 ; pmulld %xmm11,%xmm1
DB 102,15,111,217 ; movdqa %xmm1,%xmm3
- DB 102,15,250,29,129,78,1,0 ; psubd 0x14e81(%rip),%xmm3 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,29,109,78,1,0 ; psubd 0x14e6d(%rip),%xmm3 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,73,15,58,22,222,1 ; pextrq $0x1,%xmm3,%r14
DB 102,72,15,126,219 ; movq %xmm3,%rbx
DB 65,137,223 ; mov %ebx,%r15d
@@ -24581,7 +24564,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,254,199 ; paddd %xmm15,%xmm0
DB 102,65,15,56,64,195 ; pmulld %xmm11,%xmm0
DB 102,15,111,232 ; movdqa %xmm0,%xmm5
- DB 102,15,250,45,97,77,1,0 ; psubd 0x14d61(%rip),%xmm5 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,45,77,77,1,0 ; psubd 0x14d4d(%rip),%xmm5 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,69,15,118,192 ; pcmpeqd %xmm8,%xmm8
DB 102,72,15,58,22,233,1 ; pextrq $0x1,%xmm5,%rcx
DB 102,72,15,126,237 ; movq %xmm5,%rbp
@@ -24706,7 +24689,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 72,193,233,32 ; shr $0x20,%rcx
DB 243,15,16,36,136 ; movss (%rax,%rcx,4),%xmm4
DB 102,68,15,58,33,220,48 ; insertps $0x30,%xmm4,%xmm11
- DB 102,15,111,61,52,68,1,0 ; movdqa 0x14434(%rip),%xmm7 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,61,112,68,1,0 ; movdqa 0x14470(%rip),%xmm7 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,254,223 ; paddd %xmm7,%xmm3
DB 102,72,15,58,22,217,1 ; pextrq $0x1,%xmm3,%rcx
DB 102,72,15,126,221 ; movq %xmm3,%rbp
@@ -24792,7 +24775,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,201,1 ; pextrd $0x1,%xmm1,%r9d
DB 102,65,15,58,22,202,2 ; pextrd $0x2,%xmm1,%r10d
DB 102,65,15,58,22,203,3 ; pextrd $0x3,%xmm1,%r11d
- DB 102,68,15,111,21,116,66,1,0 ; movdqa 0x14274(%rip),%xmm10 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,21,176,66,1,0 ; movdqa 0x142b0(%rip),%xmm10 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,72,15,58,22,201,1 ; pextrq $0x1,%xmm1,%rcx
DB 102,72,15,126,203 ; movq %xmm1,%rbx
@@ -24888,7 +24871,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,111,124,36,64 ; movdqa 0x40(%rsp),%xmm7
DB 102,15,111,199 ; movdqa %xmm7,%xmm0
DB 102,15,254,195 ; paddd %xmm3,%xmm0
- DB 102,15,111,21,24,71,1,0 ; movdqa 0x14718(%rip),%xmm2 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,21,4,71,1,0 ; movdqa 0x14704(%rip),%xmm2 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,56,64,194 ; pmulld %xmm2,%xmm0
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
DB 102,69,15,118,192 ; pcmpeqd %xmm8,%xmm8
@@ -24909,7 +24892,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,193,1 ; pextrd $0x1,%xmm0,%r9d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,195,3 ; pextrd $0x3,%xmm0,%r11d
- DB 102,15,111,37,23,64,1,0 ; movdqa 0x14017(%rip),%xmm4 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,37,83,64,1,0 ; movdqa 0x14053(%rip),%xmm4 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,254,196 ; paddd %xmm4,%xmm0
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
@@ -24981,7 +24964,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,68,15,111,226 ; movdqa %xmm2,%xmm12
DB 102,65,15,56,64,204 ; pmulld %xmm12,%xmm1
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
- DB 102,15,250,21,67,69,1,0 ; psubd 0x14543(%rip),%xmm2 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,21,47,69,1,0 ; psubd 0x1452f(%rip),%xmm2 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,72,15,58,22,209,1 ; pextrq $0x1,%xmm2,%rcx
DB 102,72,15,126,213 ; movq %xmm2,%rbp
DB 137,235 ; mov %ebp,%ebx
@@ -25015,7 +24998,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,111,249 ; movdqa %xmm9,%xmm7
DB 102,69,15,56,64,236 ; pmulld %xmm12,%xmm13
DB 102,65,15,111,205 ; movdqa %xmm13,%xmm1
- DB 102,15,250,13,143,68,1,0 ; psubd 0x1448f(%rip),%xmm1 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,13,123,68,1,0 ; psubd 0x1447b(%rip),%xmm1 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,72,15,58,22,201,1 ; pextrq $0x1,%xmm1,%rcx
DB 102,72,15,126,203 ; movq %xmm1,%rbx
DB 137,221 ; mov %ebx,%ebp
@@ -25080,7 +25063,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,111,206 ; movdqa %xmm14,%xmm1
DB 102,15,111,108,36,64 ; movdqa 0x40(%rsp),%xmm5
DB 102,15,254,205 ; paddd %xmm5,%xmm1
- DB 102,15,111,37,35,67,1,0 ; movdqa 0x14323(%rip),%xmm4 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,37,15,67,1,0 ; movdqa 0x1430f(%rip),%xmm4 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,56,64,204 ; pmulld %xmm4,%xmm1
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,118,246 ; pcmpeqd %xmm6,%xmm6
@@ -25101,7 +25084,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,201,1 ; pextrd $0x1,%xmm1,%r9d
DB 102,65,15,58,22,202,2 ; pextrd $0x2,%xmm1,%r10d
DB 102,65,15,58,22,203,3 ; pextrd $0x3,%xmm1,%r11d
- DB 102,15,111,29,36,60,1,0 ; movdqa 0x13c24(%rip),%xmm3 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,29,96,60,1,0 ; movdqa 0x13c60(%rip),%xmm3 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,254,203 ; paddd %xmm3,%xmm1
DB 102,72,15,58,22,201,1 ; pextrq $0x1,%xmm1,%rcx
DB 102,72,15,126,203 ; movq %xmm1,%rbx
@@ -25173,7 +25156,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,56,64,239 ; pmulld %xmm7,%xmm5
DB 102,15,111,205 ; movdqa %xmm5,%xmm1
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
- DB 102,15,250,5,84,65,1,0 ; psubd 0x14154(%rip),%xmm0 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,5,64,65,1,0 ; psubd 0x14140(%rip),%xmm0 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,197 ; movq %xmm0,%rbp
DB 137,235 ; mov %ebp,%ebx
@@ -25191,7 +25174,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,193,1 ; pextrd $0x1,%xmm0,%r9d
DB 102,65,15,58,22,194,2 ; pextrd $0x2,%xmm0,%r10d
DB 102,65,15,58,22,195,3 ; pextrd $0x3,%xmm0,%r11d
- DB 102,15,254,5,82,58,1,0 ; paddd 0x13a52(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,5,142,58,1,0 ; paddd 0x13a8e(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
DB 137,221 ; mov %ebx,%ebp
@@ -25207,7 +25190,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,15,254,84,36,48 ; paddd 0x30(%rsp),%xmm2
DB 102,15,56,64,215 ; pmulld %xmm7,%xmm2
DB 102,15,111,194 ; movdqa %xmm2,%xmm0
- DB 102,15,250,5,155,64,1,0 ; psubd 0x1409b(%rip),%xmm0 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,5,135,64,1,0 ; psubd 0x14087(%rip),%xmm0 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,72,15,58,22,193,1 ; pextrq $0x1,%xmm0,%rcx
DB 102,72,15,126,195 ; movq %xmm0,%rbx
DB 137,221 ; mov %ebx,%ebp
@@ -25225,7 +25208,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 102,65,15,58,22,199,1 ; pextrd $0x1,%xmm0,%r15d
DB 102,65,15,58,22,196,2 ; pextrd $0x2,%xmm0,%r12d
DB 102,65,15,58,22,198,3 ; pextrd $0x3,%xmm0,%r14d
- DB 102,15,254,5,153,57,1,0 ; paddd 0x13999(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,5,213,57,1,0 ; paddd 0x139d5(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,72,15,58,22,195,1 ; pextrq $0x1,%xmm0,%rbx
DB 102,72,15,126,197 ; movq %xmm0,%rbp
DB 137,233 ; mov %ebp,%ecx
@@ -25288,7 +25271,7 @@ _sk_clut_4D_sse41 LABEL PROC
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 65,15,88,211 ; addps %xmm11,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,81,56,1,0 ; movaps 0x13851(%rip),%xmm3 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,40,29,141,56,1,0 ; movaps 0x1388d(%rip),%xmm3 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 72,139,76,36,120 ; mov 0x78(%rsp),%rcx
DB 15,40,164,36,192,0,0,0 ; movaps 0xc0(%rsp),%xmm4
DB 15,40,172,36,208,0,0,0 ; movaps 0xd0(%rsp),%xmm5
@@ -25303,6 +25286,23 @@ _sk_clut_4D_sse41 LABEL PROC
DB 93 ; pop %rbp
DB 255,224 ; jmpq *%rax
+PUBLIC _sk_gauss_a_to_rgba_sse41
+_sk_gauss_a_to_rgba_sse41 LABEL PROC
+ DB 15,40,5,222,62,1,0 ; movaps 0x13ede(%rip),%xmm0 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,228,62,1,0 ; addps 0x13ee4(%rip),%xmm0 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,234,62,1,0 ; addps 0x13eea(%rip),%xmm0 # 2f320 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,240,62,1,0 ; addps 0x13ef0(%rip),%xmm0 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,246,62,1,0 ; addps 0x13ef6(%rip),%xmm0 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 15,40,200 ; movaps %xmm0,%xmm1
+ DB 15,40,208 ; movaps %xmm0,%xmm2
+ DB 15,40,216 ; movaps %xmm0,%xmm3
+ DB 255,224 ; jmpq *%rax
+
PUBLIC _sk_start_pipeline_sse2
_sk_start_pipeline_sse2 LABEL PROC
DB 85 ; push %rbp
@@ -31459,23 +31459,6 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC
DB 65,94 ; pop %r14
DB 255,224 ; jmpq *%rax
-PUBLIC _sk_gauss_a_to_rgba_sse2
-_sk_gauss_a_to_rgba_sse2 LABEL PROC
- DB 15,40,5,162,222,0,0 ; movaps 0xdea2(%rip),%xmm0 # 2f200 <_sk_srcover_bgra_8888_sse2_lowp+0x10b8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,168,222,0,0 ; addps 0xdea8(%rip),%xmm0 # 2f210 <_sk_srcover_bgra_8888_sse2_lowp+0x10c8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,174,222,0,0 ; addps 0xdeae(%rip),%xmm0 # 2f220 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,180,222,0,0 ; addps 0xdeb4(%rip),%xmm0 # 2f230 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,5,186,222,0,0 ; addps 0xdeba(%rip),%xmm0 # 2f240 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
- DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 15,40,208 ; movaps %xmm0,%xmm2
- DB 15,40,216 ; movaps %xmm0,%xmm3
- DB 255,224 ; jmpq *%rax
-
PUBLIC _sk_gradient_sse2
_sk_gradient_sse2 LABEL PROC
DB 65,86 ; push %r14
@@ -31484,7 +31467,7 @@ _sk_gradient_sse2 LABEL PROC
DB 76,139,0 ; mov (%rax),%r8
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 73,131,248,2 ; cmp $0x2,%r8
- DB 114,41 ; jb 213ce <_sk_gradient_sse2+0x3b>
+ DB 114,41 ; jb 21392 <_sk_gradient_sse2+0x3b>
DB 76,139,72,72 ; mov 0x48(%rax),%r9
DB 73,255,200 ; dec %r8
DB 73,131,193,4 ; add $0x4,%r9
@@ -31495,7 +31478,7 @@ _sk_gradient_sse2 LABEL PROC
DB 102,15,250,202 ; psubd %xmm2,%xmm1
DB 73,131,193,4 ; add $0x4,%r9
DB 73,255,200 ; dec %r8
- DB 117,230 ; jne 213b4 <_sk_gradient_sse2+0x21>
+ DB 117,230 ; jne 21378 <_sk_gradient_sse2+0x21>
DB 102,15,112,209,78 ; pshufd $0x4e,%xmm1,%xmm2
DB 102,73,15,126,209 ; movq %xmm2,%r9
DB 69,137,200 ; mov %r9d,%r8d
@@ -31629,29 +31612,29 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC
DB 69,15,94,220 ; divps %xmm12,%xmm11
DB 69,15,40,227 ; movaps %xmm11,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
- DB 68,15,40,45,74,220,0,0 ; movaps 0xdc4a(%rip),%xmm13 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
+ DB 68,15,40,45,54,220,0,0 ; movaps 0xdc36(%rip),%xmm13 # 2f200 <_sk_srcover_bgra_8888_sse2_lowp+0x10b8>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,78,220,0,0 ; addps 0xdc4e(%rip),%xmm13 # 2f260 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
+ DB 68,15,88,45,58,220,0,0 ; addps 0xdc3a(%rip),%xmm13 # 2f210 <_sk_srcover_bgra_8888_sse2_lowp+0x10c8>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,82,220,0,0 ; addps 0xdc52(%rip),%xmm13 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,88,45,62,220,0,0 ; addps 0xdc3e(%rip),%xmm13 # 2f220 <_sk_srcover_bgra_8888_sse2_lowp+0x10d8>
DB 69,15,89,236 ; mulps %xmm12,%xmm13
- DB 68,15,88,45,86,220,0,0 ; addps 0xdc56(%rip),%xmm13 # 2f280 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ DB 68,15,88,45,66,220,0,0 ; addps 0xdc42(%rip),%xmm13 # 2f230 <_sk_srcover_bgra_8888_sse2_lowp+0x10e8>
DB 69,15,89,235 ; mulps %xmm11,%xmm13
DB 69,15,194,202,1 ; cmpltps %xmm10,%xmm9
- DB 68,15,40,21,85,220,0,0 ; movaps 0xdc55(%rip),%xmm10 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,40,21,65,220,0,0 ; movaps 0xdc41(%rip),%xmm10 # 2f240 <_sk_srcover_bgra_8888_sse2_lowp+0x10f8>
DB 69,15,92,213 ; subps %xmm13,%xmm10
DB 69,15,84,209 ; andps %xmm9,%xmm10
DB 69,15,85,205 ; andnps %xmm13,%xmm9
DB 69,15,86,202 ; orps %xmm10,%xmm9
DB 68,15,194,192,1 ; cmpltps %xmm0,%xmm8
- DB 68,15,40,21,8,214,0,0 ; movaps 0xd608(%rip),%xmm10 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,21,68,214,0,0 ; movaps 0xd644(%rip),%xmm10 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 69,15,92,209 ; subps %xmm9,%xmm10
DB 69,15,84,208 ; andps %xmm8,%xmm10
DB 69,15,85,193 ; andnps %xmm9,%xmm8
DB 69,15,86,194 ; orps %xmm10,%xmm8
DB 68,15,40,201 ; movaps %xmm1,%xmm9
DB 68,15,194,200,1 ; cmpltps %xmm0,%xmm9
- DB 68,15,40,21,247,213,0,0 ; movaps 0xd5f7(%rip),%xmm10 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 68,15,40,21,51,214,0,0 ; movaps 0xd633(%rip),%xmm10 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,208 ; subps %xmm8,%xmm10
DB 69,15,84,209 ; andps %xmm9,%xmm10
DB 69,15,85,200 ; andnps %xmm8,%xmm9
@@ -31682,7 +31665,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,190,219,0,0 ; mulps 0xdbbe(%rip),%xmm9 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ DB 68,15,89,13,170,219,0,0 ; mulps 0xdbaa(%rip),%xmm9 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -31690,7 +31673,7 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,169,219,0,0 ; mulps 0xdba9(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ DB 68,15,89,21,149,219,0,0 ; mulps 0xdb95(%rip),%xmm10 # 2f260 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -31699,8 +31682,8 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,81,218,0,0 ; xorps 0xda51(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
- DB 68,15,89,5,41,213,0,0 ; mulps 0xd529(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,87,13,141,218,0,0 ; xorps 0xda8d(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
+ DB 68,15,89,5,101,213,0,0 ; mulps 0xd565(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -31719,7 +31702,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 243,69,15,89,203 ; mulss %xmm11,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,32,219,0,0 ; mulps 0xdb20(%rip),%xmm9 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ DB 68,15,89,13,12,219,0,0 ; mulps 0xdb0c(%rip),%xmm9 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,225 ; movaps %xmm1,%xmm12
DB 69,15,89,228 ; mulps %xmm12,%xmm12
@@ -31727,7 +31710,7 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 243,69,15,89,219 ; mulss %xmm11,%xmm11
DB 69,15,198,219,0 ; shufps $0x0,%xmm11,%xmm11
DB 69,15,92,227 ; subps %xmm11,%xmm12
- DB 68,15,89,21,11,219,0,0 ; mulps 0xdb0b(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
+ DB 68,15,89,21,247,218,0,0 ; mulps 0xdaf7(%rip),%xmm10 # 2f260 <_sk_srcover_bgra_8888_sse2_lowp+0x1118>
DB 69,15,89,212 ; mulps %xmm12,%xmm10
DB 65,15,40,193 ; movaps %xmm9,%xmm0
DB 15,89,192 ; mulps %xmm0,%xmm0
@@ -31736,8 +31719,8 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,40,194 ; movaps %xmm10,%xmm0
DB 65,15,92,193 ; subps %xmm9,%xmm0
- DB 68,15,87,13,179,217,0,0 ; xorps 0xd9b3(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
- DB 68,15,89,5,139,212,0,0 ; mulps 0xd48b(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,87,13,239,217,0,0 ; xorps 0xd9ef(%rip),%xmm9 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
+ DB 68,15,89,5,199,212,0,0 ; mulps 0xd4c7(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 65,15,89,192 ; mulps %xmm8,%xmm0
DB 69,15,92,202 ; subps %xmm10,%xmm9
DB 69,15,89,200 ; mulps %xmm8,%xmm9
@@ -31753,7 +31736,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,69,15,89,200 ; mulss %xmm8,%xmm9
DB 69,15,198,201,0 ; shufps $0x0,%xmm9,%xmm9
DB 68,15,88,200 ; addps %xmm0,%xmm9
- DB 68,15,89,13,147,218,0,0 ; mulps 0xda93(%rip),%xmm9 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
+ DB 68,15,89,13,127,218,0,0 ; mulps 0xda7f(%rip),%xmm9 # 2f250 <_sk_srcover_bgra_8888_sse2_lowp+0x1108>
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 68,15,40,209 ; movaps %xmm1,%xmm10
DB 69,15,89,210 ; mulps %xmm10,%xmm10
@@ -31761,7 +31744,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,69,15,89,192 ; mulss %xmm8,%xmm8
DB 69,15,198,192,0 ; shufps $0x0,%xmm8,%xmm8
DB 65,15,92,192 ; subps %xmm8,%xmm0
- DB 15,87,5,79,217,0,0 ; xorps 0xd94f(%rip),%xmm0 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
+ DB 15,87,5,139,217,0,0 ; xorps 0xd98b(%rip),%xmm0 # 2f180 <_sk_srcover_bgra_8888_sse2_lowp+0x1038>
DB 65,15,94,193 ; divps %xmm9,%xmm0
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31801,7 +31784,7 @@ _sk_apply_vector_mask_sse2 LABEL PROC
PUBLIC _sk_save_xy_sse2
_sk_save_xy_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,182,211,0,0 ; movaps 0xd3b6(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,5,242,211,0,0 ; movaps 0xd3f2(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 15,17,0 ; movups %xmm0,(%rax)
DB 68,15,40,200 ; movaps %xmm0,%xmm9
DB 69,15,88,200 ; addps %xmm8,%xmm9
@@ -31809,7 +31792,7 @@ _sk_save_xy_sse2 LABEL PROC
DB 69,15,91,210 ; cvtdq2ps %xmm10,%xmm10
DB 69,15,40,217 ; movaps %xmm9,%xmm11
DB 69,15,194,218,1 ; cmpltps %xmm10,%xmm11
- DB 68,15,40,37,161,211,0,0 ; movaps 0xd3a1(%rip),%xmm12 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 68,15,40,37,221,211,0,0 ; movaps 0xd3dd(%rip),%xmm12 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,84,220 ; andps %xmm12,%xmm11
DB 69,15,92,211 ; subps %xmm11,%xmm10
DB 69,15,92,202 ; subps %xmm10,%xmm9
@@ -31852,8 +31835,8 @@ _sk_bilinear_nx_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,81,217,0,0 ; addps 0xd951(%rip),%xmm0 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,249,210,0,0 ; movaps 0xd2f9(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,5,61,217,0,0 ; addps 0xd93d(%rip),%xmm0 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,53,211,0,0 ; movaps 0xd335(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,0,1,0,0 ; movups %xmm9,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31864,7 +31847,7 @@ _sk_bilinear_px_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,197,210,0,0 ; addps 0xd2c5(%rip),%xmm0 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 15,88,5,1,211,0,0 ; addps 0xd301(%rip),%xmm0 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 68,15,17,128,0,1,0,0 ; movups %xmm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31874,8 +31857,8 @@ _sk_bilinear_ny_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,4,217,0,0 ; addps 0xd904(%rip),%xmm1 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,172,210,0,0 ; movaps 0xd2ac(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,13,240,216,0,0 ; addps 0xd8f0(%rip),%xmm1 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,232,210,0,0 ; movaps 0xd2e8(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 68,15,17,136,64,1,0,0 ; movups %xmm9,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31886,7 +31869,7 @@ _sk_bilinear_py_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,119,210,0,0 ; addps 0xd277(%rip),%xmm1 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 15,88,13,179,210,0,0 ; addps 0xd2b3(%rip),%xmm1 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 68,15,17,128,64,1,0,0 ; movups %xmm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31896,13 +31879,13 @@ _sk_bicubic_n3x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,199,216,0,0 ; addps 0xd8c7(%rip),%xmm0 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
- DB 68,15,40,13,95,210,0,0 ; movaps 0xd25f(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,5,179,216,0,0 ; addps 0xd8b3(%rip),%xmm0 # 2f280 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ DB 68,15,40,13,155,210,0,0 ; movaps 0xd29b(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,187,216,0,0 ; mulps 0xd8bb(%rip),%xmm9 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,13,67,212,0,0 ; addps 0xd443(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,13,167,216,0,0 ; mulps 0xd8a7(%rip),%xmm9 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,13,127,212,0,0 ; addps 0xd47f(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,0,1,0,0 ; movups %xmm9,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31913,16 +31896,16 @@ _sk_bicubic_n1x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,111,216,0,0 ; addps 0xd86f(%rip),%xmm0 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,23,210,0,0 ; movaps 0xd217(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,5,91,216,0,0 ; addps 0xd85b(%rip),%xmm0 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,83,210,0,0 ; movaps 0xd253(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,139,216,0,0 ; movaps 0xd88b(%rip),%xmm8 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,5,119,216,0,0 ; movaps 0xd877(%rip),%xmm8 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,143,216,0,0 ; addps 0xd88f(%rip),%xmm8 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,5,123,216,0,0 ; addps 0xd87b(%rip),%xmm8 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,227,209,0,0 ; addps 0xd1e3(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,88,5,31,210,0,0 ; addps 0xd21f(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,135,216,0,0 ; addps 0xd887(%rip),%xmm8 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,5,115,216,0,0 ; addps 0xd873(%rip),%xmm8 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,128,0,1,0,0 ; movups %xmm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31930,17 +31913,17 @@ _sk_bicubic_n1x_sse2 LABEL PROC
PUBLIC _sk_bicubic_p1x_sse2
_sk_bicubic_p1x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,193,209,0,0 ; movaps 0xd1c1(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,5,253,209,0,0 ; movaps 0xd1fd(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,136,128,0,0,0 ; movups 0x80(%rax),%xmm9
DB 65,15,88,192 ; addps %xmm8,%xmm0
- DB 68,15,40,21,58,216,0,0 ; movaps 0xd83a(%rip),%xmm10 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,21,38,216,0,0 ; movaps 0xd826(%rip),%xmm10 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,62,216,0,0 ; addps 0xd83e(%rip),%xmm10 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,21,42,216,0,0 ; addps 0xd82a(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,58,216,0,0 ; addps 0xd83a(%rip),%xmm10 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,21,38,216,0,0 ; addps 0xd826(%rip),%xmm10 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,144,0,1,0,0 ; movups %xmm10,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31950,11 +31933,11 @@ _sk_bicubic_p3x_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,0 ; movups (%rax),%xmm0
DB 68,15,16,128,128,0,0,0 ; movups 0x80(%rax),%xmm8
- DB 15,88,5,10,216,0,0 ; addps 0xd80a(%rip),%xmm0 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 15,88,5,246,215,0,0 ; addps 0xd7f6(%rip),%xmm0 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,218,215,0,0 ; mulps 0xd7da(%rip),%xmm8 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,5,98,211,0,0 ; addps 0xd362(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,5,198,215,0,0 ; mulps 0xd7c6(%rip),%xmm8 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,5,158,211,0,0 ; addps 0xd39e(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,0,1,0,0 ; movups %xmm8,0x100(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31965,13 +31948,13 @@ _sk_bicubic_n3y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,157,215,0,0 ; addps 0xd79d(%rip),%xmm1 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
- DB 68,15,40,13,53,209,0,0 ; movaps 0xd135(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,13,137,215,0,0 ; addps 0xd789(%rip),%xmm1 # 2f280 <_sk_srcover_bgra_8888_sse2_lowp+0x1138>
+ DB 68,15,40,13,113,209,0,0 ; movaps 0xd171(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
DB 69,15,40,193 ; movaps %xmm9,%xmm8
DB 69,15,89,192 ; mulps %xmm8,%xmm8
- DB 68,15,89,13,145,215,0,0 ; mulps 0xd791(%rip),%xmm9 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,13,25,211,0,0 ; addps 0xd319(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,13,125,215,0,0 ; mulps 0xd77d(%rip),%xmm9 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,13,85,211,0,0 ; addps 0xd355(%rip),%xmm9 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,200 ; mulps %xmm8,%xmm9
DB 68,15,17,136,64,1,0,0 ; movups %xmm9,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -31982,16 +31965,16 @@ _sk_bicubic_n1y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,68,215,0,0 ; addps 0xd744(%rip),%xmm1 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
- DB 68,15,40,13,236,208,0,0 ; movaps 0xd0ec(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,88,13,48,215,0,0 ; addps 0xd730(%rip),%xmm1 # 2f270 <_sk_srcover_bgra_8888_sse2_lowp+0x1128>
+ DB 68,15,40,13,40,209,0,0 ; movaps 0xd128(%rip),%xmm9 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 69,15,92,200 ; subps %xmm8,%xmm9
- DB 68,15,40,5,96,215,0,0 ; movaps 0xd760(%rip),%xmm8 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,5,76,215,0,0 ; movaps 0xd74c(%rip),%xmm8 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,100,215,0,0 ; addps 0xd764(%rip),%xmm8 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,5,80,215,0,0 ; addps 0xd750(%rip),%xmm8 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,184,208,0,0 ; addps 0xd0b8(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,88,5,244,208,0,0 ; addps 0xd0f4(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
- DB 68,15,88,5,92,215,0,0 ; addps 0xd75c(%rip),%xmm8 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,5,72,215,0,0 ; addps 0xd748(%rip),%xmm8 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,128,64,1,0,0 ; movups %xmm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -31999,17 +31982,17 @@ _sk_bicubic_n1y_sse2 LABEL PROC
PUBLIC _sk_bicubic_p1y_sse2
_sk_bicubic_p1y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 68,15,40,5,150,208,0,0 ; movaps 0xd096(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
+ DB 68,15,40,5,210,208,0,0 ; movaps 0xd0d2(%rip),%xmm8 # 2ec60 <_sk_srcover_bgra_8888_sse2_lowp+0xb18>
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,136,192,0,0,0 ; movups 0xc0(%rax),%xmm9
DB 65,15,88,200 ; addps %xmm8,%xmm1
- DB 68,15,40,21,14,215,0,0 ; movaps 0xd70e(%rip),%xmm10 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
+ DB 68,15,40,21,250,214,0,0 ; movaps 0xd6fa(%rip),%xmm10 # 2f2a0 <_sk_srcover_bgra_8888_sse2_lowp+0x1158>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,18,215,0,0 ; addps 0xd712(%rip),%xmm10 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 68,15,88,21,254,214,0,0 ; addps 0xd6fe(%rip),%xmm10 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,89,209 ; mulps %xmm9,%xmm10
DB 69,15,88,208 ; addps %xmm8,%xmm10
DB 69,15,89,209 ; mulps %xmm9,%xmm10
- DB 68,15,88,21,14,215,0,0 ; addps 0xd70e(%rip),%xmm10 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 68,15,88,21,250,214,0,0 ; addps 0xd6fa(%rip),%xmm10 # 2f2c0 <_sk_srcover_bgra_8888_sse2_lowp+0x1178>
DB 68,15,17,144,64,1,0,0 ; movups %xmm10,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
DB 255,224 ; jmpq *%rax
@@ -32019,11 +32002,11 @@ _sk_bicubic_p3y_sse2 LABEL PROC
DB 72,173 ; lods %ds:(%rsi),%rax
DB 15,16,72,64 ; movups 0x40(%rax),%xmm1
DB 68,15,16,128,192,0,0,0 ; movups 0xc0(%rax),%xmm8
- DB 15,88,13,221,214,0,0 ; addps 0xd6dd(%rip),%xmm1 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 15,88,13,201,214,0,0 ; addps 0xd6c9(%rip),%xmm1 # 2f2b0 <_sk_srcover_bgra_8888_sse2_lowp+0x1168>
DB 69,15,40,200 ; movaps %xmm8,%xmm9
DB 69,15,89,201 ; mulps %xmm9,%xmm9
- DB 68,15,89,5,173,214,0,0 ; mulps 0xd6ad(%rip),%xmm8 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
- DB 68,15,88,5,53,210,0,0 ; addps 0xd235(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
+ DB 68,15,89,5,153,214,0,0 ; mulps 0xd699(%rip),%xmm8 # 2f290 <_sk_srcover_bgra_8888_sse2_lowp+0x1148>
+ DB 68,15,88,5,113,210,0,0 ; addps 0xd271(%rip),%xmm8 # 2ee70 <_sk_srcover_bgra_8888_sse2_lowp+0xd28>
DB 69,15,89,193 ; mulps %xmm9,%xmm8
DB 68,15,17,128,64,1,0,0 ; movups %xmm8,0x140(%rax)
DB 72,173 ; lods %ds:(%rsi),%rax
@@ -32152,7 +32135,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,65,15,254,205 ; paddd %xmm13,%xmm1
DB 102,68,15,127,108,36,80 ; movdqa %xmm13,0x50(%rsp)
DB 102,15,254,217 ; paddd %xmm1,%xmm3
- DB 102,68,15,111,5,10,213,0,0 ; movdqa 0xd50a(%rip),%xmm8 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,68,15,111,5,246,212,0,0 ; movdqa 0xd4f6(%rip),%xmm8 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,112,195,245 ; pshufd $0xf5,%xmm3,%xmm0
DB 102,65,15,244,216 ; pmuludq %xmm8,%xmm3
DB 102,65,15,244,192 ; pmuludq %xmm8,%xmm0
@@ -32191,7 +32174,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,66,15,16,44,139 ; movss (%rbx,%r9,4),%xmm5
DB 15,20,236 ; unpcklps %xmm4,%xmm5
DB 102,15,20,221 ; unpcklpd %xmm5,%xmm3
- DB 102,68,15,111,37,193,205,0,0 ; movdqa 0xcdc1(%rip),%xmm12 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,37,253,205,0,0 ; movdqa 0xcdfd(%rip),%xmm12 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,196 ; paddd %xmm12,%xmm0
DB 102,15,112,224,78 ; pshufd $0x4e,%xmm0,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
@@ -32207,7 +32190,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,66,15,16,36,139 ; movss (%rbx,%r9,4),%xmm4
DB 15,20,224 ; unpcklps %xmm0,%xmm4
DB 102,15,20,236 ; unpcklpd %xmm4,%xmm5
- DB 15,40,37,246,211,0,0 ; movaps 0xd3f6(%rip),%xmm4 # 2f320 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ DB 15,40,37,226,211,0,0 ; movaps 0xd3e2(%rip),%xmm4 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
DB 68,15,88,220 ; addps %xmm4,%xmm11
DB 68,15,41,92,36,64 ; movaps %xmm11,0x40(%rsp)
DB 68,15,40,223 ; movaps %xmm7,%xmm11
@@ -32243,7 +32226,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,20,249 ; unpcklps %xmm1,%xmm7
DB 102,15,20,252 ; unpcklpd %xmm4,%xmm7
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
- DB 102,15,250,13,107,211,0,0 ; psubd 0xd36b(%rip),%xmm1 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,13,87,211,0,0 ; psubd 0xd357(%rip),%xmm1 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,225,78 ; pshufd $0x4e,%xmm1,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
DB 102,72,15,126,200 ; movq %xmm1,%rax
@@ -32333,7 +32316,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,44,131 ; movss (%rbx,%rax,4),%xmm5
DB 15,20,233 ; unpcklps %xmm1,%xmm5
DB 102,15,20,221 ; unpcklpd %xmm5,%xmm3
- DB 102,68,15,111,45,51,203,0,0 ; movdqa 0xcb33(%rip),%xmm13 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,45,111,203,0,0 ; movdqa 0xcb6f(%rip),%xmm13 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,197 ; paddd %xmm13,%xmm0
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
@@ -32430,7 +32413,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,111,206 ; movdqa %xmm6,%xmm1
DB 102,65,15,254,202 ; paddd %xmm10,%xmm1
DB 102,15,112,209,245 ; pshufd $0xf5,%xmm1,%xmm2
- DB 102,15,111,29,8,208,0,0 ; movdqa 0xd008(%rip),%xmm3 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,29,244,207,0,0 ; movdqa 0xcff4(%rip),%xmm3 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,203 ; pmuludq %xmm3,%xmm1
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
DB 102,15,111,251 ; movdqa %xmm3,%xmm7
@@ -32468,7 +32451,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,44,131 ; movss (%rbx,%rax,4),%xmm5
DB 15,20,236 ; unpcklps %xmm4,%xmm5
DB 102,15,20,213 ; unpcklpd %xmm5,%xmm2
- DB 102,15,111,5,200,200,0,0 ; movdqa 0xc8c8(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,111,5,4,201,0,0 ; movdqa 0xc904(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,254,216 ; paddd %xmm0,%xmm3
DB 102,15,112,227,78 ; pshufd $0x4e,%xmm3,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
@@ -32549,7 +32532,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,111,214 ; movdqa %xmm6,%xmm2
DB 102,65,15,254,212 ; paddd %xmm12,%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,13,230,205,0,0 ; movdqa 0xcde6(%rip),%xmm1 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,13,210,205,0,0 ; movdqa 0xcdd2(%rip),%xmm1 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,209 ; pmuludq %xmm1,%xmm2
DB 102,15,244,193 ; pmuludq %xmm1,%xmm0
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
@@ -32571,7 +32554,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 68,15,20,209 ; unpcklps %xmm1,%xmm10
DB 102,68,15,20,210 ; unpcklpd %xmm2,%xmm10
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,250,13,139,205,0,0 ; psubd 0xcd8b(%rip),%xmm1 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,13,119,205,0,0 ; psubd 0xcd77(%rip),%xmm1 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,209,78 ; pshufd $0x4e,%xmm1,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
DB 102,72,15,126,200 ; movq %xmm1,%rax
@@ -32586,7 +32569,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,20,131 ; movss (%rbx,%rax,4),%xmm2
DB 15,20,209 ; unpcklps %xmm1,%xmm2
DB 102,15,20,226 ; unpcklpd %xmm2,%xmm4
- DB 102,15,254,5,166,198,0,0 ; paddd 0xc6a6(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,5,226,198,0,0 ; paddd 0xc6e2(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
DB 102,72,15,126,192 ; movq %xmm0,%rax
@@ -32623,7 +32606,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 15,20,199 ; unpcklps %xmm7,%xmm0
DB 102,15,20,193 ; unpcklpd %xmm1,%xmm0
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
- DB 102,15,250,13,149,204,0,0 ; psubd 0xcc95(%rip),%xmm1 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,13,129,204,0,0 ; psubd 0xcc81(%rip),%xmm1 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,249,78 ; pshufd $0x4e,%xmm1,%xmm7
DB 102,73,15,126,248 ; movq %xmm7,%r8
DB 102,72,15,126,200 ; movq %xmm1,%rax
@@ -32638,7 +32621,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,52,131 ; movss (%rbx,%rax,4),%xmm6
DB 15,20,247 ; unpcklps %xmm7,%xmm6
DB 102,15,20,206 ; unpcklpd %xmm6,%xmm1
- DB 102,15,254,21,176,197,0,0 ; paddd 0xc5b0(%rip),%xmm2 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,21,236,197,0,0 ; paddd 0xc5ec(%rip),%xmm2 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,112,242,78 ; pshufd $0x4e,%xmm2,%xmm6
DB 102,73,15,126,240 ; movq %xmm6,%r8
DB 102,72,15,126,208 ; movq %xmm2,%rax
@@ -32782,7 +32765,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,254,210 ; paddd %xmm10,%xmm2
DB 102,15,111,220 ; movdqa %xmm4,%xmm3
DB 102,15,254,218 ; paddd %xmm2,%xmm3
- DB 102,15,111,37,185,201,0,0 ; movdqa 0xc9b9(%rip),%xmm4 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,37,165,201,0,0 ; movdqa 0xc9a5(%rip),%xmm4 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,112,195,245 ; pshufd $0xf5,%xmm3,%xmm0
DB 102,15,244,220 ; pmuludq %xmm4,%xmm3
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
@@ -32821,7 +32804,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,66,15,16,52,139 ; movss (%rbx,%r9,4),%xmm6
DB 15,20,244 ; unpcklps %xmm4,%xmm6
DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5
- DB 102,15,254,5,115,194,0,0 ; paddd 0xc273(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,5,175,194,0,0 ; paddd 0xc2af(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,112,224,78 ; pshufd $0x4e,%xmm0,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
DB 102,73,15,126,193 ; movq %xmm0,%r9
@@ -32836,7 +32819,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,66,15,16,52,139 ; movss (%rbx,%r9,4),%xmm6
DB 15,20,244 ; unpcklps %xmm4,%xmm6
DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3
- DB 15,40,53,173,200,0,0 ; movaps 0xc8ad(%rip),%xmm6 # 2f320 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ DB 15,40,53,153,200,0,0 ; movaps 0xc899(%rip),%xmm6 # 2f2d0 <_sk_srcover_bgra_8888_sse2_lowp+0x1188>
DB 68,15,88,198 ; addps %xmm6,%xmm8
DB 68,15,41,68,36,48 ; movaps %xmm8,0x30(%rsp)
DB 68,15,88,254 ; addps %xmm6,%xmm15
@@ -32854,7 +32837,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,254,215 ; paddd %xmm15,%xmm2
DB 102,68,15,127,124,36,96 ; movdqa %xmm15,0x60(%rsp)
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,13,96,200,0,0 ; movdqa 0xc860(%rip),%xmm1 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,13,76,200,0,0 ; movdqa 0xc84c(%rip),%xmm1 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,209 ; pmuludq %xmm1,%xmm2
DB 102,15,244,193 ; pmuludq %xmm1,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
@@ -32875,7 +32858,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,240 ; unpcklps %xmm0,%xmm6
DB 102,15,20,242 ; unpcklpd %xmm2,%xmm6
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
- DB 102,15,250,5,11,200,0,0 ; psubd 0xc80b(%rip),%xmm0 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,5,247,199,0,0 ; psubd 0xc7f7(%rip),%xmm0 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,208,78 ; pshufd $0x4e,%xmm0,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
DB 102,72,15,126,192 ; movq %xmm0,%rax
@@ -32890,7 +32873,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,68,15,16,28,131 ; movss (%rbx,%rax,4),%xmm11
DB 68,15,20,216 ; unpcklps %xmm0,%xmm11
DB 102,65,15,20,211 ; unpcklpd %xmm11,%xmm2
- DB 102,15,254,13,35,193,0,0 ; paddd 0xc123(%rip),%xmm1 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,13,95,193,0,0 ; paddd 0xc15f(%rip),%xmm1 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,112,193,78 ; pshufd $0x4e,%xmm1,%xmm0
DB 102,73,15,126,192 ; movq %xmm0,%r8
DB 102,72,15,126,200 ; movq %xmm1,%rax
@@ -32928,7 +32911,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,111,194 ; movdqa %xmm10,%xmm0
DB 102,15,254,68,36,32 ; paddd 0x20(%rsp),%xmm0
DB 102,15,112,216,245 ; pshufd $0xf5,%xmm0,%xmm3
- DB 102,15,111,37,7,199,0,0 ; movdqa 0xc707(%rip),%xmm4 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,37,243,198,0,0 ; movdqa 0xc6f3(%rip),%xmm4 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
DB 102,15,244,220 ; pmuludq %xmm4,%xmm3
DB 102,68,15,111,220 ; movdqa %xmm4,%xmm11
@@ -32966,7 +32949,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,60,131 ; movss (%rbx,%rax,4),%xmm7
DB 15,20,253 ; unpcklps %xmm5,%xmm7
DB 102,15,20,199 ; unpcklpd %xmm7,%xmm0
- DB 102,68,15,111,5,195,191,0,0 ; movdqa 0xbfc3(%rip),%xmm8 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,5,255,191,0,0 ; movdqa 0xbfff(%rip),%xmm8 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,224 ; paddd %xmm8,%xmm4
DB 102,15,112,236,78 ; pshufd $0x4e,%xmm4,%xmm5
DB 102,73,15,126,232 ; movq %xmm5,%r8
@@ -33112,7 +33095,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,131 ; movss (%rbx,%rax,4),%xmm4
DB 15,20,226 ; unpcklps %xmm2,%xmm4
DB 102,15,20,252 ; unpcklpd %xmm4,%xmm7
- DB 102,68,15,111,61,18,189,0,0 ; movdqa 0xbd12(%rip),%xmm15 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,61,78,189,0,0 ; movdqa 0xbd4e(%rip),%xmm15 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,207 ; paddd %xmm15,%xmm1
DB 102,15,112,209,78 ; pshufd $0x4e,%xmm1,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
@@ -33195,7 +33178,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,111,217 ; movdqa %xmm9,%xmm3
DB 102,65,15,254,216 ; paddd %xmm8,%xmm3
DB 102,15,112,211,245 ; pshufd $0xf5,%xmm3,%xmm2
- DB 102,15,111,45,43,194,0,0 ; movdqa 0xc22b(%rip),%xmm5 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,45,23,194,0,0 ; movdqa 0xc217(%rip),%xmm5 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,221 ; pmuludq %xmm5,%xmm3
DB 102,15,244,213 ; pmuludq %xmm5,%xmm2
DB 102,15,112,234,232 ; pshufd $0xe8,%xmm2,%xmm5
@@ -33216,7 +33199,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,198 ; unpcklps %xmm6,%xmm8
DB 102,68,15,20,197 ; unpcklpd %xmm5,%xmm8
DB 102,15,111,234 ; movdqa %xmm2,%xmm5
- DB 102,15,250,45,212,193,0,0 ; psubd 0xc1d4(%rip),%xmm5 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,45,192,193,0,0 ; psubd 0xc1c0(%rip),%xmm5 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,245,78 ; pshufd $0x4e,%xmm5,%xmm6
DB 102,73,15,126,240 ; movq %xmm6,%r8
DB 102,72,15,126,232 ; movq %xmm5,%rax
@@ -33248,7 +33231,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2
DB 102,69,15,254,205 ; paddd %xmm13,%xmm9
DB 102,65,15,112,233,245 ; pshufd $0xf5,%xmm9,%xmm5
- DB 102,15,111,29,50,193,0,0 ; movdqa 0xc132(%rip),%xmm3 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,29,30,193,0,0 ; movdqa 0xc11e(%rip),%xmm3 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,68,15,244,203 ; pmuludq %xmm3,%xmm9
DB 102,15,244,235 ; pmuludq %xmm3,%xmm5
DB 102,15,112,237,232 ; pshufd $0xe8,%xmm5,%xmm5
@@ -33269,7 +33252,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 69,15,20,233 ; unpcklps %xmm9,%xmm13
DB 102,68,15,20,237 ; unpcklpd %xmm5,%xmm13
DB 102,65,15,111,239 ; movdqa %xmm15,%xmm5
- DB 102,15,250,45,210,192,0,0 ; psubd 0xc0d2(%rip),%xmm5 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,45,190,192,0,0 ; psubd 0xc0be(%rip),%xmm5 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,221,78 ; pshufd $0x4e,%xmm5,%xmm3
DB 102,73,15,126,216 ; movq %xmm3,%r8
DB 102,72,15,126,232 ; movq %xmm5,%rax
@@ -33284,7 +33267,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,131 ; movss (%rbx,%rax,4),%xmm5
DB 15,20,235 ; unpcklps %xmm3,%xmm5
DB 102,15,20,245 ; unpcklpd %xmm5,%xmm6
- DB 102,68,15,111,13,236,185,0,0 ; movdqa 0xb9ec(%rip),%xmm9 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,13,40,186,0,0 ; movdqa 0xba28(%rip),%xmm9 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,69,15,254,249 ; paddd %xmm9,%xmm15
DB 102,65,15,112,223,78 ; pshufd $0x4e,%xmm15,%xmm3
DB 102,73,15,126,216 ; movq %xmm3,%r8
@@ -33346,7 +33329,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,65,15,111,195 ; movdqa %xmm11,%xmm0
DB 102,15,254,195 ; paddd %xmm3,%xmm0
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
- DB 102,15,111,21,102,191,0,0 ; movdqa 0xbf66(%rip),%xmm2 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,21,82,191,0,0 ; movdqa 0xbf52(%rip),%xmm2 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,68,15,111,234 ; movdqa %xmm2,%xmm13
@@ -33539,7 +33522,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,238 ; unpcklps %xmm6,%xmm13
DB 102,68,15,20,234 ; unpcklpd %xmm2,%xmm13
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
- DB 102,15,250,21,255,187,0,0 ; psubd 0xbbff(%rip),%xmm2 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,21,235,187,0,0 ; psubd 0xbbeb(%rip),%xmm2 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,242,78 ; pshufd $0x4e,%xmm2,%xmm6
DB 102,73,15,126,240 ; movq %xmm6,%r8
DB 102,72,15,126,208 ; movq %xmm2,%rax
@@ -33599,7 +33582,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,68,15,111,116,36,32 ; movdqa 0x20(%rsp),%xmm14
DB 102,65,15,254,198 ; paddd %xmm14,%xmm0
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
- DB 102,68,15,111,5,220,186,0,0 ; movdqa 0xbadc(%rip),%xmm8 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,68,15,111,5,200,186,0,0 ; movdqa 0xbac8(%rip),%xmm8 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,65,15,244,192 ; pmuludq %xmm8,%xmm0
DB 102,65,15,244,200 ; pmuludq %xmm8,%xmm1
DB 102,65,15,111,240 ; movdqa %xmm8,%xmm6
@@ -33637,7 +33620,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,131 ; movss (%rbx,%rax,4),%xmm5
DB 15,20,235 ; unpcklps %xmm3,%xmm5
DB 102,15,20,205 ; unpcklpd %xmm5,%xmm1
- DB 102,68,15,111,5,154,179,0,0 ; movdqa 0xb39a(%rip),%xmm8 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,68,15,111,5,214,179,0,0 ; movdqa 0xb3d6(%rip),%xmm8 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,65,15,254,208 ; paddd %xmm8,%xmm2
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
DB 102,73,15,126,216 ; movq %xmm3,%r8
@@ -33720,7 +33703,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,254,208 ; paddd %xmm0,%xmm2
DB 102,15,111,240 ; movdqa %xmm0,%xmm6
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,37,180,184,0,0 ; movdqa 0xb8b4(%rip),%xmm4 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 102,15,111,37,160,184,0,0 ; movdqa 0xb8a0(%rip),%xmm4 # 2f2e0 <_sk_srcover_bgra_8888_sse2_lowp+0x1198>
DB 102,15,244,212 ; pmuludq %xmm4,%xmm2
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
DB 102,15,112,200,232 ; pshufd $0xe8,%xmm0,%xmm1
@@ -33741,7 +33724,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 68,15,20,193 ; unpcklps %xmm1,%xmm8
DB 102,68,15,20,194 ; unpcklpd %xmm2,%xmm8
DB 102,15,111,200 ; movdqa %xmm0,%xmm1
- DB 102,15,250,13,93,184,0,0 ; psubd 0xb85d(%rip),%xmm1 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,13,73,184,0,0 ; psubd 0xb849(%rip),%xmm1 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,209,78 ; pshufd $0x4e,%xmm1,%xmm2
DB 102,73,15,126,208 ; movq %xmm2,%r8
DB 102,72,15,126,200 ; movq %xmm1,%rax
@@ -33756,7 +33739,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,20,131 ; movss (%rbx,%rax,4),%xmm2
DB 15,20,209 ; unpcklps %xmm1,%xmm2
DB 102,68,15,20,242 ; unpcklpd %xmm2,%xmm14
- DB 102,15,254,5,118,177,0,0 ; paddd 0xb176(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,5,178,177,0,0 ; paddd 0xb1b2(%rip),%xmm0 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
DB 102,73,15,126,200 ; movq %xmm1,%r8
DB 102,72,15,126,192 ; movq %xmm0,%rax
@@ -33794,7 +33777,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,198 ; unpcklps %xmm6,%xmm0
DB 102,15,20,193 ; unpcklpd %xmm1,%xmm0
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
- DB 102,15,250,13,101,183,0,0 ; psubd 0xb765(%rip),%xmm1 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 102,15,250,13,81,183,0,0 ; psubd 0xb751(%rip),%xmm1 # 2f2f0 <_sk_srcover_bgra_8888_sse2_lowp+0x11a8>
DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6
DB 102,73,15,126,240 ; movq %xmm6,%r8
DB 102,72,15,126,200 ; movq %xmm1,%rax
@@ -33809,7 +33792,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,131 ; movss (%rbx,%rax,4),%xmm4
DB 15,20,230 ; unpcklps %xmm6,%xmm4
DB 102,15,20,204 ; unpcklpd %xmm4,%xmm1
- DB 102,15,254,21,128,176,0,0 ; paddd 0xb080(%rip),%xmm2 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
+ DB 102,15,254,21,188,176,0,0 ; paddd 0xb0bc(%rip),%xmm2 # 2eca0 <_sk_srcover_bgra_8888_sse2_lowp+0xb58>
DB 102,15,112,226,78 ; pshufd $0x4e,%xmm2,%xmm4
DB 102,73,15,126,224 ; movq %xmm4,%r8
DB 102,72,15,126,208 ; movq %xmm2,%rax
@@ -33868,7 +33851,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,89,212 ; mulps %xmm4,%xmm2
DB 65,15,88,215 ; addps %xmm15,%xmm2
DB 72,173 ; lods %ds:(%rsi),%rax
- DB 15,40,29,102,175,0,0 ; movaps 0xaf66(%rip),%xmm3 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
+ DB 15,40,29,162,175,0,0 ; movaps 0xafa2(%rip),%xmm3 # 2ec70 <_sk_srcover_bgra_8888_sse2_lowp+0xb28>
DB 15,40,164,36,224,0,0,0 ; movaps 0xe0(%rsp),%xmm4
DB 15,40,172,36,240,0,0,0 ; movaps 0xf0(%rsp),%xmm5
DB 15,40,180,36,0,1,0,0 ; movaps 0x100(%rsp),%xmm6
@@ -33877,6 +33860,23 @@ _sk_clut_4D_sse2 LABEL PROC
DB 91 ; pop %rbx
DB 255,224 ; jmpq *%rax
+PUBLIC _sk_gauss_a_to_rgba_sse2
+_sk_gauss_a_to_rgba_sse2 LABEL PROC
+ DB 15,40,5,1,182,0,0 ; movaps 0xb601(%rip),%xmm0 # 2f300 <_sk_srcover_bgra_8888_sse2_lowp+0x11b8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,7,182,0,0 ; addps 0xb607(%rip),%xmm0 # 2f310 <_sk_srcover_bgra_8888_sse2_lowp+0x11c8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,13,182,0,0 ; addps 0xb60d(%rip),%xmm0 # 2f320 <_sk_srcover_bgra_8888_sse2_lowp+0x11d8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,19,182,0,0 ; addps 0xb613(%rip),%xmm0 # 2f330 <_sk_srcover_bgra_8888_sse2_lowp+0x11e8>
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,5,25,182,0,0 ; addps 0xb619(%rip),%xmm0 # 2f340 <_sk_srcover_bgra_8888_sse2_lowp+0x11f8>
+ DB 72,173 ; lods %ds:(%rsi),%rax
+ DB 15,40,200 ; movaps %xmm0,%xmm1
+ DB 15,40,208 ; movaps %xmm0,%xmm2
+ DB 15,40,216 ; movaps %xmm0,%xmm3
+ DB 255,224 ; jmpq *%rax
+
PUBLIC _sk_start_pipeline_hsw_lowp
_sk_start_pipeline_hsw_lowp LABEL PROC
DB 85 ; push %rbp
@@ -44645,15 +44645,9 @@ ALIGN 4
DB 55 ; (bad)
DB 63 ; (bad)
DB 152 ; cwtl
- DB 221,147,61,18,120,57 ; fstl 0x3978123d(%rbx)
- DB 64,45,16,17,192,32 ; rex sub $0x20c01110,%eax
- DB 148 ; xchg %eax,%esp
- DB 90 ; pop %rdx
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; (bad)
- DB 62,0,24 ; add %bl,%ds:(%rax)
- DB 161,57,111,43,231,187,159,215,202 ; movabs 0xcad79fbbe72b6f39,%eax
- DB 60,212 ; cmp $0xd4,%al
+ DB 221,147,61,111,43,231 ; fstl -0x18d490c3(%rbx)
+ DB 187,159,215,202,60 ; mov $0x3ccad79f,%ebx
+ DB 212 ; (bad)
DB 100,84 ; fs push %rsp
DB 189,169,240,34,62 ; mov $0x3e22f0a9,%ebp
DB 0,0 ; add %al,(%rax)
@@ -44664,20 +44658,25 @@ ALIGN 4
DB 0,0 ; add %al,(%rax)
DB 128,0,0 ; addb $0x0,(%rax)
DB 0,191,0,0,192,191 ; add %bh,-0x40400000(%rdi)
- DB 114,28 ; jb 2e57e <.literal4+0x18a>
+ DB 114,28 ; jb 2e56a <.literal4+0x176>
DB 199 ; (bad)
DB 62,0,0 ; add %al,%ds:(%rax)
DB 192,63,85 ; sarb $0x55,(%rdi)
DB 85 ; push %rbp
DB 149 ; xchg %eax,%ebp
DB 191,57,142,99,61 ; mov $0x3d638e39,%edi
- DB 114,249 ; jb 2e56b <.literal4+0x177>
- DB 127,63 ; jg 2e5b3 <_sk_srcover_bgra_8888_sse2_lowp+0x46b>
+ DB 114,249 ; jb 2e557 <.literal4+0x163>
+ DB 127,63 ; jg 2e59f <_sk_srcover_bgra_8888_sse2_lowp+0x457>
DB 3,0 ; add (%rax),%eax
DB 0,0 ; add %al,(%rax)
- DB 0,4,0 ; add %al,(%rax,%rax,1)
- DB 0,0 ; add %al,(%rax)
- DB 0,0 ; add %al,(%rax)
+ DB 18,120,57 ; adc 0x39(%rax),%bh
+ DB 64,45,16,17,192,32 ; rex sub $0x20c01110,%eax
+ DB 148 ; xchg %eax,%esp
+ DB 90 ; pop %rdx
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; (bad)
+ DB 62,0,24 ; add %bl,%ds:(%rax)
+ DB 161,57,0,4,0,0,0,0,0 ; movabs 0x40039,%eax
DB 56,255 ; cmp %bh,%bh
DB 255 ; (bad)
DB 255 ; (bad)
@@ -46211,28 +46210,7 @@ ALIGN 16
DB 221,147,61,152,221,147 ; fstl -0x6c2267c3(%rbx)
DB 61,152,221,147,61 ; cmp $0x3d93dd98,%eax
DB 152 ; cwtl
- DB 221,147,61,45,16,17 ; fstl 0x11102d3d(%rbx)
- DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110(%rip) # 2dc3031a <_sk_srcover_bgra_8888_sse2_lowp+0x2dc021d2>
- DB 17,192 ; adc %eax,%eax
- DB 45,16,17,192,18 ; sub $0x12c01110,%eax
- DB 120,57 ; js 2f24c <.literal16+0x63c>
- DB 64,18,120,57 ; adc 0x39(%rax),%dil
- DB 64,18,120,57 ; adc 0x39(%rax),%dil
- DB 64,18,120,57 ; adc 0x39(%rax),%dil
- DB 64,32,148,90,62,32,148,90 ; and %dl,0x5a94203e(%rdx,%rbx,2)
- DB 62,32,148,90,62,32,148,90 ; and %dl,%ds:0x5a94203e(%rdx,%rbx,2)
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; (bad)
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; (bad)
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; (bad)
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; (bad)
- DB 62,0,24 ; add %bl,%ds:(%rax)
- DB 161,57,0,24,161,57,0,24,161 ; movabs 0xa1180039a1180039,%eax
- DB 57,0 ; cmp %eax,(%rax)
- DB 24,161,57,111,43,231 ; sbb %ah,-0x18d490c7(%rcx)
+ DB 221,147,61,111,43,231 ; fstl -0x18d490c3(%rbx)
DB 187,111,43,231,187 ; mov $0xbbe72b6f,%ebx
DB 111 ; outsl %ds:(%rsi),(%dx)
DB 43,231 ; sub %edi,%esp
@@ -46280,13 +46258,13 @@ ALIGN 16
DB 192,191,0,0,192,191,0 ; sarb $0x0,-0x40400000(%rdi)
DB 0,192 ; add %al,%al
DB 191,0,0,192,191 ; mov $0xbfc00000,%edi
- DB 114,28 ; jb 2f2fe <.literal16+0x6ee>
+ DB 114,28 ; jb 2f2ae <.literal16+0x69e>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 2f302 <.literal16+0x6f2>
+ DB 62,114,28 ; jb,pt 2f2b2 <.literal16+0x6a2>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 2f306 <.literal16+0x6f6>
+ DB 62,114,28 ; jb,pt 2f2b6 <.literal16+0x6a6>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt 2f30a <.literal16+0x6fa>
+ DB 62,114,28 ; jb,pt 2f2ba <.literal16+0x6aa>
DB 199 ; (bad)
DB 62,85 ; ds push %rbp
DB 85 ; push %rbp
@@ -46305,15 +46283,15 @@ ALIGN 16
DB 0,192 ; add %al,%al
DB 63 ; (bad)
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%rsi)
- DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d668155 <_sk_srcover_bgra_8888_sse2_lowp+0x3d63a00d>
+ DB 99,61,57,142,99,61 ; movslq 0x3d638e39(%rip),%edi # 3d668105 <_sk_srcover_bgra_8888_sse2_lowp+0x3d639fbd>
DB 57,142,99,61,114,249 ; cmp %ecx,-0x68dc29d(%rsi)
- DB 127,63 ; jg 2f363 <.literal16+0x753>
- DB 114,249 ; jb 2f31f <.literal16+0x70f>
- DB 127,63 ; jg 2f367 <.literal16+0x757>
- DB 114,249 ; jb 2f323 <.literal16+0x713>
- DB 127,63 ; jg 2f36b <.literal16+0x75b>
- DB 114,249 ; jb 2f327 <.literal16+0x717>
- DB 127,63 ; jg 2f36f <.literal16+0x75f>
+ DB 127,63 ; jg 2f313 <.literal16+0x703>
+ DB 114,249 ; jb 2f2cf <.literal16+0x6bf>
+ DB 127,63 ; jg 2f317 <.literal16+0x707>
+ DB 114,249 ; jb 2f2d3 <.literal16+0x6c3>
+ DB 127,63 ; jg 2f31b <.literal16+0x70b>
+ DB 114,249 ; jb 2f2d7 <.literal16+0x6c7>
+ DB 127,63 ; jg 2f31f <.literal16+0x70f>
DB 3,0 ; add (%rax),%eax
DB 0,0 ; add %al,(%rax)
DB 3,0 ; add (%rax),%eax
@@ -46337,8 +46315,28 @@ ALIGN 16
DB 255 ; (bad)
DB 255 ; (bad)
DB 255 ; (bad)
- DB 255,0 ; incl (%rax)
- DB 0,255 ; add %bh,%bh
+ DB 255,45,16,17,192,45 ; ljmp *0x2dc01110(%rip) # 2dc30415 <_sk_srcover_bgra_8888_sse2_lowp+0x2dc022cd>
+ DB 16,17 ; adc %dl,(%rcx)
+ DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110(%rip) # 2dc3041e <_sk_srcover_bgra_8888_sse2_lowp+0x2dc022d6>
+ DB 17,192 ; adc %eax,%eax
+ DB 18,120,57 ; adc 0x39(%rax),%bh
+ DB 64,18,120,57 ; adc 0x39(%rax),%dil
+ DB 64,18,120,57 ; adc 0x39(%rax),%dil
+ DB 64,18,120,57 ; adc 0x39(%rax),%dil
+ DB 64,32,148,90,62,32,148,90 ; and %dl,0x5a94203e(%rdx,%rbx,2)
+ DB 62,32,148,90,62,32,148,90 ; and %dl,%ds:0x5a94203e(%rdx,%rbx,2)
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; (bad)
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; (bad)
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; (bad)
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; (bad)
+ DB 62,0,24 ; add %bl,%ds:(%rax)
+ DB 161,57,0,24,161,57,0,24,161 ; movabs 0xa1180039a1180039,%eax
+ DB 57,0 ; cmp %eax,(%rax)
+ DB 24,161,57,0,0,255 ; sbb %ah,-0xffffc7(%rcx)
DB 255,0 ; incl (%rax)
DB 0,255 ; add %bh,%bh
DB 255,0 ; incl (%rax)
@@ -54810,35 +54808,6 @@ _sk_evenly_spaced_gradient_sse2 LABEL PROC
DB 93 ; pop %ebp
DB 195 ; ret
-PUBLIC _sk_gauss_a_to_rgba_sse2
-_sk_gauss_a_to_rgba_sse2 LABEL PROC
- DB 85 ; push %ebp
- DB 137,229 ; mov %esp,%ebp
- DB 131,236,8 ; sub $0x8,%esp
- DB 232,0,0,0,0 ; call 698e <_sk_gauss_a_to_rgba_sse2+0xb>
- DB 88 ; pop %eax
- DB 139,77,12 ; mov 0xc(%ebp),%ecx
- DB 15,40,128,242,121,0,0 ; movaps 0x79f2(%eax),%xmm0
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,2,122,0,0 ; addps 0x7a02(%eax),%xmm0
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,18,122,0,0 ; addps 0x7a12(%eax),%xmm0
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,34,122,0,0 ; addps 0x7a22(%eax),%xmm0
- DB 15,89,195 ; mulps %xmm3,%xmm0
- DB 15,88,128,50,122,0,0 ; addps 0x7a32(%eax),%xmm0
- DB 141,65,4 ; lea 0x4(%ecx),%eax
- DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 15,40,208 ; movaps %xmm0,%xmm2
- DB 15,40,216 ; movaps %xmm0,%xmm3
- DB 80 ; push %eax
- DB 255,117,8 ; pushl 0x8(%ebp)
- DB 255,17 ; call *(%ecx)
- DB 131,196,24 ; add $0x18,%esp
- DB 93 ; pop %ebp
- DB 195 ; ret
-
PUBLIC _sk_gradient_sse2
_sk_gradient_sse2 LABEL PROC
DB 85 ; push %ebp
@@ -54852,7 +54821,7 @@ _sk_gradient_sse2 LABEL PROC
DB 139,10 ; mov (%edx),%ecx
DB 102,15,239,201 ; pxor %xmm1,%xmm1
DB 131,249,2 ; cmp $0x2,%ecx
- DB 114,33 ; jb 6a15 <_sk_gradient_sse2+0x3a>
+ DB 114,33 ; jb 69bd <_sk_gradient_sse2+0x3a>
DB 139,114,36 ; mov 0x24(%edx),%esi
DB 73 ; dec %ecx
DB 131,198,4 ; add $0x4,%esi
@@ -54863,7 +54832,7 @@ _sk_gradient_sse2 LABEL PROC
DB 102,15,250,202 ; psubd %xmm2,%xmm1
DB 131,198,4 ; add $0x4,%esi
DB 73 ; dec %ecx
- DB 117,234 ; jne 69ff <_sk_gradient_sse2+0x24>
+ DB 117,234 ; jne 69a7 <_sk_gradient_sse2+0x24>
DB 102,15,126,206 ; movd %xmm1,%esi
DB 102,15,112,209,229 ; pshufd $0xe5,%xmm1,%xmm2
DB 102,15,112,217,78 ; pshufd $0x4e,%xmm1,%xmm3
@@ -55012,7 +54981,7 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC
DB 15,40,218 ; movaps %xmm2,%xmm3
DB 15,40,209 ; movaps %xmm1,%xmm2
DB 15,40,200 ; movaps %xmm0,%xmm1
- DB 232,0,0,0,0 ; call 6c1d <_sk_xy_to_unit_angle_sse2+0x18>
+ DB 232,0,0,0,0 ; call 6bc5 <_sk_xy_to_unit_angle_sse2+0x18>
DB 88 ; pop %eax
DB 15,87,237 ; xorps %xmm5,%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
@@ -55027,30 +54996,30 @@ _sk_xy_to_unit_angle_sse2 LABEL PROC
DB 15,94,247 ; divps %xmm7,%xmm6
DB 15,40,254 ; movaps %xmm6,%xmm7
DB 15,89,255 ; mulps %xmm7,%xmm7
- DB 15,40,128,179,119,0,0 ; movaps 0x77b3(%eax),%xmm0
+ DB 15,40,128,187,119,0,0 ; movaps 0x77bb(%eax),%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 15,88,128,195,119,0,0 ; addps 0x77c3(%eax),%xmm0
+ DB 15,88,128,203,119,0,0 ; addps 0x77cb(%eax),%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 15,88,128,211,119,0,0 ; addps 0x77d3(%eax),%xmm0
+ DB 15,88,128,219,119,0,0 ; addps 0x77db(%eax),%xmm0
DB 15,89,199 ; mulps %xmm7,%xmm0
- DB 15,88,128,227,119,0,0 ; addps 0x77e3(%eax),%xmm0
+ DB 15,88,128,235,119,0,0 ; addps 0x77eb(%eax),%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
DB 15,194,236,1 ; cmpltps %xmm4,%xmm5
- DB 15,40,176,243,119,0,0 ; movaps 0x77f3(%eax),%xmm6
+ DB 15,40,176,251,119,0,0 ; movaps 0x77fb(%eax),%xmm6
DB 15,92,240 ; subps %xmm0,%xmm6
DB 15,84,245 ; andps %xmm5,%xmm6
DB 15,85,232 ; andnps %xmm0,%xmm5
DB 15,87,228 ; xorps %xmm4,%xmm4
DB 15,86,238 ; orps %xmm6,%xmm5
DB 15,194,204,1 ; cmpltps %xmm4,%xmm1
- DB 15,40,128,179,113,0,0 ; movaps 0x71b3(%eax),%xmm0
+ DB 15,40,128,11,114,0,0 ; movaps 0x720b(%eax),%xmm0
DB 15,92,197 ; subps %xmm5,%xmm0
DB 15,84,193 ; andps %xmm1,%xmm0
DB 15,85,205 ; andnps %xmm5,%xmm1
DB 15,86,200 ; orps %xmm0,%xmm1
DB 15,40,194 ; movaps %xmm2,%xmm0
DB 15,194,196,1 ; cmpltps %xmm4,%xmm0
- DB 15,40,168,195,113,0,0 ; movaps 0x71c3(%eax),%xmm5
+ DB 15,40,168,27,114,0,0 ; movaps 0x721b(%eax),%xmm5
DB 15,92,233 ; subps %xmm1,%xmm5
DB 15,84,232 ; andps %xmm0,%xmm5
DB 15,85,193 ; andnps %xmm1,%xmm0
@@ -55107,15 +55076,15 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,246 ; mulps %xmm6,%xmm6
DB 15,88,240 ; addps %xmm0,%xmm6
- DB 232,0,0,0,0 ; call 6d3a <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
+ DB 232,0,0,0,0 ; call 6ce2 <_sk_xy_to_2pt_conical_quadratic_max_sse2+0x31>
DB 90 ; pop %edx
DB 243,15,89,237 ; mulss %xmm5,%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,92,245 ; subps %xmm5,%xmm6
DB 243,15,16,65,64 ; movss 0x40(%ecx),%xmm0
DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0
- DB 15,89,162,230,118,0,0 ; mulps 0x76e6(%edx),%xmm4
- DB 15,89,130,246,118,0,0 ; mulps 0x76f6(%edx),%xmm0
+ DB 15,89,162,238,118,0,0 ; mulps 0x76ee(%edx),%xmm4
+ DB 15,89,130,254,118,0,0 ; mulps 0x76fe(%edx),%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
@@ -55123,11 +55092,11 @@ _sk_xy_to_2pt_conical_quadratic_max_sse2 LABEL PROC
DB 15,81,237 ; sqrtps %xmm5,%xmm5
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,87,162,150,117,0,0 ; xorps 0x7596(%edx),%xmm4
+ DB 15,87,162,238,117,0,0 ; xorps 0x75ee(%edx),%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 243,15,16,105,68 ; movss 0x44(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
- DB 15,89,170,150,112,0,0 ; mulps 0x7096(%edx),%xmm5
+ DB 15,89,170,238,112,0,0 ; mulps 0x70ee(%edx),%xmm5
DB 15,89,197 ; mulps %xmm5,%xmm0
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,95,196 ; maxps %xmm4,%xmm0
@@ -55156,15 +55125,15 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,246 ; mulps %xmm6,%xmm6
DB 15,88,240 ; addps %xmm0,%xmm6
- DB 232,0,0,0,0 ; call 6dd8 <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
+ DB 232,0,0,0,0 ; call 6d80 <_sk_xy_to_2pt_conical_quadratic_min_sse2+0x31>
DB 90 ; pop %edx
DB 243,15,89,237 ; mulss %xmm5,%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,92,245 ; subps %xmm5,%xmm6
DB 243,15,16,65,64 ; movss 0x40(%ecx),%xmm0
DB 15,198,192,0 ; shufps $0x0,%xmm0,%xmm0
- DB 15,89,162,72,118,0,0 ; mulps 0x7648(%edx),%xmm4
- DB 15,89,130,88,118,0,0 ; mulps 0x7658(%edx),%xmm0
+ DB 15,89,162,80,118,0,0 ; mulps 0x7650(%edx),%xmm4
+ DB 15,89,130,96,118,0,0 ; mulps 0x7660(%edx),%xmm0
DB 15,89,198 ; mulps %xmm6,%xmm0
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
@@ -55172,11 +55141,11 @@ _sk_xy_to_2pt_conical_quadratic_min_sse2 LABEL PROC
DB 15,81,237 ; sqrtps %xmm5,%xmm5
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,87,162,248,116,0,0 ; xorps 0x74f8(%edx),%xmm4
+ DB 15,87,162,80,117,0,0 ; xorps 0x7550(%edx),%xmm4
DB 15,92,229 ; subps %xmm5,%xmm4
DB 243,15,16,105,68 ; movss 0x44(%ecx),%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
- DB 15,89,170,248,111,0,0 ; mulps 0x6ff8(%edx),%xmm5
+ DB 15,89,170,80,112,0,0 ; mulps 0x7050(%edx),%xmm5
DB 15,89,197 ; mulps %xmm5,%xmm0
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,93,196 ; minps %xmm4,%xmm0
@@ -55194,7 +55163,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 85 ; push %ebp
DB 137,229 ; mov %esp,%ebp
DB 131,236,8 ; sub $0x8,%esp
- DB 232,0,0,0,0 ; call 6e50 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
+ DB 232,0,0,0,0 ; call 6df8 <_sk_xy_to_2pt_conical_linear_sse2+0xb>
DB 89 ; pop %ecx
DB 139,69,12 ; mov 0xc(%ebp),%eax
DB 139,16 ; mov (%eax),%edx
@@ -55203,7 +55172,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,15,89,236 ; mulss %xmm4,%xmm5
DB 15,198,237,0 ; shufps $0x0,%xmm5,%xmm5
DB 15,88,232 ; addps %xmm0,%xmm5
- DB 15,89,169,208,117,0,0 ; mulps 0x75d0(%ecx),%xmm5
+ DB 15,89,169,216,117,0,0 ; mulps 0x75d8(%ecx),%xmm5
DB 15,89,192 ; mulps %xmm0,%xmm0
DB 15,40,241 ; movaps %xmm1,%xmm6
DB 15,89,246 ; mulps %xmm6,%xmm6
@@ -55211,7 +55180,7 @@ _sk_xy_to_2pt_conical_linear_sse2 LABEL PROC
DB 243,15,89,228 ; mulss %xmm4,%xmm4
DB 15,198,228,0 ; shufps $0x0,%xmm4,%xmm4
DB 15,92,196 ; subps %xmm4,%xmm0
- DB 15,87,129,128,116,0,0 ; xorps 0x7480(%ecx),%xmm0
+ DB 15,87,129,216,116,0,0 ; xorps 0x74d8(%ecx),%xmm0
DB 15,94,197 ; divps %xmm5,%xmm0
DB 141,72,8 ; lea 0x8(%eax),%ecx
DB 131,236,8 ; sub $0x8,%esp
@@ -55282,16 +55251,16 @@ _sk_save_xy_sse2 LABEL PROC
DB 131,236,24 ; sub $0x18,%esp
DB 15,41,93,232 ; movaps %xmm3,-0x18(%ebp)
DB 15,40,218 ; movaps %xmm2,%xmm3
- DB 232,0,0,0,0 ; call 6f39 <_sk_save_xy_sse2+0x12>
+ DB 232,0,0,0,0 ; call 6ee1 <_sk_save_xy_sse2+0x12>
DB 88 ; pop %eax
- DB 15,40,160,151,110,0,0 ; movaps 0x6e97(%eax),%xmm4
+ DB 15,40,160,239,110,0,0 ; movaps 0x6eef(%eax),%xmm4
DB 15,40,232 ; movaps %xmm0,%xmm5
DB 15,88,236 ; addps %xmm4,%xmm5
DB 243,15,91,245 ; cvttps2dq %xmm5,%xmm6
DB 15,91,246 ; cvtdq2ps %xmm6,%xmm6
DB 15,40,253 ; movaps %xmm5,%xmm7
DB 15,194,254,1 ; cmpltps %xmm6,%xmm7
- DB 15,40,144,167,110,0,0 ; movaps 0x6ea7(%eax),%xmm2
+ DB 15,40,144,255,110,0,0 ; movaps 0x6eff(%eax),%xmm2
DB 15,84,250 ; andps %xmm2,%xmm7
DB 15,92,247 ; subps %xmm7,%xmm6
DB 15,92,238 ; subps %xmm6,%xmm5
@@ -55362,15 +55331,15 @@ _sk_bilinear_nx_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7021 <_sk_bilinear_nx_sse2+0xa>
+ DB 232,0,0,0,0 ; call 6fc9 <_sk_bilinear_nx_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,166,128,0,0,0 ; movups 0x80(%esi),%xmm4
- DB 15,88,128,31,116,0,0 ; addps 0x741f(%eax),%xmm0
- DB 15,40,168,191,109,0,0 ; movaps 0x6dbf(%eax),%xmm5
+ DB 15,88,128,39,116,0,0 ; addps 0x7427(%eax),%xmm0
+ DB 15,40,168,23,110,0,0 ; movaps 0x6e17(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,17,174,0,1,0,0 ; movups %xmm5,0x100(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -55389,14 +55358,14 @@ _sk_bilinear_px_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7067 <_sk_bilinear_px_sse2+0xa>
+ DB 232,0,0,0,0 ; call 700f <_sk_bilinear_px_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,166,128,0,0,0 ; movups 0x80(%esi),%xmm4
- DB 15,88,128,105,109,0,0 ; addps 0x6d69(%eax),%xmm0
+ DB 15,88,128,193,109,0,0 ; addps 0x6dc1(%eax),%xmm0
DB 15,17,166,0,1,0,0 ; movups %xmm4,0x100(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -55414,15 +55383,15 @@ _sk_bilinear_ny_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 70a3 <_sk_bilinear_ny_sse2+0xa>
+ DB 232,0,0,0,0 ; call 704b <_sk_bilinear_ny_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,64 ; movups 0x40(%esi),%xmm1
DB 15,16,166,192,0,0,0 ; movups 0xc0(%esi),%xmm4
- DB 15,88,136,157,115,0,0 ; addps 0x739d(%eax),%xmm1
- DB 15,40,168,61,109,0,0 ; movaps 0x6d3d(%eax),%xmm5
+ DB 15,88,136,165,115,0,0 ; addps 0x73a5(%eax),%xmm1
+ DB 15,40,168,149,109,0,0 ; movaps 0x6d95(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,17,174,64,1,0,0 ; movups %xmm5,0x140(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -55441,14 +55410,14 @@ _sk_bilinear_py_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 70ea <_sk_bilinear_py_sse2+0xa>
+ DB 232,0,0,0,0 ; call 7092 <_sk_bilinear_py_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,64 ; movups 0x40(%esi),%xmm1
DB 15,16,166,192,0,0,0 ; movups 0xc0(%esi),%xmm4
- DB 15,88,136,230,108,0,0 ; addps 0x6ce6(%eax),%xmm1
+ DB 15,88,136,62,109,0,0 ; addps 0x6d3e(%eax),%xmm1
DB 15,17,166,64,1,0,0 ; movups %xmm4,0x140(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -55466,20 +55435,20 @@ _sk_bicubic_n3x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7127 <_sk_bicubic_n3x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 70cf <_sk_bicubic_n3x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,166,128,0,0,0 ; movups 0x80(%esi),%xmm4
- DB 15,88,128,41,115,0,0 ; addps 0x7329(%eax),%xmm0
- DB 15,40,168,185,108,0,0 ; movaps 0x6cb9(%eax),%xmm5
+ DB 15,88,128,49,115,0,0 ; addps 0x7331(%eax),%xmm0
+ DB 15,40,168,17,109,0,0 ; movaps 0x6d11(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,40,229 ; movaps %xmm5,%xmm4
DB 15,89,228 ; mulps %xmm4,%xmm4
- DB 15,89,168,57,115,0,0 ; mulps 0x7339(%eax),%xmm5
- DB 15,88,168,169,110,0,0 ; addps 0x6ea9(%eax),%xmm5
+ DB 15,89,168,65,115,0,0 ; mulps 0x7341(%eax),%xmm5
+ DB 15,88,168,1,111,0,0 ; addps 0x6f01(%eax),%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
DB 15,17,174,0,1,0,0 ; movups %xmm5,0x100(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -55498,23 +55467,23 @@ _sk_bicubic_n1x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7184 <_sk_bicubic_n1x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 712c <_sk_bicubic_n1x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,166,128,0,0,0 ; movups 0x80(%esi),%xmm4
- DB 15,88,128,188,114,0,0 ; addps 0x72bc(%eax),%xmm0
- DB 15,40,168,92,108,0,0 ; movaps 0x6c5c(%eax),%xmm5
+ DB 15,88,128,196,114,0,0 ; addps 0x72c4(%eax),%xmm0
+ DB 15,40,168,180,108,0,0 ; movaps 0x6cb4(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
- DB 15,40,160,236,114,0,0 ; movaps 0x72ec(%eax),%xmm4
+ DB 15,40,160,244,114,0,0 ; movaps 0x72f4(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,252,114,0,0 ; addps 0x72fc(%eax),%xmm4
+ DB 15,88,160,4,115,0,0 ; addps 0x7304(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,76,108,0,0 ; addps 0x6c4c(%eax),%xmm4
+ DB 15,88,160,164,108,0,0 ; addps 0x6ca4(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,12,115,0,0 ; addps 0x730c(%eax),%xmm4
+ DB 15,88,160,20,115,0,0 ; addps 0x7314(%eax),%xmm4
DB 15,17,166,0,1,0,0 ; movups %xmm4,0x100(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -55532,22 +55501,22 @@ _sk_bicubic_p1x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 71ef <_sk_bicubic_p1x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 7197 <_sk_bicubic_p1x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
- DB 15,40,160,225,107,0,0 ; movaps 0x6be1(%eax),%xmm4
+ DB 15,40,160,57,108,0,0 ; movaps 0x6c39(%eax),%xmm4
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,174,128,0,0,0 ; movups 0x80(%esi),%xmm5
DB 15,88,196 ; addps %xmm4,%xmm0
- DB 15,40,176,129,114,0,0 ; movaps 0x7281(%eax),%xmm6
+ DB 15,40,176,137,114,0,0 ; movaps 0x7289(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,145,114,0,0 ; addps 0x7291(%eax),%xmm6
+ DB 15,88,176,153,114,0,0 ; addps 0x7299(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,88,244 ; addps %xmm4,%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,161,114,0,0 ; addps 0x72a1(%eax),%xmm6
+ DB 15,88,176,169,114,0,0 ; addps 0x72a9(%eax),%xmm6
DB 15,17,182,0,1,0,0 ; movups %xmm6,0x100(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -55565,18 +55534,18 @@ _sk_bicubic_p3x_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 724f <_sk_bicubic_p3x_sse2+0xa>
+ DB 232,0,0,0,0 ; call 71f7 <_sk_bicubic_p3x_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,6 ; movups (%esi),%xmm0
DB 15,16,166,128,0,0,0 ; movups 0x80(%esi),%xmm4
- DB 15,88,128,49,114,0,0 ; addps 0x7231(%eax),%xmm0
+ DB 15,88,128,57,114,0,0 ; addps 0x7239(%eax),%xmm0
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
- DB 15,89,160,17,114,0,0 ; mulps 0x7211(%eax),%xmm4
- DB 15,88,160,129,109,0,0 ; addps 0x6d81(%eax),%xmm4
+ DB 15,89,160,25,114,0,0 ; mulps 0x7219(%eax),%xmm4
+ DB 15,88,160,217,109,0,0 ; addps 0x6dd9(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,17,166,0,1,0,0 ; movups %xmm4,0x100(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -55595,20 +55564,20 @@ _sk_bicubic_n3y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 72a2 <_sk_bicubic_n3y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 724a <_sk_bicubic_n3y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,64 ; movups 0x40(%esi),%xmm1
DB 15,16,166,192,0,0,0 ; movups 0xc0(%esi),%xmm4
- DB 15,88,136,174,113,0,0 ; addps 0x71ae(%eax),%xmm1
- DB 15,40,168,62,107,0,0 ; movaps 0x6b3e(%eax),%xmm5
+ DB 15,88,136,182,113,0,0 ; addps 0x71b6(%eax),%xmm1
+ DB 15,40,168,150,107,0,0 ; movaps 0x6b96(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
DB 15,40,229 ; movaps %xmm5,%xmm4
DB 15,89,228 ; mulps %xmm4,%xmm4
- DB 15,89,168,190,113,0,0 ; mulps 0x71be(%eax),%xmm5
- DB 15,88,168,46,109,0,0 ; addps 0x6d2e(%eax),%xmm5
+ DB 15,89,168,198,113,0,0 ; mulps 0x71c6(%eax),%xmm5
+ DB 15,88,168,134,109,0,0 ; addps 0x6d86(%eax),%xmm5
DB 15,89,236 ; mulps %xmm4,%xmm5
DB 15,17,174,64,1,0,0 ; movups %xmm5,0x140(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -55627,23 +55596,23 @@ _sk_bicubic_n1y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 7300 <_sk_bicubic_n1y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 72a8 <_sk_bicubic_n1y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,64 ; movups 0x40(%esi),%xmm1
DB 15,16,166,192,0,0,0 ; movups 0xc0(%esi),%xmm4
- DB 15,88,136,64,113,0,0 ; addps 0x7140(%eax),%xmm1
- DB 15,40,168,224,106,0,0 ; movaps 0x6ae0(%eax),%xmm5
+ DB 15,88,136,72,113,0,0 ; addps 0x7148(%eax),%xmm1
+ DB 15,40,168,56,107,0,0 ; movaps 0x6b38(%eax),%xmm5
DB 15,92,236 ; subps %xmm4,%xmm5
- DB 15,40,160,112,113,0,0 ; movaps 0x7170(%eax),%xmm4
+ DB 15,40,160,120,113,0,0 ; movaps 0x7178(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,128,113,0,0 ; addps 0x7180(%eax),%xmm4
+ DB 15,88,160,136,113,0,0 ; addps 0x7188(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,208,106,0,0 ; addps 0x6ad0(%eax),%xmm4
+ DB 15,88,160,40,107,0,0 ; addps 0x6b28(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
- DB 15,88,160,144,113,0,0 ; addps 0x7190(%eax),%xmm4
+ DB 15,88,160,152,113,0,0 ; addps 0x7198(%eax),%xmm4
DB 15,17,166,64,1,0,0 ; movups %xmm4,0x140(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -55661,22 +55630,22 @@ _sk_bicubic_p1y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 736c <_sk_bicubic_p1y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 7314 <_sk_bicubic_p1y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
- DB 15,40,160,100,106,0,0 ; movaps 0x6a64(%eax),%xmm4
+ DB 15,40,160,188,106,0,0 ; movaps 0x6abc(%eax),%xmm4
DB 15,16,78,64 ; movups 0x40(%esi),%xmm1
DB 15,16,174,192,0,0,0 ; movups 0xc0(%esi),%xmm5
DB 15,88,204 ; addps %xmm4,%xmm1
- DB 15,40,176,4,113,0,0 ; movaps 0x7104(%eax),%xmm6
+ DB 15,40,176,12,113,0,0 ; movaps 0x710c(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,20,113,0,0 ; addps 0x7114(%eax),%xmm6
+ DB 15,88,176,28,113,0,0 ; addps 0x711c(%eax),%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
DB 15,88,244 ; addps %xmm4,%xmm6
DB 15,89,245 ; mulps %xmm5,%xmm6
- DB 15,88,176,36,113,0,0 ; addps 0x7124(%eax),%xmm6
+ DB 15,88,176,44,113,0,0 ; addps 0x712c(%eax),%xmm6
DB 15,17,182,64,1,0,0 ; movups %xmm6,0x140(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
@@ -55694,18 +55663,18 @@ _sk_bicubic_p3y_sse2 LABEL PROC
DB 137,229 ; mov %esp,%ebp
DB 86 ; push %esi
DB 80 ; push %eax
- DB 232,0,0,0,0 ; call 73cd <_sk_bicubic_p3y_sse2+0xa>
+ DB 232,0,0,0,0 ; call 7375 <_sk_bicubic_p3y_sse2+0xa>
DB 88 ; pop %eax
DB 139,77,8 ; mov 0x8(%ebp),%ecx
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 139,50 ; mov (%edx),%esi
DB 15,16,78,64 ; movups 0x40(%esi),%xmm1
DB 15,16,166,192,0,0,0 ; movups 0xc0(%esi),%xmm4
- DB 15,88,136,179,112,0,0 ; addps 0x70b3(%eax),%xmm1
+ DB 15,88,136,187,112,0,0 ; addps 0x70bb(%eax),%xmm1
DB 15,40,236 ; movaps %xmm4,%xmm5
DB 15,89,237 ; mulps %xmm5,%xmm5
- DB 15,89,160,147,112,0,0 ; mulps 0x7093(%eax),%xmm4
- DB 15,88,160,3,108,0,0 ; addps 0x6c03(%eax),%xmm4
+ DB 15,89,160,155,112,0,0 ; mulps 0x709b(%eax),%xmm4
+ DB 15,88,160,91,108,0,0 ; addps 0x6c5b(%eax),%xmm4
DB 15,89,229 ; mulps %xmm5,%xmm4
DB 15,17,166,64,1,0,0 ; movups %xmm4,0x140(%esi)
DB 141,66,8 ; lea 0x8(%edx),%eax
@@ -55844,7 +55813,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
DB 102,15,98,200 ; punpckldq %xmm0,%xmm1
DB 102,15,127,77,136 ; movdqa %xmm1,-0x78(%ebp)
- DB 232,0,0,0,0 ; call 75b3 <_sk_clut_3D_sse2+0xee>
+ DB 232,0,0,0,0 ; call 755b <_sk_clut_3D_sse2+0xee>
DB 90 ; pop %edx
DB 243,15,91,196 ; cvttps2dq %xmm4,%xmm0
DB 102,15,127,133,8,255,255,255 ; movdqa %xmm0,-0xf8(%ebp)
@@ -55852,7 +55821,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 102,15,254,216 ; paddd %xmm0,%xmm3
DB 102,15,111,193 ; movdqa %xmm1,%xmm0
DB 102,15,254,195 ; paddd %xmm3,%xmm0
- DB 102,15,111,162,253,110,0,0 ; movdqa 0x6efd(%edx),%xmm4
+ DB 102,15,111,162,5,111,0,0 ; movdqa 0x6f05(%edx),%xmm4
DB 102,15,127,165,120,255,255,255 ; movdqa %xmm4,-0x88(%ebp)
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
@@ -55892,7 +55861,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,4,129 ; movss (%ecx,%eax,4),%xmm0
DB 15,20,248 ; unpcklps %xmm0,%xmm7
DB 102,15,20,252 ; unpcklpd %xmm4,%xmm7
- DB 102,15,111,130,109,104,0,0 ; movdqa 0x686d(%edx),%xmm0
+ DB 102,15,111,130,197,104,0,0 ; movdqa 0x68c5(%edx),%xmm0
DB 102,15,127,133,104,255,255,255 ; movdqa %xmm0,-0x98(%ebp)
DB 102,15,254,200 ; paddd %xmm0,%xmm1
DB 102,15,112,193,229 ; pshufd $0xe5,%xmm1,%xmm0
@@ -55909,7 +55878,7 @@ _sk_clut_3D_sse2 LABEL PROC
DB 243,15,16,4,129 ; movss (%ecx,%eax,4),%xmm0
DB 15,20,240 ; unpcklps %xmm0,%xmm6
DB 102,15,20,241 ; unpcklpd %xmm1,%xmm6
- DB 15,40,130,237,110,0,0 ; movaps 0x6eed(%edx),%xmm0
+ DB 15,40,130,245,110,0,0 ; movaps 0x6ef5(%edx),%xmm0
DB 15,40,141,248,254,255,255 ; movaps -0x108(%ebp),%xmm1
DB 15,88,200 ; addps %xmm0,%xmm1
DB 15,41,77,200 ; movaps %xmm1,-0x38(%ebp)
@@ -56527,7 +56496,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,112,201,232 ; pshufd $0xe8,%xmm1,%xmm1
DB 102,15,98,217 ; punpckldq %xmm1,%xmm3
DB 102,15,127,93,152 ; movdqa %xmm3,-0x68(%ebp)
- DB 232,0,0,0,0 ; call 813f <_sk_clut_4D_sse2+0x165>
+ DB 232,0,0,0,0 ; call 80e7 <_sk_clut_4D_sse2+0x165>
DB 89 ; pop %ecx
DB 15,40,197 ; movaps %xmm5,%xmm0
DB 15,41,133,168,254,255,255 ; movaps %xmm0,-0x158(%ebp)
@@ -56538,7 +56507,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
DB 102,15,254,214 ; paddd %xmm6,%xmm2
DB 102,15,254,218 ; paddd %xmm2,%xmm3
- DB 102,15,111,161,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm4
+ DB 102,15,111,161,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm4
DB 102,15,112,203,245 ; pshufd $0xf5,%xmm3,%xmm1
DB 102,15,244,220 ; pmuludq %xmm4,%xmm3
DB 102,15,244,204 ; pmuludq %xmm4,%xmm1
@@ -56580,7 +56549,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,223 ; unpcklps %xmm7,%xmm3
DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3
DB 102,15,41,157,232,254,255,255 ; movapd %xmm3,-0x118(%ebp)
- DB 102,15,254,137,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm1
+ DB 102,15,254,137,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm1
DB 102,15,112,241,229 ; pshufd $0xe5,%xmm1,%xmm6
DB 102,15,126,240 ; movd %xmm6,%eax
DB 102,15,112,241,78 ; pshufd $0x4e,%xmm1,%xmm6
@@ -56595,7 +56564,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,60,130 ; movss (%edx,%eax,4),%xmm7
DB 15,20,223 ; unpcklps %xmm7,%xmm3
DB 102,15,20,222 ; unpcklpd %xmm6,%xmm3
- DB 15,40,185,97,99,0,0 ; movaps 0x6361(%ecx),%xmm7
+ DB 15,40,185,105,99,0,0 ; movaps 0x6369(%ecx),%xmm7
DB 15,88,199 ; addps %xmm7,%xmm0
DB 15,41,133,120,255,255,255 ; movaps %xmm0,-0x88(%ebp)
DB 15,40,133,248,254,255,255 ; movaps -0x108(%ebp),%xmm0
@@ -56616,7 +56585,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,127,101,168 ; movdqa %xmm4,-0x58(%ebp)
DB 102,15,254,212 ; paddd %xmm4,%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,161,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm4
+ DB 102,15,111,161,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm4
DB 102,15,244,212 ; pmuludq %xmm4,%xmm2
DB 102,15,244,196 ; pmuludq %xmm4,%xmm0
DB 102,15,112,240,232 ; pshufd $0xe8,%xmm0,%xmm6
@@ -56652,7 +56621,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5
DB 15,20,213 ; unpcklps %xmm5,%xmm2
DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2
- DB 102,15,254,129,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm0
+ DB 102,15,254,129,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm0
DB 102,15,112,232,229 ; pshufd $0xe5,%xmm0,%xmm5
DB 102,15,126,232 ; movd %xmm5,%eax
DB 102,15,112,232,78 ; pshufd $0x4e,%xmm0,%xmm5
@@ -56736,7 +56705,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5
DB 15,20,245 ; unpcklps %xmm5,%xmm6
DB 102,15,20,240 ; unpcklpd %xmm0,%xmm6
- DB 102,15,254,137,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm1
+ DB 102,15,254,137,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm1
DB 102,15,112,193,229 ; pshufd $0xe5,%xmm1,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
DB 102,15,112,193,78 ; pshufd $0x4e,%xmm1,%xmm0
@@ -56754,7 +56723,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,15,254,77,168 ; paddd -0x58(%ebp),%xmm1
DB 102,15,112,193,245 ; pshufd $0xf5,%xmm1,%xmm0
- DB 102,15,111,145,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm2
+ DB 102,15,111,145,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm2
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
@@ -56790,7 +56759,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0
DB 15,20,216 ; unpcklps %xmm0,%xmm3
DB 102,15,20,217 ; unpcklpd %xmm1,%xmm3
- DB 102,15,254,169,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm5
+ DB 102,15,254,169,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm5
DB 102,15,112,197,229 ; pshufd $0xe5,%xmm5,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
DB 102,15,112,197,78 ; pshufd $0x4e,%xmm5,%xmm0
@@ -56850,7 +56819,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,209 ; movdqa %xmm1,%xmm2
DB 102,15,254,85,152 ; paddd -0x68(%ebp),%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,153,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm3
+ DB 102,15,111,153,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm3
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,111,251 ; movdqa %xmm3,%xmm7
@@ -56889,7 +56858,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,44,130 ; movss (%edx,%eax,4),%xmm5
DB 15,20,229 ; unpcklps %xmm5,%xmm4
DB 102,15,20,227 ; unpcklpd %xmm3,%xmm4
- DB 102,15,254,129,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm0
+ DB 102,15,254,129,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm0
DB 102,15,112,216,229 ; pshufd $0xe5,%xmm0,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,216,78 ; pshufd $0x4e,%xmm0,%xmm3
@@ -56941,7 +56910,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,52,130 ; movss (%edx,%eax,4),%xmm6
DB 15,20,238 ; unpcklps %xmm6,%xmm5
DB 102,15,20,235 ; unpcklpd %xmm3,%xmm5
- DB 102,15,111,137,225,92,0,0 ; movdqa 0x5ce1(%ecx),%xmm1
+ DB 102,15,111,137,57,93,0,0 ; movdqa 0x5d39(%ecx),%xmm1
DB 102,15,254,249 ; paddd %xmm1,%xmm7
DB 102,15,112,223,229 ; pshufd $0xe5,%xmm7,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
@@ -56975,7 +56944,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,226 ; movdqa %xmm2,%xmm4
DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0
DB 102,15,112,208,245 ; pshufd $0xf5,%xmm0,%xmm2
- DB 102,15,111,153,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm3
+ DB 102,15,111,153,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm3
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,244,211 ; pmuludq %xmm3,%xmm2
DB 102,15,112,218,232 ; pshufd $0xe8,%xmm2,%xmm3
@@ -57032,7 +57001,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,212 ; movdqa %xmm4,%xmm2
DB 102,15,254,85,168 ; paddd -0x58(%ebp),%xmm2
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,137,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm1
+ DB 102,15,111,137,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm1
DB 102,15,244,209 ; pmuludq %xmm1,%xmm2
DB 102,15,244,193 ; pmuludq %xmm1,%xmm0
DB 102,15,112,240,232 ; pshufd $0xe8,%xmm0,%xmm6
@@ -57069,7 +57038,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4
DB 15,20,212 ; unpcklps %xmm4,%xmm2
DB 102,15,20,214 ; unpcklpd %xmm6,%xmm2
- DB 102,15,254,129,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm0
+ DB 102,15,254,129,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm0
DB 102,15,112,224,229 ; pshufd $0xe5,%xmm0,%xmm4
DB 102,15,126,224 ; movd %xmm4,%eax
DB 102,15,112,224,78 ; pshufd $0x4e,%xmm0,%xmm4
@@ -57137,7 +57106,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,93,152 ; movdqa -0x68(%ebp),%xmm3
DB 102,15,254,217 ; paddd %xmm1,%xmm3
DB 102,15,112,211,245 ; pshufd $0xf5,%xmm3,%xmm2
- DB 102,15,111,129,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm0
+ DB 102,15,111,129,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm0
DB 102,15,244,216 ; pmuludq %xmm0,%xmm3
DB 102,15,244,208 ; pmuludq %xmm0,%xmm2
DB 102,15,111,248 ; movdqa %xmm0,%xmm7
@@ -57176,7 +57145,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,28,130 ; movss (%edx,%eax,4),%xmm3
DB 15,20,235 ; unpcklps %xmm3,%xmm5
DB 102,15,20,238 ; unpcklpd %xmm6,%xmm5
- DB 102,15,254,145,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm2
+ DB 102,15,254,145,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm2
DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
@@ -57228,7 +57197,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0
DB 15,20,208 ; unpcklps %xmm0,%xmm2
DB 102,15,20,215 ; unpcklpd %xmm7,%xmm2
- DB 102,15,111,137,225,92,0,0 ; movdqa 0x5ce1(%ecx),%xmm1
+ DB 102,15,111,137,57,93,0,0 ; movdqa 0x5d39(%ecx),%xmm1
DB 102,15,254,217 ; paddd %xmm1,%xmm3
DB 102,15,112,195,229 ; pshufd $0xe5,%xmm3,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
@@ -57263,7 +57232,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,194 ; movdqa %xmm2,%xmm0
DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0
DB 102,15,112,224,245 ; pshufd $0xf5,%xmm0,%xmm4
- DB 102,15,111,169,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm5
+ DB 102,15,111,169,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm5
DB 102,15,111,221 ; movdqa %xmm5,%xmm3
DB 102,15,244,195 ; pmuludq %xmm3,%xmm0
DB 102,15,244,227 ; pmuludq %xmm3,%xmm4
@@ -57319,7 +57288,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,202 ; movdqa %xmm2,%xmm1
DB 102,15,254,77,168 ; paddd -0x58(%ebp),%xmm1
DB 102,15,112,193,245 ; pshufd $0xf5,%xmm1,%xmm0
- DB 102,15,111,145,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm2
+ DB 102,15,111,145,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm2
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,112,192,232 ; pshufd $0xe8,%xmm0,%xmm0
@@ -57355,7 +57324,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,4,130 ; movss (%edx,%eax,4),%xmm0
DB 15,20,216 ; unpcklps %xmm0,%xmm3
DB 102,15,20,217 ; unpcklpd %xmm1,%xmm3
- DB 102,15,254,185,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm7
+ DB 102,15,254,185,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm7
DB 102,15,112,199,229 ; pshufd $0xe5,%xmm7,%xmm0
DB 102,15,126,192 ; movd %xmm0,%eax
DB 102,15,112,199,78 ; pshufd $0x4e,%xmm7,%xmm0
@@ -57405,7 +57374,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,111,233 ; movdqa %xmm1,%xmm5
DB 102,15,254,69,152 ; paddd -0x68(%ebp),%xmm0
DB 102,15,112,200,245 ; pshufd $0xf5,%xmm0,%xmm1
- DB 102,15,111,145,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm2
+ DB 102,15,111,145,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm2
DB 102,15,244,194 ; pmuludq %xmm2,%xmm0
DB 102,15,244,202 ; pmuludq %xmm2,%xmm1
DB 102,15,111,250 ; movdqa %xmm2,%xmm7
@@ -57444,7 +57413,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4
DB 15,20,204 ; unpcklps %xmm4,%xmm1
DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1
- DB 102,15,254,145,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm2
+ DB 102,15,254,145,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm2
DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
@@ -57498,7 +57467,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,36,130 ; movss (%edx,%eax,4),%xmm4
DB 15,20,252 ; unpcklps %xmm4,%xmm7
DB 102,15,20,254 ; unpcklpd %xmm6,%xmm7
- DB 102,15,254,153,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm3
+ DB 102,15,254,153,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm3
DB 102,15,112,227,229 ; pshufd $0xe5,%xmm3,%xmm4
DB 102,15,126,224 ; movd %xmm4,%eax
DB 102,15,112,227,78 ; pshufd $0x4e,%xmm3,%xmm4
@@ -57531,7 +57500,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 102,15,254,208 ; paddd %xmm0,%xmm2
DB 102,15,111,216 ; movdqa %xmm0,%xmm3
DB 102,15,112,194,245 ; pshufd $0xf5,%xmm2,%xmm0
- DB 102,15,111,137,113,99,0,0 ; movdqa 0x6371(%ecx),%xmm1
+ DB 102,15,111,137,121,99,0,0 ; movdqa 0x6379(%ecx),%xmm1
DB 102,15,244,209 ; pmuludq %xmm1,%xmm2
DB 102,15,244,193 ; pmuludq %xmm1,%xmm0
DB 102,15,111,241 ; movdqa %xmm1,%xmm6
@@ -57571,7 +57540,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 15,20,225 ; unpcklps %xmm1,%xmm4
DB 102,15,20,226 ; unpcklpd %xmm2,%xmm4
DB 102,15,41,165,88,255,255,255 ; movapd %xmm4,-0xa8(%ebp)
- DB 102,15,254,129,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm0
+ DB 102,15,254,129,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm0
DB 102,15,112,200,229 ; pshufd $0xe5,%xmm0,%xmm1
DB 102,15,126,200 ; movd %xmm1,%eax
DB 102,15,112,200,78 ; pshufd $0x4e,%xmm0,%xmm1
@@ -57625,7 +57594,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 243,15,16,52,130 ; movss (%edx,%eax,4),%xmm6
DB 15,20,206 ; unpcklps %xmm6,%xmm1
DB 102,15,20,203 ; unpcklpd %xmm3,%xmm1
- DB 102,15,254,145,225,92,0,0 ; paddd 0x5ce1(%ecx),%xmm2
+ DB 102,15,254,145,57,93,0,0 ; paddd 0x5d39(%ecx),%xmm2
DB 102,15,112,218,229 ; pshufd $0xe5,%xmm2,%xmm3
DB 102,15,126,216 ; movd %xmm3,%eax
DB 102,15,112,218,78 ; pshufd $0x4e,%xmm2,%xmm3
@@ -57694,7 +57663,7 @@ _sk_clut_4D_sse2 LABEL PROC
DB 139,85,12 ; mov 0xc(%ebp),%edx
DB 141,66,8 ; lea 0x8(%edx),%eax
DB 131,236,8 ; sub $0x8,%esp
- DB 15,40,153,161,92,0,0 ; movaps 0x5ca1(%ecx),%xmm3
+ DB 15,40,153,249,92,0,0 ; movaps 0x5cf9(%ecx),%xmm3
DB 80 ; push %eax
DB 255,117,8 ; pushl 0x8(%ebp)
DB 255,82,4 ; call *0x4(%edx)
@@ -57704,6 +57673,35 @@ _sk_clut_4D_sse2 LABEL PROC
DB 91 ; pop %ebx
DB 93 ; pop %ebp
DB 195 ; ret
+
+PUBLIC _sk_gauss_a_to_rgba_sse2
+_sk_gauss_a_to_rgba_sse2 LABEL PROC
+ DB 85 ; push %ebp
+ DB 137,229 ; mov %esp,%ebp
+ DB 131,236,8 ; sub $0x8,%esp
+ DB 232,0,0,0,0 ; call 953c <_sk_gauss_a_to_rgba_sse2+0xb>
+ DB 88 ; pop %eax
+ DB 139,77,12 ; mov 0xc(%ebp),%ecx
+ DB 15,40,128,52,79,0,0 ; movaps 0x4f34(%eax),%xmm0
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,128,68,79,0,0 ; addps 0x4f44(%eax),%xmm0
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,128,84,79,0,0 ; addps 0x4f54(%eax),%xmm0
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,128,100,79,0,0 ; addps 0x4f64(%eax),%xmm0
+ DB 15,89,195 ; mulps %xmm3,%xmm0
+ DB 15,88,128,116,79,0,0 ; addps 0x4f74(%eax),%xmm0
+ DB 141,65,4 ; lea 0x4(%ecx),%eax
+ DB 131,236,8 ; sub $0x8,%esp
+ DB 15,40,200 ; movaps %xmm0,%xmm1
+ DB 15,40,208 ; movaps %xmm0,%xmm2
+ DB 15,40,216 ; movaps %xmm0,%xmm3
+ DB 80 ; push %eax
+ DB 255,117,8 ; pushl 0x8(%ebp)
+ DB 255,17 ; call *(%ecx)
+ DB 131,196,24 ; add $0x18,%esp
+ DB 93 ; pop %ebp
+ DB 195 ; ret
DB 144 ; nop
DB 144 ; nop
DB 144 ; nop
@@ -63645,47 +63643,20 @@ ALIGN 16
DB 0,0 ; add %al,(%eax)
DB 211,128,0,0,211,128 ; roll %cl,-0x7f2d0000(%eax)
DB 0,0 ; add %al,(%eax)
- DB 211,128,0,0,211,45 ; roll %cl,0x2dd30000(%eax)
- DB 16,17 ; adc %dl,(%ecx)
- DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110
- DB 17,192 ; adc %eax,%eax
- DB 45,16,17,192,18 ; sub $0x12c01110,%eax
- DB 120,57 ; js e3cc <.literal16+0x5fc>
- DB 64 ; inc %eax
- DB 18,120,57 ; adc 0x39(%eax),%bh
- DB 64 ; inc %eax
- DB 18,120,57 ; adc 0x39(%eax),%bh
- DB 64 ; inc %eax
- DB 18,120,57 ; adc 0x39(%eax),%bh
- DB 64 ; inc %eax
- DB 32,148,90,62,32,148,90 ; and %dl,0x5a94203e(%edx,%ebx,2)
- DB 62,32,148,90,62,32,148,90 ; and %dl,%ds:0x5a94203e(%edx,%ebx,2)
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; push %ds
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; push %ds
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; push %ds
- DB 62,4,157 ; ds add $0x9d,%al
- DB 30 ; push %ds
- DB 62,0,24 ; add %bl,%ds:(%eax)
- DB 161,57,0,24,161 ; mov 0xa1180039,%eax
- DB 57,0 ; cmp %eax,(%eax)
- DB 24,161,57,0,24,161 ; sbb %ah,-0x5ee7ffc7(%ecx)
- DB 57,111,43 ; cmp %ebp,0x2b(%edi)
- DB 231,187 ; out %eax,$0xbb
- DB 111 ; outsl %ds:(%esi),(%dx)
+ DB 211,128,0,0,211,111 ; roll %cl,0x6fd30000(%eax)
DB 43,231 ; sub %edi,%esp
DB 187,111,43,231,187 ; mov $0xbbe72b6f,%ebx
DB 111 ; outsl %ds:(%esi),(%dx)
DB 43,231 ; sub %edi,%esp
- DB 187,159,215,202,60 ; mov $0x3ccad79f,%ebx
+ DB 187,111,43,231,187 ; mov $0xbbe72b6f,%ebx
DB 159 ; lahf
DB 215 ; xlat %ds:(%ebx)
DB 202,60,159 ; lret $0x9f3c
DB 215 ; xlat %ds:(%ebx)
DB 202,60,159 ; lret $0x9f3c
DB 215 ; xlat %ds:(%ebx)
+ DB 202,60,159 ; lret $0x9f3c
+ DB 215 ; xlat %ds:(%ebx)
DB 202,60,212 ; lret $0xd43c
DB 100,84 ; fs push %esp
DB 189,212,100,84,189 ; mov $0xbd5464d4,%ebp
@@ -63721,13 +63692,13 @@ ALIGN 16
DB 192,191,0,0,192,191,0 ; sarb $0x0,-0x40400000(%edi)
DB 0,192 ; add %al,%al
DB 191,0,0,192,191 ; mov $0xbfc00000,%edi
- DB 114,28 ; jb e47e <.literal16+0x6ae>
+ DB 114,28 ; jb e42e <.literal16+0x65e>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt e482 <.literal16+0x6b2>
+ DB 62,114,28 ; jb,pt e432 <.literal16+0x662>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt e486 <.literal16+0x6b6>
+ DB 62,114,28 ; jb,pt e436 <.literal16+0x666>
DB 199 ; (bad)
- DB 62,114,28 ; jb,pt e48a <.literal16+0x6ba>
+ DB 62,114,28 ; jb,pt e43a <.literal16+0x66a>
DB 199 ; (bad)
DB 62,85 ; ds push %ebp
DB 85 ; push %ebp
@@ -63748,13 +63719,13 @@ ALIGN 16
DB 57,142,99,61,57,142 ; cmp %ecx,-0x71c6c29d(%esi)
DB 99,61,57,142,99,61 ; arpl %di,0x3d638e39
DB 57,142,99,61,114,249 ; cmp %ecx,-0x68dc29d(%esi)
- DB 127,63 ; jg e4e3 <.literal16+0x713>
- DB 114,249 ; jb e49f <.literal16+0x6cf>
- DB 127,63 ; jg e4e7 <.literal16+0x717>
- DB 114,249 ; jb e4a3 <.literal16+0x6d3>
- DB 127,63 ; jg e4eb <.literal16+0x71b>
- DB 114,249 ; jb e4a7 <.literal16+0x6d7>
- DB 127,63 ; jg e4ef <.literal16+0x71f>
+ DB 127,63 ; jg e493 <.literal16+0x6c3>
+ DB 114,249 ; jb e44f <.literal16+0x67f>
+ DB 127,63 ; jg e497 <.literal16+0x6c7>
+ DB 114,249 ; jb e453 <.literal16+0x683>
+ DB 127,63 ; jg e49b <.literal16+0x6cb>
+ DB 114,249 ; jb e457 <.literal16+0x687>
+ DB 127,63 ; jg e49f <.literal16+0x6cf>
DB 3,0 ; add (%eax),%eax
DB 0,0 ; add %al,(%eax)
DB 3,0 ; add (%eax),%eax
@@ -63763,25 +63734,53 @@ ALIGN 16
DB 0,0 ; add %al,(%eax)
DB 3,0 ; add (%eax),%eax
DB 0,0 ; add %al,(%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 255,0 ; incl (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
- DB 254,0 ; incb (%eax)
+ DB 45,16,17,192,45 ; sub $0x2dc01110,%eax
+ DB 16,17 ; adc %dl,(%ecx)
+ DB 192,45,16,17,192,45,16 ; shrb $0x10,0x2dc01110
+ DB 17,192 ; adc %eax,%eax
+ DB 18,120,57 ; adc 0x39(%eax),%bh
+ DB 64 ; inc %eax
+ DB 18,120,57 ; adc 0x39(%eax),%bh
+ DB 64 ; inc %eax
+ DB 18,120,57 ; adc 0x39(%eax),%bh
+ DB 64 ; inc %eax
+ DB 18,120,57 ; adc 0x39(%eax),%bh
+ DB 64 ; inc %eax
+ DB 32,148,90,62,32,148,90 ; and %dl,0x5a94203e(%edx,%ebx,2)
+ DB 62,32,148,90,62,32,148,90 ; and %dl,%ds:0x5a94203e(%edx,%ebx,2)
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; push %ds
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; push %ds
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; push %ds
+ DB 62,4,157 ; ds add $0x9d,%al
+ DB 30 ; push %ds
+ DB 62,0,24 ; add %bl,%ds:(%eax)
+ DB 161,57,0,24,161 ; mov 0xa1180039,%eax
+ DB 57,0 ; cmp %eax,(%eax)
+ DB 24,161,57,0,24,161 ; sbb %ah,-0x5ee7ffc7(%ecx)
+ DB 57,255 ; cmp %edi,%edi
+ DB 0,255 ; add %bh,%bh
+ DB 0,255 ; add %bh,%bh
+ DB 0,255 ; add %bh,%bh
+ DB 0,255 ; add %bh,%bh
+ DB 0,255 ; add %bh,%bh
+ DB 0,255 ; add %bh,%bh
+ DB 0,255 ; add %bh,%bh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,254 ; add %bh,%dh
+ DB 0,0 ; add %al,(%eax)
+ DB 128,0,128 ; addb $0x80,(%eax)
DB 0,128,0,128,0,128 ; add %al,-0x7fff8000(%eax)
DB 0,128,0,128,0,128 ; add %al,-0x7fff8000(%eax)
- DB 0,128,0,128,254,1 ; add %al,0x1fe8000(%eax)
+ DB 254,1 ; incb (%ecx)
DB 254,1 ; incb (%ecx)
DB 254,1 ; incb (%ecx)
DB 254,1 ; incb (%ecx)
diff --git a/src/jumper/SkJumper_stages.cpp b/src/jumper/SkJumper_stages.cpp
index 9224f2a57f..7c769fd6e3 100644
--- a/src/jumper/SkJumper_stages.cpp
+++ b/src/jumper/SkJumper_stages.cpp
@@ -1198,23 +1198,6 @@ STAGE(evenly_spaced_gradient, const SkJumper_GradientCtx* c) {
gradient_lookup(c, idx, t, &r, &g, &b, &a);
}
-// TODO: move this somewhere not in the middle of the gradients...
-STAGE(gauss_a_to_rgba, Ctx::None) {
- // x = 1 - x;
- // exp(-x * x * 4) - 0.018f;
- // ... now approximate with quartic
- //
- const float c4 = -2.26661229133605957031f;
- const float c3 = 2.89795351028442382812f;
- const float c2 = 0.21345567703247070312f;
- const float c1 = 0.15489584207534790039f;
- const float c0 = 0.00030726194381713867f;
- a = mad(a, mad(a, mad(a, mad(a, c4, c3), c2), c1), c0);
- r = a;
- g = a;
- b = a;
-}
-
STAGE(gradient, const SkJumper_GradientCtx* c) {
auto t = r;
U32 idx = 0;
@@ -1503,3 +1486,19 @@ STAGE(clut_4D, const SkJumper_ColorLookupTableCtx* ctx) {
// "a" was really CMYK's K, so we just set alpha opaque.
a = 1.0f;
}
+
+STAGE(gauss_a_to_rgba, Ctx::None) {
+ // x = 1 - x;
+ // exp(-x * x * 4) - 0.018f;
+ // ... now approximate with quartic
+ //
+ const float c4 = -2.26661229133605957031f;
+ const float c3 = 2.89795351028442382812f;
+ const float c2 = 0.21345567703247070312f;
+ const float c1 = 0.15489584207534790039f;
+ const float c0 = 0.00030726194381713867f;
+ a = mad(a, mad(a, mad(a, mad(a, c4, c3), c2), c1), c0);
+ r = a;
+ g = a;
+ b = a;
+}