summaryrefslogtreecommitdiffstats
path: root/gfx/cairo/pixman-16-bit-pipeline.patch
diff options
context:
space:
mode:
Diffstat (limited to 'gfx/cairo/pixman-16-bit-pipeline.patch')
-rw-r--r--gfx/cairo/pixman-16-bit-pipeline.patch1242
1 files changed, 1242 insertions, 0 deletions
diff --git a/gfx/cairo/pixman-16-bit-pipeline.patch b/gfx/cairo/pixman-16-bit-pipeline.patch
new file mode 100644
index 000000000..8a7878ca2
--- /dev/null
+++ b/gfx/cairo/pixman-16-bit-pipeline.patch
@@ -0,0 +1,1242 @@
+diff --git a/gfx/cairo/libpixman/src/pixman-access.c b/gfx/cairo/libpixman/src/pixman-access.c
+--- a/gfx/cairo/libpixman/src/pixman-access.c
++++ b/gfx/cairo/libpixman/src/pixman-access.c
+@@ -933,16 +933,54 @@ store_scanline_x2b10g10r10 (bits_image_t
+ {
+ WRITE (image, pixel++,
+ ((values[i] >> 38) & 0x3ff) |
+ ((values[i] >> 12) & 0xffc00) |
+ ((values[i] << 14) & 0x3ff00000));
+ }
+ }
+
++static void
++store_scanline_16 (bits_image_t * image,
++ int x,
++ int y,
++ int width,
++ const uint32_t *v)
++{
++ uint16_t *bits = (uint16_t*)(image->bits + image->rowstride * y);
++ uint16_t *values = (uint16_t *)v;
++ uint16_t *pixel = bits + x;
++ int i;
++
++ for (i = 0; i < width; ++i)
++ {
++ WRITE (image, pixel++, values[i]);
++ }
++}
++
++static void
++fetch_scanline_16 (pixman_image_t *image,
++ int x,
++ int y,
++ int width,
++ uint32_t * b,
++ const uint32_t *mask)
++{
++ const uint16_t *bits = (uint16_t*)(image->bits.bits + y * image->bits.rowstride);
++ const uint16_t *pixel = bits + x;
++ int i;
++ uint16_t *buffer = (uint16_t *)b;
++
++ for (i = 0; i < width; ++i)
++ {
++ *buffer++ = READ (image, pixel++);
++ }
++}
++
++
+ /*
+ * Contracts a 64bpp image to 32bpp and then stores it using a regular 32-bit
+ * store proc. Despite the type, this function expects a uint64_t buffer.
+ */
+ static void
+ store_scanline_generic_64 (bits_image_t * image,
+ int x,
+ int y,
+@@ -1044,32 +1082,47 @@ fetch_pixel_generic_lossy_32 (bits_image
+ pixman_contract (&result, &pixel64, 1);
+
+ return result;
+ }
+
+ typedef struct
+ {
+ pixman_format_code_t format;
++ fetch_scanline_t fetch_scanline_16;
+ fetch_scanline_t fetch_scanline_32;
+ fetch_scanline_t fetch_scanline_64;
+ fetch_pixel_32_t fetch_pixel_32;
+ fetch_pixel_64_t fetch_pixel_64;
++ store_scanline_t store_scanline_16;
+ store_scanline_t store_scanline_32;
+ store_scanline_t store_scanline_64;
+ } format_info_t;
+
+ #define FORMAT_INFO(format) \
+ { \
+ PIXMAN_ ## format, \
++ NULL, \
+ fetch_scanline_ ## format, \
+ fetch_scanline_generic_64, \
+ fetch_pixel_ ## format, fetch_pixel_generic_64, \
++ NULL, \
+ store_scanline_ ## format, store_scanline_generic_64 \
+ }
++#define FORMAT_INFO16(format) \
++ { \
++ PIXMAN_ ## format, \
++ fetch_scanline_16, \
++ fetch_scanline_ ## format, \
++ fetch_scanline_generic_64, \
++ fetch_pixel_ ## format, fetch_pixel_generic_64, \
++ store_scanline_16, \
++ store_scanline_ ## format, store_scanline_generic_64 \
++ }
++
+
+ static const format_info_t accessors[] =
+ {
+ /* 32 bpp formats */
+ FORMAT_INFO (a8r8g8b8),
+ FORMAT_INFO (x8r8g8b8),
+ FORMAT_INFO (a8b8g8r8),
+ FORMAT_INFO (x8b8g8r8),
+@@ -1079,18 +1132,18 @@ static const format_info_t accessors[] =
+ FORMAT_INFO (r8g8b8x8),
+ FORMAT_INFO (x14r6g6b6),
+
+ /* 24bpp formats */
+ FORMAT_INFO (r8g8b8),
+ FORMAT_INFO (b8g8r8),
+
+ /* 16bpp formats */
+- FORMAT_INFO (r5g6b5),
+- FORMAT_INFO (b5g6r5),
++ FORMAT_INFO16 (r5g6b5),
++ FORMAT_INFO16 (b5g6r5),
+
+ FORMAT_INFO (a1r5g5b5),
+ FORMAT_INFO (x1r5g5b5),
+ FORMAT_INFO (a1b5g5r5),
+ FORMAT_INFO (x1b5g5r5),
+ FORMAT_INFO (a4r4g4b4),
+ FORMAT_INFO (x4r4g4b4),
+ FORMAT_INFO (a4b4g4r4),
+@@ -1132,62 +1185,64 @@ static const format_info_t accessors[] =
+
+ /* 1bpp formats */
+ FORMAT_INFO (a1),
+ FORMAT_INFO (g1),
+
+ /* Wide formats */
+
+ { PIXMAN_a2r10g10b10,
+- NULL, fetch_scanline_a2r10g10b10,
++ NULL, NULL, fetch_scanline_a2r10g10b10,
+ fetch_pixel_generic_lossy_32, fetch_pixel_a2r10g10b10,
+ NULL, store_scanline_a2r10g10b10 },
+
+ { PIXMAN_x2r10g10b10,
+- NULL, fetch_scanline_x2r10g10b10,
++ NULL, NULL, fetch_scanline_x2r10g10b10,
+ fetch_pixel_generic_lossy_32, fetch_pixel_x2r10g10b10,
+ NULL, store_scanline_x2r10g10b10 },
+
+ { PIXMAN_a2b10g10r10,
+- NULL, fetch_scanline_a2b10g10r10,
++ NULL, NULL, fetch_scanline_a2b10g10r10,
+ fetch_pixel_generic_lossy_32, fetch_pixel_a2b10g10r10,
+ NULL, store_scanline_a2b10g10r10 },
+
+ { PIXMAN_x2b10g10r10,
+- NULL, fetch_scanline_x2b10g10r10,
++ NULL, NULL, fetch_scanline_x2b10g10r10,
+ fetch_pixel_generic_lossy_32, fetch_pixel_x2b10g10r10,
+ NULL, store_scanline_x2b10g10r10 },
+
+ /* YUV formats */
+ { PIXMAN_yuy2,
+- fetch_scanline_yuy2, fetch_scanline_generic_64,
++ NULL, fetch_scanline_yuy2, fetch_scanline_generic_64,
+ fetch_pixel_yuy2, fetch_pixel_generic_64,
+ NULL, NULL },
+
+ { PIXMAN_yv12,
+- fetch_scanline_yv12, fetch_scanline_generic_64,
++ NULL, fetch_scanline_yv12, fetch_scanline_generic_64,
+ fetch_pixel_yv12, fetch_pixel_generic_64,
+ NULL, NULL },
+
+ { PIXMAN_null },
+ };
+
+ static void
+ setup_accessors (bits_image_t *image)
+ {
+ const format_info_t *info = accessors;
+
+ while (info->format != PIXMAN_null)
+ {
+ if (info->format == image->format)
+ {
++ image->fetch_scanline_16 = info->fetch_scanline_16;
+ image->fetch_scanline_32 = info->fetch_scanline_32;
+ image->fetch_scanline_64 = info->fetch_scanline_64;
+ image->fetch_pixel_32 = info->fetch_pixel_32;
+ image->fetch_pixel_64 = info->fetch_pixel_64;
++ image->store_scanline_16 = info->store_scanline_16;
+ image->store_scanline_32 = info->store_scanline_32;
+ image->store_scanline_64 = info->store_scanline_64;
+
+ return;
+ }
+
+ info++;
+ }
+diff --git a/gfx/cairo/libpixman/src/pixman-bits-image.c b/gfx/cairo/libpixman/src/pixman-bits-image.c
+--- a/gfx/cairo/libpixman/src/pixman-bits-image.c
++++ b/gfx/cairo/libpixman/src/pixman-bits-image.c
+@@ -1247,16 +1247,31 @@ src_get_scanline_wide (pixman_iter_t *it
+
+ void
+ _pixman_bits_image_src_iter_init (pixman_image_t *image, pixman_iter_t *iter)
+ {
+ if (iter->flags & ITER_NARROW)
+ iter->get_scanline = src_get_scanline_narrow;
+ else
+ iter->get_scanline = src_get_scanline_wide;
++
++}
++
++static uint32_t *
++dest_get_scanline_16 (pixman_iter_t *iter, const uint32_t *mask)
++{
++ pixman_image_t *image = iter->image;
++ int x = iter->x;
++ int y = iter->y;
++ int width = iter->width;
++ uint32_t * buffer = iter->buffer;
++
++ image->bits.fetch_scanline_16 (image, x, y, width, buffer, mask);
++
++ return iter->buffer;
+ }
+
+ static uint32_t *
+ dest_get_scanline_narrow (pixman_iter_t *iter, const uint32_t *mask)
+ {
+ pixman_image_t *image = iter->image;
+ int x = iter->x;
+ int y = iter->y;
+@@ -1327,16 +1342,30 @@ dest_get_scanline_wide (pixman_iter_t *i
+ free (alpha);
+ }
+ }
+
+ return iter->buffer;
+ }
+
+ static void
++dest_write_back_16 (pixman_iter_t *iter)
++{
++ bits_image_t * image = &iter->image->bits;
++ int x = iter->x;
++ int y = iter->y;
++ int width = iter->width;
++ const uint32_t *buffer = iter->buffer;
++
++ image->store_scanline_16 (image, x, y, width, buffer);
++
++ iter->y++;
++}
++
++static void
+ dest_write_back_narrow (pixman_iter_t *iter)
+ {
+ bits_image_t * image = &iter->image->bits;
+ int x = iter->x;
+ int y = iter->y;
+ int width = iter->width;
+ const uint32_t *buffer = iter->buffer;
+
+@@ -1375,28 +1404,41 @@ dest_write_back_wide (pixman_iter_t *ite
+ }
+
+ iter->y++;
+ }
+
+ void
+ _pixman_bits_image_dest_iter_init (pixman_image_t *image, pixman_iter_t *iter)
+ {
+- if (iter->flags & ITER_NARROW)
++ if (iter->flags & ITER_16)
++ {
++ if ((iter->flags & (ITER_IGNORE_RGB | ITER_IGNORE_ALPHA)) ==
++ (ITER_IGNORE_RGB | ITER_IGNORE_ALPHA))
++ {
++ iter->get_scanline = _pixman_iter_get_scanline_noop;
++ }
++ else
++ {
++ iter->get_scanline = dest_get_scanline_16;
++ }
++ iter->write_back = dest_write_back_16;
++ }
++ else if (iter->flags & ITER_NARROW)
+ {
+ if ((iter->flags & (ITER_IGNORE_RGB | ITER_IGNORE_ALPHA)) ==
+ (ITER_IGNORE_RGB | ITER_IGNORE_ALPHA))
+ {
+ iter->get_scanline = _pixman_iter_get_scanline_noop;
+ }
+ else
+ {
+ iter->get_scanline = dest_get_scanline_narrow;
+ }
+-
++
+ iter->write_back = dest_write_back_narrow;
+ }
+ else
+ {
+ iter->get_scanline = dest_get_scanline_wide;
+ iter->write_back = dest_write_back_wide;
+ }
+ }
+diff --git a/gfx/cairo/libpixman/src/pixman-combine16.c b/gfx/cairo/libpixman/src/pixman-combine16.c
+new file mode 100644
+--- /dev/null
++++ b/gfx/cairo/libpixman/src/pixman-combine16.c
+@@ -0,0 +1,124 @@
++#ifdef HAVE_CONFIG_H
++#include <config.h>
++#endif
++
++#include <math.h>
++#include <string.h>
++
++#include "pixman-private.h"
++
++#include "pixman-combine32.h"
++
++static force_inline uint32_t
++combine_mask (const uint32_t src, const uint32_t mask)
++{
++ uint32_t s, m;
++
++ m = mask >> A_SHIFT;
++
++ if (!m)
++ return 0;
++ s = src;
++
++ UN8x4_MUL_UN8 (s, m);
++
++ return s;
++}
++
++static inline uint32_t convert_0565_to_8888(uint16_t color)
++{
++ return CONVERT_0565_TO_8888(color);
++}
++
++static inline uint16_t convert_8888_to_0565(uint32_t color)
++{
++ return CONVERT_8888_TO_0565(color);
++}
++
++static void
++combine_src_u (pixman_implementation_t *imp,
++ pixman_op_t op,
++ uint32_t * dest,
++ const uint32_t * src,
++ const uint32_t * mask,
++ int width)
++{
++ int i;
++
++ if (!mask)
++ memcpy (dest, src, width * sizeof (uint16_t));
++ else
++ {
++ uint16_t *d = (uint16_t*)dest;
++ uint16_t *src16 = (uint16_t*)src;
++ for (i = 0; i < width; ++i)
++ {
++ if ((*mask & 0xff000000) == 0xff000000) {
++ // it's likely worth special casing
++ // fully opaque because it avoids
++ // the cost of conversion as well the multiplication
++ *(d + i) = *src16;
++ } else {
++ // the mask is still 32bits
++ uint32_t s = combine_mask (convert_0565_to_8888(*src16), *mask);
++ *(d + i) = convert_8888_to_0565(s);
++ }
++ mask++;
++ src16++;
++ }
++ }
++
++}
++
++static void
++combine_over_u (pixman_implementation_t *imp,
++ pixman_op_t op,
++ uint32_t * dest,
++ const uint32_t * src,
++ const uint32_t * mask,
++ int width)
++{
++ int i;
++
++ if (!mask)
++ memcpy (dest, src, width * sizeof (uint16_t));
++ else
++ {
++ uint16_t *d = (uint16_t*)dest;
++ uint16_t *src16 = (uint16_t*)src;
++ for (i = 0; i < width; ++i)
++ {
++ if ((*mask & 0xff000000) == 0xff000000) {
++ // it's likely worth special casing
++ // fully opaque because it avoids
++ // the cost of conversion as well the multiplication
++ *(d + i) = *src16;
++ } else if ((*mask & 0xff000000) == 0x00000000) {
++ // keep the dest the same
++ } else {
++ // the mask is still 32bits
++ uint32_t s = combine_mask (convert_0565_to_8888(*src16), *mask);
++ uint32_t ia = ALPHA_8 (~s);
++ uint32_t d32 = convert_0565_to_8888(*(d + i));
++ UN8x4_MUL_UN8_ADD_UN8x4 (d32, ia, s);
++ *(d + i) = convert_8888_to_0565(d32);
++ }
++ mask++;
++ src16++;
++ }
++ }
++
++}
++
++
++void
++_pixman_setup_combiner_functions_16 (pixman_implementation_t *imp)
++{
++ int i;
++ for (i = 0; i < PIXMAN_N_OPERATORS; i++) {
++ imp->combine_16[i] = NULL;
++ }
++ imp->combine_16[PIXMAN_OP_SRC] = combine_src_u;
++ imp->combine_16[PIXMAN_OP_OVER] = combine_over_u;
++}
++
+diff --git a/gfx/cairo/libpixman/src/pixman-general.c b/gfx/cairo/libpixman/src/pixman-general.c
+--- a/gfx/cairo/libpixman/src/pixman-general.c
++++ b/gfx/cairo/libpixman/src/pixman-general.c
+@@ -106,46 +106,61 @@ general_composite_rect (pixman_implemen
+ PIXMAN_COMPOSITE_ARGS (info);
+ uint64_t stack_scanline_buffer[(SCANLINE_BUFFER_LENGTH * 3 + 7) / 8];
+ uint8_t *scanline_buffer = (uint8_t *) stack_scanline_buffer;
+ uint8_t *src_buffer, *mask_buffer, *dest_buffer;
+ pixman_iter_t src_iter, mask_iter, dest_iter;
+ pixman_combine_32_func_t compose;
+ pixman_bool_t component_alpha;
+ iter_flags_t narrow, src_flags;
++ iter_flags_t rgb16;
+ int Bpp;
+ int i;
+
+ if ((src_image->common.flags & FAST_PATH_NARROW_FORMAT) &&
+ (!mask_image || mask_image->common.flags & FAST_PATH_NARROW_FORMAT) &&
+ (dest_image->common.flags & FAST_PATH_NARROW_FORMAT))
+ {
+ narrow = ITER_NARROW;
+ Bpp = 4;
+ }
+ else
+ {
+ narrow = 0;
+ Bpp = 8;
+ }
+
++ // XXX: This special casing is bad. Ideally, we'd keep the general code general perhaps
++ // by having it deal more specifically with different intermediate formats
++ if (
++ (dest_image->common.flags & FAST_PATH_16_FORMAT && (src_image->type == LINEAR || src_image->type == RADIAL)) &&
++ ( op == PIXMAN_OP_SRC ||
++ (op == PIXMAN_OP_OVER && (src_image->common.flags & FAST_PATH_IS_OPAQUE))
++ )
++ ) {
++ rgb16 = ITER_16;
++ } else {
++ rgb16 = 0;
++ }
++
++
+ if (width * Bpp > SCANLINE_BUFFER_LENGTH)
+ {
+ scanline_buffer = pixman_malloc_abc (width, 3, Bpp);
+
+ if (!scanline_buffer)
+ return;
+ }
+
+ src_buffer = scanline_buffer;
+ mask_buffer = src_buffer + width * Bpp;
+ dest_buffer = mask_buffer + width * Bpp;
+
+ /* src iter */
+- src_flags = narrow | op_flags[op].src;
++ src_flags = narrow | op_flags[op].src | rgb16;
+
+ _pixman_implementation_src_iter_init (imp->toplevel, &src_iter, src_image,
+ src_x, src_y, width, height,
+ src_buffer, src_flags);
+
+ /* mask iter */
+ if ((src_flags & (ITER_IGNORE_ALPHA | ITER_IGNORE_RGB)) ==
+ (ITER_IGNORE_ALPHA | ITER_IGNORE_RGB))
+@@ -164,20 +179,20 @@ general_composite_rect (pixman_implemen
+
+ _pixman_implementation_src_iter_init (
+ imp->toplevel, &mask_iter, mask_image, mask_x, mask_y, width, height,
+ mask_buffer, narrow | (component_alpha? 0 : ITER_IGNORE_RGB));
+
+ /* dest iter */
+ _pixman_implementation_dest_iter_init (
+ imp->toplevel, &dest_iter, dest_image, dest_x, dest_y, width, height,
+- dest_buffer, narrow | op_flags[op].dst);
++ dest_buffer, narrow | op_flags[op].dst | rgb16);
+
+ compose = _pixman_implementation_lookup_combiner (
+- imp->toplevel, op, component_alpha, narrow);
++ imp->toplevel, op, component_alpha, narrow, !!rgb16);
+
+ if (!compose)
+ return;
+
+ for (i = 0; i < height; ++i)
+ {
+ uint32_t *s, *m, *d;
+
+@@ -234,16 +249,17 @@ general_fill (pixman_implementation_t *i
+ return FALSE;
+ }
+
+ pixman_implementation_t *
+ _pixman_implementation_create_general (void)
+ {
+ pixman_implementation_t *imp = _pixman_implementation_create (NULL, general_fast_path);
+
++ _pixman_setup_combiner_functions_16 (imp);
+ _pixman_setup_combiner_functions_32 (imp);
+ _pixman_setup_combiner_functions_64 (imp);
+
+ imp->blt = general_blt;
+ imp->fill = general_fill;
+ imp->src_iter_init = general_src_iter_init;
+ imp->dest_iter_init = general_dest_iter_init;
+
+diff --git a/gfx/cairo/libpixman/src/pixman-image.c b/gfx/cairo/libpixman/src/pixman-image.c
+--- a/gfx/cairo/libpixman/src/pixman-image.c
++++ b/gfx/cairo/libpixman/src/pixman-image.c
+@@ -451,16 +451,20 @@ compute_image_info (pixman_image_t *imag
+ flags |= FAST_PATH_IS_OPAQUE;
+ }
+
+ if (image->bits.read_func || image->bits.write_func)
+ flags &= ~FAST_PATH_NO_ACCESSORS;
+
+ if (PIXMAN_FORMAT_IS_WIDE (image->bits.format))
+ flags &= ~FAST_PATH_NARROW_FORMAT;
++
++ if (image->bits.format == PIXMAN_r5g6b5)
++ flags |= FAST_PATH_16_FORMAT;
++
+ break;
+
+ case RADIAL:
+ code = PIXMAN_unknown;
+
+ /*
+ * As explained in pixman-radial-gradient.c, every point of
+ * the plane has a valid associated radius (and thus will be
+diff --git a/gfx/cairo/libpixman/src/pixman-implementation.c b/gfx/cairo/libpixman/src/pixman-implementation.c
+--- a/gfx/cairo/libpixman/src/pixman-implementation.c
++++ b/gfx/cairo/libpixman/src/pixman-implementation.c
+@@ -101,45 +101,51 @@ pixman_implementation_t *
+ imp->fill = delegate_fill;
+ imp->src_iter_init = delegate_src_iter_init;
+ imp->dest_iter_init = delegate_dest_iter_init;
+
+ imp->fast_paths = fast_paths;
+
+ for (i = 0; i < PIXMAN_N_OPERATORS; ++i)
+ {
++ imp->combine_16[i] = NULL;
+ imp->combine_32[i] = NULL;
+ imp->combine_64[i] = NULL;
+ imp->combine_32_ca[i] = NULL;
+ imp->combine_64_ca[i] = NULL;
+ }
+
+ return imp;
+ }
+
+ pixman_combine_32_func_t
+ _pixman_implementation_lookup_combiner (pixman_implementation_t *imp,
+ pixman_op_t op,
+ pixman_bool_t component_alpha,
+- pixman_bool_t narrow)
++ pixman_bool_t narrow,
++ pixman_bool_t rgb16)
+ {
+ pixman_combine_32_func_t f;
+
+ do
+ {
+ pixman_combine_32_func_t (*combiners[]) =
+ {
+ (pixman_combine_32_func_t *)imp->combine_64,
+ (pixman_combine_32_func_t *)imp->combine_64_ca,
+ imp->combine_32,
+ imp->combine_32_ca,
++ (pixman_combine_32_func_t *)imp->combine_16,
++ NULL,
+ };
+-
+- f = combiners[component_alpha | (narrow << 1)][op];
+-
++ if (rgb16) {
++ f = combiners[4][op];
++ } else {
++ f = combiners[component_alpha + (narrow << 1)][op];
++ }
+ imp = imp->delegate;
+ }
+ while (!f);
+
+ return f;
+ }
+
+ pixman_bool_t
+diff --git a/gfx/cairo/libpixman/src/pixman-linear-gradient.c b/gfx/cairo/libpixman/src/pixman-linear-gradient.c
+--- a/gfx/cairo/libpixman/src/pixman-linear-gradient.c
++++ b/gfx/cairo/libpixman/src/pixman-linear-gradient.c
+@@ -217,42 +217,185 @@ linear_get_scanline_narrow (pixman_iter_
+ }
+ }
+
+ iter->y++;
+
+ return iter->buffer;
+ }
+
++static uint16_t convert_8888_to_0565(uint32_t color)
++{
++ return CONVERT_8888_TO_0565(color);
++}
++
++static uint32_t *
++linear_get_scanline_16 (pixman_iter_t *iter,
++ const uint32_t *mask)
++{
++ pixman_image_t *image = iter->image;
++ int x = iter->x;
++ int y = iter->y;
++ int width = iter->width;
++ uint16_t * buffer = (uint16_t*)iter->buffer;
++
++ pixman_vector_t v, unit;
++ pixman_fixed_32_32_t l;
++ pixman_fixed_48_16_t dx, dy;
++ gradient_t *gradient = (gradient_t *)image;
++ linear_gradient_t *linear = (linear_gradient_t *)image;
++ uint16_t *end = buffer + width;
++ pixman_gradient_walker_t walker;
++
++ _pixman_gradient_walker_init (&walker, gradient, image->common.repeat);
++
++ /* reference point is the center of the pixel */
++ v.vector[0] = pixman_int_to_fixed (x) + pixman_fixed_1 / 2;
++ v.vector[1] = pixman_int_to_fixed (y) + pixman_fixed_1 / 2;
++ v.vector[2] = pixman_fixed_1;
++
++ if (image->common.transform)
++ {
++ if (!pixman_transform_point_3d (image->common.transform, &v))
++ return iter->buffer;
++
++ unit.vector[0] = image->common.transform->matrix[0][0];
++ unit.vector[1] = image->common.transform->matrix[1][0];
++ unit.vector[2] = image->common.transform->matrix[2][0];
++ }
++ else
++ {
++ unit.vector[0] = pixman_fixed_1;
++ unit.vector[1] = 0;
++ unit.vector[2] = 0;
++ }
++
++ dx = linear->p2.x - linear->p1.x;
++ dy = linear->p2.y - linear->p1.y;
++
++ l = dx * dx + dy * dy;
++
++ if (l == 0 || unit.vector[2] == 0)
++ {
++ /* affine transformation only */
++ pixman_fixed_32_32_t t, next_inc;
++ double inc;
++
++ if (l == 0 || v.vector[2] == 0)
++ {
++ t = 0;
++ inc = 0;
++ }
++ else
++ {
++ double invden, v2;
++
++ invden = pixman_fixed_1 * (double) pixman_fixed_1 /
++ (l * (double) v.vector[2]);
++ v2 = v.vector[2] * (1. / pixman_fixed_1);
++ t = ((dx * v.vector[0] + dy * v.vector[1]) -
++ (dx * linear->p1.x + dy * linear->p1.y) * v2) * invden;
++ inc = (dx * unit.vector[0] + dy * unit.vector[1]) * invden;
++ }
++ next_inc = 0;
++
++ if (((pixman_fixed_32_32_t )(inc * width)) == 0)
++ {
++ register uint16_t color;
++
++ color = convert_8888_to_0565(_pixman_gradient_walker_pixel (&walker, t));
++ while (buffer < end)
++ *buffer++ = color;
++ }
++ else
++ {
++ int i;
++
++ i = 0;
++ while (buffer < end)
++ {
++ if (!mask || *mask++)
++ {
++ *buffer = convert_8888_to_0565(_pixman_gradient_walker_pixel (&walker,
++ t + next_inc));
++ }
++ i++;
++ next_inc = inc * i;
++ buffer++;
++ }
++ }
++ }
++ else
++ {
++ /* projective transformation */
++ double t;
++
++ t = 0;
++
++ while (buffer < end)
++ {
++ if (!mask || *mask++)
++ {
++ if (v.vector[2] != 0)
++ {
++ double invden, v2;
++
++ invden = pixman_fixed_1 * (double) pixman_fixed_1 /
++ (l * (double) v.vector[2]);
++ v2 = v.vector[2] * (1. / pixman_fixed_1);
++ t = ((dx * v.vector[0] + dy * v.vector[1]) -
++ (dx * linear->p1.x + dy * linear->p1.y) * v2) * invden;
++ }
++
++ *buffer = convert_8888_to_0565(_pixman_gradient_walker_pixel (&walker, t));
++ }
++
++ ++buffer;
++
++ v.vector[0] += unit.vector[0];
++ v.vector[1] += unit.vector[1];
++ v.vector[2] += unit.vector[2];
++ }
++ }
++
++ iter->y++;
++
++ return iter->buffer;
++}
++
+ static uint32_t *
+ linear_get_scanline_wide (pixman_iter_t *iter, const uint32_t *mask)
+ {
+ uint32_t *buffer = linear_get_scanline_narrow (iter, NULL);
+
+ pixman_expand ((uint64_t *)buffer, buffer, PIXMAN_a8r8g8b8, iter->width);
+
+ return buffer;
+ }
+
+ void
+ _pixman_linear_gradient_iter_init (pixman_image_t *image, pixman_iter_t *iter)
+ {
+ if (linear_gradient_is_horizontal (
+ iter->image, iter->x, iter->y, iter->width, iter->height))
+ {
+- if (iter->flags & ITER_NARROW)
++ if (iter->flags & ITER_16)
++ linear_get_scanline_16 (iter, NULL);
++ else if (iter->flags & ITER_NARROW)
+ linear_get_scanline_narrow (iter, NULL);
+ else
+ linear_get_scanline_wide (iter, NULL);
+
+ iter->get_scanline = _pixman_iter_get_scanline_noop;
+ }
+ else
+ {
+- if (iter->flags & ITER_NARROW)
++ if (iter->flags & ITER_16)
++ iter->get_scanline = linear_get_scanline_16;
++ else if (iter->flags & ITER_NARROW)
+ iter->get_scanline = linear_get_scanline_narrow;
+ else
+ iter->get_scanline = linear_get_scanline_wide;
+ }
+ }
+
+ PIXMAN_EXPORT pixman_image_t *
+ pixman_image_create_linear_gradient (pixman_point_fixed_t * p1,
+diff --git a/gfx/cairo/libpixman/src/pixman-private.h b/gfx/cairo/libpixman/src/pixman-private.h
+--- a/gfx/cairo/libpixman/src/pixman-private.h
++++ b/gfx/cairo/libpixman/src/pixman-private.h
+@@ -152,24 +152,28 @@ struct bits_image
+ int height;
+ uint32_t * bits;
+ uint32_t * free_me;
+ int rowstride; /* in number of uint32_t's */
+
+ fetch_scanline_t get_scanline_32;
+ fetch_scanline_t get_scanline_64;
+
++ fetch_scanline_t fetch_scanline_16;
++
+ fetch_scanline_t fetch_scanline_32;
+ fetch_pixel_32_t fetch_pixel_32;
+ store_scanline_t store_scanline_32;
+
+ fetch_scanline_t fetch_scanline_64;
+ fetch_pixel_64_t fetch_pixel_64;
+ store_scanline_t store_scanline_64;
+
++ store_scanline_t store_scanline_16;
++
+ /* Used for indirect access to the bits */
+ pixman_read_memory_func_t read_func;
+ pixman_write_memory_func_t write_func;
+ };
+
+ union pixman_image
+ {
+ image_type_t type;
+@@ -202,17 +206,24 @@ typedef enum
+ * destination.
+ *
+ * When he destination is xRGB, this is useful knowledge, because then
+ * we can treat it as if it were ARGB, which means in some cases we can
+ * avoid copying it to a temporary buffer.
+ */
+ ITER_LOCALIZED_ALPHA = (1 << 1),
+ ITER_IGNORE_ALPHA = (1 << 2),
+- ITER_IGNORE_RGB = (1 << 3)
++ ITER_IGNORE_RGB = (1 << 3),
++
++ /* With the addition of ITER_16 we now have two flags that to represent
++ * 3 pipelines. This means that there can be an invalid state when
++ * both ITER_NARROW and ITER_16 are set. In this case
++ * ITER_16 overrides NARROW and we should use the 16 bit pipeline.
++ * Note: ITER_16 still has a 32 bit mask, which is a bit weird. */
++ ITER_16 = (1 << 4)
+ } iter_flags_t;
+
+ struct pixman_iter_t
+ {
+ /* These are initialized by _pixman_implementation_{src,dest}_init */
+ pixman_image_t * image;
+ uint32_t * buffer;
+ int x, y;
+@@ -429,16 +440,17 @@ typedef pixman_bool_t (*pixman_fill_func
+ int x,
+ int y,
+ int width,
+ int height,
+ uint32_t xor);
+ typedef void (*pixman_iter_init_func_t) (pixman_implementation_t *imp,
+ pixman_iter_t *iter);
+
++void _pixman_setup_combiner_functions_16 (pixman_implementation_t *imp);
+ void _pixman_setup_combiner_functions_32 (pixman_implementation_t *imp);
+ void _pixman_setup_combiner_functions_64 (pixman_implementation_t *imp);
+
+ typedef struct
+ {
+ pixman_op_t op;
+ pixman_format_code_t src_format;
+ uint32_t src_flags;
+@@ -459,32 +471,34 @@ struct pixman_implementation_t
+ pixman_fill_func_t fill;
+ pixman_iter_init_func_t src_iter_init;
+ pixman_iter_init_func_t dest_iter_init;
+
+ pixman_combine_32_func_t combine_32[PIXMAN_N_OPERATORS];
+ pixman_combine_32_func_t combine_32_ca[PIXMAN_N_OPERATORS];
+ pixman_combine_64_func_t combine_64[PIXMAN_N_OPERATORS];
+ pixman_combine_64_func_t combine_64_ca[PIXMAN_N_OPERATORS];
++ pixman_combine_64_func_t combine_16[PIXMAN_N_OPERATORS];
+ };
+
+ uint32_t
+ _pixman_image_get_solid (pixman_implementation_t *imp,
+ pixman_image_t * image,
+ pixman_format_code_t format);
+
+ pixman_implementation_t *
+ _pixman_implementation_create (pixman_implementation_t *delegate,
+ const pixman_fast_path_t *fast_paths);
+
+ pixman_combine_32_func_t
+ _pixman_implementation_lookup_combiner (pixman_implementation_t *imp,
+ pixman_op_t op,
+ pixman_bool_t component_alpha,
+- pixman_bool_t wide);
++ pixman_bool_t wide,
++ pixman_bool_t rgb16);
+
+ pixman_bool_t
+ _pixman_implementation_blt (pixman_implementation_t *imp,
+ uint32_t * src_bits,
+ uint32_t * dst_bits,
+ int src_stride,
+ int dst_stride,
+ int src_bpp,
+@@ -613,16 +627,17 @@ uint32_t *
+ #define FAST_PATH_Y_UNIT_ZERO (1 << 18)
+ #define FAST_PATH_BILINEAR_FILTER (1 << 19)
+ #define FAST_PATH_ROTATE_90_TRANSFORM (1 << 20)
+ #define FAST_PATH_ROTATE_180_TRANSFORM (1 << 21)
+ #define FAST_PATH_ROTATE_270_TRANSFORM (1 << 22)
+ #define FAST_PATH_SAMPLES_COVER_CLIP_NEAREST (1 << 23)
+ #define FAST_PATH_SAMPLES_COVER_CLIP_BILINEAR (1 << 24)
+ #define FAST_PATH_BITS_IMAGE (1 << 25)
++#define FAST_PATH_16_FORMAT (1 << 26)
+
+ #define FAST_PATH_PAD_REPEAT \
+ (FAST_PATH_NO_NONE_REPEAT | \
+ FAST_PATH_NO_NORMAL_REPEAT | \
+ FAST_PATH_NO_REFLECT_REPEAT)
+
+ #define FAST_PATH_NORMAL_REPEAT \
+ (FAST_PATH_NO_NONE_REPEAT | \
+diff --git a/gfx/cairo/libpixman/src/pixman-radial-gradient.c b/gfx/cairo/libpixman/src/pixman-radial-gradient.c
+--- a/gfx/cairo/libpixman/src/pixman-radial-gradient.c
++++ b/gfx/cairo/libpixman/src/pixman-radial-gradient.c
+@@ -395,35 +395,289 @@ radial_get_scanline_narrow (pixman_iter_
+ v.vector[2] += unit.vector[2];
+ }
+ }
+
+ iter->y++;
+ return iter->buffer;
+ }
+
++static uint16_t convert_8888_to_0565(uint32_t color)
++{
++ return CONVERT_8888_TO_0565(color);
++}
++
++static uint32_t *
++radial_get_scanline_16 (pixman_iter_t *iter, const uint32_t *mask)
++{
++ /*
++ * Implementation of radial gradients following the PDF specification.
++ * See section 8.7.4.5.4 Type 3 (Radial) Shadings of the PDF Reference
++ * Manual (PDF 32000-1:2008 at the time of this writing).
++ *
++ * In the radial gradient problem we are given two circles (c₁,r₁) and
++ * (c₂,r₂) that define the gradient itself.
++ *
++ * Mathematically the gradient can be defined as the family of circles
++ *
++ * ((1-t)·c₁ + t·(c₂), (1-t)·r₁ + t·r₂)
++ *
++ * excluding those circles whose radius would be < 0. When a point
++ * belongs to more than one circle, the one with a bigger t is the only
++ * one that contributes to its color. When a point does not belong
++ * to any of the circles, it is transparent black, i.e. RGBA (0, 0, 0, 0).
++ * Further limitations on the range of values for t are imposed when
++ * the gradient is not repeated, namely t must belong to [0,1].
++ *
++ * The graphical result is the same as drawing the valid (radius > 0)
++ * circles with increasing t in [-inf, +inf] (or in [0,1] if the gradient
++ * is not repeated) using SOURCE operator composition.
++ *
++ * It looks like a cone pointing towards the viewer if the ending circle
++ * is smaller than the starting one, a cone pointing inside the page if
++ * the starting circle is the smaller one and like a cylinder if they
++ * have the same radius.
++ *
++ * What we actually do is, given the point whose color we are interested
++ * in, compute the t values for that point, solving for t in:
++ *
++ * length((1-t)·c₁ + t·(c₂) - p) = (1-t)·r₁ + t·r₂
++ *
++ * Let's rewrite it in a simpler way, by defining some auxiliary
++ * variables:
++ *
++ * cd = c₂ - c₁
++ * pd = p - c₁
++ * dr = r₂ - r₁
++ * length(t·cd - pd) = r₁ + t·dr
++ *
++ * which actually means
++ *
++ * hypot(t·cdx - pdx, t·cdy - pdy) = r₁ + t·dr
++ *
++ * or
++ *
++ * ⎷((t·cdx - pdx)² + (t·cdy - pdy)²) = r₁ + t·dr.
++ *
++ * If we impose (as stated earlier) that r₁ + t·dr >= 0, it becomes:
++ *
++ * (t·cdx - pdx)² + (t·cdy - pdy)² = (r₁ + t·dr)²
++ *
++ * where we can actually expand the squares and solve for t:
++ *
++ * t²cdx² - 2t·cdx·pdx + pdx² + t²cdy² - 2t·cdy·pdy + pdy² =
++ * = r₁² + 2·r₁·t·dr + t²·dr²
++ *
++ * (cdx² + cdy² - dr²)t² - 2(cdx·pdx + cdy·pdy + r₁·dr)t +
++ * (pdx² + pdy² - r₁²) = 0
++ *
++ * A = cdx² + cdy² - dr²
++ * B = pdx·cdx + pdy·cdy + r₁·dr
++ * C = pdx² + pdy² - r₁²
++ * At² - 2Bt + C = 0
++ *
++ * The solutions (unless the equation degenerates because of A = 0) are:
++ *
++ * t = (B ± ⎷(B² - A·C)) / A
++ *
++ * The solution we are going to prefer is the bigger one, unless the
++ * radius associated to it is negative (or it falls outside the valid t
++ * range).
++ *
++ * Additional observations (useful for optimizations):
++ * A does not depend on p
++ *
++ * A < 0 <=> one of the two circles completely contains the other one
++ * <=> for every p, the radiuses associated with the two t solutions
++ * have opposite sign
++ */
++ pixman_image_t *image = iter->image;
++ int x = iter->x;
++ int y = iter->y;
++ int width = iter->width;
++ uint16_t *buffer = iter->buffer;
++
++ gradient_t *gradient = (gradient_t *)image;
++ radial_gradient_t *radial = (radial_gradient_t *)image;
++ uint16_t *end = buffer + width;
++ pixman_gradient_walker_t walker;
++ pixman_vector_t v, unit;
++
++ /* reference point is the center of the pixel */
++ v.vector[0] = pixman_int_to_fixed (x) + pixman_fixed_1 / 2;
++ v.vector[1] = pixman_int_to_fixed (y) + pixman_fixed_1 / 2;
++ v.vector[2] = pixman_fixed_1;
++
++ _pixman_gradient_walker_init (&walker, gradient, image->common.repeat);
++
++ if (image->common.transform)
++ {
++ if (!pixman_transform_point_3d (image->common.transform, &v))
++ return iter->buffer;
++
++ unit.vector[0] = image->common.transform->matrix[0][0];
++ unit.vector[1] = image->common.transform->matrix[1][0];
++ unit.vector[2] = image->common.transform->matrix[2][0];
++ }
++ else
++ {
++ unit.vector[0] = pixman_fixed_1;
++ unit.vector[1] = 0;
++ unit.vector[2] = 0;
++ }
++
++ if (unit.vector[2] == 0 && v.vector[2] == pixman_fixed_1)
++ {
++ /*
++ * Given:
++ *
++ * t = (B ± ⎷(B² - A·C)) / A
++ *
++ * where
++ *
++ * A = cdx² + cdy² - dr²
++ * B = pdx·cdx + pdy·cdy + r₁·dr
++ * C = pdx² + pdy² - r₁²
++ * det = B² - A·C
++ *
++ * Since we have an affine transformation, we know that (pdx, pdy)
++ * increase linearly with each pixel,
++ *
++ * pdx = pdx₀ + n·ux,
++ * pdy = pdy₀ + n·uy,
++ *
++ * we can then express B, C and det through multiple differentiation.
++ */
++ pixman_fixed_32_32_t b, db, c, dc, ddc;
++
++ /* warning: this computation may overflow */
++ v.vector[0] -= radial->c1.x;
++ v.vector[1] -= radial->c1.y;
++
++ /*
++ * B and C are computed and updated exactly.
++ * If fdot was used instead of dot, in the worst case it would
++ * lose 11 bits of precision in each of the multiplication and
++ * summing up would zero out all the bit that were preserved,
++ * thus making the result 0 instead of the correct one.
++ * This would mean a worst case of unbound relative error or
++ * about 2^10 absolute error
++ */
++ b = dot (v.vector[0], v.vector[1], radial->c1.radius,
++ radial->delta.x, radial->delta.y, radial->delta.radius);
++ db = dot (unit.vector[0], unit.vector[1], 0,
++ radial->delta.x, radial->delta.y, 0);
++
++ c = dot (v.vector[0], v.vector[1],
++ -((pixman_fixed_48_16_t) radial->c1.radius),
++ v.vector[0], v.vector[1], radial->c1.radius);
++ dc = dot (2 * (pixman_fixed_48_16_t) v.vector[0] + unit.vector[0],
++ 2 * (pixman_fixed_48_16_t) v.vector[1] + unit.vector[1],
++ 0,
++ unit.vector[0], unit.vector[1], 0);
++ ddc = 2 * dot (unit.vector[0], unit.vector[1], 0,
++ unit.vector[0], unit.vector[1], 0);
++
++ while (buffer < end)
++ {
++ if (!mask || *mask++)
++ {
++ *buffer = convert_8888_to_0565(
++ radial_compute_color (radial->a, b, c,
++ radial->inva,
++ radial->delta.radius,
++ radial->mindr,
++ &walker,
++ image->common.repeat));
++ }
++
++ b += db;
++ c += dc;
++ dc += ddc;
++ ++buffer;
++ }
++ }
++ else
++ {
++ /* projective */
++ /* Warning:
++ * error propagation guarantees are much looser than in the affine case
++ */
++ while (buffer < end)
++ {
++ if (!mask || *mask++)
++ {
++ if (v.vector[2] != 0)
++ {
++ double pdx, pdy, invv2, b, c;
++
++ invv2 = 1. * pixman_fixed_1 / v.vector[2];
++
++ pdx = v.vector[0] * invv2 - radial->c1.x;
++ /* / pixman_fixed_1 */
++
++ pdy = v.vector[1] * invv2 - radial->c1.y;
++ /* / pixman_fixed_1 */
++
++ b = fdot (pdx, pdy, radial->c1.radius,
++ radial->delta.x, radial->delta.y,
++ radial->delta.radius);
++ /* / pixman_fixed_1 / pixman_fixed_1 */
++
++ c = fdot (pdx, pdy, -radial->c1.radius,
++ pdx, pdy, radial->c1.radius);
++ /* / pixman_fixed_1 / pixman_fixed_1 */
++
++ *buffer = convert_8888_to_0565 (
++ radial_compute_color (radial->a, b, c,
++ radial->inva,
++ radial->delta.radius,
++ radial->mindr,
++ &walker,
++ image->common.repeat));
++ }
++ else
++ {
++ *buffer = 0;
++ }
++ }
++
++ ++buffer;
++
++ v.vector[0] += unit.vector[0];
++ v.vector[1] += unit.vector[1];
++ v.vector[2] += unit.vector[2];
++ }
++ }
++
++ iter->y++;
++ return iter->buffer;
++}
+ static uint32_t *
+ radial_get_scanline_wide (pixman_iter_t *iter, const uint32_t *mask)
+ {
+ uint32_t *buffer = radial_get_scanline_narrow (iter, NULL);
+
+ pixman_expand ((uint64_t *)buffer, buffer, PIXMAN_a8r8g8b8, iter->width);
+
+ return buffer;
+ }
+
+ void
+ _pixman_radial_gradient_iter_init (pixman_image_t *image, pixman_iter_t *iter)
+ {
+- if (iter->flags & ITER_NARROW)
++ if (iter->flags & ITER_16)
++ iter->get_scanline = radial_get_scanline_16;
++ else if (iter->flags & ITER_NARROW)
+ iter->get_scanline = radial_get_scanline_narrow;
+ else
+ iter->get_scanline = radial_get_scanline_wide;
+ }
+
++
+ PIXMAN_EXPORT pixman_image_t *
+ pixman_image_create_radial_gradient (pixman_point_fixed_t * inner,
+ pixman_point_fixed_t * outer,
+ pixman_fixed_t inner_radius,
+ pixman_fixed_t outer_radius,
+ const pixman_gradient_stop_t *stops,
+ int n_stops)
+ {