Pass TRUE instead of FALSE to do what the comment says.

[chaz/openbox] / render / gradient.c
diff --git a/render/gradient.c b/render/gradient.c

index d2cb6814cc9336b792e19e9a3ce5e01807d15c1d..fc75047f3a570b3f266025fb1c30206893bac1bc 100644 (file)
--- a/render/gradient.c
+++ b/render/gradient.c
@@ -2,7 +2,7 @@
  
     gradient.c for the Openbox window manager
     Copyright (c) 2006        Mikael Magnusson
  
     gradient.c for the Openbox window manager
     Copyright (c) 2006        Mikael Magnusson
-   Copyright (c) 2003        Ben Jansens
+   Copyright (c) 2003-2008   Dana Jansens
     Copyright (c) 2003        Derek Foreman
  
     This program is free software; you can redistribute it and/or modify
     Copyright (c) 2003        Derek Foreman
  
     This program is free software; you can redistribute it and/or modify
@@ -22,8 +22,11 @@
  #include "gradient.h"
  #include "color.h"
  #include <glib.h>
  #include "gradient.h"
  #include "color.h"
  #include <glib.h>
+#include <string.h>
  
  
-static void highlight(RrPixel32 *x, RrPixel32 *y, gboolean raised);
+static void highlight(RrSurface *s, RrPixel32 *x, RrPixel32 *y,
+                      gboolean raised);
+static void gradient_parentrelative(RrAppearance *a, gint w, gint h);
  static void gradient_solid(RrAppearance *l, gint w, gint h);
  static void gradient_splitvertical(RrAppearance *a, gint w, gint h);
  static void gradient_vertical(RrSurface *sf, gint w, gint h);
  static void gradient_solid(RrAppearance *l, gint w, gint h);
  static void gradient_splitvertical(RrAppearance *a, gint w, gint h);
  static void gradient_vertical(RrSurface *sf, gint w, gint h);
@@ -41,6 +44,9 @@ void RrRender(RrAppearance *a, gint w, gint h)
      gint off, x;
  
      switch (a->surface.grad) {
      gint off, x;
  
      switch (a->surface.grad) {
+    case RR_SURFACE_PARENTREL:
+        gradient_parentrelative(a, w, h);
+        break;
      case RR_SURFACE_SOLID:
          gradient_solid(a, w, h);
          break;
      case RR_SURFACE_SOLID:
          gradient_solid(a, w, h);
          break;
@@ -69,7 +75,7 @@ void RrRender(RrAppearance *a, gint w, gint h)
          g_assert_not_reached(); /* unhandled gradient */
          return;
      }
          g_assert_not_reached(); /* unhandled gradient */
          return;
      }
-  
+
      if (a->surface.interlaced) {
          gint i;
          RrPixel32 *p;
      if (a->surface.interlaced) {
          gint i;
          RrPixel32 *p;
@@ -106,29 +112,29 @@ void RrRender(RrAppearance *a, gint w, gint h)
      if (a->surface.relief != RR_RELIEF_FLAT) {
          if (a->surface.bevel == RR_BEVEL_1) {
              for (off = 1, x = 1; x < w - 1; ++x, off++)
      if (a->surface.relief != RR_RELIEF_FLAT) {
          if (a->surface.bevel == RR_BEVEL_1) {
              for (off = 1, x = 1; x < w - 1; ++x, off++)
-                highlight(data + off,
+                highlight(&a->surface, data + off,
                            data + off + (h-1) * w,
                            a->surface.relief==RR_RELIEF_RAISED);
              for (off = 0, x = 0; x < h; ++x, off++)
                            data + off + (h-1) * w,
                            a->surface.relief==RR_RELIEF_RAISED);
              for (off = 0, x = 0; x < h; ++x, off++)
-                highlight(data + off * w,
+                highlight(&a->surface, data + off * w,
                            data + off * w + w - 1,
                            a->surface.relief==RR_RELIEF_RAISED);
          }
  
          if (a->surface.bevel == RR_BEVEL_2) {
              for (off = 2, x = 2; x < w - 2; ++x, off++)
                            data + off * w + w - 1,
                            a->surface.relief==RR_RELIEF_RAISED);
          }
  
          if (a->surface.bevel == RR_BEVEL_2) {
              for (off = 2, x = 2; x < w - 2; ++x, off++)
-                highlight(data + off + w,
+                highlight(&a->surface, data + off + w,
                            data + off + (h-2) * w,
                            a->surface.relief==RR_RELIEF_RAISED);
              for (off = 1, x = 1; x < h-1; ++x, off++)
                            data + off + (h-2) * w,
                            a->surface.relief==RR_RELIEF_RAISED);
              for (off = 1, x = 1; x < h-1; ++x, off++)
-                highlight(data + off * w + 1,
+                highlight(&a->surface, data + off * w + 1,
                            data + off * w + w - 2,
                            a->surface.relief==RR_RELIEF_RAISED);
          }
      }
  }
  
                            data + off * w + w - 2,
                            a->surface.relief==RR_RELIEF_RAISED);
          }
      }
  }
  
-static void highlight(RrPixel32 *x, RrPixel32 *y, gboolean raised)
+static void highlight(RrSurface *s, RrPixel32 *x, RrPixel32 *y, gboolean raised)
  {
      gint r, g, b;
  
  {
      gint r, g, b;
  
@@ -140,24 +146,25 @@ static void highlight(RrPixel32 *x, RrPixel32 *y, gboolean raised)
          up = y;
          down = x;
      }
          up = y;
          down = x;
      }
+
      r = (*up >> RrDefaultRedOffset) & 0xFF;
      r = (*up >> RrDefaultRedOffset) & 0xFF;
-    r += r >> 1;
+    r += (r * s->bevel_light_adjust) >> 8;
      g = (*up >> RrDefaultGreenOffset) & 0xFF;
      g = (*up >> RrDefaultGreenOffset) & 0xFF;
-    g += g >> 1;
+    g += (g * s->bevel_light_adjust) >> 8;
      b = (*up >> RrDefaultBlueOffset) & 0xFF;
      b = (*up >> RrDefaultBlueOffset) & 0xFF;
-    b += b >> 1;
+    b += (b * s->bevel_light_adjust) >> 8;
      if (r > 0xFF) r = 0xFF;
      if (g > 0xFF) g = 0xFF;
      if (b > 0xFF) b = 0xFF;
      *up = (r << RrDefaultRedOffset) + (g << RrDefaultGreenOffset)
          + (b << RrDefaultBlueOffset);
      if (r > 0xFF) r = 0xFF;
      if (g > 0xFF) g = 0xFF;
      if (b > 0xFF) b = 0xFF;
      *up = (r << RrDefaultRedOffset) + (g << RrDefaultGreenOffset)
          + (b << RrDefaultBlueOffset);
-  
+
      r = (*down >> RrDefaultRedOffset) & 0xFF;
      r = (*down >> RrDefaultRedOffset) & 0xFF;
-    r = (r >> 1) + (r >> 2);
+    r -= (r * s->bevel_dark_adjust) >> 8;
      g = (*down >> RrDefaultGreenOffset) & 0xFF;
      g = (*down >> RrDefaultGreenOffset) & 0xFF;
-    g = (g >> 1) + (g >> 2);
+    g -= (g * s->bevel_dark_adjust) >> 8;
      b = (*down >> RrDefaultBlueOffset) & 0xFF;
      b = (*down >> RrDefaultBlueOffset) & 0xFF;
-    b = (b >> 1) + (b >> 2);
+    b -= (b * s->bevel_dark_adjust) >> 8;
      *down = (r << RrDefaultRedOffset) + (g << RrDefaultGreenOffset)
          + (b << RrDefaultBlueOffset);
  }
      *down = (r << RrDefaultRedOffset) + (g << RrDefaultGreenOffset)
          + (b << RrDefaultBlueOffset);
  }
@@ -168,11 +175,11 @@ static void create_bevel_colors(RrAppearance *l)
  
      /* light color */
      r = l->surface.primary->r;
  
      /* light color */
      r = l->surface.primary->r;
-    r += r >> 1;
+    r += (r * l->surface.bevel_light_adjust) >> 8;
      g = l->surface.primary->g;
      g = l->surface.primary->g;
-    g += g >> 1;
+    g += (g * l->surface.bevel_light_adjust) >> 8;
      b = l->surface.primary->b;
      b = l->surface.primary->b;
-    b += b >> 1;
+    b += (b * l->surface.bevel_light_adjust) >> 8;
      if (r > 0xFF) r = 0xFF;
      if (g > 0xFF) g = 0xFF;
      if (b > 0xFF) b = 0xFF;
      if (r > 0xFF) r = 0xFF;
      if (g > 0xFF) g = 0xFF;
      if (b > 0xFF) b = 0xFF;
@@ -181,16 +188,135 @@ static void create_bevel_colors(RrAppearance *l)
  
      /* dark color */
      r = l->surface.primary->r;
  
      /* dark color */
      r = l->surface.primary->r;
-    r = (r >> 1) + (r >> 2);
+    r -= (r * l->surface.bevel_dark_adjust) >> 8;
      g = l->surface.primary->g;
      g = l->surface.primary->g;
-    g = (g >> 1) + (g >> 2);
+    g -= (g * l->surface.bevel_dark_adjust) >> 8;
      b = l->surface.primary->b;
      b = l->surface.primary->b;
-    b = (b >> 1) + (b >> 2);
+    b -= (b * l->surface.bevel_dark_adjust) >> 8;
      g_assert(!l->surface.bevel_dark);
      l->surface.bevel_dark = RrColorNew(l->inst, r, g, b);
  }
  
      g_assert(!l->surface.bevel_dark);
      l->surface.bevel_dark = RrColorNew(l->inst, r, g, b);
  }
  
-static void gradient_solid(RrAppearance *l, gint w, gint h) 
+/*! Repeat the first pixel over the entire block of memory
+  @param start The block of memory. start[0] will be copied
+         to the rest of the block.
+  @param w The width of the block of memory (including the already-set first
+           element
+*/
+static inline void repeat_pixel(RrPixel32 *start, gint w)
+{
+    gint x;
+    RrPixel32 *dest;
+
+    dest = start + 1;
+
+    /* for really small things, just copy ourselves */
+    if (w < 8) {
+        for (x = w-1; x > 0; --x)
+            *(dest++) = *start;
+    }
+
+    /* for >= 8, then use O(log n) memcpy's... */
+    else {
+        gchar *cdest;
+        gint lenbytes;
+
+        /* copy the first 3 * 32 bits (3 words) ourselves - then we have
+           3 + the original 1 = 4 words to make copies of at a time
+
+           this is faster than doing memcpy for 1 or 2 words at a time
+        */
+        for (x = 3; x > 0; --x)
+            *(dest++) = *start;
+
+        /* cdest is a pointer to the pixel data that is typed char* so that
+           adding 1 to its position moves it only one byte
+
+           lenbytes is the amount of bytes that we will be copying each
+           iteration.  this doubles each time through the loop.
+
+           x is the number of bytes left to copy into.  lenbytes will alwaysa
+           be bounded by x
+
+           this loop will run O(log n) times (n is the number of bytes we
+           need to copy into), since the size of the copy is doubled each
+           iteration.  it seems that gcc does some nice optimizations to make
+           this memcpy very fast on hardware with support for vector operations
+           such as mmx or see.  here is an idea of the kind of speed up we are
+           getting by doing this (splitvertical3 switches from doing
+           "*(data++) = color" n times to doing this memcpy thing log n times:
+
+           %   cumulative   self              self     total           
+           time   seconds   seconds    calls  ms/call  ms/call  name    
+           49.44      0.88     0.88     1063     0.83     0.83  splitvertical1
+           47.19      1.72     0.84     1063     0.79     0.79  splitvertical2
+            2.81      1.77     0.05     1063     0.05     0.05  splitvertical3
+        */
+        cdest = (gchar*)dest;
+        lenbytes = 4 * sizeof(RrPixel32);
+        for (x = (w - 4) * sizeof(RrPixel32); x > 0;) {
+            memcpy(cdest, start, lenbytes);
+            x -= lenbytes;
+            cdest += lenbytes;
+            lenbytes <<= 1;
+            if (lenbytes > x)
+                lenbytes = x;
+        }
+    }
+}
+
+static void gradient_parentrelative(RrAppearance *a, gint w, gint h)
+{
+    RrPixel32 *source, *dest;
+    gint sw, sh, partial_w, partial_h, i;
+
+    g_assert (a->surface.parent);
+    g_assert (a->surface.parent->w);
+
+    sw = a->surface.parent->w;
+    sh = a->surface.parent->h;
+
+    /* This is a little hack. When a texture is parentrelative, and the same
+       area as the parent, and has a bevel, it will draw its bevel on top
+       of the parent's, amplifying it. So instead, rerender the child with
+       the parent's settings, but the child's bevel and interlace */
+    if (a->surface.relief != RR_RELIEF_FLAT &&
+        (a->surface.parent->surface.relief != RR_RELIEF_FLAT ||
+         a->surface.parent->surface.border) &&
+        !a->surface.parentx && !a->surface.parenty &&
+        sw == w && sh == h)
+    {
+        RrSurface old = a->surface;
+        a->surface = a->surface.parent->surface;
+
+        /* turn these off for the parent */
+        a->surface.relief = RR_RELIEF_FLAT;
+        a->surface.border = FALSE;
+
+        a->surface.pixel_data = old.pixel_data;
+
+        RrRender(a, w, h);
+        a->surface = old;
+    } else {
+        source = (a->surface.parent->surface.pixel_data +
+                  a->surface.parentx + sw * a->surface.parenty);
+        dest = a->surface.pixel_data;
+
+        if (a->surface.parentx + w > sw) {
+            partial_w = sw - a->surface.parentx;
+        } else partial_w = w;
+
+        if (a->surface.parenty + h > sh) {
+            partial_h = sh - a->surface.parenty;
+        } else partial_h = h;
+
+        for (i = 0; i < partial_h; i++, source += sw, dest += w) {
+            memcpy(dest, source, partial_w * sizeof(RrPixel32));
+        }
+    }
+}
+
+static void gradient_solid(RrAppearance *l, gint w, gint h)
  {
      gint i;
      RrPixel32 pix;
  {
      gint i;
      RrPixel32 pix;
@@ -222,7 +348,7 @@ static void gradient_solid(RrAppearance *l, gint w, gint h)
                        left, bottom, right, bottom);
              XDrawLine(RrDisplay(l->inst), l->pixmap, RrColorGC(sp->bevel_dark),
                        right, bottom, right, top);
                        left, bottom, right, bottom);
              XDrawLine(RrDisplay(l->inst), l->pixmap, RrColorGC(sp->bevel_dark),
                        right, bottom, right, top);
-                
+
              XDrawLine(RrDisplay(l->inst), l->pixmap,RrColorGC(sp->bevel_light),
                        left, top, right, top);
              XDrawLine(RrDisplay(l->inst), l->pixmap,RrColorGC(sp->bevel_light),
              XDrawLine(RrDisplay(l->inst), l->pixmap,RrColorGC(sp->bevel_light),
                        left, top, right, top);
              XDrawLine(RrDisplay(l->inst), l->pixmap,RrColorGC(sp->bevel_light),
@@ -253,7 +379,7 @@ static void gradient_solid(RrAppearance *l, gint w, gint h)
                        left, bottom, right, bottom);
              XDrawLine(RrDisplay(l->inst), l->pixmap,RrColorGC(sp->bevel_light),
                        right, bottom, right, top);
                        left, bottom, right, bottom);
              XDrawLine(RrDisplay(l->inst), l->pixmap,RrColorGC(sp->bevel_light),
                        right, bottom, right, top);
-      
+
              XDrawLine(RrDisplay(l->inst), l->pixmap, RrColorGC(sp->bevel_dark),
                        left, top, right, top);
              XDrawLine(RrDisplay(l->inst), l->pixmap, RrColorGC(sp->bevel_dark),
              XDrawLine(RrDisplay(l->inst), l->pixmap, RrColorGC(sp->bevel_dark),
                        left, top, right, top);
              XDrawLine(RrDisplay(l->inst), l->pixmap, RrColorGC(sp->bevel_dark),
@@ -281,7 +407,7 @@ static void gradient_solid(RrAppearance *l, gint w, gint h)
                             left, top, right, bottom);
          }
          break;
                             left, top, right, bottom);
          }
          break;
-    default:  
+    default:
          g_assert_not_reached(); /* unhandled ReliefType */
      }
  }
          g_assert_not_reached(); /* unhandled ReliefType */
      }
  }
@@ -365,146 +491,172 @@ static void gradient_solid(RrAppearance *l, gint w, gint h)
  
  static void gradient_splitvertical(RrAppearance *a, gint w, gint h)
  {
  
  static void gradient_splitvertical(RrAppearance *a, gint w, gint h)
  {
-    gint x, y1, y3, r, g, b;
+    gint y1, y2, y3;
      RrSurface *sf = &a->surface;
      RrSurface *sf = &a->surface;
-    RrPixel32 *data = sf->pixel_data;
-    RrPixel32 current;
-    RrColor *primary_light, *secondary_light;
-
-    r = sf->primary->r;
-    r += r >> 2;
-    g = sf->primary->g;
-    g += g >> 2;
-    b = sf->primary->b;
-    b += b >> 2;
-    if (r > 0xFF) r = 0xFF;
-    if (g > 0xFF) g = 0xFF;
-    if (b > 0xFF) b = 0xFF;
-      primary_light = RrColorNew(a->inst, r, g, b);
-
-    r = sf->secondary->r;
-    r += r >> 4;
-    g = sf->secondary->g;
-    g += g >> 4;
-    b = sf->secondary->b;
-    b += b >> 4;
-    if (r > 0xFF) r = 0xFF;
-    if (g > 0xFF) g = 0xFF;
-    if (b > 0xFF) b = 0xFF;
-    secondary_light = RrColorNew(a->inst, r, g, b);
+    RrPixel32 *data;
+    gint y1sz, y2sz, y3sz;
  
      VARS(y1);
  
      VARS(y1);
-    SETUP(y1, primary_light, sf->primary, (h / 2) -1);
-  
+    VARS(y2);
      VARS(y3);
      VARS(y3);
-    SETUP(y3, sf->secondary, secondary_light,  (h / 2) -1);
  
  
-    for (y1 = h - 1; y1 > (h / 2) -1; --y1) {  /* 0 -> h-1 */
-        current = COLOR(y1);
-        for (x = w - 1; x >= 0; --x)  /* 0 -> w */
-            *(data++) = current;
+    /* if h <= 5, then a 0 or 1px middle gradient.
+       if h > 5, then always a 1px middle gradient.
+    */
+    if (h <= 5) {
+        y1sz = MAX(h/2, 0);
+        y2sz = (h < 3 ? 0 : h % 2);
+        y3sz = MAX(h/2, 1);
+    }
+    else {
+        y1sz = h/2 - (1 - (h % 2));
+        y2sz = 1;
+        y3sz = h/2;
+    }
  
  
-        NEXT(y1);
+    SETUP(y1, sf->split_primary, sf->primary, y1sz);
+    if (y2sz) {
+        /* setup to get the colors _in between_ these other 2 */
+        SETUP(y2, sf->primary, sf->secondary, y2sz + 2);
+        NEXT(y2); /* skip the first one, its the same as the last of y1 */
      }
      }
+    SETUP(y3, sf->secondary, sf->split_secondary,  y3sz);
  
  
-    
-    for (y3 = (h / 2) - 1; y3 > 0; --y3) {
-        current = COLOR(y3);
-        for (x = w - 1; x >= 0; --x)
-            *(data++) = current;
+    /* find the color for the first pixel of each row first */
+    data = sf->pixel_data;
  
  
+    for (y1 = y1sz-1; y1 > 0; --y1) {
+        *data = COLOR(y1);
+        data += w;
+        NEXT(y1);
+    }
+    *data = COLOR(y1);
+    data += w;
+    for (y2 = y2sz-1; y2 > 0; --y2) {
+        *data = COLOR(y2);
+        data += w;
+        NEXT(y2);
+    }
+    *data = COLOR(y2);
+    data += w;
+    for (y3 = y3sz-1; y3 > 0; --y3) {
+        *data = COLOR(y3);
+        data += w;
          NEXT(y3);
      }
          NEXT(y3);
      }
+    *data = COLOR(y3);
  
  
-    current = COLOR(y3);
-    for (x = w - 1; x >= 0; --x)  /* 0 -> w */
-        *(data++) = current;
-
-    RrColorFree(primary_light);
-    RrColorFree(secondary_light);
+    /* copy the first pixels into the whole rows */
+    data = sf->pixel_data;
+    for (y1 = h; y1 > 0; --y1) {
+        repeat_pixel(data, w);
+        data += w;
+    }
  }
  
  static void gradient_horizontal(RrSurface *sf, gint w, gint h)
  {
  }
  
  static void gradient_horizontal(RrSurface *sf, gint w, gint h)
  {
-    gint x, y;
+    gint x, y, cpbytes;
      RrPixel32 *data = sf->pixel_data, *datav;
      RrPixel32 *data = sf->pixel_data, *datav;
-    RrPixel32 current;
+    gchar *datac;
  
      VARS(x);
      SETUP(x, sf->primary, sf->secondary, w);
  
  
      VARS(x);
      SETUP(x, sf->primary, sf->secondary, w);
  
-    for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
-        current = COLOR(x);
-        datav = data;
-        for (y = h - 1; y >= 0; --y) {  /* 0 -> h */
-            *datav = current;
-            datav += w;
-        }
-        ++data;
-
+    /* set the color values for the first row */
+    datav = data;
+    for (x = w - 1; x > 0; --x) {  /* 0 -> w - 1 */
+        *datav = COLOR(x);
+        ++datav;
          NEXT(x);
      }
          NEXT(x);
      }
-    current = COLOR(x);
-    for (y = h - 1; y >= 0; --y)  /* 0 -> h */
-        *(data + y * w) = current;
+    *datav = COLOR(x);
+    ++datav;
+
+    /* copy the first row to the rest in O(logn) copies */
+    datac = (gchar*)datav;
+    cpbytes = 1 * w * sizeof(RrPixel32);
+    for (y = (h - 1) * w * sizeof(RrPixel32); y > 0;) {
+        memcpy(datac, data, cpbytes);
+        y -= cpbytes;
+        datac += cpbytes;
+        cpbytes <<= 1;
+        if (cpbytes > y)
+            cpbytes = y;
+    }
  }
  
  static void gradient_mirrorhorizontal(RrSurface *sf, gint w, gint h)
  {
  }
  
  static void gradient_mirrorhorizontal(RrSurface *sf, gint w, gint h)
  {
-    gint x, y;
+    gint x, y, half1, half2, cpbytes;
      RrPixel32 *data = sf->pixel_data, *datav;
      RrPixel32 *data = sf->pixel_data, *datav;
-    RrPixel32 current;
+    gchar *datac;
  
      VARS(x);
  
      VARS(x);
-    SETUP(x, sf->primary, sf->secondary, w/2);
-
-    for (x = w - 1; x > w/2-1; --x) {  /* 0 -> w-1 */
-        current = COLOR(x);
-        datav = data;
-        for (y = h - 1; y >= 0; --y) {  /* 0 -> h */
-            *datav = current;
-            datav += w;
-        }
-        ++data;
  
  
+    half1 = (w + 1) / 2;
+    half2 = w / 2;
+
+    /* set the color values for the first row */
+
+    SETUP(x, sf->primary, sf->secondary, half1);
+    datav = data;
+    for (x = half1 - 1; x > 0; --x) {  /* 0 -> half1 - 1 */
+        *datav = COLOR(x);
+        ++datav;
          NEXT(x);
      }
          NEXT(x);
      }
-    SETUP(x, sf->secondary, sf->primary, w/2);
-    for (x = w/2 - 1; x > 0; --x) {  /* 0 -> w-1 */
-        current = COLOR(x);
-        datav = data;
-        for (y = h - 1; y >= 0; --y) {  /* 0 -> h */
-            *datav = current;
-            datav += w;
+    *datav = COLOR(x);
+    ++datav;
+
+    if (half2 > 0) {
+        SETUP(x, sf->secondary, sf->primary, half2);
+        for (x = half2 - 1; x > 0; --x) {  /* 0 -> half2 - 1 */
+            *datav = COLOR(x);
+            ++datav;
+            NEXT(x);
          }
          }
-        ++data;
+        *datav = COLOR(x);
+        ++datav;
+    }
  
  
-        NEXT(x);
+    /* copy the first row to the rest in O(logn) copies */
+    datac = (gchar*)datav;
+    cpbytes = 1 * w * sizeof(RrPixel32);
+    for (y = (h - 1) * w * sizeof(RrPixel32); y > 0;) {
+        memcpy(datac, data, cpbytes);
+        y -= cpbytes;
+        datac += cpbytes;
+        cpbytes <<= 1;
+        if (cpbytes > y)
+            cpbytes = y;
      }
      }
-    current = COLOR(x);
-    for (y = h - 1; y >= 0; --y)  /* 0 -> h */
-        *(data + y * w) = current;
  }
  
  static void gradient_vertical(RrSurface *sf, gint w, gint h)
  {
  }
  
  static void gradient_vertical(RrSurface *sf, gint w, gint h)
  {
-    gint x, y;
-    RrPixel32 *data = sf->pixel_data;
-    RrPixel32 current;
+    gint y;
+    RrPixel32 *data;
  
      VARS(y);
      SETUP(y, sf->primary, sf->secondary, h);
  
  
      VARS(y);
      SETUP(y, sf->primary, sf->secondary, h);
  
-    for (y = h - 1; y > 0; --y) {  /* 0 -> h-1 */
-        current = COLOR(y);
-        for (x = w - 1; x >= 0; --x)  /* 0 -> w */
-            *(data++) = current;
+    /* find the color for the first pixel of each row first */
+    data = sf->pixel_data;
  
  
+    for (y = h - 1; y > 0; --y) {  /* 0 -> h-1 */
+        *data = COLOR(y);
+        data += w;
          NEXT(y);
      }
          NEXT(y);
      }
-    current = COLOR(y);
-    for (x = w - 1; x >= 0; --x)  /* 0 -> w */
-        *(data++) = current;
+    *data = COLOR(y);
+
+    /* copy the first pixels into the whole rows */
+    data = sf->pixel_data;
+    for (y = h; y > 0; --y) {
+        repeat_pixel(data, w);
+        data += w;
+    }
  }
  
  
  }
  
  
@@ -549,7 +701,7 @@ static void gradient_diagonal(RrSurface *sf, gint w, gint h)
  
      for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
          *(data++) = COLOR(x);
  
      for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
          *(data++) = COLOR(x);
-        
+
          NEXT(x);
      }
      *data = COLOR(x);
          NEXT(x);
      }
      *data = COLOR(x);
@@ -596,20 +748,19 @@ static void gradient_crossdiagonal(RrSurface *sf, gint w, gint h)
  
      for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
          *(data++) = COLOR(x);
  
      for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
          *(data++) = COLOR(x);
-        
+
          NEXT(x);
      }
      *data = COLOR(x);
  }
  
          NEXT(x);
      }
      *data = COLOR(x);
  }
  
-static void gradient_pyramid(RrSurface *sf, gint inw, gint inh)
+static void gradient_pyramid(RrSurface *sf, gint w, gint h)
  {
  {
-    gint x, y, w = (inw >> 1) + 1, h = (inh >> 1) + 1;
-    RrPixel32 *data = sf->pixel_data;
-    RrPixel32 *end = data + inw*inh - 1;
-    RrPixel32 current;
+    RrPixel32 *ldata, *rdata;
+    RrPixel32 *cp;
      RrColor left, right;
      RrColor extracorner;
      RrColor left, right;
      RrColor extracorner;
+    gint x, y, halfw, halfh, midx, midy;
  
      VARS(lefty);
      VARS(righty);
  
      VARS(lefty);
      VARS(righty);
@@ -619,54 +770,64 @@ static void gradient_pyramid(RrSurface *sf, gint inw, gint inh)
      extracorner.g = (sf->primary->g + sf->secondary->g) / 2;
      extracorner.b = (sf->primary->b + sf->secondary->b) / 2;
  
      extracorner.g = (sf->primary->g + sf->secondary->g) / 2;
      extracorner.b = (sf->primary->b + sf->secondary->b) / 2;
  
-    SETUP(lefty, (&extracorner), sf->secondary, h);
-    SETUP(righty, sf->primary, (&extracorner), h);
+    halfw = w >> 1;
+    halfh = h >> 1;
+    midx = w - halfw - halfw; /* 0 or 1, depending if w is even or odd */
+    midy = h - halfh - halfh;   /* 0 or 1, depending if h is even or odd */
+
+    SETUP(lefty, sf->primary, (&extracorner), halfh + midy);
+    SETUP(righty, (&extracorner), sf->secondary, halfh + midy);
+
+    /* draw the top half
+
+       it is faster to draw both top quarters together than to draw one and
+       then copy it over to the other side.
+    */
+
+    ldata = sf->pixel_data;
+    rdata = ldata + w - 1;
+    for (y = halfh + midy; y > 0; --y) {  /* 0 -> (h+1)/2 */
+        RrPixel32 c;
  
  
-    for (y = h - 1; y > 0; --y) {  /* 0 -> h-1 */
          COLOR_RR(lefty, (&left));
          COLOR_RR(righty, (&right));
  
          COLOR_RR(lefty, (&left));
          COLOR_RR(righty, (&right));
  
-        SETUP(x, (&left), (&right), w);
+        SETUP(x, (&left), (&right), halfw + midx);
  
  
-        for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
-            current = COLOR(x);
-            *(data+x) = current;
-            *(data+inw-x) = current;
-            *(end-x) = current;
-            *(end-(inw-x)) = current;
+        for (x = halfw + midx - 1; x > 0; --x) {  /* 0 -> (w+1)/2 */
+            c = COLOR(x);
+            *(ldata++) = *(rdata--) = c;
  
              NEXT(x);
          }
  
              NEXT(x);
          }
-        current = COLOR(x);
-        *(data+x) = current;
-        *(data+inw-x) = current;
-        *(end-x) = current;
-        *(end-(inw-x)) = current;
-
-        data+=inw;
-        end-=inw;
+        c = COLOR(x);
+        *ldata = *rdata = c;
+        ldata += halfw + 1;
+        rdata += halfw - 1 + midx + w;
  
          NEXT(lefty);
          NEXT(righty);
      }
  
          NEXT(lefty);
          NEXT(righty);
      }
-    COLOR_RR(lefty, (&left));
-    COLOR_RR(righty, (&right));
  
  
-    SETUP(x, (&left), (&right), w);
-
-    for (x = w - 1; x > 0; --x) {  /* 0 -> w-1 */
-        current = COLOR(x);
-        *(data+x) = current;
-        *(data+inw-x) = current;
-        *(end-x) = current;
-        *(end-(inw-x)) = current;
-        
-        NEXT(x);
+    /* copy the top half into the bottom half, mirroring it, so we can only
+       copy one row at a time
+
+       it is faster, to move the writing pointer forward, and the reading
+       pointer backward
+
+       this is the current code, moving the write pointer forward and read
+       pointer backward
+       41.78      4.26     1.78      504     3.53     3.53  gradient_pyramid2
+       this is the opposite, moving the read pointer forward and the write
+       pointer backward
+       42.27      4.40     1.86      504     3.69     3.69  gradient_pyramid2
+       
+    */
+    ldata = sf->pixel_data + (halfh - 1) * w;
+    cp = ldata + (midy + 1) * w;
+    for (y = halfh; y > 0; --y) {
+        memcpy(cp, ldata, w * sizeof(RrPixel32));
+        ldata -= w;
+        cp += w;
      }
      }
-    current = COLOR(x);
-    *(data+x) = current;
-    *(data+inw-x) = current;
-    *(end-x) = current;
-    *(end-(inw-x)) = current;
  }
  }
-