revised palette conversion subsystem to make a little more sense

CVS patchset: 2539 CVS date: 2002/08/28 03:32:48
author: Mike Melanson <mike@multimedia.cx> 2002-08-28 03:32:48 +0000
committer: Mike Melanson <mike@multimedia.cx> 2002-08-28 03:32:48 +0000
commit: d1606decedff8ef07319d9ea4830ececf69f62d0 (patch)
tree: be6bc8b8ed1236513b6cf7fdbcaf028df4c79ef5
parent: 28280f2f9870a7854ffdd4bccd48bb62468ce6ee (diff)
download: xine-lib-d1606decedff8ef07319d9ea4830ececf69f62d0.tar.gz
xine-lib-d1606decedff8ef07319d9ea4830ececf69f62d0.tar.bz2
6 files changed, 116 insertions, 259 deletions
diff --git a/src/libxinevdec/fli.c b/src/libxinevdec/fli.c
index 9737dbc9c..3527692c0 100644
--- a/src/libxinevdec/fli.c
+++ b/src/libxinevdec/fli.c
@@ -23,7 +23,7 @@
  * avoid when implementing a FLI decoder, visit:
  *   http://www.pcisys.net/~melanson/codecs/
  * 
- * $Id: fli.c,v 1.2 2002/07/15 21:42:34 esnel Exp $
+ * $Id: fli.c,v 1.3 2002/08/28 03:37:17 tmmm Exp $
  */
 
 #include <stdio.h>
@@ -183,7 +183,7 @@ void decode_fli_frame(fli_decoder_t *this) {
         stream_ptr += 2;
         if (line_packets < 0) {
           line_packets = -line_packets;
-          y_ptr += (line_packets * this->yuv_planes.row_stride);
+          y_ptr += (line_packets * this->yuv_planes.row_width);
           ghost_y_ptr += (line_packets * this->width);
         } else {
           pixel_ptr = y_ptr;
@@ -232,18 +232,7 @@ void decode_fli_frame(fli_decoder_t *this) {
             }
           }
 
-          // take care of the extra 2 pixels on the C lines
-          this->yuv_planes.u[pixel_ptr] =
-            this->yuv_planes.u[pixel_ptr - 1];
-          this->yuv_planes.u[pixel_ptr + 1] =
-            this->yuv_planes.u[pixel_ptr - 2];
-
-          this->yuv_planes.v[pixel_ptr] =
-            this->yuv_planes.v[pixel_ptr - 1];
-          this->yuv_planes.v[pixel_ptr + 1] =
-            this->yuv_planes.v[pixel_ptr - 2];
-
-          y_ptr += this->yuv_planes.row_stride;
+          y_ptr += this->yuv_planes.row_width;
           ghost_y_ptr += this->width;
           compressed_lines--;
         }
@@ -254,7 +243,7 @@ void decode_fli_frame(fli_decoder_t *this) {
       /* line compressed */
       starting_line = LE_16(&this->buf[stream_ptr]);
       stream_ptr += 2;
-      y_ptr = starting_line * this->yuv_planes.row_stride;
+      y_ptr = starting_line * this->yuv_planes.row_width;
       ghost_y_ptr = starting_line * this->width;
 
       compressed_lines = LE_16(&this->buf[stream_ptr]);
@@ -299,18 +288,7 @@ void decode_fli_frame(fli_decoder_t *this) {
           }
         }
 
-        // take care of the extra 2 pixels on the C lines
-        this->yuv_planes.u[pixel_ptr] =
-          this->yuv_planes.u[pixel_ptr - 1];
-        this->yuv_planes.u[pixel_ptr + 1] =
-          this->yuv_planes.u[pixel_ptr - 2];
-
-        this->yuv_planes.v[pixel_ptr] =
-          this->yuv_planes.v[pixel_ptr - 1];
-        this->yuv_planes.v[pixel_ptr + 1] =
-          this->yuv_planes.v[pixel_ptr - 2];
-
-        y_ptr += this->yuv_planes.row_stride;
+        y_ptr += this->yuv_planes.row_width;
         ghost_y_ptr += this->width;
         compressed_lines--;
       }
@@ -362,18 +340,7 @@ void decode_fli_frame(fli_decoder_t *this) {
           }
         }
 
-        // take care of the extra 2 pixels on the C lines
-        this->yuv_planes.u[pixel_ptr] =
-          this->yuv_planes.u[pixel_ptr - 1];
-        this->yuv_planes.u[pixel_ptr + 1] =
-          this->yuv_planes.u[pixel_ptr - 2];
-
-        this->yuv_planes.v[pixel_ptr] =
-          this->yuv_planes.v[pixel_ptr - 1];
-        this->yuv_planes.v[pixel_ptr + 1] =
-          this->yuv_planes.v[pixel_ptr - 2];
-
-        y_ptr += this->yuv_planes.row_stride;
+        y_ptr += this->yuv_planes.row_width;
         ghost_y_ptr += this->width;
       }
       break;
@@ -419,18 +386,6 @@ void decode_fli_frame(fli_decoder_t *this) {
         pixel_ptr++;
       }
 
-      // take care of the extra 2 pixels on the C lines
-      this->yuv_planes.u[pixel_ptr] =
-        this->yuv_planes.u[pixel_ptr - 1];
-      this->yuv_planes.u[pixel_ptr + 1] =
-        this->yuv_planes.u[pixel_ptr - 2];
-
-      // take care of the extra 2 pixels on the C lines
-      this->yuv_planes.v[pixel_ptr] =
-        this->yuv_planes.v[pixel_ptr - 1];
-      this->yuv_planes.v[pixel_ptr + 1] =
-        this->yuv_planes.v[pixel_ptr - 2];
-
       pixel_ptr += 2;
     }
   }
diff --git a/src/libxinevdec/idcinvideo.c b/src/libxinevdec/idcinvideo.c
index 725eff548..dde1c8562 100644
--- a/src/libxinevdec/idcinvideo.c
+++ b/src/libxinevdec/idcinvideo.c
@@ -21,7 +21,7 @@
  * the Id CIN format, visit:
  *   http://www.csse.monash.edu.au/~timf/
  * 
- * $Id: idcinvideo.c,v 1.1 2002/08/12 00:16:54 tmmm Exp $
+ * $Id: idcinvideo.c,v 1.2 2002/08/28 03:37:17 tmmm Exp $
  */
 
 #include <stdio.h>
@@ -91,7 +91,6 @@ void huff_decode(idcinvideo_decoder_t *this) {
   int prev;
   unsigned char v = 0;
   int bit_pos, node_num, dat_pos;
-  int width_countdown = this->width;
   int plane_ptr = 0;
 
   prev = bit_pos = dat_pos = 0;
@@ -118,12 +117,6 @@ void huff_decode(idcinvideo_decoder_t *this) {
     this->yuv_planes.u[plane_ptr] = this->yuv_palette[node_num * 4 + 1];
     this->yuv_planes.v[plane_ptr] = this->yuv_palette[node_num * 4 + 2];
     plane_ptr++;
-    width_countdown--;
-    if (!width_countdown) {
-      FINISH_LINE(this->yuv_planes, plane_ptr - this->width);
-      width_countdown = this->width;
-      plane_ptr += 2;
-    }
 
     prev = node_num;
   }
diff --git a/src/libxinevdec/msrle.c b/src/libxinevdec/msrle.c
index 982d689dc..0d748c580 100644
--- a/src/libxinevdec/msrle.c
+++ b/src/libxinevdec/msrle.c
@@ -21,7 +21,7 @@
  * For more information on the MS RLE format, visit:
  *   http://www.pcisys.net/~melanson/codecs/
  * 
- * $Id: msrle.c,v 1.3 2002/07/20 04:24:59 tmmm Exp $
+ * $Id: msrle.c,v 1.4 2002/08/28 03:37:17 tmmm Exp $
  */
 
 #include <stdio.h>
@@ -78,9 +78,9 @@ void decode_msrle8(msrle_decoder_t *this) {
   unsigned char extra_byte;
   unsigned char stream_byte;
   int pixel_ptr = 0;
-  int row_dec = this->yuv_planes.row_stride;
+  int row_dec = this->yuv_planes.row_width;
   int row_ptr = (this->height - 1) * row_dec;
-  int frame_size = this->yuv_planes.row_stride * this->height;
+  int frame_size = this->yuv_planes.row_width * this->height;
   unsigned char y, u, v;
 
   while (row_ptr >= 0) {
@@ -90,22 +90,13 @@ void decode_msrle8(msrle_decoder_t *this) {
       /* fetch the next byte to see how to handle escape code */
       FETCH_NEXT_STREAM_BYTE();
       if (stream_byte == 0) {
-        /* take care of the extra 2 pixels on the C lines */
-        FINISH_LINE(this->yuv_planes, row_ptr);
-
         /* line is done, goto the next one */
         row_ptr -= row_dec;
         pixel_ptr = 0;
       } else if (stream_byte == 1) {
-        /* take care of the extra 2 pixels on the C lines */
-        FINISH_LINE(this->yuv_planes, row_ptr);
-
         /* decode is done */
         return;
       } else if (stream_byte == 2) {
-        /* take care of the extra 2 pixels on the C lines */
-        FINISH_LINE(this->yuv_planes, row_ptr);
-
         /* reposition frame decode coordinates */
         FETCH_NEXT_STREAM_BYTE();
         pixel_ptr += stream_byte;
diff --git a/src/libxinevdec/rgb.c b/src/libxinevdec/rgb.c
index 3c6368ee0..7b01fcbb7 100644
--- a/src/libxinevdec/rgb.c
+++ b/src/libxinevdec/rgb.c
@@ -21,7 +21,7 @@
  * Actually, this decoder just converts a raw RGB image to a YUY2 map
  * suitable for display under xine.
  * 
- * $Id: rgb.c,v 1.3 2002/07/20 04:24:59 tmmm Exp $
+ * $Id: rgb.c,v 1.4 2002/08/28 03:37:17 tmmm Exp $
  */
 
 #include <stdio.h>
@@ -162,9 +162,9 @@ static void rgb_decode_data (video_decoder_t *this_gen,
 
       /* iterate through each row */
       buf_ptr = 0;
-      row_ptr = this->yuv_planes.row_stride *
+      row_ptr = this->yuv_planes.row_width *
         (this->yuv_planes.row_count - 1);
-      for (; row_ptr >= 0; row_ptr -= this->yuv_planes.row_stride) {
+      for (; row_ptr >= 0; row_ptr -= this->yuv_planes.row_width) {
         for (pixel_ptr = 0; pixel_ptr < this->width; pixel_ptr++) {
 
           if (this->bytes_per_pixel == 1) {
@@ -206,9 +206,6 @@ static void rgb_decode_data (video_decoder_t *this_gen,
 
           }
         }
-
-        /* take care of the extra 2 pixels on the C lines */
-        FINISH_LINE(this->yuv_planes, row_ptr);
       }
 
       yuv444_to_yuy2(&this->yuv_planes, img->base[0], img->pitches[0]);
diff --git a/src/xine-utils/color.c b/src/xine-utils/color.c
index 8696c31dd..b99e663b1 100644
--- a/src/xine-utils/color.c
+++ b/src/xine-utils/color.c
@@ -37,25 +37,8 @@
  * COMPUTE_Y(r, g, b), COMPUTE_U(r, g, b), COMPUTE_V(r, g, b) macros found
  * in xineutils.h
  *
- * The yuv_planes_t structure has 3 other fields: row_width and row_count,
- * which are equivalent to the frame width and height, respectively, and
- * row_stride, which is 2 bytes longer than the row_width. This is because
- * each row in each plane is actually 2 bytes longer than the width. For
- * example, if the row_width is 8 then the row_stride is 10 and each
- * plane's byte map is laid out as follows:
- *
- *   byte  0: p0  p1  p2  p3  p4  p5  p6  p7  p7  p6
- *   byte 10: p8  p9 p10 p11 p12 p13 p14 p15 p15 p14 
- *   byte 20: ...
- *
- * The extra 2 samples are necessary for the final conversion. The extra
- * 2 samples are simply mirrored from the last 2 samples on the line.
- * This library provides a macro called FINISH_LINE() to mirror the last
- * 2 samples in each color plane. To use it, call the macro with the YUV
- * planes structure and the index of the first byte on the row. For
- * example, in the above example, call FINISH_LINE() with a yuv_planes
- * structure and the index 10 in order to finish (mirror the last 2 samples)
- * on the second line.
+ * The yuv_planes_t structure has 2 other fields: row_width and row_count
+ * which are equivalent to the frame width and height, respectively.
  *
  * When an image has been fully decoded into the yuv_planes_t structure,
  * call yuv444_to_yuy2() with the structure and the final (pre-allocated)
@@ -76,7 +59,7 @@
  * instructions), these macros will automatically map to those special
  * instructions.
  *
- * $Id: color.c,v 1.5 2002/07/20 04:20:56 tmmm Exp $
+ * $Id: color.c,v 1.6 2002/08/28 03:32:48 tmmm Exp $
  */
 
 #include "xine_internal.h"
@@ -152,17 +135,17 @@ void (*yuv444_to_yuy2) (yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int p
  * init_yuv_planes
  *
  * This function initializes a yuv_planes_t structure based on the width
- * and height passed to it. The width must be divisible by 4 or the
- * final conversion function will not work.
+ * and height passed to it. The width must be divisible by 2.
  */
 void init_yuv_planes(yuv_planes_t *yuv_planes, int width, int height) {
 
   int plane_size;
 
   yuv_planes->row_width = width;
-  yuv_planes->row_stride = width + 2;
   yuv_planes->row_count = height;
-  plane_size = yuv_planes->row_stride * yuv_planes->row_count;
+  /* add 6 extra bytes to the plane size to account for residual filtering
+   * on the C planes */
+  plane_size = yuv_planes->row_width * yuv_planes->row_count + 6;
 
   yuv_planes->y = xine_xmalloc(plane_size);
   yuv_planes->u = xine_xmalloc(plane_size);
@@ -197,15 +180,16 @@ void free_yuv_planes(yuv_planes_t *yuv_planes) {
  *
  *   YUY2 map: Y0 U0 Y1 V1  Y2 U2 Y3 V3
  */
-void yuv444_to_yuy2_c(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int pitch) {
+void yuv444_to_yuy2_c(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, 
+  int pitch) {
 
   int row_ptr, pixel_ptr;
   int yuy2_index;
 
   /* copy the Y samples */
   yuy2_index = 0;
-  for (row_ptr = 0; row_ptr < yuv_planes->row_stride * yuv_planes->row_count;
-    row_ptr += yuv_planes->row_stride) {
+  for (row_ptr = 0; row_ptr < yuv_planes->row_width * yuv_planes->row_count;
+    row_ptr += yuv_planes->row_width) {
     for (pixel_ptr = 0; pixel_ptr <  yuv_planes->row_width;
       pixel_ptr++, yuy2_index += 2)
       yuy2_map[yuy2_index] = yuv_planes->y[row_ptr + pixel_ptr];
@@ -215,8 +199,8 @@ void yuv444_to_yuy2_c(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int pit
 
   /* copy the C samples */
   yuy2_index = 1;
-  for (row_ptr = 0; row_ptr < yuv_planes->row_stride * yuv_planes->row_count;
-    row_ptr += yuv_planes->row_stride) {
+  for (row_ptr = 0; row_ptr < yuv_planes->row_width * yuv_planes->row_count;
+    row_ptr += yuv_planes->row_width) {
 
     for (pixel_ptr = 0; pixel_ptr <  yuv_planes->row_width;) {
       yuy2_map[yuy2_index] = yuv_planes->u[row_ptr + pixel_ptr];
@@ -300,15 +284,20 @@ void yuv444_to_yuy2_c(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int pit
  * [C2..C5] and once for [C4..C7]. After computing 3 filtered samples,
  * increment the plane pointer by 6 and repeat the whole process.
  *
- * There is a special case when the row width is not evenly divisible by
- * 6. In the special case, the plane pointer must be backed up by a few
- * samples so that the filter can be computed 1 or 2 more times in order to
- * pad out the line.    
+ * There is a special case when the filter hits the end of the line since
+ * it is always necessary to rely on phantom samples beyond the end of the
+ * line in order to compute the final 1-3 C samples of a line. This function
+ * uses zeros in those phantom positions in order to compute the final 
+ * samples. However, the function might read up to 6 samples from the next
+ * line which might not exist if the filter is already operation on the 
+ * last line of the plane. This is why the planes are allocated to be 6 
+ * bytes larger than width * height.
  *
  */
-void yuv444_to_yuy2_mmx(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int pitch) {
+void yuv444_to_yuy2_mmx(yuv_planes_t *yuv_planes, unsigned char *yuy2_map,
+  int pitch) {
 #ifdef ARCH_X86
-  int i, j, k;
+  int h, i, j, k;
   unsigned char *source_plane;
   unsigned char *dest_plane;
   unsigned char vector[8];
@@ -318,22 +307,37 @@ void yuv444_to_yuy2_mmx(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int p
     0x03, 0x00,
     0x01, 0x00
   };
-
-  /* special case work variables */
-  int width_mod;
-  int secondary_samples;
-  int rewind_bytes;
-  int toss_out_shift;
+  unsigned char advance2_andmask[] = {
+    0xFF, 0xFF,
+    0x00, 0x00,
+    0x00, 0x00,
+    0x00, 0x00
+  };
+  unsigned char advance4_andmask[] = {
+    0xFF, 0xFF,
+    0xFF, 0xFF,
+    0x00, 0x00,
+    0x00, 0x00
+  };
+  unsigned char advance6_andmask[] = {
+    0xFF, 0xFF,
+    0xFF, 0xFF,
+    0xFF, 0xFF,
+    0x00, 0x00
+  };
+  int block_loops = yuv_planes->row_width / 6;
+  int filter_loops;
+  int advance_count;
   int row_inc = (pitch - 2 * yuv_planes->row_width);
 
-  width_mod = yuv_planes->row_width % 6;
-  secondary_samples = width_mod / 2;
-  rewind_bytes = 6 - width_mod;
-  toss_out_shift = rewind_bytes * 8;
-
-  /* set up some MMX registers: mm0 = 0, mm7 = color filter */
+  /* set up some MMX registers: 
+   * mm0 = 0, mm7 = color filter,
+   * mm4..6 = advance 2,4,6 and masks */
   pxor_r2r(mm0, mm0);
   movq_m2r(*filter, mm7);
+  movq_m2r(*advance2_andmask, mm4);
+  movq_m2r(*advance4_andmask, mm5);
+  movq_m2r(*advance6_andmask, mm6);
 
   /* copy the Y samples */
   source_plane = yuv_planes->y;
@@ -356,141 +360,70 @@ void yuv444_to_yuy2_mmx(yuv_planes_t *yuv_planes, unsigned char *yuy2_map, int p
       dest_plane += 8;
     }
 
-    /* account for extra 2 samples */
-    source_plane += 2;
     dest_plane += row_inc;
   }
 
-  /* figure out the U samples */
-  source_plane = yuv_planes->u;
-  dest_plane = yuy2_map + 1;
-  for (i = 0; i < yuv_planes->row_count; i++) {
-
-    /* iterate through blocks of 6 samples */
-    for (j = 0; j < yuv_planes->row_width / 6; j++) {
+  /* figure out the C samples */
+  for (h = 0; h < 2; h++) {
 
-      movq_m2r(*source_plane, mm1); /* load 8 U samples */
-      source_plane += 6;
-
-      for (k = 0; k < 3; k++)
-      {
-        movq_r2r(mm1, mm2);      /* make a copy */
-
-        punpcklbw_r2r(mm0, mm2); /* interleave lower 4 samples with zeros */
-        pmaddwd_r2r(mm7, mm2);   /* apply the filter */
-        movq_r2r(mm2, mm3);      /* copy result to mm3 */
-        psrlq_i2r(32, mm3);      /* move the upper sum down */
-        paddd_r2r(mm3, mm2);     /* mm2 += mm3 */
-        psrlq_i2r(3, mm2);       /* final phase of the filter */
-
-        movq_r2m(mm2, *vector);
-        dest_plane[0] = vector[0];
-        dest_plane += 4;
-
-        psrlq_i2r(16, mm1);      /* toss out 2 U samples and loop again */
-      }
+    /* select the color plane for this iteration */
+    if (h == 0) {
+      source_plane = yuv_planes->u;
+      dest_plane = yuy2_map + 1;
+    } else {
+      source_plane = yuv_planes->v;
+      dest_plane = yuy2_map + 3;
     }
 
-    /* special case time: secondary samples */
-    if (width_mod) {
-      source_plane -= rewind_bytes;
-      movq_m2r(*source_plane, mm1); /* load 8 U samples */
-      source_plane += 8;
-
-      /* toss out 1-2 U samples before starting */
-      /* (psrlq_m2r does not work like I expect it to, so this looks weird) */
-      if (toss_out_shift == 16)
-        psrlq_i2r(16, mm1);
-      else
-        psrlq_i2r(32, mm1);
-
-      for (k = 0; k < secondary_samples; k++)
-      {
-        movq_r2r(mm1, mm2);      /* make a copy */
-
-        punpcklbw_r2r(mm0, mm2); /* interleave lower 4 samples with zeros */
-        pmaddwd_r2r(mm7, mm2);   /* apply the filter */
-        movq_r2r(mm2, mm3);      /* copy result to mm3 */
-        psrlq_i2r(32, mm3);      /* move the upper sum down */
-        paddd_r2r(mm3, mm2);     /* mm2 += mm3 */
-        psrlq_i2r(3, mm2);       /* final phase of the filter */
-
-        movq_r2m(mm2, *vector);
-        dest_plane[0] = vector[0];
-        dest_plane += 4;
-
-        psrlq_i2r(16, mm1);      /* toss out 2 U samples and loop again */
-      }
-    } else
-      source_plane += 2;
-
-    dest_plane += row_inc;
-  }
-
-  /* figure out the V samples */
-  source_plane = yuv_planes->v;
-  dest_plane = yuy2_map + 3;
-  for (i = 0; i < yuv_planes->row_count; i++) {
-
-    /* iterate through blocks of 6 samples */
-    for (j = 0; j < yuv_planes->row_width / 6; j++) {
+    for (i = 0; i < yuv_planes->row_count; i++) {
 
-      movq_m2r(*source_plane, mm1); /* load 8 V samples */
-      source_plane += 6;
+      filter_loops = 3;
 
-      for (k = 0; k < 3; k++)
-      {
-        movq_r2r(mm1, mm2);      /* make a copy */
+      /* iterate through blocks of 6 samples */
+      for (j = 0; j <= block_loops; j++) {
 
-        punpcklbw_r2r(mm0, mm2); /* interleave lower 4 samples with zeros */
-        pmaddwd_r2r(mm7, mm2);   /* apply the filter */
-        movq_r2r(mm2, mm3);      /* copy result to mm3 */
-        psrlq_i2r(32, mm3);      /* move the upper sum down */
-        paddd_r2r(mm3, mm2);     /* mm2 += mm3 */
-        psrlq_i2r(3, mm2);       /* final phase of the filter */
+        /* special case for end-of-line residual */
+        if (j != block_loops) {
+          movq_m2r(*source_plane, mm1); /* load 8 C samples */
+          source_plane += 6;
+        } else {
+          advance_count = yuv_planes->row_width % 6;
+          if (!advance_count)
+            advance_count = 6;
+          filter_loops = advance_count / 2;
 
-        movq_r2m(mm2, *vector);
-        dest_plane[0] = vector[0];
-        dest_plane += 4;
+          movq_m2r(*source_plane, mm1); /* load 8 C samples */
+          source_plane += advance_count;
 
-        psrlq_i2r(16, mm1);      /* toss out 2 V samples and loop again */
+          /* zero out the rest of the samples */
+/*
+          if (advance_count == 2)
+            pand_r2r(mm4, mm1);
+          else if (advance_count == 4)
+            pand_r2r(mm5, mm1);
+          else if (advance_count == 6)
+            pand_r2r(mm6, mm1);
+*/
+        }
+
+        for (k = 0; k < filter_loops; k++) {
+          movq_r2r(mm1, mm2);      /* make a copy */
+
+          punpcklbw_r2r(mm0, mm2); /* interleave lower 4 samples with zeros */
+          pmaddwd_r2r(mm7, mm2);   /* apply the filter */
+          movq_r2r(mm2, mm3);      /* copy result to mm3 */
+          psrlq_i2r(32, mm3);      /* move the upper sum down */
+          paddd_r2r(mm3, mm2);     /* mm2 += mm3 */
+          psrlq_i2r(3, mm2);       /* divide by 8 */
+
+          movq_r2m(mm2, *vector);
+          dest_plane[0] = vector[0];
+          dest_plane += 4;
+
+          psrlq_i2r(16, mm1);      /* toss out 2 C samples and loop again */
+        }
       }
     }
-
-    /* special case time: secondary samples */
-    if (width_mod) {
-      source_plane -= rewind_bytes;
-      movq_m2r(*source_plane, mm1); /* load 8 V samples */
-      source_plane += 8;
-
-      /* toss out 1-2 V samples before starting */
-      /* (psrlq_m2r does not work like I expect it to, so this looks weird) */
-      if (toss_out_shift == 16)
-        psrlq_i2r(16, mm1);
-      else
-        psrlq_i2r(32, mm1);
-
-      for (k = 0; k < secondary_samples; k++)
-      {
-        movq_r2r(mm1, mm2);      /* make a copy */
-
-        punpcklbw_r2r(mm0, mm2); /* interleave lower 4 samples with zeros */
-        pmaddwd_r2r(mm7, mm2);   /* apply the filter */
-        movq_r2r(mm2, mm3);      /* copy result to mm3 */
-        psrlq_i2r(32, mm3);      /* move the upper sum down */
-        paddd_r2r(mm3, mm2);     /* mm2 += mm3 */
-        psrlq_i2r(3, mm2);       /* final phase of the filter */
-
-        movq_r2m(mm2, *vector);
-        dest_plane[0] = vector[0];
-        dest_plane += 4;
-
-        psrlq_i2r(16, mm1);      /* toss out 2 V samples and loop again */
-      }
-    } else
-      source_plane += 2;
-
-    dest_plane += row_inc;
   }
 
   /* be a good MMX citizen and empty MMX state */
diff --git a/src/xine-utils/xineutils.h b/src/xine-utils/xineutils.h
index 66f704861..cd44dca80 100644
--- a/src/xine-utils/xineutils.h
+++ b/src/xine-utils/xineutils.h
@@ -17,7 +17,7 @@
  * along with this program; if not, write to the Free Software
  * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA
  *
- * $Id: xineutils.h,v 1.20 2002/07/24 08:00:13 f1rmb Exp $
+ * $Id: xineutils.h,v 1.21 2002/08/28 03:32:48 tmmm Exp $
  *
  */
 #ifndef XINEUTILS_H
@@ -728,7 +728,6 @@ typedef struct yuv_planes_s {
   unsigned char *u;
   unsigned char *v;
   unsigned int row_width;    /* frame width */
-  unsigned int row_stride;   /* frame width + 2 */
   unsigned int row_count;    /* frame height */
 
 } yuv_planes_t;
@@ -753,17 +752,6 @@ extern void (*yuv444_to_yuy2)
   (unsigned char) \
   ((v_r_table[r] + v_g_table[g] + v_b_table[b]) / SCALEFACTOR + CENTERSAMPLE)
 
-#define FINISH_LINE(yuv_planes, row_ptr) \
-  yuv_planes.u[row_ptr + yuv_planes.row_width] = \
-    yuv_planes.u[row_ptr + yuv_planes.row_width - 1]; \
-  yuv_planes.u[row_ptr + yuv_planes.row_width + 1] = \
-    yuv_planes.u[row_ptr + yuv_planes.row_width - 2]; \
- \
-  yuv_planes.v[row_ptr + yuv_planes.row_width] = \
-    yuv_planes.v[row_ptr + yuv_planes.row_width - 1]; \
-  yuv_planes.v[row_ptr + yuv_planes.row_width + 1] = \
-    yuv_planes.v[row_ptr + yuv_planes.row_width - 2];
-
 #define UNPACK_BGR15(packed_pixel, r, g, b) \
   b = (packed_pixel & 0x7C00) >> 7; \
   g = (packed_pixel & 0x03E0) >> 2; \
author	Mike Melanson <mike@multimedia.cx>	2002-08-28 03:32:48 +0000
committer	Mike Melanson <mike@multimedia.cx>	2002-08-28 03:32:48 +0000
commit	d1606decedff8ef07319d9ea4830ececf69f62d0 (patch)
tree	be6bc8b8ed1236513b6cf7fdbcaf028df4c79ef5
parent	28280f2f9870a7854ffdd4bccd48bb62468ce6ee (diff)
download	xine-lib-d1606decedff8ef07319d9ea4830ececf69f62d0.tar.gz xine-lib-d1606decedff8ef07319d9ea4830ececf69f62d0.tar.bz2