third_party/libyuv/source/convert.cc - vendor/opensource/webrtc - Git at Google

 /*
  *  Copyright (c) 2011 The LibYuv project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "libyuv/convert.h"

 //#define SCALEOPT //Currently for windows only. June 2010

 #ifdef SCALEOPT
 #include <emmintrin.h>
 #endif

 #include "conversion_tables.h"
 #include "libyuv/basic_types.h"
 #include "libyuv/cpu_id.h"
 #include "libyuv/format_conversion.h"
 #include "libyuv/planar_functions.h"
 #include "libyuv/rotate.h"
 #include "row.h"
 #include "libyuv/video_common.h"

 #ifdef __cplusplus
 namespace libyuv {
 extern "C" {
 #endif

 static __inline uint8 Clip(int32 val) {
   if (val < 0) {
     return (uint8) 0;
   } else if (val > 255){
     return (uint8) 255;
   }
   return (uint8) val;
 }

 // TODO(fbarchard): rewrite with row functions
 int I420ToRGB24(const uint8* src_y, int src_stride_y,
                 const uint8* src_u, int src_stride_u,
                 const uint8* src_v, int src_stride_v,
                 uint8* dst_frame, int dst_stride_frame,
                 int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }
   // TODO(fbarchard): support inversion
   uint8* out = dst_frame;
   uint8* out2 = out + dst_stride_frame;
   int h, w;
   int tmp_r, tmp_g, tmp_b;
   const uint8 *y1, *y2 ,*u, *v;
   y1 = src_y;
   y2 = y1 + src_stride_y;
   u = src_u;
   v = src_v;
   for (h = ((height + 1) >> 1); h > 0; h--){
     // 2 rows at a time, 2 y's at a time
     for (w = 0; w < ((width + 1) >> 1); w++){
       // Vertical and horizontal sub-sampling
       tmp_r = (int32)((mapYc[y1[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[0]] + mapUcb[u[0]] + 128) >> 8);
       out[0] = Clip(tmp_b);
       out[1] = Clip(tmp_g);
       out[2] = Clip(tmp_r);

       tmp_r = (int32)((mapYc[y1[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[1]] + mapUcb[u[0]] + 128) >> 8);
       out[3] = Clip(tmp_b);
       out[4] = Clip(tmp_g);
       out[5] = Clip(tmp_r);

       tmp_r = (int32)((mapYc[y2[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[0]] + mapUcb[u[0]] + 128) >> 8);
       out2[0] = Clip(tmp_b);
       out2[1] = Clip(tmp_g);
       out2[2] = Clip(tmp_r);

       tmp_r = (int32)((mapYc[y2[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[1]] + mapUcb[u[0]] + 128) >> 8);
       out2[3] = Clip(tmp_b);
       out2[4] = Clip(tmp_g);
       out2[5] = Clip(tmp_r);

       out += 6;
       out2 += 6;
       y1 += 2;
       y2 += 2;
       u++;
       v++;
     }
     y1 += 2 * src_stride_y - width;
     y2 += 2 * src_stride_y - width;
     u += src_stride_u - ((width + 1) >> 1);
     v += src_stride_v - ((width + 1) >> 1);
     out += dst_stride_frame;
     out2 += dst_stride_frame;
   }
   return 0;
 }

 // same as RGB24 but r,g,b instead of b,g,r
 // TODO(fbarchard): rewrite with row functions
 int I420ToRAW(const uint8* src_y, int src_stride_y,
               const uint8* src_u, int src_stride_u,
               const uint8* src_v, int src_stride_v,
               uint8* dst_frame, int dst_stride_frame,
               int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }

   // RGB orientation - bottom up
   // TODO(fbarchard): support inversion
   uint8* out = dst_frame + dst_stride_frame * height - dst_stride_frame;
   uint8* out2 = out - dst_stride_frame;
   int h, w;
   int tmp_r, tmp_g, tmp_b;
   const uint8 *y1, *y2 ,*u, *v;
   y1 = src_y;
   y2 = y1 + src_stride_y;
   u = src_u;
   v = src_v;
   for (h = ((height + 1) >> 1); h > 0; h--){
     // 2 rows at a time, 2 y's at a time
     for (w = 0; w < ((width + 1) >> 1); w++){
       // Vertical and horizontal sub-sampling
       tmp_r = (int32)((mapYc[y1[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[0]] + mapUcb[u[0]] + 128) >> 8);
       out[0] = Clip(tmp_r);
       out[1] = Clip(tmp_g);
       out[2] = Clip(tmp_b);

       tmp_r = (int32)((mapYc[y1[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[1]] + mapUcb[u[0]] + 128) >> 8);
       out[3] = Clip(tmp_r);
       out[4] = Clip(tmp_g);
       out[5] = Clip(tmp_b);

       tmp_r = (int32)((mapYc[y2[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[0]] + mapUcb[u[0]] + 128) >> 8);
       out2[0] = Clip(tmp_r);
       out2[1] = Clip(tmp_g);
       out2[2] = Clip(tmp_b);

       tmp_r = (int32)((mapYc[y2[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[1]] + mapUcb[u[0]] + 128) >> 8);
       out2[3] = Clip(tmp_r);
       out2[4] = Clip(tmp_g);
       out2[5] = Clip(tmp_b);

       out += 6;
       out2 += 6;
       y1 += 2;
       y2 += 2;
       u++;
       v++;
     }
     y1 += src_stride_y + src_stride_y - width;
     y2 += src_stride_y + src_stride_y - width;
     u += src_stride_u - ((width + 1) >> 1);
     v += src_stride_v - ((width + 1) >> 1);
     out -= dst_stride_frame * 3;
     out2 -= dst_stride_frame * 3;
   } // end height for
   return 0;
 }

 // Little Endian...
 // TODO(fbarchard): rewrite with row functions
 int I420ToARGB4444(const uint8* src_y, int src_stride_y,
                    const uint8* src_u, int src_stride_u,
                    const uint8* src_v, int src_stride_v,
                    uint8* dst_frame, int dst_stride_frame,
                    int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }

   // RGB orientation - bottom up
   uint8* out = dst_frame + dst_stride_frame * (height - 1);
   uint8* out2 = out - dst_stride_frame;
   int tmp_r, tmp_g, tmp_b;
   const uint8 *y1,*y2, *u, *v;
   y1 = src_y;
   y2 = y1 + src_stride_y;
   u = src_u;
   v = src_v;
   int h, w;

   for (h = ((height + 1) >> 1); h > 0; h--) {
     // 2 rows at a time, 2 y's at a time
     for (w = 0; w < ((width + 1) >> 1); w++) {
         // Vertical and horizontal sub-sampling
         // Convert to RGB888 and re-scale to 4 bits
         tmp_r = (int32)((mapYc[y1[0]] + mapVcr[v[0]] + 128) >> 8);
         tmp_g = (int32)((mapYc[y1[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
         tmp_b = (int32)((mapYc[y1[0]] + mapUcb[u[0]] + 128) >> 8);
         out[0] =(uint8)((Clip(tmp_g) & 0xf0) + (Clip(tmp_b) >> 4));
         out[1] = (uint8)(0xf0 + (Clip(tmp_r) >> 4));

         tmp_r = (int32)((mapYc[y1[1]] + mapVcr[v[0]] + 128) >> 8);
         tmp_g = (int32)((mapYc[y1[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
         tmp_b = (int32)((mapYc[y1[1]] + mapUcb[u[0]] + 128) >> 8);
         out[2] = (uint8)((Clip(tmp_g) & 0xf0 ) + (Clip(tmp_b) >> 4));
         out[3] = (uint8)(0xf0 + (Clip(tmp_r) >> 4));

         tmp_r = (int32)((mapYc[y2[0]] + mapVcr[v[0]] + 128) >> 8);
         tmp_g = (int32)((mapYc[y2[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
         tmp_b = (int32)((mapYc[y2[0]] + mapUcb[u[0]] + 128) >> 8);
         out2[0] = (uint8)((Clip(tmp_g) & 0xf0 ) + (Clip(tmp_b) >> 4));
         out2[1] = (uint8) (0xf0 + (Clip(tmp_r) >> 4));

         tmp_r = (int32)((mapYc[y2[1]] + mapVcr[v[0]] + 128) >> 8);
         tmp_g = (int32)((mapYc[y2[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
         tmp_b = (int32)((mapYc[y2[1]] + mapUcb[u[0]] + 128) >> 8);
         out2[2] = (uint8)((Clip(tmp_g) & 0xf0 ) + (Clip(tmp_b) >> 4));
         out2[3] = (uint8)(0xf0 + (Clip(tmp_r) >> 4));

         out += 4;
         out2 += 4;
         y1 += 2;
         y2 += 2;
         u++;
         v++;
     }
     y1 += 2 * src_stride_y - width;
     y2 += 2 * src_stride_y - width;
     u += src_stride_u - ((width + 1) >> 1);
     v += src_stride_v - ((width + 1) >> 1);
     out -= (dst_stride_frame + width) * 2;
     out2 -= (dst_stride_frame + width) * 2;
   } // end height for
   return 0;
 }

 // TODO(fbarchard): rewrite with row functions
 int I420ToRGB565(const uint8* src_y, int src_stride_y,
                  const uint8* src_u, int src_stride_u,
                  const uint8* src_v, int src_stride_v,
                  uint8* dst_frame, int dst_stride_frame,
                  int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }

   // Negative height means invert the image.
   if (height < 0) {
     height = -height;
     src_y = src_y + (height - 1) * src_stride_y;
     src_u = src_u + (height - 1) * src_stride_u;
     src_v = src_v + (height - 1) * src_stride_v;
     src_stride_y = -src_stride_y;
     src_stride_u = -src_stride_u;
     src_stride_v = -src_stride_v;
   }
   uint16* out = (uint16*)(dst_frame) + dst_stride_frame * (height - 1);
   uint16* out2 = out - dst_stride_frame;

   int tmp_r, tmp_g, tmp_b;
   const uint8* y1,* y2, * u, * v;
   y1 = src_y;
   y2 = y1 + src_stride_y;
   u = src_u;
   v = src_v;
   int h, w;

   for (h = ((height + 1) >> 1); h > 0; h--){
     // 2 rows at a time, 2 y's at a time
     for (w = 0; w < ((width + 1) >> 1); w++){
       // Vertical and horizontal sub-sampling
       // 1. Convert to RGB888
       // 2. Shift to adequate location (in the 16 bit word) - RGB 565

       tmp_r = (int32)((mapYc[y1[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[0]] + mapUcb[u[0]] + 128) >> 8);
       out[0]  = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                           & 0xfc) << 3) + (Clip(tmp_b) >> 3);

       tmp_r = (int32)((mapYc[y1[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[1]] + mapUcb[u[0]] + 128) >> 8);
       out[1] = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                          & 0xfc) << 3) + (Clip(tmp_b ) >> 3);

       tmp_r = (int32)((mapYc[y2[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[0]] + mapUcb[u[0]] + 128) >> 8);
       out2[0] = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                           & 0xfc) << 3) + (Clip(tmp_b) >> 3);

       tmp_r = (int32)((mapYc[y2[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[1]] + mapUcb[u[0]] + 128) >> 8);
       out2[1] = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                           & 0xfc) << 3) + (Clip(tmp_b) >> 3);

       y1 += 2;
       y2 += 2;
       out += 2;
       out2 += 2;
       u++;
       v++;
     }
     y1 += 2 * src_stride_y - width;
     y2 += 2 * src_stride_y - width;
     u += src_stride_u - ((width + 1) >> 1);
     v += src_stride_v - ((width + 1) >> 1);
     out -= 2 * dst_stride_frame + width;
     out2 -=  2 * dst_stride_frame + width;
   }
   return 0;
 }

 // TODO(fbarchard): rewrite with row functions
 int I420ToARGB1555(const uint8* src_y, int src_stride_y,
                    const uint8* src_u, int src_stride_u,
                    const uint8* src_v, int src_stride_v,
                    uint8* dst_frame, int dst_stride_frame,
                    int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }
   uint16* out = (uint16*)(dst_frame) + dst_stride_frame * (height - 1);
   uint16* out2 = out - dst_stride_frame ;
   int32 tmp_r, tmp_g, tmp_b;
   const uint8 *y1,*y2, *u, *v;
   int h, w;

   y1 = src_y;
   y2 = y1 + src_stride_y;
   u = src_u;
   v = src_v;

   for (h = ((height + 1) >> 1); h > 0; h--){
     // 2 rows at a time, 2 y's at a time
     for (w = 0; w < ((width + 1) >> 1); w++){
       // Vertical and horizontal sub-sampling
       // 1. Convert to RGB888
       // 2. Shift to adequate location (in the 16 bit word) - RGB 555
       // 3. Add 1 for alpha value
       tmp_r = (int32)((mapYc[y1[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[0]] + mapUcb[u[0]] + 128) >> 8);
       out[0]  = (uint16)(0x8000 + ((Clip(tmp_r) & 0xf8) << 10) +
                 ((Clip(tmp_g) & 0xf8) << 3) + (Clip(tmp_b) >> 3));

       tmp_r = (int32)((mapYc[y1[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[1]] + mapUcg[u[0]] + mapVcg[v[0]]  + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[1]] + mapUcb[u[0]] + 128) >> 8);
       out[1]  = (uint16)(0x8000 + ((Clip(tmp_r) & 0xf8) << 10) +
                 ((Clip(tmp_g) & 0xf8) << 3)  + (Clip(tmp_b) >> 3));

       tmp_r = (int32)((mapYc[y2[0]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[0]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[0]] + mapUcb[u[0]] + 128) >> 8);
       out2[0]  = (uint16)(0x8000 + ((Clip(tmp_r) & 0xf8) << 10) +
                  ((Clip(tmp_g) & 0xf8) << 3) + (Clip(tmp_b) >> 3));

       tmp_r = (int32)((mapYc[y2[1]] + mapVcr[v[0]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[1]] + mapUcg[u[0]] + mapVcg[v[0]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[1]] + mapUcb[u[0]] + 128) >> 8);
       out2[1]  = (uint16)(0x8000 + ((Clip(tmp_r) & 0xf8) << 10) +
                  ((Clip(tmp_g) & 0xf8) << 3)  + (Clip(tmp_b) >> 3));

       y1 += 2;
       y2 += 2;
       out += 2;
       out2 += 2;
       u++;
       v++;
     }
     y1 += 2 * src_stride_y - width;
     y2 += 2 * src_stride_y - width;
     u += src_stride_u - ((width + 1) >> 1);
     v += src_stride_v - ((width + 1) >> 1);
     out -= 2 * dst_stride_frame + width;
     out2 -=  2 * dst_stride_frame + width;
   }
   return 0;
 }

 // YUY2 - Macro-pixel = 2 image pixels
 // Y0U0Y1V0....Y2U2Y3V2...Y4U4Y5V4....

 #if defined(_M_IX86) && !defined(YUV_DISABLE_ASM)
 #define HAS_I42XTOYUY2ROW_SSE2
 __declspec(naked)
 static void I42xToYUY2Row_SSE2(const uint8* src_y,
                                const uint8* src_u,
                                const uint8* src_v,
                                uint8* dst_frame, int width) {
   __asm {
     push       esi
     push       edi
     mov        eax, [esp + 8 + 4]    // src_y
     mov        esi, [esp + 8 + 8]    // src_u
     mov        edx, [esp + 8 + 12]   // src_v
     mov        edi, [esp + 8 + 16]   // dst_frame
     mov        ecx, [esp + 8 + 20]   // width
     sub        edx, esi

   convertloop:
     movdqa     xmm0, [eax] // Y
     lea        eax, [eax + 16]
     movq       xmm2, qword ptr [esi] // U
     movq       xmm3, qword ptr [esi + edx] // V
     lea        esi, [esi + 8]
     punpcklbw  xmm2, xmm3 // UV
     movdqa     xmm1, xmm0
     punpcklbw  xmm0, xmm2 // YUYV
     punpckhbw  xmm1, xmm2
     movdqa     [edi], xmm0
     movdqa     [edi + 16], xmm1
     lea        edi, [edi + 32]
     sub        ecx, 16
     ja         convertloop

     pop        edi
     pop        esi
     ret
   }
 }
 #elif (defined(__x86_64__) || defined(__i386__)) && !defined(YUV_DISABLE_ASM)
 #define HAS_I42XTOYUY2ROW_SSE2
 static void I42xToYUY2Row_SSE2(const uint8* src_y,
                                const uint8* src_u,
                                const uint8* src_v,
                                uint8* dst_frame, int width) {
  asm volatile (
   "sub        %1,%2                            \n"
 "1:                                            \n"
   "movdqa    (%0),%%xmm0                       \n"
   "lea       0x10(%0),%0                       \n"
   "movq      (%1),%%xmm2                       \n"
   "movq      (%1,%2,1),%%xmm3                  \n"
   "lea       0x8(%1),%1                        \n"
   "punpcklbw %%xmm3,%%xmm2                     \n"
   "movdqa    %%xmm0,%%xmm1                     \n"
   "punpcklbw %%xmm2,%%xmm0                     \n"
   "punpckhbw %%xmm2,%%xmm1                     \n"
   "movdqa    %%xmm0,(%3)                       \n"
   "movdqa    %%xmm1,0x10(%3)                   \n"
   "lea       0x20(%3),%3                       \n"
   "sub       $0x10,%4                          \n"
   "ja         1b                               \n"
   : "+r"(src_y),  // %0
     "+r"(src_u),  // %1
     "+r"(src_v),  // %2
     "+r"(dst_frame),  // %3
     "+rm"(width)  // %4
   :
   : "memory", "cc"
 #if defined(__SSE2__)
     , "xmm0", "xmm1", "xmm2", "xmm3"
 #endif
 );
 }
 #endif

 void I42xToYUY2Row_C(const uint8* src_y, const uint8* src_u, const uint8* src_v,
                      uint8* dst_frame, int width) {
     for (int x = 0; x < width - 1; x += 2) {
       dst_frame[0] = src_y[0];
       dst_frame[1] = src_u[0];
       dst_frame[2] = src_y[1];
       dst_frame[3] = src_v[0];
       dst_frame += 4;
       src_y += 2;
       src_u += 1;
       src_v += 1;
     }
     if (width & 1) {
       dst_frame[0] = src_y[0];
       dst_frame[1] = src_u[0];
       dst_frame[2] = src_y[0];  // duplicate last y
       dst_frame[3] = src_v[0];
     }
 }

 int I422ToYUY2(const uint8* src_y, int src_stride_y,
                const uint8* src_u, int src_stride_u,
                const uint8* src_v, int src_stride_v,
                uint8* dst_frame, int dst_stride_frame,
                int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }
   // Negative height means invert the image.
   if (height < 0) {
     height = -height;
     dst_frame = dst_frame + (height - 1) * dst_stride_frame;
     dst_stride_frame = -dst_stride_frame;
   }
   void (*I42xToYUY2Row)(const uint8* src_y, const uint8* src_u,
                         const uint8* src_v, uint8* dst_frame, int width);
 #if defined(HAS_I42XTOYUY2ROW_SSE2)
   if (TestCpuFlag(kCpuHasSSE2) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_y, 16) && IS_ALIGNED(src_stride_y, 16) &&
       IS_ALIGNED(dst_frame, 16) && IS_ALIGNED(dst_stride_frame, 16)) {
     I42xToYUY2Row = I42xToYUY2Row_SSE2;
   } else
 #endif
   {
     I42xToYUY2Row = I42xToYUY2Row_C;
   }
   for (int y = 0; y < height; ++y) {
     I42xToYUY2Row(src_y, src_u, src_y, dst_frame, width);
     src_y += src_stride_y;
     src_u += src_stride_u;
     src_v += src_stride_v;
     dst_frame += dst_stride_frame;
   }
   return 0;
 }

 int I420ToYUY2(const uint8* src_y, int src_stride_y,
                const uint8* src_u, int src_stride_u,
                const uint8* src_v, int src_stride_v,
                uint8* dst_frame, int dst_stride_frame,
                int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }
   // Negative height means invert the image.
   if (height < 0) {
     height = -height;
     dst_frame = dst_frame + (height - 1) * dst_stride_frame;
     dst_stride_frame = -dst_stride_frame;
   }
   void (*I42xToYUY2Row)(const uint8* src_y, const uint8* src_u,
                         const uint8* src_v, uint8* dst_frame, int width);
 #if defined(HAS_I42XTOYUY2ROW_SSE2)
   if (TestCpuFlag(kCpuHasSSE2) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_y, 16) && IS_ALIGNED(src_stride_y, 16) &&
       IS_ALIGNED(dst_frame, 16) && IS_ALIGNED(dst_stride_frame, 16)) {
     I42xToYUY2Row = I42xToYUY2Row_SSE2;
   } else
 #endif
   {
     I42xToYUY2Row = I42xToYUY2Row_C;
   }
   for (int y = 0; y < height - 1; y += 2) {
     I42xToYUY2Row(src_y, src_u, src_v, dst_frame, width);
     I42xToYUY2Row(src_y + src_stride_y, src_u, src_v,
                   dst_frame + dst_stride_frame, width);
     src_y += src_stride_y * 2;
     src_u += src_stride_u;
     src_v += src_stride_v;
     dst_frame += dst_stride_frame * 2;
   }
   if (height & 1) {
     I42xToYUY2Row(src_y, src_u, src_v, dst_frame, width);
   }
   return 0;
 }

 int I420ToUYVY(const uint8* src_y, int src_stride_y,
                const uint8* src_u, int src_stride_u,
                const uint8* src_v, int src_stride_v,
                uint8* dst_frame, int dst_stride_frame,
                int width, int height) {
   if (src_y == NULL || src_u == NULL || src_v == NULL || dst_frame == NULL) {
     return -1;
   }

   int i = 0;
   const uint8* y1 = src_y;
   const uint8* y2 = y1 + src_stride_y;
   const uint8* u = src_u;
   const uint8* v = src_v;

   uint8* out1 = dst_frame;
   uint8* out2 = dst_frame + dst_stride_frame;

   // Macro-pixel = 2 image pixels
   // U0Y0V0Y1....U2Y2V2Y3...U4Y4V4Y5.....

 #ifndef SCALEOPT
   for (; i < ((height + 1) >> 1); i++) {
     for (int j = 0; j < ((width + 1) >> 1); j++) {
       out1[0] = *u;
       out1[1] = y1[0];
       out1[2] = *v;
       out1[3] = y1[1];

       out2[0] = *u;
       out2[1] = y2[0];
       out2[2] = *v;
       out2[3] = y2[1];
       out1 += 4;
       out2 += 4;
       u++;
       v++;
       y1 += 2;
       y2 += 2;
     }
     y1 += 2 * src_stride_y - width;
     y2 += 2 * src_stride_y - width;
     u += src_stride_u - ((width + 1) >> 1);
     v += src_stride_v - ((width + 1) >> 1);
     out1 += 2 * (dst_stride_frame - width);
     out2 += 2 * (dst_stride_frame - width);
   }
 #else
   for (; i < (height >> 1);i++) {
     int32 width__ = (width >> 4);
     _asm
     {
       ;pusha
       mov       eax, DWORD PTR [in1]                       ;1939.33
       mov       ecx, DWORD PTR [in2]                       ;1939.33
       mov       ebx, DWORD PTR [src_u]                       ;1939.33
       mov       edx, DWORD PTR [src_v]                       ;1939.33
 loop0:
       movq      xmm6, QWORD PTR [ebx]          ;src_u
       movq      xmm0, QWORD PTR [edx]          ;src_v
       punpcklbw xmm6, xmm0                     ;src_u, src_v mix
       movdqa    xmm1, xmm6
       movdqa    xmm2, xmm6
       movdqa    xmm4, xmm6

       movdqu    xmm3, XMMWORD PTR [eax]        ;in1
       punpcklbw xmm1, xmm3                     ;src_u, in1, src_v
       mov       esi, DWORD PTR [out1]
       movdqu    XMMWORD PTR [esi], xmm1        ;write to out1

       movdqu    xmm5, XMMWORD PTR [ecx]        ;in2
       punpcklbw xmm2, xmm5                     ;src_u, in2, src_v
       mov       edi, DWORD PTR [out2]
       movdqu    XMMWORD PTR [edi], xmm2        ;write to out2

       punpckhbw xmm4, xmm3                     ;src_u, in1, src_v again
       movdqu    XMMWORD PTR [esi+16], xmm4     ;write to out1 again
       add       esi, 32
       mov       DWORD PTR [out1], esi

       punpckhbw xmm6, xmm5                     ;src_u, in2, src_v again
       movdqu    XMMWORD PTR [edi+16], xmm6     ;write to out2 again
       add       edi, 32
       mov       DWORD PTR [out2], edi

       add       ebx, 8
       add       edx, 8
       add       eax, 16
       add       ecx, 16

       mov       esi, DWORD PTR [width__]
       sub       esi, 1
       mov       DWORD PTR [width__], esi
       jg        loop0

       mov       DWORD PTR [in1], eax                       ;1939.33
       mov       DWORD PTR [in2], ecx                       ;1939.33
       mov       DWORD PTR [src_u], ebx                       ;1939.33
       mov       DWORD PTR [src_v], edx                       ;1939.33

       ;popa
       emms
     }
     in1 += width;
     in2 += width;
     out1 += 2 * (dst_stride_frame - width);
     out2 += 2 * (dst_stride_frame - width);
   }
 #endif
   return 0;
 }


 int NV12ToRGB565(const uint8* src_y, int src_stride_y,
                  const uint8* src_uv, int src_stride_uv,
                  uint8* dst_frame, int dst_stride_frame,
                  int width, int height) {
   if (src_y == NULL || src_uv == NULL || dst_frame == NULL) {
     return -1;
   }

   // Bi-Planar: Y plane followed by an interlaced U and V plane
   const uint8* interlacedSrc = src_uv;
   uint16* out = (uint16*)(src_y) + dst_stride_frame * (height - 1);
   uint16* out2 = out - dst_stride_frame;
   int32 tmp_r, tmp_g, tmp_b;
   const uint8 *y1,*y2;
   y1 = src_y;
   y2 = y1 + src_stride_y;
   int h, w;

   for (h = ((height + 1) >> 1); h > 0; h--) {
     // 2 rows at a time, 2 y's at a time
     for (w = 0; w < ((width + 1) >> 1); w++) {
       // Vertical and horizontal sub-sampling
       // 1. Convert to RGB888
       // 2. Shift to adequate location (in the 16 bit word) - RGB 565

       tmp_r = (int32)((mapYc[y1[0]] + mapVcr[interlacedSrc[1]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[0]] + mapUcg[interlacedSrc[0]]
                       + mapVcg[interlacedSrc[1]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[0]] + mapUcb[interlacedSrc[0]] + 128) >> 8);
       out[0]  = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                           & 0xfc) << 3) + (Clip(tmp_b) >> 3);

       tmp_r = (int32)((mapYc[y1[1]] + mapVcr[interlacedSrc[1]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y1[1]] + mapUcg[interlacedSrc[0]]
                       + mapVcg[interlacedSrc[1]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y1[1]] + mapUcb[interlacedSrc[0]] + 128) >> 8);
       out[1] = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                          & 0xfc) << 3) + (Clip(tmp_b ) >> 3);

       tmp_r = (int32)((mapYc[y2[0]] + mapVcr[interlacedSrc[1]] + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[0]] + mapUcg[interlacedSrc[0]]
                       + mapVcg[interlacedSrc[1]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[0]] + mapUcb[interlacedSrc[0]] + 128) >> 8);
       out2[0] = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                           & 0xfc) << 3) + (Clip(tmp_b) >> 3);

       tmp_r = (int32)((mapYc[y2[1]] + mapVcr[interlacedSrc[1]]
                       + 128) >> 8);
       tmp_g = (int32)((mapYc[y2[1]] + mapUcg[interlacedSrc[0]]
                       + mapVcg[interlacedSrc[1]] + 128) >> 8);
       tmp_b = (int32)((mapYc[y2[1]] + mapUcb[interlacedSrc[0]] + 128) >> 8);
       out2[1] = (uint16)((Clip(tmp_r) & 0xf8) << 8) + ((Clip(tmp_g)
                           & 0xfc) << 3) + (Clip(tmp_b) >> 3);

       y1 += 2;
       y2 += 2;
       out += 2;
       out2 += 2;
       interlacedSrc += 2;
     }
     y1 += 2 * src_stride_y - width;
     y2 += 2 * src_stride_y - width;
     interlacedSrc += src_stride_uv - ((width + 1) >> 1);
     out -= 3 * dst_stride_frame + dst_stride_frame - width;
     out2 -= 3 * dst_stride_frame + dst_stride_frame - width;
   }
   return 0;
 }

 // TODO(fbarchard): Deprecated - this is same as BG24ToARGB with -height
 int RGB24ToARGB(const uint8* src_frame, int src_stride_frame,
                 uint8* dst_frame, int dst_stride_frame,
                 int width, int height) {
   if (src_frame == NULL || dst_frame == NULL) {
     return -1;
   }

   int i, j, offset;
   uint8* outFrame = dst_frame;
   const uint8* inFrame = src_frame;

   outFrame += dst_stride_frame * (height - 1) * 4;
   for (i = 0; i < height; i++) {
     for (j = 0; j < width; j++) {
       offset = j * 4;
       outFrame[0 + offset] = inFrame[0];
       outFrame[1 + offset] = inFrame[1];
       outFrame[2 + offset] = inFrame[2];
       outFrame[3 + offset] = 0xff;
       inFrame += 3;
     }
     outFrame -= 4 * (dst_stride_frame - width);
     inFrame += src_stride_frame - width;
   }
   return 0;
 }

 int ARGBToI420(const uint8* src_frame, int src_stride_frame,
                uint8* dst_y, int dst_stride_y,
                uint8* dst_u, int dst_stride_u,
                uint8* dst_v, int dst_stride_v,
                int width, int height) {
   if (height < 0) {
     height = -height;
     src_frame = src_frame + (height - 1) * src_stride_frame;
     src_stride_frame = -src_stride_frame;
   }
   void (*ARGBToYRow)(const uint8* src_argb, uint8* dst_y, int pix);
   void (*ARGBToUVRow)(const uint8* src_argb0, int src_stride_argb,
                       uint8* dst_u, uint8* dst_v, int width);
 #if defined(HAS_ARGBTOYROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_y, 16) && IS_ALIGNED(dst_stride_y, 16)) {
     ARGBToYRow = ARGBToYRow_SSSE3;
   } else
 #endif
   {
     ARGBToYRow = ARGBToYRow_C;
   }
 #if defined(HAS_ARGBTOUVROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_u, 8) && IS_ALIGNED(dst_stride_u, 8) &&
       IS_ALIGNED(dst_v, 8) && IS_ALIGNED(dst_stride_v, 8)) {
     ARGBToUVRow = ARGBToUVRow_SSSE3;
   } else
 #endif
   {
     ARGBToUVRow = ARGBToUVRow_C;
   }

   for (int y = 0; y < (height - 1); y += 2) {
     ARGBToUVRow(src_frame, src_stride_frame, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
     ARGBToYRow(src_frame + src_stride_frame, dst_y + dst_stride_y, width);
     src_frame += src_stride_frame * 2;
     dst_y += dst_stride_y * 2;
     dst_u += dst_stride_u;
     dst_v += dst_stride_v;
   }
   if (height & 1) {
     ARGBToUVRow(src_frame, 0, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
   }
   return 0;
 }

 int BGRAToI420(const uint8* src_frame, int src_stride_frame,
                uint8* dst_y, int dst_stride_y,
                uint8* dst_u, int dst_stride_u,
                uint8* dst_v, int dst_stride_v,
                int width, int height) {
   if (height < 0) {
     height = -height;
     src_frame = src_frame + (height - 1) * src_stride_frame;
     src_stride_frame = -src_stride_frame;
   }
   void (*ARGBToYRow)(const uint8* src_argb, uint8* dst_y, int pix);
   void (*ARGBToUVRow)(const uint8* src_argb0, int src_stride_argb,
                       uint8* dst_u, uint8* dst_v, int width);
 #if defined(HAS_BGRATOYROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_y, 16) && IS_ALIGNED(dst_stride_y, 16)) {
     ARGBToYRow = BGRAToYRow_SSSE3;
   } else
 #endif
   {
     ARGBToYRow = BGRAToYRow_C;
   }
 #if defined(HAS_BGRATOUVROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_u, 8) && IS_ALIGNED(dst_stride_u, 8) &&
       IS_ALIGNED(dst_v, 8) && IS_ALIGNED(dst_stride_v, 8)) {
     ARGBToUVRow = BGRAToUVRow_SSSE3;
   } else
 #endif
   {
     ARGBToUVRow = BGRAToUVRow_C;
   }

   for (int y = 0; y < (height - 1); y += 2) {
     ARGBToUVRow(src_frame, src_stride_frame, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
     ARGBToYRow(src_frame + src_stride_frame, dst_y + dst_stride_y, width);
     src_frame += src_stride_frame * 2;
     dst_y += dst_stride_y * 2;
     dst_u += dst_stride_u;
     dst_v += dst_stride_v;
   }
   if (height & 1) {
     ARGBToUVRow(src_frame, 0, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
   }
   return 0;
 }

 int ABGRToI420(const uint8* src_frame, int src_stride_frame,
                uint8* dst_y, int dst_stride_y,
                uint8* dst_u, int dst_stride_u,
                uint8* dst_v, int dst_stride_v,
                int width, int height) {
   if (height < 0) {
     height = -height;
     src_frame = src_frame + (height - 1) * src_stride_frame;
     src_stride_frame = -src_stride_frame;
   }
   void (*ARGBToYRow)(const uint8* src_argb, uint8* dst_y, int pix);
   void (*ARGBToUVRow)(const uint8* src_argb0, int src_stride_argb,
                       uint8* dst_u, uint8* dst_v, int width);
 #if defined(HAS_ABGRTOYROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_y, 16) && IS_ALIGNED(dst_stride_y, 16)) {
     ARGBToYRow = ABGRToYRow_SSSE3;
   } else
 #endif
   {
     ARGBToYRow = ABGRToYRow_C;
   }
 #if defined(HAS_ABGRTOUVROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_u, 8) && IS_ALIGNED(dst_stride_u, 8) &&
       IS_ALIGNED(dst_v, 8) && IS_ALIGNED(dst_stride_v, 8)) {
     ARGBToUVRow = ABGRToUVRow_SSSE3;
   } else
 #endif
   {
     ARGBToUVRow = ABGRToUVRow_C;
   }

   for (int y = 0; y < (height - 1); y += 2) {
     ARGBToUVRow(src_frame, src_stride_frame, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
     ARGBToYRow(src_frame + src_stride_frame, dst_y + dst_stride_y, width);
     src_frame += src_stride_frame * 2;
     dst_y += dst_stride_y * 2;
     dst_u += dst_stride_u;
     dst_v += dst_stride_v;
   }
   if (height & 1) {
     ARGBToUVRow(src_frame, 0, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
   }
   return 0;
 }

 int RGB24ToI420(const uint8* src_frame, int src_stride_frame,
                 uint8* dst_y, int dst_stride_y,
                 uint8* dst_u, int dst_stride_u,
                 uint8* dst_v, int dst_stride_v,
                 int width, int height) {
   if (height < 0) {
     height = -height;
     src_frame = src_frame + (height - 1) * src_stride_frame;
     src_stride_frame = -src_stride_frame;
   }
   void (*ARGBToYRow)(const uint8* src_argb, uint8* dst_y, int pix);
   void (*ARGBToUVRow)(const uint8* src_argb0, int src_stride_argb,
                       uint8* dst_u, uint8* dst_v, int width);
 #if defined(HAS_RGB24TOYROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_y, 16) && IS_ALIGNED(dst_stride_y, 16)) {
     ARGBToYRow = RGB24ToYRow_SSSE3;
   } else
 #endif
   {
     ARGBToYRow = RGB24ToYRow_C;
   }
 #if defined(HAS_RGB24TOUVROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_u, 8) && IS_ALIGNED(dst_stride_u, 8) &&
       IS_ALIGNED(dst_v, 8) && IS_ALIGNED(dst_stride_v, 8)) {
     ARGBToUVRow = RGB24ToUVRow_SSSE3;
   } else
 #endif
   {
     ARGBToUVRow = RGB24ToUVRow_C;
   }

   for (int y = 0; y < (height - 1); y += 2) {
     ARGBToUVRow(src_frame, src_stride_frame, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
     ARGBToYRow(src_frame + src_stride_frame, dst_y + dst_stride_y, width);
     src_frame += src_stride_frame * 2;
     dst_y += dst_stride_y * 2;
     dst_u += dst_stride_u;
     dst_v += dst_stride_v;
   }
   if (height & 1) {
     ARGBToUVRow(src_frame, 0, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
   }
   return 0;
 }

 int RAWToI420(const uint8* src_frame, int src_stride_frame,
               uint8* dst_y, int dst_stride_y,
               uint8* dst_u, int dst_stride_u,
               uint8* dst_v, int dst_stride_v,
               int width, int height) {
   if (height < 0) {
     height = -height;
     src_frame = src_frame + (height - 1) * src_stride_frame;
     src_stride_frame = -src_stride_frame;
   }
   void (*ARGBToYRow)(const uint8* src_argb, uint8* dst_y, int pix);
   void (*ARGBToUVRow)(const uint8* src_argb0, int src_stride_argb,
                       uint8* dst_u, uint8* dst_v, int width);
 #if defined(HAS_RAWTOYROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_y, 16) && IS_ALIGNED(dst_stride_y, 16)) {
     ARGBToYRow = RAWToYRow_SSSE3;
   } else
 #endif
   {
     ARGBToYRow = RAWToYRow_C;
   }
 #if defined(HAS_RAWTOUVROW_SSSE3)
   if (TestCpuFlag(kCpuHasSSSE3) &&
       IS_ALIGNED(width, 16) &&
       IS_ALIGNED(src_frame, 16) && IS_ALIGNED(src_stride_frame, 16) &&
       IS_ALIGNED(dst_u, 8) && IS_ALIGNED(dst_stride_u, 8) &&
       IS_ALIGNED(dst_v, 8) && IS_ALIGNED(dst_stride_v, 8)) {
     ARGBToUVRow = RAWToUVRow_SSSE3;
   } else
 #endif
   {
     ARGBToUVRow = RAWToUVRow_C;
   }

   for (int y = 0; y < (height - 1); y += 2) {
     ARGBToUVRow(src_frame, src_stride_frame, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
     ARGBToYRow(src_frame + src_stride_frame, dst_y + dst_stride_y, width);
     src_frame += src_stride_frame * 2;
     dst_y += dst_stride_y * 2;
     dst_u += dst_stride_u;
     dst_v += dst_stride_v;
   }
   if (height & 1) {
     ARGBToUVRow(src_frame, 0, dst_u, dst_v, width);
     ARGBToYRow(src_frame, dst_y, width);
   }
   return 0;
 }

 // Convert camera sample to I420 with cropping, rotation and vertical flip.
 // src_width is used for source stride computation
 // src_height is used to compute location of planes, and indicate inversion
 // TODO(fbarchard): sample_size should be used to ensure the low levels do
 // not read outside the buffer provided.  It is measured in bytes and is the
 // size of the frame.  With MJPEG it is the compressed size of the frame.
 int ConvertToI420(const uint8* sample, size_t sample_size,
                   uint8* y, int y_stride,
                   uint8* u, int u_stride,
                   uint8* v, int v_stride,
                   int crop_x, int crop_y,
                   int src_width, int src_height,
                   int dst_width, int dst_height,
                   RotationMode rotation,
                   uint32 format) {
   if (y == NULL || u == NULL || v == NULL || sample == NULL) {
     return -1;
   }
   int aligned_src_width = (src_width + 1) & ~1;
   const uint8* src;
   const uint8* src_uv;
   int abs_src_height = (src_height < 0) ? -src_height : src_height;
   int inv_dst_height = (dst_height < 0) ? -dst_height : dst_height;
   if (src_height < 0) {
     inv_dst_height = -inv_dst_height;
   }

   switch (format) {
     // Single plane formats
     case FOURCC_YUY2:
       src = sample + (aligned_src_width * crop_y + crop_x) * 2 ;
       YUY2ToI420(src, aligned_src_width * 2,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     case FOURCC_UYVY:
       src = sample + (aligned_src_width * crop_y + crop_x) * 2;
       UYVYToI420(src, aligned_src_width * 2,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     case FOURCC_24BG:
       src = sample + (src_width * crop_y + crop_x) * 3;
       RGB24ToI420(src, src_width * 3,
                   y, y_stride,
                   u, u_stride,
                   v, v_stride,
                   dst_width, inv_dst_height);
       break;
     case FOURCC_RAW:
       src = sample + (src_width * crop_y + crop_x) * 3;
       RAWToI420(src, src_width * 3,
                 y, y_stride,
                 u, u_stride,
                 v, v_stride,
                 dst_width, inv_dst_height);
       break;
     case FOURCC_ARGB:
       src = sample + (src_width * crop_y + crop_x) * 4;
       ARGBToI420(src, src_width * 4,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     case FOURCC_BGRA:
       src = sample + (src_width * crop_y + crop_x) * 4;
       BGRAToI420(src, src_width * 4,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     case FOURCC_ABGR:
       src = sample + (src_width * crop_y + crop_x) * 4;
       ABGRToI420(src, src_width * 4,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     case FOURCC_BGGR:
     case FOURCC_RGGB:
     case FOURCC_GRBG:
     case FOURCC_GBRG:
       // TODO(fbarchard): Support cropping by odd numbers by adjusting fourcc.
       src = sample + (src_width * crop_y + crop_x);
       BayerRGBToI420(src, src_width, format,
                      y, y_stride, u, u_stride, v, v_stride,
                      dst_width, inv_dst_height);
       break;
     case FOURCC_I400:
       src = sample + src_width * crop_y + crop_x;
       I400ToI420(src, src_width,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;

     // Biplanar formats
     case FOURCC_NV12:
       src = sample + (src_width * crop_y + crop_x);
       src_uv = sample + aligned_src_width * (src_height + crop_y / 2) + crop_x;
       NV12ToI420Rotate(src, src_width,
                        src_uv, aligned_src_width,
                        y, y_stride,
                        u, u_stride,
                        v, v_stride,
                        dst_width, inv_dst_height, rotation);
       break;
     case FOURCC_NV21:
       src = sample + (src_width * crop_y + crop_x);
       src_uv = sample + aligned_src_width * (src_height + crop_y / 2) + crop_x;
       // Call NV12 but with u and v parameters swapped.
       NV12ToI420Rotate(src, src_width,
                        src_uv, aligned_src_width,
                        y, y_stride,
                        u, u_stride,
                        v, v_stride,
                        dst_width, inv_dst_height, rotation);
       break;
     case FOURCC_M420:
       src = sample + (src_width * crop_y) * 12 / 8 + crop_x;
       M420ToI420(src, src_width,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     case FOURCC_Q420:
       src = sample + (src_width + aligned_src_width * 2) * crop_y + crop_x;
       src_uv = sample + (src_width + aligned_src_width * 2) * crop_y +
                src_width + crop_x * 2;
       Q420ToI420(src, src_width * 3,
                  src_uv, src_width * 3,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     // Triplanar formats
     case FOURCC_I420:
     case FOURCC_YV12: {
       const uint8* src_y = sample + (src_width * crop_y + crop_x);
       const uint8* src_u;
       const uint8* src_v;
       int halfwidth = (src_width + 1) / 2;
       int halfheight = (abs_src_height + 1) / 2;
       if (format == FOURCC_I420) {
         src_u = sample + src_width * abs_src_height +
             (halfwidth * crop_y + crop_x) / 2;
         src_v = sample + src_width * abs_src_height +
             halfwidth * (halfheight + crop_y / 2) + crop_x / 2;
       } else {
         src_v = sample + src_width * abs_src_height +
             (halfwidth * crop_y + crop_x) / 2;
         src_u = sample + src_width * abs_src_height +
             halfwidth * (halfheight + crop_y / 2) + crop_x / 2;
       }
       I420Rotate(src_y, src_width,
                  src_u, halfwidth,
                  src_v, halfwidth,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height, rotation);
       break;
     }
     case FOURCC_I422:
     case FOURCC_YV16: {
       const uint8* src_y = sample + src_width * crop_y + crop_x;
       const uint8* src_u;
       const uint8* src_v;
       int halfwidth = (src_width + 1) / 2;
       if (format == FOURCC_I422) {
         src_u = sample + src_width * abs_src_height +
             halfwidth * crop_y + crop_x / 2;
         src_v = sample + src_width * abs_src_height +
             halfwidth * (abs_src_height + crop_y) + crop_x / 2;
       } else {
         src_v = sample + src_width * abs_src_height +
             halfwidth * crop_y + crop_x / 2;
         src_u = sample + src_width * abs_src_height +
             halfwidth * (abs_src_height + crop_y) + crop_x / 2;
       }
       I422ToI420(src_y, src_width,
                  src_u, halfwidth,
                  src_v, halfwidth,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     }
     case FOURCC_I444:
     case FOURCC_YV24: {
       const uint8* src_y = sample + src_width * crop_y + crop_x;
       const uint8* src_u;
       const uint8* src_v;
       if (format == FOURCC_I444) {
         src_u = sample + src_width * (abs_src_height + crop_y) + crop_x;
         src_v = sample + src_width * (abs_src_height * 2 + crop_y) + crop_x;
       } else {
         src_v = sample + src_width * (abs_src_height + crop_y) + crop_x;
         src_u = sample + src_width * (abs_src_height * 2 + crop_y) + crop_x;
       }
       I444ToI420(src_y, src_width,
                  src_u, src_width,
                  src_v, src_width,
                  y, y_stride,
                  u, u_stride,
                  v, v_stride,
                  dst_width, inv_dst_height);
       break;
     }
     // Formats not supported
     case FOURCC_MJPG:
     default:
       return -1;  // unknown fourcc - return failure code.
   }
   return 0;
 }

 #ifdef __cplusplus
 }  // extern "C"
 }  // namespace libyuv
 #endif