| /* | 
 |  * Copyright (c) 2021, Alliance for Open Media. All rights reserved | 
 |  * | 
 |  * This source code is subject to the terms of the BSD 3-Clause Clear License and the | 
 |  * Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear License was | 
 |  * not distributed with this source code in the LICENSE file, you can obtain it | 
 |  * at aomedia.org/license/software-license/bsd-3-c-c/.  If the Alliance for Open Media Patent | 
 |  * License 1.0 was not distributed with this source code in the PATENTS file, you | 
 |  * can obtain it at aomedia.org/license/patent-license/. | 
 |  */ | 
 |  | 
 | #ifndef INCLUDE_LIBYUV_ROW_H_  // NOLINT | 
 | #define INCLUDE_LIBYUV_ROW_H_ | 
 |  | 
 | #include <stdlib.h>  // For malloc. | 
 |  | 
 | #include "libyuv/basic_types.h" | 
 |  | 
 | #ifdef __cplusplus | 
 | namespace libyuv { | 
 | extern "C" { | 
 | #endif | 
 |  | 
 | #define IS_ALIGNED(p, a) (!((uintptr_t)(p) & ((a) - 1))) | 
 |  | 
 | #ifdef __cplusplus | 
 | #define align_buffer_64(var, size)                                             \ | 
 |   uint8* var##_mem = reinterpret_cast<uint8*>(malloc((size) + 63));            \ | 
 |   uint8* var = reinterpret_cast<uint8*>                                        \ | 
 |       ((reinterpret_cast<intptr_t>(var##_mem) + 63) & ~63) | 
 | #else | 
 | #define align_buffer_64(var, size)                                             \ | 
 |   uint8* var##_mem = (uint8*)(malloc((size) + 63));               /* NOLINT */ \ | 
 |   uint8* var = (uint8*)(((intptr_t)(var##_mem) + 63) & ~63)       /* NOLINT */ | 
 | #endif | 
 |  | 
 | #define free_aligned_buffer_64(var) \ | 
 |   free(var##_mem);  \ | 
 |   var = 0 | 
 |  | 
 | #if defined(__pnacl__) || defined(__CLR_VER) || \ | 
 |     (defined(__i386__) && !defined(__SSE2__)) | 
 | #define LIBYUV_DISABLE_X86 | 
 | #endif | 
 | // True if compiling for SSSE3 as a requirement. | 
 | #if defined(__SSSE3__) || (defined(_M_IX86_FP) && (_M_IX86_FP >= 3)) | 
 | #define LIBYUV_SSSE3_ONLY | 
 | #endif | 
 |  | 
 | #if defined(__native_client__) | 
 | #define LIBYUV_DISABLE_NEON | 
 | #endif | 
 | // clang >= 3.5.0 required for Arm64. | 
 | #if defined(__clang__) && defined(__aarch64__) && !defined(LIBYUV_DISABLE_NEON) | 
 | #if (__clang_major__ < 3) || (__clang_major__ == 3 && (__clang_minor__ < 5)) | 
 | #define LIBYUV_DISABLE_NEON | 
 | #endif  // clang >= 3.5 | 
 | #endif  // __clang__ | 
 |  | 
 | // The following are available on all x86 platforms: | 
 | #if !defined(LIBYUV_DISABLE_X86) && \ | 
 |     (defined(_M_IX86) || defined(__x86_64__) || defined(__i386__)) | 
 | // Conversions: | 
 | #define HAS_ABGRTOUVROW_SSSE3 | 
 | #define HAS_ABGRTOYROW_SSSE3 | 
 | #define HAS_ARGB1555TOARGBROW_SSE2 | 
 | #define HAS_ARGB4444TOARGBROW_SSE2 | 
 | #define HAS_ARGBSETROW_X86 | 
 | #define HAS_ARGBSHUFFLEROW_SSE2 | 
 | #define HAS_ARGBSHUFFLEROW_SSSE3 | 
 | #define HAS_ARGBTOARGB1555ROW_SSE2 | 
 | #define HAS_ARGBTOARGB4444ROW_SSE2 | 
 | #define HAS_ARGBTORAWROW_SSSE3 | 
 | #define HAS_ARGBTORGB24ROW_SSSE3 | 
 | #define HAS_ARGBTORGB565ROW_SSE2 | 
 | #define HAS_ARGBTOUV422ROW_SSSE3 | 
 | #define HAS_ARGBTOUV444ROW_SSSE3 | 
 | #define HAS_ARGBTOUVJROW_SSSE3 | 
 | #define HAS_ARGBTOUVROW_SSSE3 | 
 | #define HAS_ARGBTOYJROW_SSSE3 | 
 | #define HAS_ARGBTOYROW_SSSE3 | 
 | #define HAS_BGRATOUVROW_SSSE3 | 
 | #define HAS_BGRATOYROW_SSSE3 | 
 | #define HAS_COPYROW_ERMS | 
 | #define HAS_COPYROW_SSE2 | 
 | #define HAS_I400TOARGBROW_SSE2 | 
 | #define HAS_I411TOARGBROW_SSSE3 | 
 | #define HAS_I422TOABGRROW_SSSE3 | 
 | #define HAS_I422TOARGB1555ROW_SSSE3 | 
 | #define HAS_I422TOARGB4444ROW_SSSE3 | 
 | #define HAS_I422TOARGBROW_SSSE3 | 
 | #define HAS_I422TOBGRAROW_SSSE3 | 
 | #define HAS_I422TORAWROW_SSSE3 | 
 | #define HAS_I422TORGB24ROW_SSSE3 | 
 | #define HAS_I422TORGB565ROW_SSSE3 | 
 | #define HAS_I422TORGBAROW_SSSE3 | 
 | #define HAS_I422TOUYVYROW_SSE2 | 
 | #define HAS_I422TOYUY2ROW_SSE2 | 
 | #define HAS_I444TOARGBROW_SSSE3 | 
 | #define HAS_J400TOARGBROW_SSE2 | 
 | #define HAS_J422TOARGBROW_SSSE3 | 
 | #define HAS_MERGEUVROW_SSE2 | 
 | #define HAS_MIRRORROW_SSE2 | 
 | #define HAS_MIRRORROW_SSSE3 | 
 | #define HAS_MIRRORROW_UV_SSSE3 | 
 | #define HAS_MIRRORUVROW_SSSE3 | 
 | #define HAS_NV12TOARGBROW_SSSE3 | 
 | #define HAS_NV12TORGB565ROW_SSSE3 | 
 | #define HAS_NV21TOARGBROW_SSSE3 | 
 | #define HAS_NV21TORGB565ROW_SSSE3 | 
 | #define HAS_RAWTOARGBROW_SSSE3 | 
 | #define HAS_RAWTOYROW_SSSE3 | 
 | #define HAS_RGB24TOARGBROW_SSSE3 | 
 | #define HAS_RGB24TOYROW_SSSE3 | 
 | #define HAS_RGB565TOARGBROW_SSE2 | 
 | #define HAS_RGBATOUVROW_SSSE3 | 
 | #define HAS_RGBATOYROW_SSSE3 | 
 | #define HAS_SETROW_ERMS | 
 | #define HAS_SETROW_X86 | 
 | #define HAS_SPLITUVROW_SSE2 | 
 | #define HAS_UYVYTOARGBROW_SSSE3 | 
 | #define HAS_UYVYTOUV422ROW_SSE2 | 
 | #define HAS_UYVYTOUVROW_SSE2 | 
 | #define HAS_UYVYTOYROW_SSE2 | 
 | #define HAS_YUY2TOARGBROW_SSSE3 | 
 | #define HAS_YUY2TOUV422ROW_SSE2 | 
 | #define HAS_YUY2TOUVROW_SSE2 | 
 | #define HAS_YUY2TOYROW_SSE2 | 
 |  | 
 | // Effects: | 
 | #define HAS_ARGBADDROW_SSE2 | 
 | #define HAS_ARGBAFFINEROW_SSE2 | 
 | #define HAS_ARGBATTENUATEROW_SSSE3 | 
 | #define HAS_ARGBBLENDROW_SSSE3 | 
 | #define HAS_ARGBCOLORMATRIXROW_SSSE3 | 
 | #define HAS_ARGBCOLORTABLEROW_X86 | 
 | #define HAS_ARGBCOPYALPHAROW_SSE2 | 
 | #define HAS_ARGBCOPYYTOALPHAROW_SSE2 | 
 | #define HAS_ARGBGRAYROW_SSSE3 | 
 | #define HAS_ARGBLUMACOLORTABLEROW_SSSE3 | 
 | #define HAS_ARGBMIRRORROW_SSE2 | 
 | #define HAS_ARGBMULTIPLYROW_SSE2 | 
 | #define HAS_ARGBPOLYNOMIALROW_SSE2 | 
 | #define HAS_ARGBQUANTIZEROW_SSE2 | 
 | #define HAS_ARGBSEPIAROW_SSSE3 | 
 | #define HAS_ARGBSHADEROW_SSE2 | 
 | #define HAS_ARGBSUBTRACTROW_SSE2 | 
 | #define HAS_ARGBUNATTENUATEROW_SSE2 | 
 | #define HAS_COMPUTECUMULATIVESUMROW_SSE2 | 
 | #define HAS_CUMULATIVESUMTOAVERAGEROW_SSE2 | 
 | #define HAS_INTERPOLATEROW_SSE2 | 
 | #define HAS_INTERPOLATEROW_SSSE3 | 
 | #define HAS_RGBCOLORTABLEROW_X86 | 
 | #define HAS_SOBELROW_SSE2 | 
 | #define HAS_SOBELTOPLANEROW_SSE2 | 
 | #define HAS_SOBELXROW_SSE2 | 
 | #define HAS_SOBELXYROW_SSE2 | 
 | #define HAS_SOBELYROW_SSE2 | 
 | #endif | 
 |  | 
 | // The following are available on x64 Visual C and clangcl. | 
 | #if !defined(LIBYUV_DISABLE_X86) && defined (_M_X64) && \ | 
 |     (!defined(__clang__) || defined(__SSSE3__)) | 
 | #define HAS_I422TOARGBROW_SSSE3 | 
 | #endif | 
 |  | 
 | // GCC >= 4.7.0 required for AVX2. | 
 | #if defined(__GNUC__) && (defined(__x86_64__) || defined(__i386__)) | 
 | #if (__GNUC__ > 4) || (__GNUC__ == 4 && (__GNUC_MINOR__ >= 7)) | 
 | #define GCC_HAS_AVX2 1 | 
 | #endif  // GNUC >= 4.7 | 
 | #endif  // __GNUC__ | 
 |  | 
 | // clang >= 3.4.0 required for AVX2. | 
 | #if defined(__clang__) && (defined(__x86_64__) || defined(__i386__)) | 
 | #if (__clang_major__ > 3) || (__clang_major__ == 3 && (__clang_minor__ >= 4)) | 
 | #define CLANG_HAS_AVX2 1 | 
 | #endif  // clang >= 3.4 | 
 | #endif  // __clang__ | 
 |  | 
 | // Visual C 2012 required for AVX2. | 
 | #if defined(_M_IX86) && !defined(__clang__) && \ | 
 |     defined(_MSC_VER) && _MSC_VER >= 1700 | 
 | #define VISUALC_HAS_AVX2 1 | 
 | #endif  // VisualStudio >= 2012 | 
 |  | 
 | // The following are available require VS2012.  Port to GCC. | 
 | #if !defined(LIBYUV_DISABLE_X86) && defined(VISUALC_HAS_AVX2) | 
 | #define HAS_ARGB1555TOARGBROW_AVX2 | 
 | #define HAS_ARGB4444TOARGBROW_AVX2 | 
 | #define HAS_ARGBTOARGB1555ROW_AVX2 | 
 | #define HAS_ARGBTOARGB4444ROW_AVX2 | 
 | #define HAS_ARGBTORGB565DITHERROW_AVX2 | 
 | #define HAS_ARGBTORGB565DITHERROW_SSE2 | 
 | #define HAS_ARGBTORGB565ROW_AVX2 | 
 | #define HAS_I411TOARGBROW_AVX2 | 
 | #define HAS_I422TOARGB1555ROW_AVX2 | 
 | #define HAS_I422TOARGB4444ROW_AVX2 | 
 | #define HAS_I422TORGB565ROW_AVX2 | 
 | #define HAS_I444TOARGBROW_AVX2 | 
 | #define HAS_J400TOARGBROW_AVX2 | 
 | #define HAS_NV12TOARGBROW_AVX2 | 
 | #define HAS_NV12TORGB565ROW_AVX2 | 
 | #define HAS_NV21TOARGBROW_AVX2 | 
 | #define HAS_NV21TORGB565ROW_AVX2 | 
 | #define HAS_RGB565TOARGBROW_AVX2 | 
 | #endif | 
 |  | 
 | // The following are available on all x86 platforms, but | 
 | // require VS2012, clang 3.4 or gcc 4.7. | 
 | // The code supports NaCL but requires a new compiler and validator. | 
 | #if !defined(LIBYUV_DISABLE_X86) && (defined(VISUALC_HAS_AVX2) || \ | 
 |     defined(CLANG_HAS_AVX2) || defined(GCC_HAS_AVX2)) | 
 | #define HAS_ARGBCOPYALPHAROW_AVX2 | 
 | #define HAS_ARGBCOPYYTOALPHAROW_AVX2 | 
 | #define HAS_ARGBMIRRORROW_AVX2 | 
 | #define HAS_ARGBPOLYNOMIALROW_AVX2 | 
 | #define HAS_ARGBSHUFFLEROW_AVX2 | 
 | #define HAS_ARGBTOUVROW_AVX2 | 
 | #define HAS_ARGBTOYJROW_AVX2 | 
 | #define HAS_ARGBTOYROW_AVX2 | 
 | #define HAS_COPYROW_AVX | 
 | #define HAS_I400TOARGBROW_AVX2 | 
 | #define HAS_I422TOABGRROW_AVX2 | 
 | #define HAS_I422TOARGBROW_AVX2 | 
 | #define HAS_I422TOBGRAROW_AVX2 | 
 | #define HAS_I422TORAWROW_AVX2 | 
 | #define HAS_I422TORGB24ROW_AVX2 | 
 | #define HAS_I422TORGBAROW_AVX2 | 
 | #define HAS_INTERPOLATEROW_AVX2 | 
 | #define HAS_J422TOARGBROW_AVX2 | 
 | #define HAS_MERGEUVROW_AVX2 | 
 | #define HAS_MIRRORROW_AVX2 | 
 | #define HAS_SPLITUVROW_AVX2 | 
 | #define HAS_UYVYTOARGBROW_AVX2 | 
 | #define HAS_UYVYTOUV422ROW_AVX2 | 
 | #define HAS_UYVYTOUVROW_AVX2 | 
 | #define HAS_UYVYTOYROW_AVX2 | 
 | #define HAS_YUY2TOARGBROW_AVX2 | 
 | #define HAS_YUY2TOUV422ROW_AVX2 | 
 | #define HAS_YUY2TOUVROW_AVX2 | 
 | #define HAS_YUY2TOYROW_AVX2 | 
 |  | 
 | // Effects: | 
 | #define HAS_ARGBADDROW_AVX2 | 
 | #define HAS_ARGBATTENUATEROW_AVX2 | 
 | #define HAS_ARGBMULTIPLYROW_AVX2 | 
 | #define HAS_ARGBSUBTRACTROW_AVX2 | 
 | #define HAS_ARGBUNATTENUATEROW_AVX2 | 
 | #endif | 
 |  | 
 | // The following are disabled when SSSE3 is available: | 
 | #if !defined(LIBYUV_DISABLE_X86) && \ | 
 |     (defined(_M_IX86) || defined(__x86_64__) || defined(__i386__)) && \ | 
 |     !defined(LIBYUV_SSSE3_ONLY) | 
 | #define HAS_ARGBATTENUATEROW_SSE2 | 
 | #define HAS_ARGBBLENDROW_SSE2 | 
 | #define HAS_MIRRORROW_SSE2 | 
 | #endif | 
 |  | 
 | // The following are available on Neon platforms: | 
 | #if !defined(LIBYUV_DISABLE_NEON) && \ | 
 |     (defined(__aarch64__) || defined(__ARM_NEON__) || defined(LIBYUV_NEON)) | 
 | #define HAS_ABGRTOUVROW_NEON | 
 | #define HAS_ABGRTOYROW_NEON | 
 | #define HAS_ARGB1555TOARGBROW_NEON | 
 | #define HAS_ARGB1555TOUVROW_NEON | 
 | #define HAS_ARGB1555TOYROW_NEON | 
 | #define HAS_ARGB4444TOARGBROW_NEON | 
 | #define HAS_ARGB4444TOUVROW_NEON | 
 | #define HAS_ARGB4444TOYROW_NEON | 
 | #define HAS_ARGBTOARGB1555ROW_NEON | 
 | #define HAS_ARGBTOARGB4444ROW_NEON | 
 | #define HAS_ARGBTORAWROW_NEON | 
 | #define HAS_ARGBTORGB24ROW_NEON | 
 | #define HAS_ARGBTORGB565ROW_NEON | 
 | #define HAS_ARGBTOUV411ROW_NEON | 
 | #define HAS_ARGBTOUV422ROW_NEON | 
 | #define HAS_ARGBTOUV444ROW_NEON | 
 | #define HAS_ARGBTOUVJROW_NEON | 
 | #define HAS_ARGBTOUVROW_NEON | 
 | #define HAS_ARGBTOYJROW_NEON | 
 | #define HAS_ARGBTOYROW_NEON | 
 | #define HAS_BGRATOUVROW_NEON | 
 | #define HAS_BGRATOYROW_NEON | 
 | #define HAS_COPYROW_NEON | 
 | #define HAS_J400TOARGBROW_NEON | 
 | #define HAS_I411TOARGBROW_NEON | 
 | #define HAS_I422TOABGRROW_NEON | 
 | #define HAS_I422TOARGB1555ROW_NEON | 
 | #define HAS_I422TOARGB4444ROW_NEON | 
 | #define HAS_I422TOARGBROW_NEON | 
 | #define HAS_I422TOBGRAROW_NEON | 
 | #define HAS_I422TORAWROW_NEON | 
 | #define HAS_I422TORGB24ROW_NEON | 
 | #define HAS_I422TORGB565ROW_NEON | 
 | #define HAS_I422TORGBAROW_NEON | 
 | #define HAS_I422TOUYVYROW_NEON | 
 | #define HAS_I422TOYUY2ROW_NEON | 
 | #define HAS_I444TOARGBROW_NEON | 
 | #define HAS_MERGEUVROW_NEON | 
 | #define HAS_MIRRORROW_NEON | 
 | #define HAS_MIRRORUVROW_NEON | 
 | #define HAS_NV12TOARGBROW_NEON | 
 | #define HAS_NV12TORGB565ROW_NEON | 
 | #define HAS_NV21TOARGBROW_NEON | 
 | #define HAS_NV21TORGB565ROW_NEON | 
 | #define HAS_RAWTOARGBROW_NEON | 
 | #define HAS_RAWTOUVROW_NEON | 
 | #define HAS_RAWTOYROW_NEON | 
 | #define HAS_RGB24TOARGBROW_NEON | 
 | #define HAS_RGB24TOUVROW_NEON | 
 | #define HAS_RGB24TOYROW_NEON | 
 | #define HAS_RGB565TOARGBROW_NEON | 
 | #define HAS_RGB565TOUVROW_NEON | 
 | #define HAS_RGB565TOYROW_NEON | 
 | #define HAS_RGBATOUVROW_NEON | 
 | #define HAS_RGBATOYROW_NEON | 
 | #define HAS_SETROW_NEON | 
 | #define HAS_ARGBSETROW_NEON | 
 | #define HAS_SPLITUVROW_NEON | 
 | #define HAS_UYVYTOARGBROW_NEON | 
 | #define HAS_UYVYTOUV422ROW_NEON | 
 | #define HAS_UYVYTOUVROW_NEON | 
 | #define HAS_UYVYTOYROW_NEON | 
 | #define HAS_I400TOARGBROW_NEON | 
 | #define HAS_YUY2TOARGBROW_NEON | 
 | #define HAS_YUY2TOUV422ROW_NEON | 
 | #define HAS_YUY2TOUVROW_NEON | 
 | #define HAS_YUY2TOYROW_NEON | 
 | #define HAS_ARGBTORGB565DITHERROW_NEON | 
 |  | 
 | // Effects: | 
 | #define HAS_ARGBADDROW_NEON | 
 | #define HAS_ARGBATTENUATEROW_NEON | 
 | #define HAS_ARGBBLENDROW_NEON | 
 | #define HAS_ARGBGRAYROW_NEON | 
 | #define HAS_ARGBMIRRORROW_NEON | 
 | #define HAS_ARGBMULTIPLYROW_NEON | 
 | #define HAS_ARGBQUANTIZEROW_NEON | 
 | #define HAS_ARGBSEPIAROW_NEON | 
 | #define HAS_ARGBSHADEROW_NEON | 
 | #define HAS_ARGBSUBTRACTROW_NEON | 
 | #define HAS_INTERPOLATEROW_NEON | 
 | #define HAS_SOBELROW_NEON | 
 | #define HAS_SOBELTOPLANEROW_NEON | 
 | #define HAS_SOBELXROW_NEON | 
 | #define HAS_SOBELXYROW_NEON | 
 | #define HAS_SOBELYROW_NEON | 
 | #define HAS_ARGBCOLORMATRIXROW_NEON | 
 | #define HAS_ARGBSHUFFLEROW_NEON | 
 | #endif | 
 |  | 
 | // The following are available on Mips platforms: | 
 | #if !defined(LIBYUV_DISABLE_MIPS) && defined(__mips__) && \ | 
 |     (_MIPS_SIM == _MIPS_SIM_ABI32) && (__mips_isa_rev < 6) | 
 | #define HAS_COPYROW_MIPS | 
 | #if defined(__mips_dsp) && (__mips_dsp_rev >= 2) | 
 | #define HAS_I422TOABGRROW_MIPS_DSPR2 | 
 | #define HAS_I422TOARGBROW_MIPS_DSPR2 | 
 | #define HAS_I422TOBGRAROW_MIPS_DSPR2 | 
 | #define HAS_INTERPOLATEROW_MIPS_DSPR2 | 
 | #define HAS_MIRRORROW_MIPS_DSPR2 | 
 | #define HAS_MIRRORUVROW_MIPS_DSPR2 | 
 | #define HAS_SPLITUVROW_MIPS_DSPR2 | 
 | #endif | 
 | #endif | 
 |  | 
 | #if defined(_MSC_VER) && !defined(__CLR_VER) | 
 | #define SIMD_ALIGNED(var) __declspec(align(16)) var | 
 | #define SIMD_ALIGNED32(var) __declspec(align(64)) var | 
 | typedef __declspec(align(16)) int16 vec16[8]; | 
 | typedef __declspec(align(16)) int32 vec32[4]; | 
 | typedef __declspec(align(16)) int8 vec8[16]; | 
 | typedef __declspec(align(16)) uint16 uvec16[8]; | 
 | typedef __declspec(align(16)) uint32 uvec32[4]; | 
 | typedef __declspec(align(16)) uint8 uvec8[16]; | 
 | typedef __declspec(align(32)) int16 lvec16[16]; | 
 | typedef __declspec(align(32)) int32 lvec32[8]; | 
 | typedef __declspec(align(32)) int8 lvec8[32]; | 
 | typedef __declspec(align(32)) uint16 ulvec16[16]; | 
 | typedef __declspec(align(32)) uint32 ulvec32[8]; | 
 | typedef __declspec(align(32)) uint8 ulvec8[32]; | 
 | #elif defined(__GNUC__) | 
 | // Caveat GCC 4.2 to 4.7 have a known issue using vectors with const. | 
 | #define SIMD_ALIGNED(var) var __attribute__((aligned(16))) | 
 | #define SIMD_ALIGNED32(var) var __attribute__((aligned(64))) | 
 | typedef int16 __attribute__((vector_size(16))) vec16; | 
 | typedef int32 __attribute__((vector_size(16))) vec32; | 
 | typedef int8 __attribute__((vector_size(16))) vec8; | 
 | typedef uint16 __attribute__((vector_size(16))) uvec16; | 
 | typedef uint32 __attribute__((vector_size(16))) uvec32; | 
 | typedef uint8 __attribute__((vector_size(16))) uvec8; | 
 | typedef int16 __attribute__((vector_size(32))) lvec16; | 
 | typedef int32 __attribute__((vector_size(32))) lvec32; | 
 | typedef int8 __attribute__((vector_size(32))) lvec8; | 
 | typedef uint16 __attribute__((vector_size(32))) ulvec16; | 
 | typedef uint32 __attribute__((vector_size(32))) ulvec32; | 
 | typedef uint8 __attribute__((vector_size(32))) ulvec8; | 
 | #else | 
 | #define SIMD_ALIGNED(var) var | 
 | #define SIMD_ALIGNED32(var) var | 
 | typedef int16 vec16[8]; | 
 | typedef int32 vec32[4]; | 
 | typedef int8 vec8[16]; | 
 | typedef uint16 uvec16[8]; | 
 | typedef uint32 uvec32[4]; | 
 | typedef uint8 uvec8[16]; | 
 | typedef int16 lvec16[16]; | 
 | typedef int32 lvec32[8]; | 
 | typedef int8 lvec8[32]; | 
 | typedef uint16 ulvec16[16]; | 
 | typedef uint32 ulvec32[8]; | 
 | typedef uint8 ulvec8[32]; | 
 | #endif | 
 |  | 
 | #if defined(__APPLE__) || defined(__x86_64__) || defined(__llvm__) | 
 | #define OMITFP | 
 | #else | 
 | #define OMITFP __attribute__((optimize("omit-frame-pointer"))) | 
 | #endif | 
 |  | 
 | // NaCL macros for GCC x86 and x64. | 
 | #if defined(__native_client__) | 
 | #define LABELALIGN ".p2align 5\n" | 
 | #else | 
 | #define LABELALIGN | 
 | #endif | 
 | #if defined(__native_client__) && defined(__x86_64__) | 
 | // r14 is used for MEMOP macros. | 
 | #define NACL_R14 "r14", | 
 | #define BUNDLELOCK ".bundle_lock\n" | 
 | #define BUNDLEUNLOCK ".bundle_unlock\n" | 
 | #define MEMACCESS(base) "%%nacl:(%%r15,%q" #base ")" | 
 | #define MEMACCESS2(offset, base) "%%nacl:" #offset "(%%r15,%q" #base ")" | 
 | #define MEMLEA(offset, base) #offset "(%q" #base ")" | 
 | #define MEMLEA3(offset, index, scale) \ | 
 |     #offset "(,%q" #index "," #scale ")" | 
 | #define MEMLEA4(offset, base, index, scale) \ | 
 |     #offset "(%q" #base ",%q" #index "," #scale ")" | 
 | #define MEMMOVESTRING(s, d) "%%nacl:(%q" #s "),%%nacl:(%q" #d "), %%r15" | 
 | #define MEMSTORESTRING(reg, d) "%%" #reg ",%%nacl:(%q" #d "), %%r15" | 
 | #define MEMOPREG(opcode, offset, base, index, scale, reg) \ | 
 |     BUNDLELOCK \ | 
 |     "lea " #offset "(%q" #base ",%q" #index "," #scale "),%%r14d\n" \ | 
 |     #opcode " (%%r15,%%r14),%%" #reg "\n" \ | 
 |     BUNDLEUNLOCK | 
 | #define MEMOPMEM(opcode, reg, offset, base, index, scale) \ | 
 |     BUNDLELOCK \ | 
 |     "lea " #offset "(%q" #base ",%q" #index "," #scale "),%%r14d\n" \ | 
 |     #opcode " %%" #reg ",(%%r15,%%r14)\n" \ | 
 |     BUNDLEUNLOCK | 
 | #define MEMOPARG(opcode, offset, base, index, scale, arg) \ | 
 |     BUNDLELOCK \ | 
 |     "lea " #offset "(%q" #base ",%q" #index "," #scale "),%%r14d\n" \ | 
 |     #opcode " (%%r15,%%r14),%" #arg "\n" \ | 
 |     BUNDLEUNLOCK | 
 | #define VMEMOPREG(opcode, offset, base, index, scale, reg1, reg2) \ | 
 |     BUNDLELOCK \ | 
 |     "lea " #offset "(%q" #base ",%q" #index "," #scale "),%%r14d\n" \ | 
 |     #opcode " (%%r15,%%r14),%%" #reg1 ",%%" #reg2 "\n" \ | 
 |     BUNDLEUNLOCK | 
 | #define VEXTOPMEM(op, sel, reg, offset, base, index, scale) \ | 
 |     BUNDLELOCK \ | 
 |     "lea " #offset "(%q" #base ",%q" #index "," #scale "),%%r14d\n" \ | 
 |     #op " $" #sel ",%%" #reg ",(%%r15,%%r14)\n" \ | 
 |     BUNDLEUNLOCK | 
 | #else  // defined(__native_client__) && defined(__x86_64__) | 
 | #define NACL_R14 | 
 | #define BUNDLEALIGN | 
 | #define MEMACCESS(base) "(%" #base ")" | 
 | #define MEMACCESS2(offset, base) #offset "(%" #base ")" | 
 | #define MEMLEA(offset, base) #offset "(%" #base ")" | 
 | #define MEMLEA3(offset, index, scale) \ | 
 |     #offset "(,%" #index "," #scale ")" | 
 | #define MEMLEA4(offset, base, index, scale) \ | 
 |     #offset "(%" #base ",%" #index "," #scale ")" | 
 | #define MEMMOVESTRING(s, d) | 
 | #define MEMSTORESTRING(reg, d) | 
 | #define MEMOPREG(opcode, offset, base, index, scale, reg) \ | 
 |     #opcode " " #offset "(%" #base ",%" #index "," #scale "),%%" #reg "\n" | 
 | #define MEMOPMEM(opcode, reg, offset, base, index, scale) \ | 
 |     #opcode " %%" #reg ","#offset "(%" #base ",%" #index "," #scale ")\n" | 
 | #define MEMOPARG(opcode, offset, base, index, scale, arg) \ | 
 |     #opcode " " #offset "(%" #base ",%" #index "," #scale "),%" #arg "\n" | 
 | #define VMEMOPREG(opcode, offset, base, index, scale, reg1, reg2) \ | 
 |     #opcode " " #offset "(%" #base ",%" #index "," #scale "),%%" #reg1 ",%%" \ | 
 |     #reg2 "\n" | 
 | #define VEXTOPMEM(op, sel, reg, offset, base, index, scale) \ | 
 |     #op " $" #sel ",%%" #reg ","#offset "(%" #base ",%" #index "," #scale ")\n" | 
 | #endif  // defined(__native_client__) && defined(__x86_64__) | 
 |  | 
 | #if defined(__arm__) || defined(__aarch64__) | 
 | #undef MEMACCESS | 
 | #if defined(__native_client__) | 
 | #define MEMACCESS(base) ".p2align 3\nbic %" #base ", #0xc0000000\n" | 
 | #else | 
 | #define MEMACCESS(base) | 
 | #endif | 
 | #endif | 
 |  | 
 | void I444ToARGBRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToARGBRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I411ToARGBRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToBGRARow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_bgra, | 
 |                         int width); | 
 | void I422ToABGRRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_abgr, | 
 |                         int width); | 
 | void I422ToRGBARow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_rgba, | 
 |                         int width); | 
 | void I422ToRGB24Row_NEON(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_rgb24, | 
 |                          int width); | 
 | void I422ToRAWRow_NEON(const uint8* src_y, | 
 |                        const uint8* src_u, | 
 |                        const uint8* src_v, | 
 |                        uint8* dst_raw, | 
 |                        int width); | 
 | void I422ToRGB565Row_NEON(const uint8* src_y, | 
 |                           const uint8* src_u, | 
 |                           const uint8* src_v, | 
 |                           uint8* dst_rgb565, | 
 |                           int width); | 
 | void I422ToARGB1555Row_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb1555, | 
 |                             int width); | 
 | void I422ToARGB4444Row_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb4444, | 
 |                             int width); | 
 | void NV12ToARGBRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_uv, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void NV21ToARGBRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_vu, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void NV12ToRGB565Row_NEON(const uint8* src_y, | 
 |                           const uint8* src_uv, | 
 |                           uint8* dst_rgb565, | 
 |                           int width); | 
 | void NV21ToRGB565Row_NEON(const uint8* src_y, | 
 |                           const uint8* src_vu, | 
 |                           uint8* dst_rgb565, | 
 |                           int width); | 
 | void YUY2ToARGBRow_NEON(const uint8* src_yuy2, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void UYVYToARGBRow_NEON(const uint8* src_uyvy, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 |  | 
 | void ARGBToYRow_AVX2(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYRow_Any_AVX2(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYRow_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_AVX2(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_Any_AVX2(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void BGRAToYRow_SSSE3(const uint8* src_bgra, uint8* dst_y, int pix); | 
 | void ABGRToYRow_SSSE3(const uint8* src_abgr, uint8* dst_y, int pix); | 
 | void RGBAToYRow_SSSE3(const uint8* src_rgba, uint8* dst_y, int pix); | 
 | void RGB24ToYRow_SSSE3(const uint8* src_rgb24, uint8* dst_y, int pix); | 
 | void RAWToYRow_SSSE3(const uint8* src_raw, uint8* dst_y, int pix); | 
 | void ARGBToYRow_NEON(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_NEON(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToUV444Row_NEON(const uint8* src_argb, uint8* dst_u, uint8* dst_v, | 
 |                          int pix); | 
 | void ARGBToUV422Row_NEON(const uint8* src_argb, uint8* dst_u, uint8* dst_v, | 
 |                          int pix); | 
 | void ARGBToUV411Row_NEON(const uint8* src_argb, uint8* dst_u, uint8* dst_v, | 
 |                          int pix); | 
 | void ARGBToUVRow_NEON(const uint8* src_argb, int src_stride_argb, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGBToUVJRow_NEON(const uint8* src_argb, int src_stride_argb, | 
 |                        uint8* dst_u, uint8* dst_v, int pix); | 
 | void BGRAToUVRow_NEON(const uint8* src_bgra, int src_stride_bgra, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void ABGRToUVRow_NEON(const uint8* src_abgr, int src_stride_abgr, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void RGBAToUVRow_NEON(const uint8* src_rgba, int src_stride_rgba, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void RGB24ToUVRow_NEON(const uint8* src_rgb24, int src_stride_rgb24, | 
 |                        uint8* dst_u, uint8* dst_v, int pix); | 
 | void RAWToUVRow_NEON(const uint8* src_raw, int src_stride_raw, | 
 |                      uint8* dst_u, uint8* dst_v, int pix); | 
 | void RGB565ToUVRow_NEON(const uint8* src_rgb565, int src_stride_rgb565, | 
 |                         uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGB1555ToUVRow_NEON(const uint8* src_argb1555, int src_stride_argb1555, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGB4444ToUVRow_NEON(const uint8* src_argb4444, int src_stride_argb4444, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void BGRAToYRow_NEON(const uint8* src_bgra, uint8* dst_y, int pix); | 
 | void ABGRToYRow_NEON(const uint8* src_abgr, uint8* dst_y, int pix); | 
 | void RGBAToYRow_NEON(const uint8* src_rgba, uint8* dst_y, int pix); | 
 | void RGB24ToYRow_NEON(const uint8* src_rgb24, uint8* dst_y, int pix); | 
 | void RAWToYRow_NEON(const uint8* src_raw, uint8* dst_y, int pix); | 
 | void RGB565ToYRow_NEON(const uint8* src_rgb565, uint8* dst_y, int pix); | 
 | void ARGB1555ToYRow_NEON(const uint8* src_argb1555, uint8* dst_y, int pix); | 
 | void ARGB4444ToYRow_NEON(const uint8* src_argb4444, uint8* dst_y, int pix); | 
 | void ARGBToYRow_C(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_C(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void BGRAToYRow_C(const uint8* src_bgra, uint8* dst_y, int pix); | 
 | void ABGRToYRow_C(const uint8* src_abgr, uint8* dst_y, int pix); | 
 | void RGBAToYRow_C(const uint8* src_rgba, uint8* dst_y, int pix); | 
 | void RGB24ToYRow_C(const uint8* src_rgb24, uint8* dst_y, int pix); | 
 | void RAWToYRow_C(const uint8* src_raw, uint8* dst_y, int pix); | 
 | void RGB565ToYRow_C(const uint8* src_rgb565, uint8* dst_y, int pix); | 
 | void ARGB1555ToYRow_C(const uint8* src_argb1555, uint8* dst_y, int pix); | 
 | void ARGB4444ToYRow_C(const uint8* src_argb4444, uint8* dst_y, int pix); | 
 | void ARGBToYRow_Any_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_Any_SSSE3(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void BGRAToYRow_Any_SSSE3(const uint8* src_bgra, uint8* dst_y, int pix); | 
 | void ABGRToYRow_Any_SSSE3(const uint8* src_abgr, uint8* dst_y, int pix); | 
 | void RGBAToYRow_Any_SSSE3(const uint8* src_rgba, uint8* dst_y, int pix); | 
 | void RGB24ToYRow_Any_SSSE3(const uint8* src_rgb24, uint8* dst_y, int pix); | 
 | void RAWToYRow_Any_SSSE3(const uint8* src_raw, uint8* dst_y, int pix); | 
 | void ARGBToYRow_Any_NEON(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void ARGBToYJRow_Any_NEON(const uint8* src_argb, uint8* dst_y, int pix); | 
 | void BGRAToYRow_Any_NEON(const uint8* src_bgra, uint8* dst_y, int pix); | 
 | void ABGRToYRow_Any_NEON(const uint8* src_abgr, uint8* dst_y, int pix); | 
 | void RGBAToYRow_Any_NEON(const uint8* src_rgba, uint8* dst_y, int pix); | 
 | void RGB24ToYRow_Any_NEON(const uint8* src_rgb24, uint8* dst_y, int pix); | 
 | void RAWToYRow_Any_NEON(const uint8* src_raw, uint8* dst_y, int pix); | 
 | void RGB565ToYRow_Any_NEON(const uint8* src_rgb565, uint8* dst_y, int pix); | 
 | void ARGB1555ToYRow_Any_NEON(const uint8* src_argb1555, uint8* dst_y, int pix); | 
 | void ARGB4444ToYRow_Any_NEON(const uint8* src_argb4444, uint8* dst_y, int pix); | 
 |  | 
 | void ARGBToUVRow_AVX2(const uint8* src_argb, int src_stride_argb, | 
 |                       uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVRow_Any_AVX2(const uint8* src_argb, int src_stride_argb, | 
 |                           uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVRow_SSSE3(const uint8* src_argb, int src_stride_argb, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVJRow_SSSE3(const uint8* src_argb, int src_stride_argb, | 
 |                         uint8* dst_u, uint8* dst_v, int width); | 
 | void BGRAToUVRow_SSSE3(const uint8* src_bgra, int src_stride_bgra, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 | void ABGRToUVRow_SSSE3(const uint8* src_abgr, int src_stride_abgr, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 | void RGBAToUVRow_SSSE3(const uint8* src_rgba, int src_stride_rgba, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVRow_Any_SSSE3(const uint8* src_argb, int src_stride_argb, | 
 |                            uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVJRow_Any_SSSE3(const uint8* src_argb, int src_stride_argb, | 
 |                             uint8* dst_u, uint8* dst_v, int width); | 
 | void BGRAToUVRow_Any_SSSE3(const uint8* src_bgra, int src_stride_bgra, | 
 |                            uint8* dst_u, uint8* dst_v, int width); | 
 | void ABGRToUVRow_Any_SSSE3(const uint8* src_abgr, int src_stride_abgr, | 
 |                            uint8* dst_u, uint8* dst_v, int width); | 
 | void RGBAToUVRow_Any_SSSE3(const uint8* src_rgba, int src_stride_rgba, | 
 |                            uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUV444Row_Any_NEON(const uint8* src_argb, uint8* dst_u, uint8* dst_v, | 
 |                              int pix); | 
 | void ARGBToUV422Row_Any_NEON(const uint8* src_argb, uint8* dst_u, uint8* dst_v, | 
 |                              int pix); | 
 | void ARGBToUV411Row_Any_NEON(const uint8* src_argb, uint8* dst_u, uint8* dst_v, | 
 |                              int pix); | 
 | void ARGBToUVRow_Any_NEON(const uint8* src_argb, int src_stride_argb, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGBToUVJRow_Any_NEON(const uint8* src_argb, int src_stride_argb, | 
 |                            uint8* dst_u, uint8* dst_v, int pix); | 
 | void BGRAToUVRow_Any_NEON(const uint8* src_bgra, int src_stride_bgra, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void ABGRToUVRow_Any_NEON(const uint8* src_abgr, int src_stride_abgr, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void RGBAToUVRow_Any_NEON(const uint8* src_rgba, int src_stride_rgba, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void RGB24ToUVRow_Any_NEON(const uint8* src_rgb24, int src_stride_rgb24, | 
 |                            uint8* dst_u, uint8* dst_v, int pix); | 
 | void RAWToUVRow_Any_NEON(const uint8* src_raw, int src_stride_raw, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void RGB565ToUVRow_Any_NEON(const uint8* src_rgb565, int src_stride_rgb565, | 
 |                             uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGB1555ToUVRow_Any_NEON(const uint8* src_argb1555, | 
 |                               int src_stride_argb1555, | 
 |                               uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGB4444ToUVRow_Any_NEON(const uint8* src_argb4444, | 
 |                               int src_stride_argb4444, | 
 |                               uint8* dst_u, uint8* dst_v, int pix); | 
 | void ARGBToUVRow_C(const uint8* src_argb, int src_stride_argb, | 
 |                    uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVJRow_C(const uint8* src_argb, int src_stride_argb, | 
 |                     uint8* dst_u, uint8* dst_v, int width); | 
 | void BGRAToUVRow_C(const uint8* src_bgra, int src_stride_bgra, | 
 |                    uint8* dst_u, uint8* dst_v, int width); | 
 | void ABGRToUVRow_C(const uint8* src_abgr, int src_stride_abgr, | 
 |                    uint8* dst_u, uint8* dst_v, int width); | 
 | void RGBAToUVRow_C(const uint8* src_rgba, int src_stride_rgba, | 
 |                    uint8* dst_u, uint8* dst_v, int width); | 
 | void RGB24ToUVRow_C(const uint8* src_rgb24, int src_stride_rgb24, | 
 |                     uint8* dst_u, uint8* dst_v, int width); | 
 | void RAWToUVRow_C(const uint8* src_raw, int src_stride_raw, | 
 |                   uint8* dst_u, uint8* dst_v, int width); | 
 | void RGB565ToUVRow_C(const uint8* src_rgb565, int src_stride_rgb565, | 
 |                      uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGB1555ToUVRow_C(const uint8* src_argb1555, int src_stride_argb1555, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGB4444ToUVRow_C(const uint8* src_argb4444, int src_stride_argb4444, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 |  | 
 | void ARGBToUV444Row_SSSE3(const uint8* src_argb, | 
 |                           uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUV444Row_Any_SSSE3(const uint8* src_argb, | 
 |                               uint8* dst_u, uint8* dst_v, int width); | 
 |  | 
 | void ARGBToUV422Row_SSSE3(const uint8* src_argb, | 
 |                           uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUV422Row_Any_SSSE3(const uint8* src_argb, | 
 |                               uint8* dst_u, uint8* dst_v, int width); | 
 |  | 
 | void ARGBToUV444Row_C(const uint8* src_argb, | 
 |                       uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUV422Row_C(const uint8* src_argb, | 
 |                       uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUV411Row_C(const uint8* src_argb, | 
 |                       uint8* dst_u, uint8* dst_v, int width); | 
 | void ARGBToUVJ422Row_C(const uint8* src_argb, | 
 |                        uint8* dst_u, uint8* dst_v, int width); | 
 |  | 
 | void MirrorRow_AVX2(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_SSSE3(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_SSE2(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_NEON(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_MIPS_DSPR2(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_C(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_Any_AVX2(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_Any_SSSE3(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_Any_SSE2(const uint8* src, uint8* dst, int width); | 
 | void MirrorRow_Any_NEON(const uint8* src, uint8* dst, int width); | 
 |  | 
 | void MirrorUVRow_SSSE3(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                        int width); | 
 | void MirrorUVRow_NEON(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                       int width); | 
 | void MirrorUVRow_MIPS_DSPR2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                             int width); | 
 | void MirrorUVRow_C(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                    int width); | 
 |  | 
 | void ARGBMirrorRow_AVX2(const uint8* src, uint8* dst, int width); | 
 | void ARGBMirrorRow_SSE2(const uint8* src, uint8* dst, int width); | 
 | void ARGBMirrorRow_NEON(const uint8* src, uint8* dst, int width); | 
 | void ARGBMirrorRow_C(const uint8* src, uint8* dst, int width); | 
 | void ARGBMirrorRow_Any_AVX2(const uint8* src, uint8* dst, int width); | 
 | void ARGBMirrorRow_Any_SSE2(const uint8* src, uint8* dst, int width); | 
 | void ARGBMirrorRow_Any_NEON(const uint8* src, uint8* dst, int width); | 
 |  | 
 | void SplitUVRow_C(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); | 
 | void SplitUVRow_SSE2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); | 
 | void SplitUVRow_AVX2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); | 
 | void SplitUVRow_NEON(const uint8* src_uv, uint8* dst_u, uint8* dst_v, int pix); | 
 | void SplitUVRow_MIPS_DSPR2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                            int pix); | 
 | void SplitUVRow_Any_SSE2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                          int pix); | 
 | void SplitUVRow_Any_AVX2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                          int pix); | 
 | void SplitUVRow_Any_NEON(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                          int pix); | 
 | void SplitUVRow_Any_MIPS_DSPR2(const uint8* src_uv, uint8* dst_u, uint8* dst_v, | 
 |                                int pix); | 
 |  | 
 | void MergeUVRow_C(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                   int width); | 
 | void MergeUVRow_SSE2(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                      int width); | 
 | void MergeUVRow_AVX2(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                      int width); | 
 | void MergeUVRow_NEON(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                      int width); | 
 | void MergeUVRow_Any_SSE2(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                          int width); | 
 | void MergeUVRow_Any_AVX2(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                          int width); | 
 | void MergeUVRow_Any_NEON(const uint8* src_u, const uint8* src_v, uint8* dst_uv, | 
 |                          int width); | 
 |  | 
 | void CopyRow_SSE2(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_AVX(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_ERMS(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_NEON(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_MIPS(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_C(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_Any_SSE2(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_Any_AVX(const uint8* src, uint8* dst, int count); | 
 | void CopyRow_Any_NEON(const uint8* src, uint8* dst, int count); | 
 |  | 
 | void CopyRow_16_C(const uint16* src, uint16* dst, int count); | 
 |  | 
 | void ARGBCopyAlphaRow_C(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBCopyAlphaRow_SSE2(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBCopyAlphaRow_AVX2(const uint8* src_argb, uint8* dst_argb, int width); | 
 |  | 
 | void ARGBCopyYToAlphaRow_C(const uint8* src_y, uint8* dst_argb, int width); | 
 | void ARGBCopyYToAlphaRow_SSE2(const uint8* src_y, uint8* dst_argb, int width); | 
 | void ARGBCopyYToAlphaRow_AVX2(const uint8* src_y, uint8* dst_argb, int width); | 
 |  | 
 | void SetRow_C(uint8* dst, uint8 v8, int count); | 
 | void SetRow_X86(uint8* dst, uint8 v8, int count); | 
 | void SetRow_ERMS(uint8* dst, uint8 v8, int count); | 
 | void SetRow_NEON(uint8* dst, uint8 v8, int count); | 
 | void SetRow_Any_X86(uint8* dst, uint8 v8, int count); | 
 | void SetRow_Any_NEON(uint8* dst, uint8 v8, int count); | 
 |  | 
 | void ARGBSetRow_C(uint8* dst_argb, uint32 v32, int count); | 
 | void ARGBSetRow_X86(uint8* dst_argb, uint32 v32, int count); | 
 | void ARGBSetRow_NEON(uint8* dst_argb, uint32 v32, int count); | 
 | void ARGBSetRow_Any_NEON(uint8* dst_argb, uint32 v32, int count); | 
 |  | 
 | // ARGBShufflers for BGRAToARGB etc. | 
 | void ARGBShuffleRow_C(const uint8* src_argb, uint8* dst_argb, | 
 |                       const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_SSE2(const uint8* src_argb, uint8* dst_argb, | 
 |                          const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_SSSE3(const uint8* src_argb, uint8* dst_argb, | 
 |                           const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_AVX2(const uint8* src_argb, uint8* dst_argb, | 
 |                          const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_NEON(const uint8* src_argb, uint8* dst_argb, | 
 |                          const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_Any_SSE2(const uint8* src_argb, uint8* dst_argb, | 
 |                              const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_Any_SSSE3(const uint8* src_argb, uint8* dst_argb, | 
 |                               const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_Any_AVX2(const uint8* src_argb, uint8* dst_argb, | 
 |                              const uint8* shuffler, int pix); | 
 | void ARGBShuffleRow_Any_NEON(const uint8* src_argb, uint8* dst_argb, | 
 |                              const uint8* shuffler, int pix); | 
 |  | 
 | void RGB24ToARGBRow_SSSE3(const uint8* src_rgb24, uint8* dst_argb, int pix); | 
 | void RAWToARGBRow_SSSE3(const uint8* src_raw, uint8* dst_argb, int pix); | 
 | void RGB565ToARGBRow_SSE2(const uint8* src_rgb565, uint8* dst_argb, int pix); | 
 | void ARGB1555ToARGBRow_SSE2(const uint8* src_argb1555, uint8* dst_argb, | 
 |                             int pix); | 
 | void ARGB4444ToARGBRow_SSE2(const uint8* src_argb4444, uint8* dst_argb, | 
 |                             int pix); | 
 | void RGB565ToARGBRow_AVX2(const uint8* src_rgb565, uint8* dst_argb, int pix); | 
 | void ARGB1555ToARGBRow_AVX2(const uint8* src_argb1555, uint8* dst_argb, | 
 |                             int pix); | 
 | void ARGB4444ToARGBRow_AVX2(const uint8* src_argb4444, uint8* dst_argb, | 
 |                             int pix); | 
 |  | 
 | void RGB24ToARGBRow_NEON(const uint8* src_rgb24, uint8* dst_argb, int pix); | 
 | void RAWToARGBRow_NEON(const uint8* src_raw, uint8* dst_argb, int pix); | 
 | void RGB565ToARGBRow_NEON(const uint8* src_rgb565, uint8* dst_argb, int pix); | 
 | void ARGB1555ToARGBRow_NEON(const uint8* src_argb1555, uint8* dst_argb, | 
 |                             int pix); | 
 | void ARGB4444ToARGBRow_NEON(const uint8* src_argb4444, uint8* dst_argb, | 
 |                             int pix); | 
 | void RGB24ToARGBRow_C(const uint8* src_rgb24, uint8* dst_argb, int pix); | 
 | void RAWToARGBRow_C(const uint8* src_raw, uint8* dst_argb, int pix); | 
 | void RGB565ToARGBRow_C(const uint8* src_rgb, uint8* dst_argb, int pix); | 
 | void ARGB1555ToARGBRow_C(const uint8* src_argb, uint8* dst_argb, int pix); | 
 | void ARGB4444ToARGBRow_C(const uint8* src_argb, uint8* dst_argb, int pix); | 
 | void RGB24ToARGBRow_Any_SSSE3(const uint8* src_rgb24, uint8* dst_argb, int pix); | 
 | void RAWToARGBRow_Any_SSSE3(const uint8* src_raw, uint8* dst_argb, int pix); | 
 |  | 
 | void RGB565ToARGBRow_Any_SSE2(const uint8* src_rgb565, uint8* dst_argb, | 
 |                               int pix); | 
 | void ARGB1555ToARGBRow_Any_SSE2(const uint8* src_argb1555, uint8* dst_argb, | 
 |                                 int pix); | 
 | void ARGB4444ToARGBRow_Any_SSE2(const uint8* src_argb4444, uint8* dst_argb, | 
 |                                 int pix); | 
 | void RGB565ToARGBRow_Any_AVX2(const uint8* src_rgb565, uint8* dst_argb, | 
 |                               int pix); | 
 | void ARGB1555ToARGBRow_Any_AVX2(const uint8* src_argb1555, uint8* dst_argb, | 
 |                                 int pix); | 
 | void ARGB4444ToARGBRow_Any_AVX2(const uint8* src_argb4444, uint8* dst_argb, | 
 |                                 int pix); | 
 |  | 
 | void RGB24ToARGBRow_Any_NEON(const uint8* src_rgb24, uint8* dst_argb, int pix); | 
 | void RAWToARGBRow_Any_NEON(const uint8* src_raw, uint8* dst_argb, int pix); | 
 | void RGB565ToARGBRow_Any_NEON(const uint8* src_rgb565, uint8* dst_argb, | 
 |                               int pix); | 
 | void ARGB1555ToARGBRow_Any_NEON(const uint8* src_argb1555, uint8* dst_argb, | 
 |                                 int pix); | 
 | void ARGB4444ToARGBRow_Any_NEON(const uint8* src_argb4444, uint8* dst_argb, | 
 |                                 int pix); | 
 |  | 
 | void ARGBToRGB24Row_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRAWRow_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565Row_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 |  | 
 | void ARGBToRGB565DitherRow_C(const uint8* src_argb, uint8* dst_rgb, | 
 |                              const uint32 dither4, int pix); | 
 | void ARGBToRGB565DitherRow_SSE2(const uint8* src_argb, uint8* dst_rgb, | 
 |                                 const uint32 dither4, int pix); | 
 | void ARGBToRGB565DitherRow_AVX2(const uint8* src_argb, uint8* dst_rgb, | 
 |                                 const uint32 dither4, int pix); | 
 |  | 
 | void ARGBToRGB565Row_AVX2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_AVX2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_AVX2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 |  | 
 | void ARGBToRGB24Row_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRAWRow_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565Row_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565DitherRow_NEON(const uint8* src_argb, uint8* dst_rgb, | 
 |                                 const uint32 dither4, int width); | 
 |  | 
 | void ARGBToRGBARow_C(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB24Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRAWRow_C(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_C(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 |  | 
 | void J400ToARGBRow_SSE2(const uint8* src_y, uint8* dst_argb, int pix); | 
 | void J400ToARGBRow_AVX2(const uint8* src_y, uint8* dst_argb, int pix); | 
 | void J400ToARGBRow_NEON(const uint8* src_y, uint8* dst_argb, int pix); | 
 | void J400ToARGBRow_C(const uint8* src_y, uint8* dst_argb, int pix); | 
 | void J400ToARGBRow_Any_SSE2(const uint8* src_y, uint8* dst_argb, int pix); | 
 | void J400ToARGBRow_Any_AVX2(const uint8* src_y, uint8* dst_argb, int pix); | 
 | void J400ToARGBRow_Any_NEON(const uint8* src_y, uint8* dst_argb, int pix); | 
 |  | 
 | void I444ToARGBRow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void I422ToARGBRow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void I411ToARGBRow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void NV12ToARGBRow_C(const uint8* src_y, | 
 |                      const uint8* src_uv, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void NV21ToRGB565Row_C(const uint8* src_y, | 
 |                        const uint8* src_vu, | 
 |                        uint8* dst_argb, | 
 |                        int width); | 
 | void NV12ToRGB565Row_C(const uint8* src_y, | 
 |                        const uint8* src_uv, | 
 |                        uint8* dst_argb, | 
 |                        int width); | 
 | void NV21ToARGBRow_C(const uint8* src_y, | 
 |                      const uint8* src_vu, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void YUY2ToARGBRow_C(const uint8* src_yuy2, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void UYVYToARGBRow_C(const uint8* src_uyvy, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void J422ToARGBRow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_argb, | 
 |                      int width); | 
 | void I422ToBGRARow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_bgra, | 
 |                      int width); | 
 | void I422ToABGRRow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_abgr, | 
 |                      int width); | 
 | void I422ToRGBARow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_rgba, | 
 |                      int width); | 
 | void I422ToRGB24Row_C(const uint8* src_y, | 
 |                       const uint8* src_u, | 
 |                       const uint8* src_v, | 
 |                       uint8* dst_rgb24, | 
 |                       int width); | 
 | void I422ToRAWRow_C(const uint8* src_y, | 
 |                     const uint8* src_u, | 
 |                     const uint8* src_v, | 
 |                     uint8* dst_raw, | 
 |                     int width); | 
 | void I422ToARGB4444Row_C(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_argb4444, | 
 |                          int width); | 
 | void I422ToARGB1555Row_C(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_argb4444, | 
 |                          int width); | 
 | void I422ToRGB565Row_C(const uint8* src_y, | 
 |                        const uint8* src_u, | 
 |                        const uint8* src_v, | 
 |                        uint8* dst_rgb565, | 
 |                        int width); | 
 | void I422ToARGBRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToBGRARow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToRGBARow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToABGRRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I444ToARGBRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void I444ToARGBRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToARGBRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void I411ToARGBRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void I411ToARGBRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void NV12ToARGBRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_uv, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void NV21ToARGBRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_vu, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void NV12ToARGBRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_uv, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void NV21ToARGBRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_vu, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void NV12ToRGB565Row_SSSE3(const uint8* src_y, | 
 |                            const uint8* src_uv, | 
 |                            uint8* dst_argb, | 
 |                            int width); | 
 | void NV21ToRGB565Row_SSSE3(const uint8* src_y, | 
 |                            const uint8* src_vu, | 
 |                            uint8* dst_argb, | 
 |                            int width); | 
 | void NV12ToRGB565Row_AVX2(const uint8* src_y, | 
 |                           const uint8* src_uv, | 
 |                           uint8* dst_argb, | 
 |                           int width); | 
 | void NV21ToRGB565Row_AVX2(const uint8* src_y, | 
 |                           const uint8* src_vu, | 
 |                           uint8* dst_argb, | 
 |                           int width); | 
 | void YUY2ToARGBRow_SSSE3(const uint8* src_yuy2, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void UYVYToARGBRow_SSSE3(const uint8* src_uyvy, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void YUY2ToARGBRow_AVX2(const uint8* src_yuy2, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void UYVYToARGBRow_AVX2(const uint8* src_uyvy, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void J422ToARGBRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_argb, | 
 |                          int width); | 
 | void J422ToARGBRow_AVX2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_argb, | 
 |                         int width); | 
 | void I422ToBGRARow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_bgra, | 
 |                          int width); | 
 | void I422ToABGRRow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_abgr, | 
 |                          int width); | 
 | void I422ToRGBARow_SSSE3(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_rgba, | 
 |                          int width); | 
 | void I422ToARGB4444Row_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I422ToARGB4444Row_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToARGB1555Row_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I422ToARGB1555Row_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToRGB565Row_SSSE3(const uint8* src_y, | 
 |                            const uint8* src_u, | 
 |                            const uint8* src_v, | 
 |                            uint8* dst_argb, | 
 |                            int width); | 
 | void I422ToRGB565Row_AVX2(const uint8* src_y, | 
 |                           const uint8* src_u, | 
 |                           const uint8* src_v, | 
 |                           uint8* dst_argb, | 
 |                           int width); | 
 | void I422ToRGB24Row_SSSE3(const uint8* src_y, | 
 |                           const uint8* src_u, | 
 |                           const uint8* src_v, | 
 |                           uint8* dst_rgb24, | 
 |                           int width); | 
 | void I422ToRGB24Row_AVX2(const uint8* src_y, | 
 |                          const uint8* src_u, | 
 |                          const uint8* src_v, | 
 |                          uint8* dst_rgb24, | 
 |                          int width); | 
 | void I422ToRAWRow_SSSE3(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_raw, | 
 |                         int width); | 
 | void I422ToRAWRow_AVX2(const uint8* src_y, | 
 |                        const uint8* src_u, | 
 |                        const uint8* src_v, | 
 |                        uint8* dst_raw, | 
 |                        int width); | 
 | void I422ToARGBRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToBGRARow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToRGBARow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToABGRRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I444ToARGBRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I444ToARGBRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToARGBRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I411ToARGBRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I411ToARGBRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void NV12ToARGBRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_uv, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void NV21ToARGBRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_vu, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void NV12ToARGBRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_uv, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void NV21ToARGBRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_vu, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void NV12ToRGB565Row_Any_SSSE3(const uint8* src_y, | 
 |                                const uint8* src_uv, | 
 |                                uint8* dst_argb, | 
 |                                int width); | 
 | void NV21ToRGB565Row_Any_SSSE3(const uint8* src_y, | 
 |                                const uint8* src_vu, | 
 |                                uint8* dst_argb, | 
 |                                int width); | 
 | void NV12ToRGB565Row_Any_AVX2(const uint8* src_y, | 
 |                               const uint8* src_uv, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void NV21ToRGB565Row_Any_AVX2(const uint8* src_y, | 
 |                               const uint8* src_vu, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void YUY2ToARGBRow_Any_SSSE3(const uint8* src_yuy2, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void UYVYToARGBRow_Any_SSSE3(const uint8* src_uyvy, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void YUY2ToARGBRow_Any_AVX2(const uint8* src_yuy2, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void UYVYToARGBRow_Any_AVX2(const uint8* src_uyvy, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void J422ToARGBRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void J422ToARGBRow_Any_AVX2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToBGRARow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_bgra, | 
 |                              int width); | 
 | void I422ToABGRRow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_abgr, | 
 |                              int width); | 
 | void I422ToRGBARow_Any_SSSE3(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_rgba, | 
 |                              int width); | 
 | void I422ToARGB4444Row_Any_SSSE3(const uint8* src_y, | 
 |                                  const uint8* src_u, | 
 |                                  const uint8* src_v, | 
 |                                  uint8* dst_rgba, | 
 |                                  int width); | 
 | void I422ToARGB4444Row_Any_AVX2(const uint8* src_y, | 
 |                                 const uint8* src_u, | 
 |                                 const uint8* src_v, | 
 |                                 uint8* dst_rgba, | 
 |                                 int width); | 
 | void I422ToARGB1555Row_Any_SSSE3(const uint8* src_y, | 
 |                                  const uint8* src_u, | 
 |                                  const uint8* src_v, | 
 |                                  uint8* dst_rgba, | 
 |                                  int width); | 
 | void I422ToARGB1555Row_Any_AVX2(const uint8* src_y, | 
 |                                 const uint8* src_u, | 
 |                                 const uint8* src_v, | 
 |                                 uint8* dst_rgba, | 
 |                                 int width); | 
 | void I422ToRGB565Row_Any_SSSE3(const uint8* src_y, | 
 |                                const uint8* src_u, | 
 |                                const uint8* src_v, | 
 |                                uint8* dst_rgba, | 
 |                                int width); | 
 | void I422ToRGB565Row_Any_AVX2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_rgba, | 
 |                               int width); | 
 | void I422ToRGB24Row_Any_SSSE3(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void I422ToRGB24Row_Any_AVX2(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I422ToRAWRow_Any_SSSE3(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToRAWRow_Any_AVX2(const uint8* src_y, | 
 |                            const uint8* src_u, | 
 |                            const uint8* src_v, | 
 |                            uint8* dst_argb, | 
 |                            int width); | 
 |  | 
 | void I400ToARGBRow_C(const uint8* src_y, uint8* dst_argb, int width); | 
 | void I400ToARGBRow_SSE2(const uint8* src_y, uint8* dst_argb, int width); | 
 | void I400ToARGBRow_AVX2(const uint8* src_y, uint8* dst_argb, int width); | 
 | void I400ToARGBRow_NEON(const uint8* src_y, uint8* dst_argb, int width); | 
 | void I400ToARGBRow_Any_SSE2(const uint8* src_y, uint8* dst_argb, int width); | 
 | void I400ToARGBRow_Any_AVX2(const uint8* src_y, uint8* dst_argb, int width); | 
 | void I400ToARGBRow_Any_NEON(const uint8* src_y, uint8* dst_argb, int width); | 
 |  | 
 | // ARGB preattenuated alpha blend. | 
 | void ARGBBlendRow_SSSE3(const uint8* src_argb, const uint8* src_argb1, | 
 |                         uint8* dst_argb, int width); | 
 | void ARGBBlendRow_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                        uint8* dst_argb, int width); | 
 | void ARGBBlendRow_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                        uint8* dst_argb, int width); | 
 | void ARGBBlendRow_C(const uint8* src_argb, const uint8* src_argb1, | 
 |                     uint8* dst_argb, int width); | 
 |  | 
 | // ARGB multiply images. Same API as Blend, but these require | 
 | // pointer and width alignment for SSE2. | 
 | void ARGBMultiplyRow_C(const uint8* src_argb, const uint8* src_argb1, | 
 |                        uint8* dst_argb, int width); | 
 | void ARGBMultiplyRow_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                           uint8* dst_argb, int width); | 
 | void ARGBMultiplyRow_Any_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                               uint8* dst_argb, int width); | 
 | void ARGBMultiplyRow_AVX2(const uint8* src_argb, const uint8* src_argb1, | 
 |                           uint8* dst_argb, int width); | 
 | void ARGBMultiplyRow_Any_AVX2(const uint8* src_argb, const uint8* src_argb1, | 
 |                               uint8* dst_argb, int width); | 
 | void ARGBMultiplyRow_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                           uint8* dst_argb, int width); | 
 | void ARGBMultiplyRow_Any_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                               uint8* dst_argb, int width); | 
 |  | 
 | // ARGB add images. | 
 | void ARGBAddRow_C(const uint8* src_argb, const uint8* src_argb1, | 
 |                   uint8* dst_argb, int width); | 
 | void ARGBAddRow_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                      uint8* dst_argb, int width); | 
 | void ARGBAddRow_Any_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                          uint8* dst_argb, int width); | 
 | void ARGBAddRow_AVX2(const uint8* src_argb, const uint8* src_argb1, | 
 |                      uint8* dst_argb, int width); | 
 | void ARGBAddRow_Any_AVX2(const uint8* src_argb, const uint8* src_argb1, | 
 |                          uint8* dst_argb, int width); | 
 | void ARGBAddRow_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                      uint8* dst_argb, int width); | 
 | void ARGBAddRow_Any_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                          uint8* dst_argb, int width); | 
 |  | 
 | // ARGB subtract images. Same API as Blend, but these require | 
 | // pointer and width alignment for SSE2. | 
 | void ARGBSubtractRow_C(const uint8* src_argb, const uint8* src_argb1, | 
 |                        uint8* dst_argb, int width); | 
 | void ARGBSubtractRow_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                           uint8* dst_argb, int width); | 
 | void ARGBSubtractRow_Any_SSE2(const uint8* src_argb, const uint8* src_argb1, | 
 |                               uint8* dst_argb, int width); | 
 | void ARGBSubtractRow_AVX2(const uint8* src_argb, const uint8* src_argb1, | 
 |                           uint8* dst_argb, int width); | 
 | void ARGBSubtractRow_Any_AVX2(const uint8* src_argb, const uint8* src_argb1, | 
 |                               uint8* dst_argb, int width); | 
 | void ARGBSubtractRow_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                           uint8* dst_argb, int width); | 
 | void ARGBSubtractRow_Any_NEON(const uint8* src_argb, const uint8* src_argb1, | 
 |                               uint8* dst_argb, int width); | 
 |  | 
 | void ARGBToRGB24Row_Any_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRAWRow_Any_SSSE3(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565Row_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 |  | 
 | void ARGBToRGB565DitherRow_Any_SSE2(const uint8* src_argb, uint8* dst_rgb, | 
 |                                     const uint32 dither4, int pix); | 
 | void ARGBToRGB565DitherRow_Any_AVX2(const uint8* src_argb, uint8* dst_rgb, | 
 |                                     const uint32 dither4, int pix); | 
 |  | 
 | void ARGBToRGB565Row_Any_AVX2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_Any_AVX2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_Any_AVX2(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 |  | 
 | void ARGBToRGB24Row_Any_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRAWRow_Any_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565Row_Any_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB1555Row_Any_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToARGB4444Row_Any_NEON(const uint8* src_argb, uint8* dst_rgb, int pix); | 
 | void ARGBToRGB565DitherRow_Any_NEON(const uint8* src_argb, uint8* dst_rgb, | 
 |                                     const uint32 dither4, int width); | 
 |  | 
 | void I444ToARGBRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToARGBRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I411ToARGBRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToBGRARow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToABGRRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToRGBARow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToRGB24Row_Any_NEON(const uint8* src_y, | 
 |                              const uint8* src_u, | 
 |                              const uint8* src_v, | 
 |                              uint8* dst_argb, | 
 |                              int width); | 
 | void I422ToRAWRow_Any_NEON(const uint8* src_y, | 
 |                            const uint8* src_u, | 
 |                            const uint8* src_v, | 
 |                            uint8* dst_argb, | 
 |                            int width); | 
 | void I422ToARGB4444Row_Any_NEON(const uint8* src_y, | 
 |                                 const uint8* src_u, | 
 |                                 const uint8* src_v, | 
 |                                 uint8* dst_argb, | 
 |                                 int width); | 
 | void I422ToARGB1555Row_Any_NEON(const uint8* src_y, | 
 |                                 const uint8* src_u, | 
 |                                 const uint8* src_v, | 
 |                                 uint8* dst_argb, | 
 |                                 int width); | 
 | void I422ToRGB565Row_Any_NEON(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void NV12ToARGBRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_uv, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void NV21ToARGBRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_uv, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void NV12ToRGB565Row_Any_NEON(const uint8* src_y, | 
 |                               const uint8* src_uv, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void NV21ToRGB565Row_Any_NEON(const uint8* src_y, | 
 |                               const uint8* src_uv, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void YUY2ToARGBRow_Any_NEON(const uint8* src_yuy2, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void UYVYToARGBRow_Any_NEON(const uint8* src_uyvy, | 
 |                             uint8* dst_argb, | 
 |                             int width); | 
 | void I422ToARGBRow_MIPS_DSPR2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void I422ToBGRARow_MIPS_DSPR2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void I422ToABGRRow_MIPS_DSPR2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void I422ToARGBRow_MIPS_DSPR2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void I422ToBGRARow_MIPS_DSPR2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 | void I422ToABGRRow_MIPS_DSPR2(const uint8* src_y, | 
 |                               const uint8* src_u, | 
 |                               const uint8* src_v, | 
 |                               uint8* dst_argb, | 
 |                               int width); | 
 |  | 
 | void YUY2ToYRow_AVX2(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_AVX2(const uint8* src_yuy2, int stride_yuy2, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_AVX2(const uint8* src_yuy2, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToYRow_SSE2(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_SSE2(const uint8* src_yuy2, int stride_yuy2, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_SSE2(const uint8* src_yuy2, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToYRow_NEON(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_NEON(const uint8* src_yuy2, int stride_yuy2, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_NEON(const uint8* src_yuy2, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToYRow_C(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_C(const uint8* src_yuy2, int stride_yuy2, | 
 |                    uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_C(const uint8* src_yuy2, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToYRow_Any_AVX2(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_Any_AVX2(const uint8* src_yuy2, int stride_yuy2, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_Any_AVX2(const uint8* src_yuy2, | 
 |                              uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToYRow_Any_SSE2(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_Any_SSE2(const uint8* src_yuy2, int stride_yuy2, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_Any_SSE2(const uint8* src_yuy2, | 
 |                              uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToYRow_Any_NEON(const uint8* src_yuy2, uint8* dst_y, int pix); | 
 | void YUY2ToUVRow_Any_NEON(const uint8* src_yuy2, int stride_yuy2, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void YUY2ToUV422Row_Any_NEON(const uint8* src_yuy2, | 
 |                              uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_AVX2(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_AVX2(const uint8* src_uyvy, int stride_uyvy, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_AVX2(const uint8* src_uyvy, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_SSE2(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_SSE2(const uint8* src_uyvy, int stride_uyvy, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_SSE2(const uint8* src_uyvy, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_AVX2(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_AVX2(const uint8* src_uyvy, int stride_uyvy, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_AVX2(const uint8* src_uyvy, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_NEON(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_NEON(const uint8* src_uyvy, int stride_uyvy, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_NEON(const uint8* src_uyvy, | 
 |                          uint8* dst_u, uint8* dst_v, int pix); | 
 |  | 
 | void UYVYToYRow_C(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_C(const uint8* src_uyvy, int stride_uyvy, | 
 |                    uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_C(const uint8* src_uyvy, | 
 |                       uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_Any_AVX2(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_Any_AVX2(const uint8* src_uyvy, int stride_uyvy, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_Any_AVX2(const uint8* src_uyvy, | 
 |                              uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_Any_SSE2(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_Any_SSE2(const uint8* src_uyvy, int stride_uyvy, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_Any_SSE2(const uint8* src_uyvy, | 
 |                              uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToYRow_Any_NEON(const uint8* src_uyvy, uint8* dst_y, int pix); | 
 | void UYVYToUVRow_Any_NEON(const uint8* src_uyvy, int stride_uyvy, | 
 |                           uint8* dst_u, uint8* dst_v, int pix); | 
 | void UYVYToUV422Row_Any_NEON(const uint8* src_uyvy, | 
 |                              uint8* dst_u, uint8* dst_v, int pix); | 
 |  | 
 | void I422ToYUY2Row_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_yuy2, int width); | 
 | void I422ToUYVYRow_C(const uint8* src_y, | 
 |                      const uint8* src_u, | 
 |                      const uint8* src_v, | 
 |                      uint8* dst_uyvy, int width); | 
 | void I422ToYUY2Row_SSE2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_yuy2, int width); | 
 | void I422ToUYVYRow_SSE2(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_uyvy, int width); | 
 | void I422ToYUY2Row_Any_SSE2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_yuy2, int width); | 
 | void I422ToUYVYRow_Any_SSE2(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_uyvy, int width); | 
 | void I422ToYUY2Row_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_yuy2, int width); | 
 | void I422ToUYVYRow_NEON(const uint8* src_y, | 
 |                         const uint8* src_u, | 
 |                         const uint8* src_v, | 
 |                         uint8* dst_uyvy, int width); | 
 | void I422ToYUY2Row_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_yuy2, int width); | 
 | void I422ToUYVYRow_Any_NEON(const uint8* src_y, | 
 |                             const uint8* src_u, | 
 |                             const uint8* src_v, | 
 |                             uint8* dst_uyvy, int width); | 
 |  | 
 | // Effects related row functions. | 
 | void ARGBAttenuateRow_C(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBAttenuateRow_SSE2(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBAttenuateRow_SSSE3(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBAttenuateRow_AVX2(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBAttenuateRow_NEON(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBAttenuateRow_Any_SSE2(const uint8* src_argb, uint8* dst_argb, | 
 |                                int width); | 
 | void ARGBAttenuateRow_Any_SSSE3(const uint8* src_argb, uint8* dst_argb, | 
 |                                 int width); | 
 | void ARGBAttenuateRow_Any_AVX2(const uint8* src_argb, uint8* dst_argb, | 
 |                                int width); | 
 | void ARGBAttenuateRow_Any_NEON(const uint8* src_argb, uint8* dst_argb, | 
 |                                int width); | 
 |  | 
 | // Inverse table for unattenuate, shared by C and SSE2. | 
 | extern const uint32 fixed_invtbl8[256]; | 
 | void ARGBUnattenuateRow_C(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBUnattenuateRow_SSE2(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBUnattenuateRow_AVX2(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBUnattenuateRow_Any_SSE2(const uint8* src_argb, uint8* dst_argb, | 
 |                                  int width); | 
 | void ARGBUnattenuateRow_Any_AVX2(const uint8* src_argb, uint8* dst_argb, | 
 |                                  int width); | 
 |  | 
 | void ARGBGrayRow_C(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBGrayRow_SSSE3(const uint8* src_argb, uint8* dst_argb, int width); | 
 | void ARGBGrayRow_NEON(const uint8* src_argb, uint8* dst_argb, int width); | 
 |  | 
 | void ARGBSepiaRow_C(uint8* dst_argb, int width); | 
 | void ARGBSepiaRow_SSSE3(uint8* dst_argb, int width); | 
 | void ARGBSepiaRow_NEON(uint8* dst_argb, int width); | 
 |  | 
 | void ARGBColorMatrixRow_C(const uint8* src_argb, uint8* dst_argb, | 
 |                           const int8* matrix_argb, int width); | 
 | void ARGBColorMatrixRow_SSSE3(const uint8* src_argb, uint8* dst_argb, | 
 |                               const int8* matrix_argb, int width); | 
 | void ARGBColorMatrixRow_NEON(const uint8* src_argb, uint8* dst_argb, | 
 |                              const int8* matrix_argb, int width); | 
 |  | 
 | void ARGBColorTableRow_C(uint8* dst_argb, const uint8* table_argb, int width); | 
 | void ARGBColorTableRow_X86(uint8* dst_argb, const uint8* table_argb, int width); | 
 |  | 
 | void RGBColorTableRow_C(uint8* dst_argb, const uint8* table_argb, int width); | 
 | void RGBColorTableRow_X86(uint8* dst_argb, const uint8* table_argb, int width); | 
 |  | 
 | void ARGBQuantizeRow_C(uint8* dst_argb, int scale, int interval_size, | 
 |                        int interval_offset, int width); | 
 | void ARGBQuantizeRow_SSE2(uint8* dst_argb, int scale, int interval_size, | 
 |                           int interval_offset, int width); | 
 | void ARGBQuantizeRow_NEON(uint8* dst_argb, int scale, int interval_size, | 
 |                           int interval_offset, int width); | 
 |  | 
 | void ARGBShadeRow_C(const uint8* src_argb, uint8* dst_argb, int width, | 
 |                     uint32 value); | 
 | void ARGBShadeRow_SSE2(const uint8* src_argb, uint8* dst_argb, int width, | 
 |                        uint32 value); | 
 | void ARGBShadeRow_NEON(const uint8* src_argb, uint8* dst_argb, int width, | 
 |                        uint32 value); | 
 |  | 
 | // Used for blur. | 
 | void CumulativeSumToAverageRow_SSE2(const int32* topleft, const int32* botleft, | 
 |                                     int width, int area, uint8* dst, int count); | 
 | void ComputeCumulativeSumRow_SSE2(const uint8* row, int32* cumsum, | 
 |                                   const int32* previous_cumsum, int width); | 
 |  | 
 | void CumulativeSumToAverageRow_C(const int32* topleft, const int32* botleft, | 
 |                                  int width, int area, uint8* dst, int count); | 
 | void ComputeCumulativeSumRow_C(const uint8* row, int32* cumsum, | 
 |                                const int32* previous_cumsum, int width); | 
 |  | 
 | LIBYUV_API | 
 | void ARGBAffineRow_C(const uint8* src_argb, int src_argb_stride, | 
 |                      uint8* dst_argb, const float* uv_dudv, int width); | 
 | LIBYUV_API | 
 | void ARGBAffineRow_SSE2(const uint8* src_argb, int src_argb_stride, | 
 |                         uint8* dst_argb, const float* uv_dudv, int width); | 
 |  | 
 | // Used for I420Scale, ARGBScale, and ARGBInterpolate. | 
 | void InterpolateRow_C(uint8* dst_ptr, const uint8* src_ptr, | 
 |                       ptrdiff_t src_stride_ptr, | 
 |                       int width, int source_y_fraction); | 
 | void InterpolateRow_SSE2(uint8* dst_ptr, const uint8* src_ptr, | 
 |                          ptrdiff_t src_stride_ptr, int width, | 
 |                          int source_y_fraction); | 
 | void InterpolateRow_SSSE3(uint8* dst_ptr, const uint8* src_ptr, | 
 |                           ptrdiff_t src_stride_ptr, int width, | 
 |                           int source_y_fraction); | 
 | void InterpolateRow_AVX2(uint8* dst_ptr, const uint8* src_ptr, | 
 |                          ptrdiff_t src_stride_ptr, int width, | 
 |                          int source_y_fraction); | 
 | void InterpolateRow_NEON(uint8* dst_ptr, const uint8* src_ptr, | 
 |                          ptrdiff_t src_stride_ptr, int width, | 
 |                          int source_y_fraction); | 
 | void InterpolateRow_MIPS_DSPR2(uint8* dst_ptr, const uint8* src_ptr, | 
 |                                ptrdiff_t src_stride_ptr, int width, | 
 |                                int source_y_fraction); | 
 | void InterpolateRow_Any_NEON(uint8* dst_ptr, const uint8* src_ptr, | 
 |                              ptrdiff_t src_stride_ptr, int width, | 
 |                              int source_y_fraction); | 
 | void InterpolateRow_Any_SSE2(uint8* dst_ptr, const uint8* src_ptr, | 
 |                              ptrdiff_t src_stride_ptr, int width, | 
 |                              int source_y_fraction); | 
 | void InterpolateRow_Any_SSSE3(uint8* dst_ptr, const uint8* src_ptr, | 
 |                               ptrdiff_t src_stride_ptr, int width, | 
 |                               int source_y_fraction); | 
 | void InterpolateRow_Any_AVX2(uint8* dst_ptr, const uint8* src_ptr, | 
 |                              ptrdiff_t src_stride_ptr, int width, | 
 |                              int source_y_fraction); | 
 | void InterpolateRow_Any_MIPS_DSPR2(uint8* dst_ptr, const uint8* src_ptr, | 
 |                                    ptrdiff_t src_stride_ptr, int width, | 
 |                                    int source_y_fraction); | 
 |  | 
 | void InterpolateRow_16_C(uint16* dst_ptr, const uint16* src_ptr, | 
 |                          ptrdiff_t src_stride_ptr, | 
 |                          int width, int source_y_fraction); | 
 |  | 
 | // Sobel images. | 
 | void SobelXRow_C(const uint8* src_y0, const uint8* src_y1, const uint8* src_y2, | 
 |                  uint8* dst_sobelx, int width); | 
 | void SobelXRow_SSE2(const uint8* src_y0, const uint8* src_y1, | 
 |                     const uint8* src_y2, uint8* dst_sobelx, int width); | 
 | void SobelXRow_NEON(const uint8* src_y0, const uint8* src_y1, | 
 |                     const uint8* src_y2, uint8* dst_sobelx, int width); | 
 | void SobelYRow_C(const uint8* src_y0, const uint8* src_y1, | 
 |                  uint8* dst_sobely, int width); | 
 | void SobelYRow_SSE2(const uint8* src_y0, const uint8* src_y1, | 
 |                     uint8* dst_sobely, int width); | 
 | void SobelYRow_NEON(const uint8* src_y0, const uint8* src_y1, | 
 |                     uint8* dst_sobely, int width); | 
 | void SobelRow_C(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                 uint8* dst_argb, int width); | 
 | void SobelRow_SSE2(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                    uint8* dst_argb, int width); | 
 | void SobelRow_NEON(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                    uint8* dst_argb, int width); | 
 | void SobelToPlaneRow_C(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                        uint8* dst_y, int width); | 
 | void SobelToPlaneRow_SSE2(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                           uint8* dst_y, int width); | 
 | void SobelToPlaneRow_NEON(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                           uint8* dst_y, int width); | 
 | void SobelXYRow_C(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                   uint8* dst_argb, int width); | 
 | void SobelXYRow_SSE2(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                      uint8* dst_argb, int width); | 
 | void SobelXYRow_NEON(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                      uint8* dst_argb, int width); | 
 | void SobelRow_Any_SSE2(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                        uint8* dst_argb, int width); | 
 | void SobelRow_Any_NEON(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                        uint8* dst_argb, int width); | 
 | void SobelToPlaneRow_Any_SSE2(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                               uint8* dst_y, int width); | 
 | void SobelToPlaneRow_Any_NEON(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                               uint8* dst_y, int width); | 
 | void SobelXYRow_Any_SSE2(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                          uint8* dst_argb, int width); | 
 | void SobelXYRow_Any_NEON(const uint8* src_sobelx, const uint8* src_sobely, | 
 |                          uint8* dst_argb, int width); | 
 |  | 
 | void ARGBPolynomialRow_C(const uint8* src_argb, | 
 |                          uint8* dst_argb, const float* poly, | 
 |                          int width); | 
 | void ARGBPolynomialRow_SSE2(const uint8* src_argb, | 
 |                             uint8* dst_argb, const float* poly, | 
 |                             int width); | 
 | void ARGBPolynomialRow_AVX2(const uint8* src_argb, | 
 |                             uint8* dst_argb, const float* poly, | 
 |                             int width); | 
 |  | 
 | void ARGBLumaColorTableRow_C(const uint8* src_argb, uint8* dst_argb, int width, | 
 |                              const uint8* luma, uint32 lumacoeff); | 
 | void ARGBLumaColorTableRow_SSSE3(const uint8* src_argb, uint8* dst_argb, | 
 |                                  int width, | 
 |                                  const uint8* luma, uint32 lumacoeff); | 
 |  | 
 | #ifdef __cplusplus | 
 | }  // extern "C" | 
 | }  // namespace libyuv | 
 | #endif | 
 |  | 
 | #endif  // INCLUDE_LIBYUV_ROW_H_  NOLINT |