Commit 3c11d4bf authored by fbarchard@google.com's avatar fbarchard@google.com

align avx2 buffers to 32 bytes

BUG=403
TESTED=untested
R=harryjin@google.com

Review URL: https://webrtc-codereview.appspot.com/40929004

git-svn-id: http://libyuv.googlecode.com/svn/trunk@1294 16f28f9a-4ce2-e073-06de-1de4eb20be90
parent 446fa955
Name: libyuv Name: libyuv
URL: http://code.google.com/p/libyuv/ URL: http://code.google.com/p/libyuv/
Version: 1293 Version: 1294
License: BSD License: BSD
License File: LICENSE License File: LICENSE
......
...@@ -219,6 +219,7 @@ extern "C" { ...@@ -219,6 +219,7 @@ extern "C" {
#if defined(HAS_I422TOARGBROW_AVX2) #if defined(HAS_I422TOARGBROW_AVX2)
#define HAS_YUY2TOARGBROW_AVX2 #define HAS_YUY2TOARGBROW_AVX2
#define HAS_UYVYTOARGBROW_AVX2 #define HAS_UYVYTOARGBROW_AVX2
// TODO(fbarchard): Enable once low levels are ported to AVX2
#define HAS_NV12TORGB565ROW_AVX2 #define HAS_NV12TORGB565ROW_AVX2
#define HAS_NV21TORGB565ROW_AVX2 #define HAS_NV21TORGB565ROW_AVX2
#define HAS_I422TORGB565ROW_AVX2 #define HAS_I422TORGB565ROW_AVX2
......
...@@ -11,6 +11,6 @@ ...@@ -11,6 +11,6 @@
#ifndef INCLUDE_LIBYUV_VERSION_H_ // NOLINT #ifndef INCLUDE_LIBYUV_VERSION_H_ // NOLINT
#define INCLUDE_LIBYUV_VERSION_H_ #define INCLUDE_LIBYUV_VERSION_H_
#define LIBYUV_VERSION 1293 #define LIBYUV_VERSION 1294
#endif // INCLUDE_LIBYUV_VERSION_H_ NOLINT #endif // INCLUDE_LIBYUV_VERSION_H_ NOLINT
...@@ -2265,7 +2265,7 @@ void I422ToRGB565Row_AVX2(const uint8* src_y, ...@@ -2265,7 +2265,7 @@ void I422ToRGB565Row_AVX2(const uint8* src_y,
const uint8* src_v, const uint8* src_v,
uint8* dst_rgb565, uint8* dst_rgb565,
int width) { int width) {
SIMD_ALIGNED(uint8 row[MAXTWIDTH * 4]); SIMD_ALIGNED32(uint8 row[MAXTWIDTH * 4]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
I422ToARGBRow_AVX2(src_y, src_u, src_v, row, twidth); I422ToARGBRow_AVX2(src_y, src_u, src_v, row, twidth);
...@@ -2286,7 +2286,7 @@ void I422ToARGB1555Row_AVX2(const uint8* src_y, ...@@ -2286,7 +2286,7 @@ void I422ToARGB1555Row_AVX2(const uint8* src_y,
uint8* dst_argb1555, uint8* dst_argb1555,
int width) { int width) {
// Row buffer for intermediate ARGB pixels. // Row buffer for intermediate ARGB pixels.
SIMD_ALIGNED(uint8 row[MAXTWIDTH * 4]); SIMD_ALIGNED32(uint8 row[MAXTWIDTH * 4]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
I422ToARGBRow_AVX2(src_y, src_u, src_v, row, twidth); I422ToARGBRow_AVX2(src_y, src_u, src_v, row, twidth);
...@@ -2307,7 +2307,7 @@ void I422ToARGB4444Row_AVX2(const uint8* src_y, ...@@ -2307,7 +2307,7 @@ void I422ToARGB4444Row_AVX2(const uint8* src_y,
uint8* dst_argb4444, uint8* dst_argb4444,
int width) { int width) {
// Row buffer for intermediate ARGB pixels. // Row buffer for intermediate ARGB pixels.
SIMD_ALIGNED(uint8 row[MAXTWIDTH * 4]); SIMD_ALIGNED32(uint8 row[MAXTWIDTH * 4]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
I422ToARGBRow_AVX2(src_y, src_u, src_v, row, twidth); I422ToARGBRow_AVX2(src_y, src_u, src_v, row, twidth);
...@@ -2325,7 +2325,7 @@ void I422ToARGB4444Row_AVX2(const uint8* src_y, ...@@ -2325,7 +2325,7 @@ void I422ToARGB4444Row_AVX2(const uint8* src_y,
void NV12ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_uv, void NV12ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_uv,
uint8* dst_rgb565, int width) { uint8* dst_rgb565, int width) {
// Row buffer for intermediate ARGB pixels. // Row buffer for intermediate ARGB pixels.
SIMD_ALIGNED(uint8 row[MAXTWIDTH * 4]); SIMD_ALIGNED32(uint8 row[MAXTWIDTH * 4]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
NV12ToARGBRow_AVX2(src_y, src_uv, row, twidth); NV12ToARGBRow_AVX2(src_y, src_uv, row, twidth);
...@@ -2342,7 +2342,7 @@ void NV12ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_uv, ...@@ -2342,7 +2342,7 @@ void NV12ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_uv,
void NV21ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_vu, void NV21ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_vu,
uint8* dst_rgb565, int width) { uint8* dst_rgb565, int width) {
// Row buffer for intermediate ARGB pixels. // Row buffer for intermediate ARGB pixels.
SIMD_ALIGNED(uint8 row[MAXTWIDTH * 4]); SIMD_ALIGNED32(uint8 row[MAXTWIDTH * 4]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
NV21ToARGBRow_AVX2(src_y, src_vu, row, twidth); NV21ToARGBRow_AVX2(src_y, src_vu, row, twidth);
...@@ -2358,9 +2358,9 @@ void NV21ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_vu, ...@@ -2358,9 +2358,9 @@ void NV21ToRGB565Row_AVX2(const uint8* src_y, const uint8* src_vu,
#if defined(HAS_YUY2TOARGBROW_AVX2) #if defined(HAS_YUY2TOARGBROW_AVX2)
void YUY2ToARGBRow_AVX2(const uint8* src_yuy2, uint8* dst_argb, int width) { void YUY2ToARGBRow_AVX2(const uint8* src_yuy2, uint8* dst_argb, int width) {
// Row buffers for intermediate YUV pixels. // Row buffers for intermediate YUV pixels.
SIMD_ALIGNED(uint8 row_y[MAXTWIDTH]); SIMD_ALIGNED32(uint8 row_y[MAXTWIDTH]);
SIMD_ALIGNED(uint8 row_u[MAXTWIDTH / 2]); SIMD_ALIGNED32(uint8 row_u[MAXTWIDTH / 2]);
SIMD_ALIGNED(uint8 row_v[MAXTWIDTH / 2]); SIMD_ALIGNED32(uint8 row_v[MAXTWIDTH / 2]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
YUY2ToUV422Row_AVX2(src_yuy2, row_u, row_v, twidth); YUY2ToUV422Row_AVX2(src_yuy2, row_u, row_v, twidth);
...@@ -2376,9 +2376,9 @@ void YUY2ToARGBRow_AVX2(const uint8* src_yuy2, uint8* dst_argb, int width) { ...@@ -2376,9 +2376,9 @@ void YUY2ToARGBRow_AVX2(const uint8* src_yuy2, uint8* dst_argb, int width) {
#if defined(HAS_UYVYTOARGBROW_AVX2) #if defined(HAS_UYVYTOARGBROW_AVX2)
void UYVYToARGBRow_AVX2(const uint8* src_uyvy, uint8* dst_argb, int width) { void UYVYToARGBRow_AVX2(const uint8* src_uyvy, uint8* dst_argb, int width) {
// Row buffers for intermediate YUV pixels. // Row buffers for intermediate YUV pixels.
SIMD_ALIGNED(uint8 row_y[MAXTWIDTH]); SIMD_ALIGNED32(uint8 row_y[MAXTWIDTH]);
SIMD_ALIGNED(uint8 row_u[MAXTWIDTH / 2]); SIMD_ALIGNED32(uint8 row_u[MAXTWIDTH / 2]);
SIMD_ALIGNED(uint8 row_v[MAXTWIDTH / 2]); SIMD_ALIGNED32(uint8 row_v[MAXTWIDTH / 2]);
while (width > 0) { while (width > 0) {
int twidth = width > MAXTWIDTH ? MAXTWIDTH : width; int twidth = width > MAXTWIDTH ? MAXTWIDTH : width;
UYVYToUV422Row_AVX2(src_uyvy, row_u, row_v, twidth); UYVYToUV422Row_AVX2(src_uyvy, row_u, row_v, twidth);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment