Commit 18c9ab10 authored by Frank Barchard's avatar Frank Barchard Committed by Frank Barchard

Rotate ARGB using scale_row.h header

ARGB rotation using scaling code.  Previously it had forward
declarations of the low level row functions used.  This CL
uses the header and hooks up Any and MSA versions of the code.

Bug: libyuv:779
Test: perf record out/Release/libyuv_unittest --gtest_filter=*ARGBRotate90_Opt --libyuv_width=640 --libyuv_height=359 --libyuv_repeat=999
Change-Id: Ifacd58b26bb17a236181a404fad589fd2543b911
Reviewed-on: https://chromium-review.googlesource.com/927530Reviewed-by: 's avatarWeiyong Yao <braveyao@chromium.org>
parent 29ba52ed
Name: libyuv Name: libyuv
URL: http://code.google.com/p/libyuv/ URL: http://code.google.com/p/libyuv/
Version: 1699 Version: 1700
License: BSD License: BSD
License File: LICENSE License File: LICENSE
......
...@@ -11,6 +11,6 @@ ...@@ -11,6 +11,6 @@
#ifndef INCLUDE_LIBYUV_VERSION_H_ #ifndef INCLUDE_LIBYUV_VERSION_H_
#define INCLUDE_LIBYUV_VERSION_H_ #define INCLUDE_LIBYUV_VERSION_H_
#define LIBYUV_VERSION 1699 #define LIBYUV_VERSION 1700
#endif // INCLUDE_LIBYUV_VERSION_H_ #endif // INCLUDE_LIBYUV_VERSION_H_
...@@ -14,111 +14,99 @@ ...@@ -14,111 +14,99 @@
#include "libyuv/cpu_id.h" #include "libyuv/cpu_id.h"
#include "libyuv/planar_functions.h" #include "libyuv/planar_functions.h"
#include "libyuv/row.h" #include "libyuv/row.h"
#include "libyuv/scale_row.h" /* for ScaleARGBRowDownEven_ */
#ifdef __cplusplus #ifdef __cplusplus
namespace libyuv { namespace libyuv {
extern "C" { extern "C" {
#endif #endif
// ARGBScale has a function to copy pixels to a row, striding each source static void ARGBTranspose(const uint8_t* src_argb,
// pixel by a constant. int src_stride_argb,
#if !defined(LIBYUV_DISABLE_X86) && \ uint8_t* dst_argb,
(defined(_M_IX86) || defined(__x86_64__) || defined(__i386__)) int dst_stride_argb,
#define HAS_SCALEARGBROWDOWNEVEN_SSE2
void ScaleARGBRowDownEven_SSE2(const uint8_t* src_ptr,
int src_stride,
int src_stepx,
uint8_t* dst_ptr,
int dst_width);
#endif
#if !defined(LIBYUV_DISABLE_NEON) && \
(defined(__ARM_NEON__) || defined(LIBYUV_NEON) || defined(__aarch64__))
#define HAS_SCALEARGBROWDOWNEVEN_NEON
void ScaleARGBRowDownEven_NEON(const uint8_t* src_ptr,
int src_stride,
int src_stepx,
uint8_t* dst_ptr,
int dst_width);
#endif
void ScaleARGBRowDownEven_C(const uint8_t* src_ptr,
int,
int src_stepx,
uint8_t* dst_ptr,
int dst_width);
static void ARGBTranspose(const uint8_t* src,
int src_stride,
uint8_t* dst,
int dst_stride,
int width, int width,
int height) { int height) {
int i; int i;
int src_pixel_step = src_stride >> 2; int src_pixel_step = src_stride_argb >> 2;
void (*ScaleARGBRowDownEven)(const uint8_t* src_ptr, int src_stride, void (*ScaleARGBRowDownEven)(const uint8_t* src_argb, ptrdiff_t src_stride_argb,
int src_step, uint8_t* dst_ptr, int dst_width) = int src_step, uint8_t* dst_argb, int dst_width) =
ScaleARGBRowDownEven_C; ScaleARGBRowDownEven_C;
#if defined(HAS_SCALEARGBROWDOWNEVEN_SSE2) #if defined(HAS_SCALEARGBROWDOWNEVEN_SSE2)
if (TestCpuFlag(kCpuHasSSE2) && IS_ALIGNED(height, 4)) { // Width of dest. if (TestCpuFlag(kCpuHasSSE2)) {
ScaleARGBRowDownEven = ScaleARGBRowDownEven_SSE2; ScaleARGBRowDownEven = ScaleARGBRowDownEven_Any_SSE2;
if (IS_ALIGNED(height, 4)) { // Width of dest.
ScaleARGBRowDownEven = ScaleARGBRowDownEven_SSE2;
}
} }
#endif #endif
#if defined(HAS_SCALEARGBROWDOWNEVEN_NEON) #if defined(HAS_SCALEARGBROWDOWNEVEN_NEON)
if (TestCpuFlag(kCpuHasNEON) && IS_ALIGNED(height, 4)) { // Width of dest. if (TestCpuFlag(kCpuHasNEON)) {
ScaleARGBRowDownEven = ScaleARGBRowDownEven_NEON; ScaleARGBRowDownEven = ScaleARGBRowDownEven_Any_NEON;
if (IS_ALIGNED(height, 4)) { // Width of dest.
ScaleARGBRowDownEven = ScaleARGBRowDownEven_NEON;
}
}
#endif
#if defined(HAS_SCALEARGBROWDOWNEVEN_MSA)
if (TestCpuFlag(kCpuHasMSA)) {
ScaleARGBRowDownEven = ScaleARGBRowDownEven_Any_MSA;
if (IS_ALIGNED(height, 4)) { // Width of dest.
ScaleARGBRowDownEven = ScaleARGBRowDownEven_MSA;
}
} }
#endif #endif
for (i = 0; i < width; ++i) { // column of source to row of dest. for (i = 0; i < width; ++i) { // column of source to row of dest.
ScaleARGBRowDownEven(src, 0, src_pixel_step, dst, height); ScaleARGBRowDownEven(src_argb, 0, src_pixel_step, dst_argb, height);
dst += dst_stride; dst_argb += dst_stride_argb;
src += 4; src_argb += 4;
} }
} }
void ARGBRotate90(const uint8_t* src, void ARGBRotate90(const uint8_t* src_argb,
int src_stride, int src_stride_argb,
uint8_t* dst, uint8_t* dst_argb,
int dst_stride, int dst_stride_argb,
int width, int width,
int height) { int height) {
// Rotate by 90 is a ARGBTranspose with the source read // Rotate by 90 is a ARGBTranspose with the source read
// from bottom to top. So set the source pointer to the end // from bottom to top. So set the source pointer to the end
// of the buffer and flip the sign of the source stride. // of the buffer and flip the sign of the source stride.
src += src_stride * (height - 1); src_argb += src_stride_argb * (height - 1);
src_stride = -src_stride; src_stride_argb = -src_stride_argb;
ARGBTranspose(src, src_stride, dst, dst_stride, width, height); ARGBTranspose(src_argb, src_stride_argb, dst_argb, dst_stride_argb, width, height);
} }
void ARGBRotate270(const uint8_t* src, void ARGBRotate270(const uint8_t* src_argb,
int src_stride, int src_stride_argb,
uint8_t* dst, uint8_t* dst_argb,
int dst_stride, int dst_stride_argb,
int width, int width,
int height) { int height) {
// Rotate by 270 is a ARGBTranspose with the destination written // Rotate by 270 is a ARGBTranspose with the destination written
// from bottom to top. So set the destination pointer to the end // from bottom to top. So set the destination pointer to the end
// of the buffer and flip the sign of the destination stride. // of the buffer and flip the sign of the destination stride.
dst += dst_stride * (width - 1); dst_argb += dst_stride_argb * (width - 1);
dst_stride = -dst_stride; dst_stride_argb = -dst_stride_argb;
ARGBTranspose(src, src_stride, dst, dst_stride, width, height); ARGBTranspose(src_argb, src_stride_argb, dst_argb, dst_stride_argb, width, height);
} }
void ARGBRotate180(const uint8_t* src, void ARGBRotate180(const uint8_t* src_argb,
int src_stride, int src_stride_argb,
uint8_t* dst, uint8_t* dst_argb,
int dst_stride, int dst_stride_argb,
int width, int width,
int height) { int height) {
// Swap first and last row and mirror the content. Uses a temporary row. // Swap first and last row and mirror the content. Uses a temporary row.
align_buffer_64(row, width * 4); align_buffer_64(row, width * 4);
const uint8_t* src_bot = src + src_stride * (height - 1); const uint8_t* src_bot = src_argb + src_stride_argb * (height - 1);
uint8_t* dst_bot = dst + dst_stride * (height - 1); uint8_t* dst_bot = dst_argb + dst_stride_argb * (height - 1);
int half_height = (height + 1) >> 1; int half_height = (height + 1) >> 1;
int y; int y;
void (*ARGBMirrorRow)(const uint8_t* src, uint8_t* dst, int width) = void (*ARGBMirrorRow)(const uint8_t* src_argb, uint8_t* dst_argb, int width) =
ARGBMirrorRow_C; ARGBMirrorRow_C;
void (*CopyRow)(const uint8_t* src, uint8_t* dst, int width) = CopyRow_C; void (*CopyRow)(const uint8_t* src_argb, uint8_t* dst_argb, int width) = CopyRow_C;
#if defined(HAS_ARGBMIRRORROW_NEON) #if defined(HAS_ARGBMIRRORROW_NEON)
if (TestCpuFlag(kCpuHasNEON)) { if (TestCpuFlag(kCpuHasNEON)) {
ARGBMirrorRow = ARGBMirrorRow_Any_NEON; ARGBMirrorRow = ARGBMirrorRow_Any_NEON;
...@@ -174,13 +162,13 @@ void ARGBRotate180(const uint8_t* src, ...@@ -174,13 +162,13 @@ void ARGBRotate180(const uint8_t* src,
// Odd height will harmlessly mirror the middle row twice. // Odd height will harmlessly mirror the middle row twice.
for (y = 0; y < half_height; ++y) { for (y = 0; y < half_height; ++y) {
ARGBMirrorRow(src, row, width); // Mirror first row into a buffer ARGBMirrorRow(src_argb, row, width); // Mirror first row into a buffer
ARGBMirrorRow(src_bot, dst, width); // Mirror last row into first row ARGBMirrorRow(src_bot, dst_argb, width); // Mirror last row into first row
CopyRow(row, dst_bot, width * 4); // Copy first mirrored row into last CopyRow(row, dst_bot, width * 4); // Copy first mirrored row into last
src += src_stride; src_argb += src_stride_argb;
dst += dst_stride; dst_argb += dst_stride_argb;
src_bot -= src_stride; src_bot -= src_stride_argb;
dst_bot -= dst_stride; dst_bot -= dst_stride_argb;
} }
free_aligned_buffer_64(row); free_aligned_buffer_64(row);
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment