blob: 4a3eb1c4ea2a3fb7ec129a4d910bb4d51f80ea60 [file] [log] [blame]
fbarchard@google.comd51c3422012-06-26 23:46:25 +00001/*
fbarchard@google.comb0c97972012-08-08 19:04:24 +00002 * Copyright 2012 The LibYuv Project Authors. All rights reserved.
fbarchard@google.comd51c3422012-06-26 23:46:25 +00003 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
fbarchard@google.comcde58702013-01-28 00:02:35 +00007 * in the file PATENTS. All contributing project authors may
fbarchard@google.comd51c3422012-06-26 23:46:25 +00008 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11#include "libyuv/rotate.h"
12
13#include "libyuv/cpu_id.h"
14#include "libyuv/convert.h"
15#include "libyuv/planar_functions.h"
fbarchard@google.com142f6c42012-09-18 20:56:51 +000016#include "libyuv/row.h"
fbarchard@google.comd51c3422012-06-26 23:46:25 +000017
18#ifdef __cplusplus
19namespace libyuv {
20extern "C" {
21#endif
22
23// ARGBScale has a function to copy pixels to a row, striding each source
24// pixel by a constant.
fbarchard@google.com83a63e62013-02-27 00:20:29 +000025#if !defined(LIBYUV_DISABLE_X86) && (defined(_M_IX86) || \
fbarchard@google.comd51c3422012-06-26 23:46:25 +000026 defined(__x86_64__) || defined(__i386__))
27#define HAS_SCALEARGBROWDOWNEVEN_SSE2
28void ScaleARGBRowDownEven_SSE2(const uint8* src_ptr, int src_stride,
29 int src_stepx,
30 uint8* dst_ptr, int dst_width);
31#endif
fbarchard@google.com83a63e62013-02-27 00:20:29 +000032#if !defined(LIBYUV_DISABLE_NEON) && \
33 (defined(__ARM_NEON__) || defined(LIBYUV_NEON))
fbarchard@google.comcb5262d2012-11-16 01:41:35 +000034#define HAS_SCALEARGBROWDOWNEVEN_NEON
35void ScaleARGBRowDownEven_NEON(const uint8* src_ptr, int src_stride,
36 int src_stepx,
37 uint8* dst_ptr, int dst_width);
38#endif
39
fbarchard@google.comd51c3422012-06-26 23:46:25 +000040void ScaleARGBRowDownEven_C(const uint8* src_ptr, int,
41 int src_stepx,
42 uint8* dst_ptr, int dst_width);
43
44static void ARGBTranspose(const uint8* src, int src_stride,
45 uint8* dst, int dst_stride,
46 int width, int height) {
fbarchard@google.comcb5262d2012-11-16 01:41:35 +000047 int src_pixel_step = src_stride >> 2;
fbarchard@google.comd51c3422012-06-26 23:46:25 +000048 void (*ScaleARGBRowDownEven)(const uint8* src_ptr, int src_stride,
49 int src_step, uint8* dst_ptr, int dst_width) = ScaleARGBRowDownEven_C;
50#if defined(HAS_SCALEARGBROWDOWNEVEN_SSE2)
fbarchard@google.com3e464442012-11-14 02:03:49 +000051 if (TestCpuFlag(kCpuHasSSE2) && IS_ALIGNED(height, 4) && // Width of dest.
fbarchard@google.comd51c3422012-06-26 23:46:25 +000052 IS_ALIGNED(dst, 16) && IS_ALIGNED(dst_stride, 16)) {
53 ScaleARGBRowDownEven = ScaleARGBRowDownEven_SSE2;
54 }
fbarchard@google.comcb5262d2012-11-16 01:41:35 +000055#elif defined(HAS_SCALEARGBROWDOWNEVEN_NEON)
56 if (TestCpuFlag(kCpuHasNEON) && IS_ALIGNED(height, 4) && // Width of dest.
57 IS_ALIGNED(src, 4)) {
58 ScaleARGBRowDownEven = ScaleARGBRowDownEven_NEON;
59 }
fbarchard@google.comd51c3422012-06-26 23:46:25 +000060#endif
61
fbarchard@google.comd51c3422012-06-26 23:46:25 +000062 for (int i = 0; i < width; ++i) { // column of source to row of dest.
63 ScaleARGBRowDownEven(src, 0, src_pixel_step, dst, height);
64 dst += dst_stride;
65 src += 4;
66 }
67}
68
69void ARGBRotate90(const uint8* src, int src_stride,
70 uint8* dst, int dst_stride,
71 int width, int height) {
72 // Rotate by 90 is a ARGBTranspose with the source read
fbarchard@google.com64ce0ab2012-10-09 00:05:29 +000073 // from bottom to top. So set the source pointer to the end
fbarchard@google.comd51c3422012-06-26 23:46:25 +000074 // of the buffer and flip the sign of the source stride.
75 src += src_stride * (height - 1);
76 src_stride = -src_stride;
77 ARGBTranspose(src, src_stride, dst, dst_stride, width, height);
78}
79
80void ARGBRotate270(const uint8* src, int src_stride,
81 uint8* dst, int dst_stride,
82 int width, int height) {
83 // Rotate by 270 is a ARGBTranspose with the destination written
fbarchard@google.com64ce0ab2012-10-09 00:05:29 +000084 // from bottom to top. So set the destination pointer to the end
fbarchard@google.comd51c3422012-06-26 23:46:25 +000085 // of the buffer and flip the sign of the destination stride.
86 dst += dst_stride * (width - 1);
87 dst_stride = -dst_stride;
88 ARGBTranspose(src, src_stride, dst, dst_stride, width, height);
89}
90
91void ARGBRotate180(const uint8* src, int src_stride,
92 uint8* dst, int dst_stride,
93 int width, int height) {
94 void (*ARGBMirrorRow)(const uint8* src, uint8* dst, int width) =
95 ARGBMirrorRow_C;
96#if defined(HAS_ARGBMIRRORROW_SSSE3)
97 if (TestCpuFlag(kCpuHasSSSE3) && IS_ALIGNED(width, 4) &&
98 IS_ALIGNED(src, 16) && IS_ALIGNED(src_stride, 16) &&
99 IS_ALIGNED(dst, 16) && IS_ALIGNED(dst_stride, 16)) {
100 ARGBMirrorRow = ARGBMirrorRow_SSSE3;
101 }
fbarchard@google.com3e464442012-11-14 02:03:49 +0000102#elif defined(HAS_ARGBMIRRORROW_NEON)
103 if (TestCpuFlag(kCpuHasNEON) && IS_ALIGNED(width, 4)) {
104 ARGBMirrorRow = ARGBMirrorRow_NEON;
105 }
fbarchard@google.comd51c3422012-06-26 23:46:25 +0000106#endif
107 void (*CopyRow)(const uint8* src, uint8* dst, int width) = CopyRow_C;
108#if defined(HAS_COPYROW_NEON)
fbarchard@google.com62a961b2012-10-22 17:24:50 +0000109 if (TestCpuFlag(kCpuHasNEON) && IS_ALIGNED(width * 4, 32)) {
fbarchard@google.comd51c3422012-06-26 23:46:25 +0000110 CopyRow = CopyRow_NEON;
111 }
112#endif
113#if defined(HAS_COPYROW_X86)
114 if (TestCpuFlag(kCpuHasX86)) {
115 CopyRow = CopyRow_X86;
116 }
117#endif
118#if defined(HAS_COPYROW_SSE2)
119 if (TestCpuFlag(kCpuHasSSE2) && IS_ALIGNED(width * 4, 32) &&
120 IS_ALIGNED(src, 16) && IS_ALIGNED(src_stride, 16) &&
121 IS_ALIGNED(dst, 16) && IS_ALIGNED(dst_stride, 16)) {
122 CopyRow = CopyRow_SSE2;
123 }
124#endif
fbarchard@google.com92352b72013-01-28 19:43:29 +0000125#if defined(HAS_COPYROW_MIPS)
126 if (TestCpuFlag(kCpuHasMIPS)) {
127 CopyRow = CopyRow_MIPS;
128 }
129#endif
fbarchard@google.comd51c3422012-06-26 23:46:25 +0000130 if (width * 4 > kMaxStride) {
131 return;
132 }
fbarchard@google.com64ce0ab2012-10-09 00:05:29 +0000133 // Swap first and last row and mirror the content. Uses a temporary row.
fbarchard@google.comd51c3422012-06-26 23:46:25 +0000134 SIMD_ALIGNED(uint8 row[kMaxStride]);
135 const uint8* src_bot = src + src_stride * (height - 1);
136 uint8* dst_bot = dst + dst_stride * (height - 1);
137 int half_height = (height + 1) >> 1;
138 // Odd height will harmlessly mirror the middle row twice.
139 for (int y = 0; y < half_height; ++y) {
140 ARGBMirrorRow(src, row, width); // Mirror first row into a buffer
141 src += src_stride;
142 ARGBMirrorRow(src_bot, dst, width); // Mirror last row into first row
143 dst += dst_stride;
144 CopyRow(row, dst_bot, width * 4); // Copy first mirrored row into last
145 src_bot -= src_stride;
146 dst_bot -= dst_stride;
147 }
148}
149
fbarchard@google.comfc7314e2012-09-27 02:17:51 +0000150LIBYUV_API
fbarchard@google.comd51c3422012-06-26 23:46:25 +0000151int ARGBRotate(const uint8* src_argb, int src_stride_argb,
152 uint8* dst_argb, int dst_stride_argb,
153 int width, int height,
154 RotationMode mode) {
155 if (!src_argb || width <= 0 || height == 0 || !dst_argb) {
156 return -1;
157 }
158
159 // Negative height means invert the image.
160 if (height < 0) {
161 height = -height;
162 src_argb = src_argb + (height - 1) * src_stride_argb;
163 src_stride_argb = -src_stride_argb;
164 }
165
166 switch (mode) {
167 case kRotate0:
168 // copy frame
169 return ARGBCopy(src_argb, src_stride_argb,
170 dst_argb, dst_stride_argb,
171 width, height);
172 case kRotate90:
173 ARGBRotate90(src_argb, src_stride_argb,
174 dst_argb, dst_stride_argb,
175 width, height);
176 return 0;
177 case kRotate270:
178 ARGBRotate270(src_argb, src_stride_argb,
179 dst_argb, dst_stride_argb,
180 width, height);
181 return 0;
182 case kRotate180:
183 ARGBRotate180(src_argb, src_stride_argb,
184 dst_argb, dst_stride_argb,
185 width, height);
186 return 0;
187 default:
188 break;
189 }
190 return -1;
191}
192
193#ifdef __cplusplus
194} // extern "C"
195} // namespace libyuv
196#endif