blob: 852129eed34099a26c41ff38e1c7d01045b7b77e [file] [log] [blame]
J. Duke319a3b92007-12-01 00:00:00 +00001/*
2 * Copyright 2003 Sun Microsystems, Inc. All Rights Reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation. Sun designates this
8 * particular file as subject to the "Classpath" exception as provided
9 * by Sun in the LICENSE file that accompanied this code.
10 *
11 * This code is distributed in the hope that it will be useful, but WITHOUT
12 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
14 * version 2 for more details (a copy is included in the LICENSE file that
15 * accompanied this code).
16 *
17 * You should have received a copy of the GNU General Public License version
18 * 2 along with this work; if not, write to the Free Software Foundation,
19 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
20 *
21 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
22 * CA 95054 USA or visit www.sun.com if you need additional information or
23 * have any questions.
24 */
25
26
27/*
28 * FUNCTION
29 * Image affine transformation with Bicubic filtering
30 * SYNOPSIS
31 * mlib_status mlib_ImageAffine_[s32|f32|d64]_?ch_bc
32 * (mlib_s32 *leftEdges,
33 * mlib_s32 *rightEdges,
34 * mlib_s32 *xStarts,
35 * mlib_s32 *yStarts,
36 * mlib_s32 *sides,
37 * mlib_u8 *dstData,
38 * mlib_u8 **lineAddr,
39 * mlib_s32 dstYStride,
40 * mlib_s32 is_affine,
41 * mlib_s32 srcYStride,
42 * mlib_filter filter)
43 *
44 * ARGUMENTS
45 * leftEdges array[dstHeight] of xLeft coordinates
46 * RightEdges array[dstHeight] of xRight coordinates
47 * xStarts array[dstHeight] of xStart * 65536 coordinates
48 * yStarts array[dstHeight] of yStart * 65536 coordinates
49 * sides output array[4]. sides[0] is yStart, sides[1] is yFinish,
50 * sides[2] is dx * 65536, sides[3] is dy * 65536
51 * dstData pointer to the first pixel on (yStart - 1) line
52 * lineAddr array[srcHeight] of pointers to the first pixel on
53 * the corresponding lines
54 * dstYStride stride of destination image
55 * is_affine indicator (Affine - GridWarp)
56 * srcYStride stride of source image
57 * filter type of resampling filter
58 *
59 * DESCRIPTION
60 * The functions step along the lines from xLeft to xRight and apply
61 * the Bicubic and Bicubic2 filtering.
62 *
63 */
64
65#include "mlib_ImageAffine.h"
66
67#define IMG_TYPE 3
68
69/***************************************************************/
70#if IMG_TYPE == 3
71
72#define DTYPE mlib_s32
73#define FTYPE mlib_d64
74
75#define FUN_NAME(CHAN) mlib_ImageAffine_s32_##CHAN##_bc
76
77#define STORE(res, x) SAT32(res)
78
79#elif IMG_TYPE == 4
80
81#define DTYPE mlib_f32
82#define FTYPE DTYPE
83
84#define FUN_NAME(CHAN) mlib_ImageAffine_f32_##CHAN##_bc
85
86#define STORE(res, x) res = (x)
87
88#elif IMG_TYPE == 5
89
90#define DTYPE mlib_d64
91#define FTYPE DTYPE
92
93#define FUN_NAME(CHAN) mlib_ImageAffine_d64_##CHAN##_bc
94
95#define STORE(res, x) res = (x)
96
97#endif
98
99/***************************************************************/
100#define CREATE_COEF_BICUBIC( X, Y, OPERATOR ) \
101 dx = (X & MLIB_MASK) * scale; \
102 dy = (Y & MLIB_MASK) * scale; \
103 dx_2 = ((FTYPE)0.5) * dx; \
104 dy_2 = ((FTYPE)0.5) * dy; \
105 dx2 = dx * dx; dy2 = dy * dy; \
106 dx3_2 = dx_2 * dx2; dy3_2 = dy_2 * dy2; \
107 dx3_3 = ((FTYPE)3.0) * dx3_2; \
108 dy3_3 = ((FTYPE)3.0) * dy3_2; \
109 \
110 xf0 = dx2 - dx3_2 - dx_2; \
111 xf1 = dx3_3 - ((FTYPE)2.5) * dx2 + ((FTYPE)1.0); \
112 xf2 = ((FTYPE)2.0) * dx2 - dx3_3 + dx_2; \
113 xf3 = dx3_2 - ((FTYPE)0.5) * dx2; \
114 \
115 OPERATOR; \
116 \
117 yf0 = dy2 - dy3_2 - dy_2; \
118 yf1 = dy3_3 - ((FTYPE)2.5) * dy2 + ((FTYPE)1.0); \
119 yf2 = ((FTYPE)2.0) * dy2 - dy3_3 + dy_2; \
120 yf3 = dy3_2 - ((FTYPE)0.5) * dy2
121
122/***************************************************************/
123#define CREATE_COEF_BICUBIC_2( X, Y, OPERATOR ) \
124 dx = (X & MLIB_MASK) * scale; \
125 dy = (Y & MLIB_MASK) * scale; \
126 dx2 = dx * dx; dy2 = dy * dy; \
127 dx3_2 = dx * dx2; dy3_2 = dy * dy2; \
128 dx3_3 = ((FTYPE)2.0) * dx2; \
129 dy3_3 = ((FTYPE)2.0) * dy2; \
130 \
131 xf0 = dx3_3 - dx3_2 - dx; \
132 xf1 = dx3_2 - dx3_3 + ((FTYPE)1.0); \
133 xf2 = dx2 - dx3_2 + dx; \
134 xf3 = dx3_2 - dx2; \
135 \
136 OPERATOR; \
137 \
138 yf0 = dy3_3 - dy3_2 - dy; \
139 yf1 = dy3_2 - dy3_3 + ((FTYPE)1.0); \
140 yf2 = dy2 - dy3_2 + dy; \
141 yf3 = dy3_2 - dy2
142
143/***************************************************************/
144mlib_status FUN_NAME(1ch)(mlib_affine_param *param)
145{
146 DECLAREVAR_BC();
147 DTYPE *dstLineEnd;
148
149 for (j = yStart; j <= yFinish; j++) {
150 FTYPE xf0, xf1, xf2, xf3;
151 FTYPE yf0, yf1, yf2, yf3;
152 FTYPE dx, dx_2, dx2, dx3_2, dx3_3;
153 FTYPE dy, dy_2, dy2, dy3_2, dy3_3;
154 FTYPE c0, c1, c2, c3, val0;
155 FTYPE scale = 1 / 65536.f;
156 FTYPE s0, s1, s2, s3;
157 FTYPE s4, s5, s6, s7;
158
159 CLIP(1);
160 dstLineEnd = (DTYPE *) dstData + xRight;
161
162 if (filter == MLIB_BICUBIC) {
163 CREATE_COEF_BICUBIC(X, Y,;
164 );
165 }
166 else {
167 CREATE_COEF_BICUBIC_2(X, Y,;
168 );
169 }
170
171 xSrc = (X >> MLIB_SHIFT) - 1;
172 ySrc = (Y >> MLIB_SHIFT) - 1;
173
174 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + xSrc;
175 s0 = srcPixelPtr[0];
176 s1 = srcPixelPtr[1];
177 s2 = srcPixelPtr[2];
178 s3 = srcPixelPtr[3];
179
180 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
181 s4 = srcPixelPtr[0];
182 s5 = srcPixelPtr[1];
183 s6 = srcPixelPtr[2];
184 s7 = srcPixelPtr[3];
185
186 if (filter == MLIB_BICUBIC) {
187 for (; dstPixelPtr <= (dstLineEnd - 1); dstPixelPtr++) {
188 X += dX;
189 Y += dY;
190
191 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
192 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
193 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
194 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[1] * xf1 +
195 srcPixelPtr[2] * xf2 + srcPixelPtr[3] * xf3);
196 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
197 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[1] * xf1 +
198 srcPixelPtr[2] * xf2 + srcPixelPtr[3] * xf3);
199
200 CREATE_COEF_BICUBIC(X, Y, val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
201
202 STORE(dstPixelPtr[0], val0);
203
204 xSrc = (X >> MLIB_SHIFT) - 1;
205 ySrc = (Y >> MLIB_SHIFT) - 1;
206
207 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + xSrc;
208 s0 = srcPixelPtr[0];
209 s1 = srcPixelPtr[1];
210 s2 = srcPixelPtr[2];
211 s3 = srcPixelPtr[3];
212
213 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
214 s4 = srcPixelPtr[0];
215 s5 = srcPixelPtr[1];
216 s6 = srcPixelPtr[2];
217 s7 = srcPixelPtr[3];
218 }
219
220 }
221 else {
222 for (; dstPixelPtr <= (dstLineEnd - 1); dstPixelPtr++) {
223 X += dX;
224 Y += dY;
225
226 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
227 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
228 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
229 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[1] * xf1 +
230 srcPixelPtr[2] * xf2 + srcPixelPtr[3] * xf3);
231 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
232 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[1] * xf1 +
233 srcPixelPtr[2] * xf2 + srcPixelPtr[3] * xf3);
234
235 CREATE_COEF_BICUBIC_2(X, Y, val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
236
237 STORE(dstPixelPtr[0], val0);
238
239 xSrc = (X >> MLIB_SHIFT) - 1;
240 ySrc = (Y >> MLIB_SHIFT) - 1;
241
242 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + xSrc;
243 s0 = srcPixelPtr[0];
244 s1 = srcPixelPtr[1];
245 s2 = srcPixelPtr[2];
246 s3 = srcPixelPtr[3];
247
248 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
249 s4 = srcPixelPtr[0];
250 s5 = srcPixelPtr[1];
251 s6 = srcPixelPtr[2];
252 s7 = srcPixelPtr[3];
253 }
254 }
255
256 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
257 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
258 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
259 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[1] * xf1 +
260 srcPixelPtr[2] * xf2 + srcPixelPtr[3] * xf3);
261 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
262 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[1] * xf1 +
263 srcPixelPtr[2] * xf2 + srcPixelPtr[3] * xf3);
264
265 val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3);
266 STORE(dstPixelPtr[0], val0);
267 }
268
269 return MLIB_SUCCESS;
270}
271
272/***************************************************************/
273mlib_status FUN_NAME(2ch)(mlib_affine_param *param)
274{
275 DECLAREVAR_BC();
276 DTYPE *dstLineEnd;
277
278 for (j = yStart; j <= yFinish; j++) {
279 FTYPE xf0, xf1, xf2, xf3;
280 FTYPE yf0, yf1, yf2, yf3;
281 FTYPE dx, dx_2, dx2, dx3_2, dx3_3;
282 FTYPE dy, dy_2, dy2, dy3_2, dy3_3;
283 FTYPE c0, c1, c2, c3, val0;
284 FTYPE scale = 1 / 65536.f;
285 FTYPE s0, s1, s2, s3;
286 FTYPE s4, s5, s6, s7;
287 mlib_s32 k;
288
289 CLIP(2);
290 dstLineEnd = (DTYPE *) dstData + 2 * xRight;
291
292 for (k = 0; k < 2; k++) {
293 mlib_s32 X1 = X;
294 mlib_s32 Y1 = Y;
295 DTYPE *dPtr = dstPixelPtr + k;
296
297 if (filter == MLIB_BICUBIC) {
298 CREATE_COEF_BICUBIC(X1, Y1,;
299 );
300 }
301 else {
302 CREATE_COEF_BICUBIC_2(X1, Y1,;
303 );
304 }
305
306 xSrc = (X1 >> MLIB_SHIFT) - 1;
307 ySrc = (Y1 >> MLIB_SHIFT) - 1;
308
309 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 2 * xSrc + k;
310 s0 = srcPixelPtr[0];
311 s1 = srcPixelPtr[2];
312 s2 = srcPixelPtr[4];
313 s3 = srcPixelPtr[6];
314
315 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
316 s4 = srcPixelPtr[0];
317 s5 = srcPixelPtr[2];
318 s6 = srcPixelPtr[4];
319 s7 = srcPixelPtr[6];
320
321 if (filter == MLIB_BICUBIC) {
322 for (; dPtr <= (dstLineEnd - 1); dPtr += 2) {
323 X1 += dX;
324 Y1 += dY;
325
326 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
327 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
328 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
329 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[2] * xf1 +
330 srcPixelPtr[4] * xf2 + srcPixelPtr[6] * xf3);
331 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
332 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[2] * xf1 +
333 srcPixelPtr[4] * xf2 + srcPixelPtr[6] * xf3);
334
335 CREATE_COEF_BICUBIC(X1, Y1, val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
336
337 STORE(dPtr[0], val0);
338
339 xSrc = (X1 >> MLIB_SHIFT) - 1;
340 ySrc = (Y1 >> MLIB_SHIFT) - 1;
341
342 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 2 * xSrc + k;
343 s0 = srcPixelPtr[0];
344 s1 = srcPixelPtr[2];
345 s2 = srcPixelPtr[4];
346 s3 = srcPixelPtr[6];
347
348 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
349 s4 = srcPixelPtr[0];
350 s5 = srcPixelPtr[2];
351 s6 = srcPixelPtr[4];
352 s7 = srcPixelPtr[6];
353 }
354
355 }
356 else {
357 for (; dPtr <= (dstLineEnd - 1); dPtr += 2) {
358 X1 += dX;
359 Y1 += dY;
360
361 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
362 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
363 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
364 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[2] * xf1 +
365 srcPixelPtr[4] * xf2 + srcPixelPtr[6] * xf3);
366 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
367 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[2] * xf1 +
368 srcPixelPtr[4] * xf2 + srcPixelPtr[6] * xf3);
369
370 CREATE_COEF_BICUBIC_2(X1, Y1, val0 =
371 (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
372
373 STORE(dPtr[0], val0);
374
375 xSrc = (X1 >> MLIB_SHIFT) - 1;
376 ySrc = (Y1 >> MLIB_SHIFT) - 1;
377
378 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 2 * xSrc + k;
379 s0 = srcPixelPtr[0];
380 s1 = srcPixelPtr[2];
381 s2 = srcPixelPtr[4];
382 s3 = srcPixelPtr[6];
383
384 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
385 s4 = srcPixelPtr[0];
386 s5 = srcPixelPtr[2];
387 s6 = srcPixelPtr[4];
388 s7 = srcPixelPtr[6];
389 }
390 }
391
392 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
393 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
394 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
395 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[2] * xf1 +
396 srcPixelPtr[4] * xf2 + srcPixelPtr[6] * xf3);
397 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
398 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[2] * xf1 +
399 srcPixelPtr[4] * xf2 + srcPixelPtr[6] * xf3);
400
401 val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3);
402 STORE(dPtr[0], val0);
403 }
404 }
405
406 return MLIB_SUCCESS;
407}
408
409/***************************************************************/
410mlib_status FUN_NAME(3ch)(mlib_affine_param *param)
411{
412 DECLAREVAR_BC();
413 DTYPE *dstLineEnd;
414
415 for (j = yStart; j <= yFinish; j++) {
416 FTYPE xf0, xf1, xf2, xf3;
417 FTYPE yf0, yf1, yf2, yf3;
418 FTYPE dx, dx_2, dx2, dx3_2, dx3_3;
419 FTYPE dy, dy_2, dy2, dy3_2, dy3_3;
420 FTYPE c0, c1, c2, c3, val0;
421 FTYPE scale = 1 / 65536.f;
422 FTYPE s0, s1, s2, s3;
423 FTYPE s4, s5, s6, s7;
424 mlib_s32 k;
425
426 CLIP(3);
427 dstLineEnd = (DTYPE *) dstData + 3 * xRight;
428
429 for (k = 0; k < 3; k++) {
430 mlib_s32 X1 = X;
431 mlib_s32 Y1 = Y;
432 DTYPE *dPtr = dstPixelPtr + k;
433
434 if (filter == MLIB_BICUBIC) {
435 CREATE_COEF_BICUBIC(X1, Y1,;
436 );
437 }
438 else {
439 CREATE_COEF_BICUBIC_2(X1, Y1,;
440 );
441 }
442
443 xSrc = (X1 >> MLIB_SHIFT) - 1;
444 ySrc = (Y1 >> MLIB_SHIFT) - 1;
445
446 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 3 * xSrc + k;
447 s0 = srcPixelPtr[0];
448 s1 = srcPixelPtr[3];
449 s2 = srcPixelPtr[6];
450 s3 = srcPixelPtr[9];
451
452 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
453 s4 = srcPixelPtr[0];
454 s5 = srcPixelPtr[3];
455 s6 = srcPixelPtr[6];
456 s7 = srcPixelPtr[9];
457
458 if (filter == MLIB_BICUBIC) {
459 for (; dPtr <= (dstLineEnd - 1); dPtr += 3) {
460 X1 += dX;
461 Y1 += dY;
462
463 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
464 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
465 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
466 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[3] * xf1 +
467 srcPixelPtr[6] * xf2 + srcPixelPtr[9] * xf3);
468 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
469 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[3] * xf1 +
470 srcPixelPtr[6] * xf2 + srcPixelPtr[9] * xf3);
471
472 CREATE_COEF_BICUBIC(X1, Y1, val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
473
474 STORE(dPtr[0], val0);
475
476 xSrc = (X1 >> MLIB_SHIFT) - 1;
477 ySrc = (Y1 >> MLIB_SHIFT) - 1;
478
479 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 3 * xSrc + k;
480 s0 = srcPixelPtr[0];
481 s1 = srcPixelPtr[3];
482 s2 = srcPixelPtr[6];
483 s3 = srcPixelPtr[9];
484
485 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
486 s4 = srcPixelPtr[0];
487 s5 = srcPixelPtr[3];
488 s6 = srcPixelPtr[6];
489 s7 = srcPixelPtr[9];
490 }
491
492 }
493 else {
494 for (; dPtr <= (dstLineEnd - 1); dPtr += 3) {
495 X1 += dX;
496 Y1 += dY;
497
498 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
499 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
500 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
501 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[3] * xf1 +
502 srcPixelPtr[6] * xf2 + srcPixelPtr[9] * xf3);
503 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
504 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[3] * xf1 +
505 srcPixelPtr[6] * xf2 + srcPixelPtr[9] * xf3);
506
507 CREATE_COEF_BICUBIC_2(X1, Y1, val0 =
508 (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
509
510 STORE(dPtr[0], val0);
511
512 xSrc = (X1 >> MLIB_SHIFT) - 1;
513 ySrc = (Y1 >> MLIB_SHIFT) - 1;
514
515 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 3 * xSrc + k;
516 s0 = srcPixelPtr[0];
517 s1 = srcPixelPtr[3];
518 s2 = srcPixelPtr[6];
519 s3 = srcPixelPtr[9];
520
521 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
522 s4 = srcPixelPtr[0];
523 s5 = srcPixelPtr[3];
524 s6 = srcPixelPtr[6];
525 s7 = srcPixelPtr[9];
526 }
527 }
528
529 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
530 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
531 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
532 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[3] * xf1 +
533 srcPixelPtr[6] * xf2 + srcPixelPtr[9] * xf3);
534 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
535 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[3] * xf1 +
536 srcPixelPtr[6] * xf2 + srcPixelPtr[9] * xf3);
537
538 val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3);
539 STORE(dPtr[0], val0);
540 }
541 }
542
543 return MLIB_SUCCESS;
544}
545
546/***************************************************************/
547mlib_status FUN_NAME(4ch)(mlib_affine_param *param)
548{
549 DECLAREVAR_BC();
550 DTYPE *dstLineEnd;
551
552 for (j = yStart; j <= yFinish; j++) {
553 FTYPE xf0, xf1, xf2, xf3;
554 FTYPE yf0, yf1, yf2, yf3;
555 FTYPE dx, dx_2, dx2, dx3_2, dx3_3;
556 FTYPE dy, dy_2, dy2, dy3_2, dy3_3;
557 FTYPE c0, c1, c2, c3, val0;
558 FTYPE scale = 1 / 65536.f;
559 FTYPE s0, s1, s2, s3;
560 FTYPE s4, s5, s6, s7;
561 mlib_s32 k;
562
563 CLIP(4);
564 dstLineEnd = (DTYPE *) dstData + 4 * xRight;
565
566 for (k = 0; k < 4; k++) {
567 mlib_s32 X1 = X;
568 mlib_s32 Y1 = Y;
569 DTYPE *dPtr = dstPixelPtr + k;
570
571 if (filter == MLIB_BICUBIC) {
572 CREATE_COEF_BICUBIC(X1, Y1,;
573 );
574 }
575 else {
576 CREATE_COEF_BICUBIC_2(X1, Y1,;
577 );
578 }
579
580 xSrc = (X1 >> MLIB_SHIFT) - 1;
581 ySrc = (Y1 >> MLIB_SHIFT) - 1;
582
583 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 4 * xSrc + k;
584 s0 = srcPixelPtr[0];
585 s1 = srcPixelPtr[4];
586 s2 = srcPixelPtr[8];
587 s3 = srcPixelPtr[12];
588
589 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
590 s4 = srcPixelPtr[0];
591 s5 = srcPixelPtr[4];
592 s6 = srcPixelPtr[8];
593 s7 = srcPixelPtr[12];
594
595 if (filter == MLIB_BICUBIC) {
596 for (; dPtr <= (dstLineEnd - 1); dPtr += 4) {
597
598 X1 += dX;
599 Y1 += dY;
600
601 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
602 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
603 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
604 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[4] * xf1 +
605 srcPixelPtr[8] * xf2 + srcPixelPtr[12] * xf3);
606 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
607 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[4] * xf1 +
608 srcPixelPtr[8] * xf2 + srcPixelPtr[12] * xf3);
609
610 CREATE_COEF_BICUBIC(X1, Y1, val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
611
612 STORE(dPtr[0], val0);
613
614 xSrc = (X1 >> MLIB_SHIFT) - 1;
615 ySrc = (Y1 >> MLIB_SHIFT) - 1;
616
617 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 4 * xSrc + k;
618 s0 = srcPixelPtr[0];
619 s1 = srcPixelPtr[4];
620 s2 = srcPixelPtr[8];
621 s3 = srcPixelPtr[12];
622
623 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
624 s4 = srcPixelPtr[0];
625 s5 = srcPixelPtr[4];
626 s6 = srcPixelPtr[8];
627 s7 = srcPixelPtr[12];
628 }
629
630 }
631 else {
632 for (; dPtr <= (dstLineEnd - 1); dPtr += 4) {
633
634 X1 += dX;
635 Y1 += dY;
636
637 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
638 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
639 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
640 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[4] * xf1 +
641 srcPixelPtr[8] * xf2 + srcPixelPtr[12] * xf3);
642 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
643 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[4] * xf1 +
644 srcPixelPtr[8] * xf2 + srcPixelPtr[12] * xf3);
645
646 CREATE_COEF_BICUBIC_2(X1, Y1, val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3));
647
648 STORE(dPtr[0], val0);
649
650 xSrc = (X1 >> MLIB_SHIFT) - 1;
651 ySrc = (Y1 >> MLIB_SHIFT) - 1;
652
653 srcPixelPtr = ((DTYPE **) lineAddr)[ySrc] + 4 * xSrc + k;
654 s0 = srcPixelPtr[0];
655 s1 = srcPixelPtr[4];
656 s2 = srcPixelPtr[8];
657 s3 = srcPixelPtr[12];
658
659 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
660 s4 = srcPixelPtr[0];
661 s5 = srcPixelPtr[4];
662 s6 = srcPixelPtr[8];
663 s7 = srcPixelPtr[12];
664 }
665 }
666
667 c0 = (s0 * xf0 + s1 * xf1 + s2 * xf2 + s3 * xf3);
668 c1 = (s4 * xf0 + s5 * xf1 + s6 * xf2 + s7 * xf3);
669 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
670 c2 = (srcPixelPtr[0] * xf0 + srcPixelPtr[4] * xf1 +
671 srcPixelPtr[8] * xf2 + srcPixelPtr[12] * xf3);
672 srcPixelPtr = (DTYPE *) ((mlib_u8 *) srcPixelPtr + srcYStride);
673 c3 = (srcPixelPtr[0] * xf0 + srcPixelPtr[4] * xf1 +
674 srcPixelPtr[8] * xf2 + srcPixelPtr[12] * xf3);
675
676 val0 = (c0 * yf0 + c1 * yf1 + c2 * yf2 + c3 * yf3);
677 STORE(dPtr[0], val0);
678 }
679 }
680
681 return MLIB_SUCCESS;
682}
683
684/***************************************************************/