1 /*
   2  * Copyright (c) 2003, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.  Oracle designates this
   8  * particular file as subject to the "Classpath" exception as provided
   9  * by Oracle in the LICENSE file that accompanied this code.
  10  *
  11  * This code is distributed in the hope that it will be useful, but WITHOUT
  12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14  * version 2 for more details (a copy is included in the LICENSE file that
  15  * accompanied this code).
  16  *
  17  * You should have received a copy of the GNU General Public License version
  18  * 2 along with this work; if not, write to the Free Software Foundation,
  19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  20  *
  21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  22  * or visit www.oracle.com if you need additional information or have any
  23  * questions.
  24  */
  25 
  26 
  27 /*
  28  * FUNCTION
  29  *      mlib_ImageAffine_u16_1ch_bl
  30  *      mlib_ImageAffine_u16_2ch_bl
  31  *      mlib_ImageAffine_u16_3ch_bl
  32  *      mlib_ImageAffine_u16_4ch_bl
  33  *        - image affine transformation with Bilinear filtering
  34  * SYNOPSIS
  35  *      mlib_status mlib_ImageAffine_u16_?ch_bl(mlib_s32 *leftEdges,
  36  *                                              mlib_s32 *rightEdges,
  37  *                                              mlib_s32 *xStarts,
  38  *                                              mlib_s32 *yStarts,
  39  *                                              mlib_s32 *sides,
  40  *                                              mlib_u8  *dstData,
  41  *                                              mlib_u8  **lineAddr,
  42  *                                              mlib_s32 dstYStride,
  43  *                                              mlib_s32 is_affine,
  44  *                                              mlib_s32 srcYStride)
  45  *
  46  * ARGUMENTS
  47  *      leftEdges  array[dstHeight] of xLeft coordinates
  48  *      RightEdges array[dstHeight] of xRight coordinates
  49  *      xStarts    array[dstHeight] of xStart * 65536 coordinates
  50  *      yStarts    array[dstHeight] of yStart * 65536 coordinates
  51  *      sides      output array[4]. sides[0] is yStart, sides[1] is yFinish,
  52  *                 sides[2] is dx * 65536, sides[3] is dy * 65536
  53  *      dstData    pointer to the first pixel on (yStart - 1) line
  54  *      lineAddr   array[srcHeight] of pointers to the first pixel on
  55  *                 the corresponding lines
  56  *      dstYStride stride of destination image
  57  *      is_affine  indicator (Affine - GridWarp)
  58  *      srcYStride stride of source image
  59  *
  60  * DESCRIPTION
  61  *      The functions step along the lines from xLeft to xRight and apply
  62  *      the bilinear filtering.
  63  *
  64  */
  65 
  66 #include "mlib_ImageAffine.h"
  67 
  68 /***************************************************************/
  69 #define DTYPE  mlib_u16
  70 #define FTYPE  mlib_d64
  71 
  72 /***************************************************************/
  73 #define TTYPE    mlib_s32
  74 #define I2F(x)   (x)
  75 #define ROUND(x) (x)
  76 
  77 #define FUN_NAME(CHAN) mlib_ImageAffine_u16_##CHAN##_bl
  78 
  79 /***************************************************************/
  80 #ifdef __sparc /* for SPARC, using floating-point multiplies is faster */
  81 
  82 /***************************************************************/
  83 #define GET_POINTERS(ind)                                       \
  84   fdx = (FTYPE)(X & MLIB_MASK) * scale;                         \
  85   fdy = (FTYPE)(Y & MLIB_MASK) * scale;                         \
  86   ySrc = MLIB_POINTER_SHIFT(Y);  Y += dY;                       \
  87   xSrc = X >> MLIB_SHIFT;  X += dX;                             \
  88   srcPixelPtr = MLIB_POINTER_GET(lineAddr, ySrc) + ind * xSrc;  \
  89   srcPixelPtr2 = (DTYPE *)((mlib_u8 *)srcPixelPtr + srcYStride)
  90 
  91 /***************************************************************/
  92 #define COUNT(ind)                                              \
  93   pix0_##ind = a00_##ind + fdy * (a10_##ind - a00_##ind);       \
  94   pix1_##ind = a01_##ind + fdy * (a11_##ind - a01_##ind);       \
  95   res##ind = ROUND(pix0_##ind + fdx * (pix1_##ind - pix0_##ind))
  96 
  97 /***************************************************************/
  98 #define LOAD(ind, ind1, ind2)                                   \
  99   a00_##ind = I2F(srcPixelPtr[ind1]);                           \
 100   a01_##ind = I2F(srcPixelPtr[ind2]);                           \
 101   a10_##ind = I2F(srcPixelPtr2[ind1]);                          \
 102   a11_##ind = I2F(srcPixelPtr2[ind2])
 103 
 104 /***************************************************************/
 105 mlib_status FUN_NAME(1ch)(mlib_affine_param *param)
 106 {
 107   DECLAREVAR_BL();
 108   DTYPE *dstLineEnd;
 109   DTYPE *srcPixelPtr2;
 110   FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
 111 
 112   for (j = yStart; j <= yFinish; j++) {
 113     FTYPE fdx, fdy;
 114     TTYPE a00_0, a01_0, a10_0, a11_0;
 115     FTYPE pix0_0, pix1_0, res0;
 116 
 117     CLIP(1);
 118     dstLineEnd = (DTYPE *) dstData + xRight;
 119 
 120     GET_POINTERS(1);
 121     LOAD(0, 0, 1);
 122 
 123 #ifdef __SUNPRO_C
 124 #pragma pipeloop(0)
 125 #endif /* __SUNPRO_C */
 126     for (; dstPixelPtr < dstLineEnd; dstPixelPtr++) {
 127       COUNT(0);
 128       GET_POINTERS(1);
 129       LOAD(0, 0, 1);
 130       dstPixelPtr[0] = (DTYPE) res0;
 131     }
 132 
 133     COUNT(0);
 134     dstPixelPtr[0] = (DTYPE) res0;
 135   }
 136 
 137   return MLIB_SUCCESS;
 138 }
 139 
 140 /***************************************************************/
 141 mlib_status FUN_NAME(2ch)(mlib_affine_param *param)
 142 {
 143   DECLAREVAR_BL();
 144   DTYPE *dstLineEnd;
 145   DTYPE *srcPixelPtr2;
 146   FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
 147 
 148   for (j = yStart; j <= yFinish; j++) {
 149     FTYPE fdx, fdy;
 150     TTYPE a00_0, a01_0, a10_0, a11_0;
 151     TTYPE a00_1, a01_1, a10_1, a11_1;
 152     FTYPE pix0_0, pix1_0, res0;
 153     FTYPE pix0_1, pix1_1, res1;
 154 
 155     CLIP(2);
 156     dstLineEnd = (DTYPE *) dstData + 2 * xRight;
 157 
 158     GET_POINTERS(2);
 159     LOAD(0, 0, 2);
 160     LOAD(1, 1, 3);
 161 
 162 #ifdef __SUNPRO_C
 163 #pragma pipeloop(0)
 164 #endif /* __SUNPRO_C */
 165     for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 2) {
 166       COUNT(0);
 167       COUNT(1);
 168       GET_POINTERS(2);
 169       LOAD(0, 0, 2);
 170       LOAD(1, 1, 3);
 171       dstPixelPtr[0] = (DTYPE) res0;
 172       dstPixelPtr[1] = (DTYPE) res1;
 173     }
 174 
 175     COUNT(0);
 176     COUNT(1);
 177     dstPixelPtr[0] = (DTYPE) res0;
 178     dstPixelPtr[1] = (DTYPE) res1;
 179   }
 180 
 181   return MLIB_SUCCESS;
 182 }
 183 
 184 /***************************************************************/
 185 mlib_status FUN_NAME(3ch)(mlib_affine_param *param)
 186 {
 187   DECLAREVAR_BL();
 188   DTYPE *dstLineEnd;
 189   DTYPE *srcPixelPtr2;
 190   FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
 191 
 192   for (j = yStart; j <= yFinish; j++) {
 193     FTYPE fdx, fdy;
 194     FTYPE a00_0, a01_0, a10_0, a11_0;
 195     FTYPE a00_1, a01_1, a10_1, a11_1;
 196     FTYPE a00_2, a01_2, a10_2, a11_2;
 197     FTYPE pix0_0, pix1_0, res0;
 198     FTYPE pix0_1, pix1_1, res1;
 199     FTYPE pix0_2, pix1_2, res2;
 200 
 201     CLIP(3);
 202     dstLineEnd = (DTYPE *) dstData + 3 * xRight;
 203 
 204     GET_POINTERS(3);
 205     LOAD(0, 0, 3);
 206     LOAD(1, 1, 4);
 207     LOAD(2, 2, 5);
 208 
 209 #ifdef __SUNPRO_C
 210 #pragma pipeloop(0)
 211 #endif /* __SUNPRO_C */
 212     for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 3) {
 213       COUNT(0);
 214       COUNT(1);
 215       COUNT(2);
 216       GET_POINTERS(3);
 217       LOAD(0, 0, 3);
 218       LOAD(1, 1, 4);
 219       LOAD(2, 2, 5);
 220       dstPixelPtr[0] = (DTYPE) res0;
 221       dstPixelPtr[1] = (DTYPE) res1;
 222       dstPixelPtr[2] = (DTYPE) res2;
 223     }
 224 
 225     COUNT(0);
 226     COUNT(1);
 227     COUNT(2);
 228     dstPixelPtr[0] = (DTYPE) res0;
 229     dstPixelPtr[1] = (DTYPE) res1;
 230     dstPixelPtr[2] = (DTYPE) res2;
 231   }
 232 
 233   return MLIB_SUCCESS;
 234 }
 235 
 236 /***************************************************************/
 237 mlib_status FUN_NAME(4ch)(mlib_affine_param *param)
 238 {
 239   DECLAREVAR_BL();
 240   DTYPE *dstLineEnd;
 241   DTYPE *srcPixelPtr2;
 242   FTYPE scale = (FTYPE) 1.0 / MLIB_PREC;
 243 
 244   for (j = yStart; j <= yFinish; j++) {
 245     FTYPE fdx, fdy;
 246     TTYPE a00_0, a01_0, a10_0, a11_0;
 247     TTYPE a00_1, a01_1, a10_1, a11_1;
 248     TTYPE a00_2, a01_2, a10_2, a11_2;
 249     TTYPE a00_3, a01_3, a10_3, a11_3;
 250     FTYPE pix0_0, pix1_0, res0;
 251     FTYPE pix0_1, pix1_1, res1;
 252     FTYPE pix0_2, pix1_2, res2;
 253     FTYPE pix0_3, pix1_3, res3;
 254 
 255     CLIP(4);
 256     dstLineEnd = (DTYPE *) dstData + 4 * xRight;
 257 
 258     GET_POINTERS(4);
 259     LOAD(0, 0, 4);
 260     LOAD(1, 1, 5);
 261     LOAD(2, 2, 6);
 262     LOAD(3, 3, 7);
 263 
 264 #ifdef __SUNPRO_C
 265 #pragma pipeloop(0)
 266 #endif /* __SUNPRO_C */
 267     for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 4) {
 268       COUNT(0);
 269       COUNT(1);
 270       COUNT(2);
 271       COUNT(3);
 272       GET_POINTERS(4);
 273       LOAD(0, 0, 4);
 274       LOAD(1, 1, 5);
 275       LOAD(2, 2, 6);
 276       LOAD(3, 3, 7);
 277       dstPixelPtr[0] = (DTYPE) res0;
 278       dstPixelPtr[1] = (DTYPE) res1;
 279       dstPixelPtr[2] = (DTYPE) res2;
 280       dstPixelPtr[3] = (DTYPE) res3;
 281     }
 282 
 283     COUNT(0);
 284     COUNT(1);
 285     COUNT(2);
 286     COUNT(3);
 287     dstPixelPtr[0] = (DTYPE) res0;
 288     dstPixelPtr[1] = (DTYPE) res1;
 289     dstPixelPtr[2] = (DTYPE) res2;
 290     dstPixelPtr[3] = (DTYPE) res3;
 291   }
 292 
 293   return MLIB_SUCCESS;
 294 }
 295 
 296 /***************************************************************/
 297 #else       /* for x86, using integer multiplies is faster */
 298 
 299 /***************************************************************/
 300 /* for SHORT/USHORT decrease MLIB_SHIFT due to overflow in multiplies like fdy * (a10 - a00) */
 301 #undef  MLIB_SHIFT
 302 #define MLIB_SHIFT  15
 303 
 304 #define MLIB_ROUND   (1 << (MLIB_SHIFT - 1))
 305 
 306 /***************************************************************/
 307 #define GET_POINTERS(ind)                                        \
 308   fdx = X & MLIB_MASK;                                           \
 309   fdy = Y & MLIB_MASK;                                           \
 310   ySrc = MLIB_POINTER_SHIFT(Y);                                  \
 311   xSrc = X >> MLIB_SHIFT;                                        \
 312   srcPixelPtr = MLIB_POINTER_GET(lineAddr, ySrc) + ind * xSrc;   \
 313   srcPixelPtr2 = (DTYPE *)((mlib_u8 *)srcPixelPtr + srcYStride); \
 314   X += dX;                                                       \
 315   Y += dY
 316 
 317 /***************************************************************/
 318 #define COUNT(ind)                                                                       \
 319   pix0_##ind = a00_##ind + ((fdy * (a10_##ind - a00_##ind) + MLIB_ROUND) >> MLIB_SHIFT); \
 320   pix1_##ind = a01_##ind + ((fdy * (a11_##ind - a01_##ind) + MLIB_ROUND) >> MLIB_SHIFT); \
 321   res##ind = pix0_##ind + ((fdx * (pix1_##ind - pix0_##ind) + MLIB_ROUND) >> MLIB_SHIFT)
 322 
 323 /***************************************************************/
 324 #define LOAD(ind, ind1, ind2)                                   \
 325   a00_##ind = srcPixelPtr[ind1];                                \
 326   a01_##ind = srcPixelPtr[ind2];                                \
 327   a10_##ind = srcPixelPtr2[ind1];                               \
 328   a11_##ind = srcPixelPtr2[ind2]
 329 
 330 /***************************************************************/
 331 mlib_status FUN_NAME(1ch)(mlib_affine_param *param)
 332 {
 333   DECLAREVAR_BL();
 334   DTYPE *dstLineEnd;
 335   DTYPE *srcPixelPtr2;
 336 
 337 #if MLIB_SHIFT == 15
 338   dX = (dX + 1) >> 1;
 339   dY = (dY + 1) >> 1;
 340 #endif
 341 
 342   for (j = yStart; j <= yFinish; j++) {
 343     mlib_s32 fdx, fdy;
 344     mlib_s32 a00_0, a01_0, a10_0, a11_0;
 345     mlib_s32 pix0_0, pix1_0, res0;
 346 
 347     CLIP(1);
 348     dstLineEnd = (DTYPE *) dstData + xRight;
 349 #if MLIB_SHIFT == 15
 350     X = X >> 1;
 351     Y = Y >> 1;
 352 
 353     if (warp_tbl != NULL) {
 354       dX = (dX + 1) >> 1;
 355       dY = (dY + 1) >> 1;
 356     }
 357 
 358 #endif
 359 
 360     GET_POINTERS(1);
 361     LOAD(0, 0, 1);
 362 
 363 #ifdef __SUNPRO_C
 364 #pragma pipeloop(0)
 365 #endif /* __SUNPRO_C */
 366     for (; dstPixelPtr < dstLineEnd; dstPixelPtr++) {
 367       COUNT(0);
 368       GET_POINTERS(1);
 369       LOAD(0, 0, 1);
 370       dstPixelPtr[0] = (DTYPE) res0;
 371     }
 372 
 373     COUNT(0);
 374     dstPixelPtr[0] = (DTYPE) res0;
 375   }
 376 
 377   return MLIB_SUCCESS;
 378 }
 379 
 380 /***************************************************************/
 381 mlib_status FUN_NAME(2ch)(mlib_affine_param *param)
 382 {
 383   DECLAREVAR_BL();
 384   DTYPE *dstLineEnd;
 385   DTYPE *srcPixelPtr2;
 386 
 387 #if MLIB_SHIFT == 15
 388   dX = (dX + 1) >> 1;
 389   dY = (dY + 1) >> 1;
 390 #endif
 391 
 392   for (j = yStart; j <= yFinish; j++) {
 393     mlib_s32 fdx, fdy;
 394     mlib_s32 a00_0, a01_0, a10_0, a11_0;
 395     mlib_s32 a00_1, a01_1, a10_1, a11_1;
 396     mlib_s32 pix0_0, pix1_0, res0;
 397     mlib_s32 pix0_1, pix1_1, res1;
 398 
 399     CLIP(2);
 400     dstLineEnd = (DTYPE *) dstData + 2 * xRight;
 401 #if MLIB_SHIFT == 15
 402     X = X >> 1;
 403     Y = Y >> 1;
 404 
 405     if (warp_tbl != NULL) {
 406       dX = (dX + 1) >> 1;
 407       dY = (dY + 1) >> 1;
 408     }
 409 
 410 #endif
 411 
 412     GET_POINTERS(2);
 413     LOAD(0, 0, 2);
 414     LOAD(1, 1, 3);
 415 
 416 #ifdef __SUNPRO_C
 417 #pragma pipeloop(0)
 418 #endif /* __SUNPRO_C */
 419     for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 2) {
 420       COUNT(0);
 421       COUNT(1);
 422       GET_POINTERS(2);
 423       LOAD(0, 0, 2);
 424       LOAD(1, 1, 3);
 425       dstPixelPtr[0] = (DTYPE) res0;
 426       dstPixelPtr[1] = (DTYPE) res1;
 427     }
 428 
 429     COUNT(0);
 430     COUNT(1);
 431     dstPixelPtr[0] = (DTYPE) res0;
 432     dstPixelPtr[1] = (DTYPE) res1;
 433   }
 434 
 435   return MLIB_SUCCESS;
 436 }
 437 
 438 /***************************************************************/
 439 mlib_status FUN_NAME(3ch)(mlib_affine_param *param)
 440 {
 441   DECLAREVAR_BL();
 442   DTYPE *dstLineEnd;
 443   DTYPE *srcPixelPtr2;
 444 
 445 #if MLIB_SHIFT == 15
 446   dX = (dX + 1) >> 1;
 447   dY = (dY + 1) >> 1;
 448 #endif
 449 
 450   for (j = yStart; j <= yFinish; j++) {
 451     mlib_s32 fdx, fdy;
 452     mlib_s32 a00_0, a01_0, a10_0, a11_0;
 453     mlib_s32 a00_1, a01_1, a10_1, a11_1;
 454     mlib_s32 a00_2, a01_2, a10_2, a11_2;
 455     mlib_s32 pix0_0, pix1_0, res0;
 456     mlib_s32 pix0_1, pix1_1, res1;
 457     mlib_s32 pix0_2, pix1_2, res2;
 458 
 459     CLIP(3);
 460     dstLineEnd = (DTYPE *) dstData + 3 * xRight;
 461 #if MLIB_SHIFT == 15
 462     X = X >> 1;
 463     Y = Y >> 1;
 464 
 465     if (warp_tbl != NULL) {
 466       dX = (dX + 1) >> 1;
 467       dY = (dY + 1) >> 1;
 468     }
 469 
 470 #endif
 471 
 472     GET_POINTERS(3);
 473     LOAD(0, 0, 3);
 474     LOAD(1, 1, 4);
 475     LOAD(2, 2, 5);
 476 
 477 #ifdef __SUNPRO_C
 478 #pragma pipeloop(0)
 479 #endif /* __SUNPRO_C */
 480     for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 3) {
 481       COUNT(0);
 482       COUNT(1);
 483       COUNT(2);
 484       GET_POINTERS(3);
 485       LOAD(0, 0, 3);
 486       LOAD(1, 1, 4);
 487       LOAD(2, 2, 5);
 488       dstPixelPtr[0] = (DTYPE) res0;
 489       dstPixelPtr[1] = (DTYPE) res1;
 490       dstPixelPtr[2] = (DTYPE) res2;
 491     }
 492 
 493     COUNT(0);
 494     COUNT(1);
 495     COUNT(2);
 496     dstPixelPtr[0] = (DTYPE) res0;
 497     dstPixelPtr[1] = (DTYPE) res1;
 498     dstPixelPtr[2] = (DTYPE) res2;
 499   }
 500 
 501   return MLIB_SUCCESS;
 502 }
 503 
 504 /***************************************************************/
 505 mlib_status FUN_NAME(4ch)(mlib_affine_param *param)
 506 {
 507   DECLAREVAR_BL();
 508   DTYPE *dstLineEnd;
 509   DTYPE *srcPixelPtr2;
 510 
 511 #if MLIB_SHIFT == 15
 512   dX = (dX + 1) >> 1;
 513   dY = (dY + 1) >> 1;
 514 #endif
 515 
 516   for (j = yStart; j <= yFinish; j++) {
 517     mlib_s32 fdx, fdy;
 518     mlib_s32 a00_0, a01_0, a10_0, a11_0;
 519     mlib_s32 a00_1, a01_1, a10_1, a11_1;
 520     mlib_s32 a00_2, a01_2, a10_2, a11_2;
 521     mlib_s32 a00_3, a01_3, a10_3, a11_3;
 522     mlib_s32 pix0_0, pix1_0, res0;
 523     mlib_s32 pix0_1, pix1_1, res1;
 524     mlib_s32 pix0_2, pix1_2, res2;
 525     mlib_s32 pix0_3, pix1_3, res3;
 526 
 527     CLIP(4);
 528     dstLineEnd = (DTYPE *) dstData + 4 * xRight;
 529 #if MLIB_SHIFT == 15
 530     X = X >> 1;
 531     Y = Y >> 1;
 532 
 533     if (warp_tbl != NULL) {
 534       dX = (dX + 1) >> 1;
 535       dY = (dY + 1) >> 1;
 536     }
 537 
 538 #endif
 539 
 540     GET_POINTERS(4);
 541     LOAD(0, 0, 4);
 542     LOAD(1, 1, 5);
 543     LOAD(2, 2, 6);
 544     LOAD(3, 3, 7);
 545 
 546 #ifdef __SUNPRO_C
 547 #pragma pipeloop(0)
 548 #endif /* __SUNPRO_C */
 549     for (; dstPixelPtr < dstLineEnd; dstPixelPtr += 4) {
 550       COUNT(0);
 551       COUNT(1);
 552       COUNT(2);
 553       COUNT(3);
 554       GET_POINTERS(4);
 555       LOAD(0, 0, 4);
 556       LOAD(1, 1, 5);
 557       LOAD(2, 2, 6);
 558       LOAD(3, 3, 7);
 559       dstPixelPtr[0] = (DTYPE) res0;
 560       dstPixelPtr[1] = (DTYPE) res1;
 561       dstPixelPtr[2] = (DTYPE) res2;
 562       dstPixelPtr[3] = (DTYPE) res3;
 563     }
 564 
 565     COUNT(0);
 566     COUNT(1);
 567     COUNT(2);
 568     COUNT(3);
 569     dstPixelPtr[0] = (DTYPE) res0;
 570     dstPixelPtr[1] = (DTYPE) res1;
 571     dstPixelPtr[2] = (DTYPE) res2;
 572     dstPixelPtr[3] = (DTYPE) res3;
 573   }
 574 
 575   return MLIB_SUCCESS;
 576 }
 577 
 578 #endif /* #ifdef __sparc */
 579 
 580 /***************************************************************/