blob: 8f953c71edef1b8def2a92beece4ceaa8cd22f62 [file] [log] [blame]
DRCcdc8ac32009-06-25 20:38:31 +00001;
DRC72130be2014-05-09 20:14:26 +00002; jdmerge.asm - merged upsampling/color conversion (64-bit SSE2)
DRCcdc8ac32009-06-25 20:38:31 +00003;
4; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
5; Copyright 2009 D. R. Commander
6;
7; Based on
8; x86 SIMD extension for IJG JPEG library
9; Copyright (C) 1999-2006, MIYASAKA Masaru.
10; For conditions of distribution and use, see copyright notice in jsimdext.inc
11;
12; This file should be assembled with NASM (Netwide Assembler),
13; can *not* be assembled with Microsoft's MASM or any compatible
14; assembler (including Borland's Turbo Assembler).
15; NASM is available from http://nasm.sourceforge.net/ or
16; http://sourceforge.net/project/showfiles.php?group_id=6208
17;
18; [TAB8]
19
20%include "jsimdext.inc"
21
22; --------------------------------------------------------------------------
23
DRCe5eaf372014-05-09 18:00:32 +000024%define SCALEBITS 16
DRCcdc8ac32009-06-25 20:38:31 +000025
DRCe5eaf372014-05-09 18:00:32 +000026F_0_344 equ 22554 ; FIX(0.34414)
27F_0_714 equ 46802 ; FIX(0.71414)
28F_1_402 equ 91881 ; FIX(1.40200)
29F_1_772 equ 116130 ; FIX(1.77200)
30F_0_402 equ (F_1_402 - 65536) ; FIX(1.40200) - FIX(1)
31F_0_285 equ ( 65536 - F_0_714) ; FIX(1) - FIX(0.71414)
32F_0_228 equ (131072 - F_1_772) ; FIX(2) - FIX(1.77200)
DRCcdc8ac32009-06-25 20:38:31 +000033
34; --------------------------------------------------------------------------
DRCe5eaf372014-05-09 18:00:32 +000035 SECTION SEG_CONST
DRCcdc8ac32009-06-25 20:38:31 +000036
DRCe5eaf372014-05-09 18:00:32 +000037 alignz 16
38 global EXTN(jconst_merged_upsample_sse2)
DRCcdc8ac32009-06-25 20:38:31 +000039
40EXTN(jconst_merged_upsample_sse2):
41
DRCe5eaf372014-05-09 18:00:32 +000042PW_F0402 times 8 dw F_0_402
43PW_MF0228 times 8 dw -F_0_228
44PW_MF0344_F0285 times 4 dw -F_0_344, F_0_285
45PW_ONE times 8 dw 1
46PD_ONEHALF times 4 dd 1 << (SCALEBITS-1)
DRCcdc8ac32009-06-25 20:38:31 +000047
DRCe5eaf372014-05-09 18:00:32 +000048 alignz 16
DRCcdc8ac32009-06-25 20:38:31 +000049
50; --------------------------------------------------------------------------
DRCe5eaf372014-05-09 18:00:32 +000051 SECTION SEG_TEXT
52 BITS 64
DRC56fb2372011-05-03 06:32:41 +000053
DRC24e92e92014-05-10 09:53:34 +000054%include "jdmrgext-sse2-64.asm"
DRCcdc8ac32009-06-25 20:38:31 +000055
56%undef RGB_RED
57%undef RGB_GREEN
58%undef RGB_BLUE
59%undef RGB_PIXELSIZE
DRCb4570bb2011-09-07 06:31:00 +000060%define RGB_RED EXT_RGB_RED
61%define RGB_GREEN EXT_RGB_GREEN
62%define RGB_BLUE EXT_RGB_BLUE
63%define RGB_PIXELSIZE EXT_RGB_PIXELSIZE
DRCcdc8ac32009-06-25 20:38:31 +000064%define jsimd_h2v1_merged_upsample_sse2 jsimd_h2v1_extrgb_merged_upsample_sse2
65%define jsimd_h2v2_merged_upsample_sse2 jsimd_h2v2_extrgb_merged_upsample_sse2
DRC24e92e92014-05-10 09:53:34 +000066%include "jdmrgext-sse2-64.asm"
DRCcdc8ac32009-06-25 20:38:31 +000067
68%undef RGB_RED
69%undef RGB_GREEN
70%undef RGB_BLUE
71%undef RGB_PIXELSIZE
DRCb4570bb2011-09-07 06:31:00 +000072%define RGB_RED EXT_RGBX_RED
73%define RGB_GREEN EXT_RGBX_GREEN
74%define RGB_BLUE EXT_RGBX_BLUE
75%define RGB_PIXELSIZE EXT_RGBX_PIXELSIZE
DRCcdc8ac32009-06-25 20:38:31 +000076%define jsimd_h2v1_merged_upsample_sse2 jsimd_h2v1_extrgbx_merged_upsample_sse2
77%define jsimd_h2v2_merged_upsample_sse2 jsimd_h2v2_extrgbx_merged_upsample_sse2
DRC24e92e92014-05-10 09:53:34 +000078%include "jdmrgext-sse2-64.asm"
DRCcdc8ac32009-06-25 20:38:31 +000079
80%undef RGB_RED
81%undef RGB_GREEN
82%undef RGB_BLUE
83%undef RGB_PIXELSIZE
DRCb4570bb2011-09-07 06:31:00 +000084%define RGB_RED EXT_BGR_RED
85%define RGB_GREEN EXT_BGR_GREEN
86%define RGB_BLUE EXT_BGR_BLUE
87%define RGB_PIXELSIZE EXT_BGR_PIXELSIZE
DRCcdc8ac32009-06-25 20:38:31 +000088%define jsimd_h2v1_merged_upsample_sse2 jsimd_h2v1_extbgr_merged_upsample_sse2
89%define jsimd_h2v2_merged_upsample_sse2 jsimd_h2v2_extbgr_merged_upsample_sse2
DRC24e92e92014-05-10 09:53:34 +000090%include "jdmrgext-sse2-64.asm"
DRCcdc8ac32009-06-25 20:38:31 +000091
92%undef RGB_RED
93%undef RGB_GREEN
94%undef RGB_BLUE
95%undef RGB_PIXELSIZE
DRCb4570bb2011-09-07 06:31:00 +000096%define RGB_RED EXT_BGRX_RED
97%define RGB_GREEN EXT_BGRX_GREEN
98%define RGB_BLUE EXT_BGRX_BLUE
99%define RGB_PIXELSIZE EXT_BGRX_PIXELSIZE
DRCcdc8ac32009-06-25 20:38:31 +0000100%define jsimd_h2v1_merged_upsample_sse2 jsimd_h2v1_extbgrx_merged_upsample_sse2
101%define jsimd_h2v2_merged_upsample_sse2 jsimd_h2v2_extbgrx_merged_upsample_sse2
DRC24e92e92014-05-10 09:53:34 +0000102%include "jdmrgext-sse2-64.asm"
DRCcdc8ac32009-06-25 20:38:31 +0000103
104%undef RGB_RED
105%undef RGB_GREEN
106%undef RGB_BLUE
107%undef RGB_PIXELSIZE
DRCb4570bb2011-09-07 06:31:00 +0000108%define RGB_RED EXT_XBGR_RED
109%define RGB_GREEN EXT_XBGR_GREEN
110%define RGB_BLUE EXT_XBGR_BLUE
111%define RGB_PIXELSIZE EXT_XBGR_PIXELSIZE
DRCcdc8ac32009-06-25 20:38:31 +0000112%define jsimd_h2v1_merged_upsample_sse2 jsimd_h2v1_extxbgr_merged_upsample_sse2
113%define jsimd_h2v2_merged_upsample_sse2 jsimd_h2v2_extxbgr_merged_upsample_sse2
DRC24e92e92014-05-10 09:53:34 +0000114%include "jdmrgext-sse2-64.asm"
DRCcdc8ac32009-06-25 20:38:31 +0000115
116%undef RGB_RED
117%undef RGB_GREEN
118%undef RGB_BLUE
119%undef RGB_PIXELSIZE
DRCb4570bb2011-09-07 06:31:00 +0000120%define RGB_RED EXT_XRGB_RED
121%define RGB_GREEN EXT_XRGB_GREEN
122%define RGB_BLUE EXT_XRGB_BLUE
123%define RGB_PIXELSIZE EXT_XRGB_PIXELSIZE
DRCcdc8ac32009-06-25 20:38:31 +0000124%define jsimd_h2v1_merged_upsample_sse2 jsimd_h2v1_extxrgb_merged_upsample_sse2
125%define jsimd_h2v2_merged_upsample_sse2 jsimd_h2v2_extxrgb_merged_upsample_sse2
DRC24e92e92014-05-10 09:53:34 +0000126%include "jdmrgext-sse2-64.asm"