Imported Upstream version 1.5.3
[platform/upstream/libjpeg-turbo.git] / simd / jdcolor-sse2.asm
1 ;
2 ; jdcolor.asm - colorspace conversion (SSE2)
3 ;
4 ; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
5 ; Copyright (C) 2009, D. R. Commander.
6 ;
7 ; Based on the x86 SIMD extension for IJG JPEG library
8 ; Copyright (C) 1999-2006, MIYASAKA Masaru.
9 ; For conditions of distribution and use, see copyright notice in jsimdext.inc
10 ;
11 ; This file should be assembled with NASM (Netwide Assembler),
12 ; can *not* be assembled with Microsoft's MASM or any compatible
13 ; assembler (including Borland's Turbo Assembler).
14 ; NASM is available from http://nasm.sourceforge.net/ or
15 ; http://sourceforge.net/project/showfiles.php?group_id=6208
16 ;
17 ; [TAB8]
18
19 %include "jsimdext.inc"
20
21 ; --------------------------------------------------------------------------
22
23 %define SCALEBITS       16
24
25 F_0_344 equ      22554                  ; FIX(0.34414)
26 F_0_714 equ      46802                  ; FIX(0.71414)
27 F_1_402 equ      91881                  ; FIX(1.40200)
28 F_1_772 equ     116130                  ; FIX(1.77200)
29 F_0_402 equ     (F_1_402 - 65536)       ; FIX(1.40200) - FIX(1)
30 F_0_285 equ     ( 65536 - F_0_714)      ; FIX(1) - FIX(0.71414)
31 F_0_228 equ     (131072 - F_1_772)      ; FIX(2) - FIX(1.77200)
32
33 ; --------------------------------------------------------------------------
34         SECTION SEG_CONST
35
36         alignz  16
37         global  EXTN(jconst_ycc_rgb_convert_sse2)
38
39 EXTN(jconst_ycc_rgb_convert_sse2):
40
41 PW_F0402        times 8 dw  F_0_402
42 PW_MF0228       times 8 dw -F_0_228
43 PW_MF0344_F0285 times 4 dw -F_0_344, F_0_285
44 PW_ONE          times 8 dw  1
45 PD_ONEHALF      times 4 dd  1 << (SCALEBITS-1)
46
47         alignz  16
48
49 ; --------------------------------------------------------------------------
50         SECTION SEG_TEXT
51         BITS    32
52
53 %include "jdcolext-sse2.asm"
54
55 %undef RGB_RED
56 %undef RGB_GREEN
57 %undef RGB_BLUE
58 %undef RGB_PIXELSIZE
59 %define RGB_RED EXT_RGB_RED
60 %define RGB_GREEN EXT_RGB_GREEN
61 %define RGB_BLUE EXT_RGB_BLUE
62 %define RGB_PIXELSIZE EXT_RGB_PIXELSIZE
63 %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extrgb_convert_sse2
64 %include "jdcolext-sse2.asm"
65
66 %undef RGB_RED
67 %undef RGB_GREEN
68 %undef RGB_BLUE
69 %undef RGB_PIXELSIZE
70 %define RGB_RED EXT_RGBX_RED
71 %define RGB_GREEN EXT_RGBX_GREEN
72 %define RGB_BLUE EXT_RGBX_BLUE
73 %define RGB_PIXELSIZE EXT_RGBX_PIXELSIZE
74 %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extrgbx_convert_sse2
75 %include "jdcolext-sse2.asm"
76
77 %undef RGB_RED
78 %undef RGB_GREEN
79 %undef RGB_BLUE
80 %undef RGB_PIXELSIZE
81 %define RGB_RED EXT_BGR_RED
82 %define RGB_GREEN EXT_BGR_GREEN
83 %define RGB_BLUE EXT_BGR_BLUE
84 %define RGB_PIXELSIZE EXT_BGR_PIXELSIZE
85 %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extbgr_convert_sse2
86 %include "jdcolext-sse2.asm"
87
88 %undef RGB_RED
89 %undef RGB_GREEN
90 %undef RGB_BLUE
91 %undef RGB_PIXELSIZE
92 %define RGB_RED EXT_BGRX_RED
93 %define RGB_GREEN EXT_BGRX_GREEN
94 %define RGB_BLUE EXT_BGRX_BLUE
95 %define RGB_PIXELSIZE EXT_BGRX_PIXELSIZE
96 %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extbgrx_convert_sse2
97 %include "jdcolext-sse2.asm"
98
99 %undef RGB_RED
100 %undef RGB_GREEN
101 %undef RGB_BLUE
102 %undef RGB_PIXELSIZE
103 %define RGB_RED EXT_XBGR_RED
104 %define RGB_GREEN EXT_XBGR_GREEN
105 %define RGB_BLUE EXT_XBGR_BLUE
106 %define RGB_PIXELSIZE EXT_XBGR_PIXELSIZE
107 %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extxbgr_convert_sse2
108 %include "jdcolext-sse2.asm"
109
110 %undef RGB_RED
111 %undef RGB_GREEN
112 %undef RGB_BLUE
113 %undef RGB_PIXELSIZE
114 %define RGB_RED EXT_XRGB_RED
115 %define RGB_GREEN EXT_XRGB_GREEN
116 %define RGB_BLUE EXT_XRGB_BLUE
117 %define RGB_PIXELSIZE EXT_XRGB_PIXELSIZE
118 %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extxrgb_convert_sse2
119 %include "jdcolext-sse2.asm"