|
1 /* |
|
2 * simd/jsimd.h |
|
3 * |
|
4 * Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB |
|
5 * Copyright 2011 D. R. Commander |
|
6 * |
|
7 * Based on the x86 SIMD extension for IJG JPEG library, |
|
8 * Copyright (C) 1999-2006, MIYASAKA Masaru. |
|
9 * For conditions of distribution and use, see copyright notice in jsimdext.inc |
|
10 * |
|
11 */ |
|
12 |
|
13 /* Bitmask for supported acceleration methods */ |
|
14 |
|
15 #define JSIMD_NONE 0x00 |
|
16 #define JSIMD_MMX 0x01 |
|
17 #define JSIMD_3DNOW 0x02 |
|
18 #define JSIMD_SSE 0x04 |
|
19 #define JSIMD_SSE2 0x08 |
|
20 #define JSIMD_ARM_NEON 0x10 |
|
21 |
|
22 /* Short forms of external names for systems with brain-damaged linkers. */ |
|
23 |
|
24 #ifdef NEED_SHORT_EXTERNAL_NAMES |
|
25 #define jpeg_simd_cpu_support jSiCpuSupport |
|
26 #define jsimd_rgb_ycc_convert_mmx jSRGBYCCM |
|
27 #define jsimd_extrgb_ycc_convert_mmx jSEXTRGBYCCM |
|
28 #define jsimd_extrgbx_ycc_convert_mmx jSEXTRGBXYCCM |
|
29 #define jsimd_extbgr_ycc_convert_mmx jSEXTBGRYCCM |
|
30 #define jsimd_extbgrx_ycc_convert_mmx jSEXTBGRXYCCM |
|
31 #define jsimd_extxbgr_ycc_convert_mmx jSEXTXBGRYCCM |
|
32 #define jsimd_extxrgb_ycc_convert_mmx jSEXTXRGBYCCM |
|
33 #define jsimd_rgb_gray_convert_mmx jSRGBGRYM |
|
34 #define jsimd_extrgb_gray_convert_mmx jSEXTRGBGRYM |
|
35 #define jsimd_extrgbx_gray_convert_mmx jSEXTRGBXGRYM |
|
36 #define jsimd_extbgr_gray_convert_mmx jSEXTBGRGRYM |
|
37 #define jsimd_extbgrx_gray_convert_mmx jSEXTBGRXGRYM |
|
38 #define jsimd_extxbgr_gray_convert_mmx jSEXTXBGRGRYM |
|
39 #define jsimd_extxrgb_gray_convert_mmx jSEXTXRGBGRYM |
|
40 #define jsimd_ycc_rgb_convert_mmx jSYCCRGBM |
|
41 #define jsimd_ycc_extrgb_convert_mmx jSYCCEXTRGBM |
|
42 #define jsimd_ycc_extrgbx_convert_mmx jSYCCEXTRGBXM |
|
43 #define jsimd_ycc_extbgr_convert_mmx jSYCCEXTBGRM |
|
44 #define jsimd_ycc_extbgrx_convert_mmx jSYCCEXTBGRXM |
|
45 #define jsimd_ycc_extxbgr_convert_mmx jSYCCEXTXBGRM |
|
46 #define jsimd_ycc_extxrgb_convert_mmx jSYCCEXTXRGBM |
|
47 #define jconst_rgb_ycc_convert_sse2 jSCRGBYCCS2 |
|
48 #define jsimd_rgb_ycc_convert_sse2 jSRGBYCCS2 |
|
49 #define jsimd_extrgb_ycc_convert_sse2 jSEXTRGBYCCS2 |
|
50 #define jsimd_extrgbx_ycc_convert_sse2 jSEXTRGBXYCCS2 |
|
51 #define jsimd_extbgr_ycc_convert_sse2 jSEXTBGRYCCS2 |
|
52 #define jsimd_extbgrx_ycc_convert_sse2 jSEXTBGRXYCCS2 |
|
53 #define jsimd_extxbgr_ycc_convert_sse2 jSEXTXBGRYCCS2 |
|
54 #define jsimd_extxrgb_ycc_convert_sse2 jSEXTXRGBYCCS2 |
|
55 #define jconst_rgb_gray_convert_sse2 jSCRGBGRYS2 |
|
56 #define jsimd_rgb_gray_convert_sse2 jSRGBGRYS2 |
|
57 #define jsimd_extrgb_gray_convert_sse2 jSEXTRGBGRYS2 |
|
58 #define jsimd_extrgbx_gray_convert_sse2 jSEXTRGBXGRYS2 |
|
59 #define jsimd_extbgr_gray_convert_sse2 jSEXTBGRGRYS2 |
|
60 #define jsimd_extbgrx_gray_convert_sse2 jSEXTBGRXGRYS2 |
|
61 #define jsimd_extxbgr_gray_convert_sse2 jSEXTXBGRGRYS2 |
|
62 #define jsimd_extxrgb_gray_convert_sse2 jSEXTXRGBGRYS2 |
|
63 #define jconst_ycc_rgb_convert_sse2 jSCYCCRGBS2 |
|
64 #define jsimd_ycc_rgb_convert_sse2 jSYCCRGBS2 |
|
65 #define jsimd_ycc_extrgb_convert_sse2 jSYCCEXTRGBS2 |
|
66 #define jsimd_ycc_extrgbx_convert_sse2 jSYCCEXTRGBXS2 |
|
67 #define jsimd_ycc_extbgr_convert_sse2 jSYCCEXTBGRS2 |
|
68 #define jsimd_ycc_extbgrx_convert_sse2 jSYCCEXTBGRXS2 |
|
69 #define jsimd_ycc_extxbgr_convert_sse2 jSYCCEXTXBGRS2 |
|
70 #define jsimd_ycc_extxrgb_convert_sse2 jSYCCEXTXRGBS2 |
|
71 #define jsimd_h2v2_downsample_mmx jSDnH2V2M |
|
72 #define jsimd_h2v1_downsample_mmx jSDnH2V1M |
|
73 #define jsimd_h2v2_downsample_sse2 jSDnH2V2S2 |
|
74 #define jsimd_h2v1_downsample_sse2 jSDnH2V1S2 |
|
75 #define jsimd_h2v2_upsample_mmx jSUpH2V2M |
|
76 #define jsimd_h2v1_upsample_mmx jSUpH2V1M |
|
77 #define jsimd_h2v2_fancy_upsample_mmx jSFUpH2V2M |
|
78 #define jsimd_h2v1_fancy_upsample_mmx jSFUpH2V1M |
|
79 #define jsimd_h2v2_merged_upsample_mmx jSMUpH2V2M |
|
80 #define jsimd_h2v2_extrgb_merged_upsample_mmx jSMUpH2V2EXTRGBM |
|
81 #define jsimd_h2v2_extrgbx_merged_upsample_mmx jSMUpH2V2EXTRGBXM |
|
82 #define jsimd_h2v2_extbgr_merged_upsample_mmx jSMUpH2V2EXTBGRM |
|
83 #define jsimd_h2v2_extbgrx_merged_upsample_mmx jSMUpH2V2EXTBGRXM |
|
84 #define jsimd_h2v2_extxbgr_merged_upsample_mmx jSMUpH2V2EXTXBGRM |
|
85 #define jsimd_h2v2_extxrgb_merged_upsample_mmx jSMUpH2V2EXTXRGBM |
|
86 #define jsimd_h2v1_merged_upsample_mmx jSMUpH2V1M |
|
87 #define jsimd_h2v1_extrgb_merged_upsample_mmx jSMUpH2V1EXTRGBM |
|
88 #define jsimd_h2v1_extrgbx_merged_upsample_mmx jSMUpH2V1EXTRGBXM |
|
89 #define jsimd_h2v1_extbgr_merged_upsample_mmx jSMUpH2V1EXTBGRM |
|
90 #define jsimd_h2v1_extbgrx_merged_upsample_mmx jSMUpH2V1EXTBGRXM |
|
91 #define jsimd_h2v1_extxbgr_merged_upsample_mmx jSMUpH2V1EXTXBGRM |
|
92 #define jsimd_h2v1_extxrgb_merged_upsample_mmx jSMUpH2V1EXTXRGBM |
|
93 #define jsimd_h2v2_upsample_sse2 jSUpH2V2S2 |
|
94 #define jsimd_h2v1_upsample_sse2 jSUpH2V1S2 |
|
95 #define jconst_fancy_upsample_sse2 jSCFUpS2 |
|
96 #define jsimd_h2v2_fancy_upsample_sse2 jSFUpH2V2S2 |
|
97 #define jsimd_h2v1_fancy_upsample_sse2 jSFUpH2V1S2 |
|
98 #define jconst_merged_upsample_sse2 jSCMUpS2 |
|
99 #define jsimd_h2v2_merged_upsample_sse2 jSMUpH2V2S2 |
|
100 #define jsimd_h2v2_extrgb_merged_upsample_sse2 jSMUpH2V2EXTRGBS2 |
|
101 #define jsimd_h2v2_extrgbx_merged_upsample_sse2 jSMUpH2V2EXTRGBXS2 |
|
102 #define jsimd_h2v2_extbgr_merged_upsample_sse2 jSMUpH2V2EXTBGRS2 |
|
103 #define jsimd_h2v2_extbgrx_merged_upsample_sse2 jSMUpH2V2EXTBGRXS2 |
|
104 #define jsimd_h2v2_extxbgr_merged_upsample_sse2 jSMUpH2V2EXTXBGRS2 |
|
105 #define jsimd_h2v2_extxrgb_merged_upsample_sse2 jSMUpH2V2EXTXRGBS2 |
|
106 #define jsimd_h2v1_merged_upsample_sse2 jSMUpH2V1S2 |
|
107 #define jsimd_h2v1_extrgb_merged_upsample_sse2 jSMUpH2V1EXTRGBS2 |
|
108 #define jsimd_h2v1_extrgbx_merged_upsample_sse2 jSMUpH2V1EXTRGBXS2 |
|
109 #define jsimd_h2v1_extbgr_merged_upsample_sse2 jSMUpH2V1EXTBGRS2 |
|
110 #define jsimd_h2v1_extbgrx_merged_upsample_sse2 jSMUpH2V1EXTBGRXS2 |
|
111 #define jsimd_h2v1_extxbgr_merged_upsample_sse2 jSMUpH2V1EXTXBGRS2 |
|
112 #define jsimd_h2v1_extxrgb_merged_upsample_sse2 jSMUpH2V1EXTXRGBS2 |
|
113 #define jsimd_convsamp_mmx jSConvM |
|
114 #define jsimd_convsamp_sse2 jSConvS2 |
|
115 #define jsimd_convsamp_float_3dnow jSConvF3D |
|
116 #define jsimd_convsamp_float_sse jSConvFS |
|
117 #define jsimd_convsamp_float_sse2 jSConvFS2 |
|
118 #define jsimd_fdct_islow_mmx jSFDMIS |
|
119 #define jsimd_fdct_ifast_mmx jSFDMIF |
|
120 #define jconst_fdct_islow_sse2 jSCFDS2IS |
|
121 #define jsimd_fdct_islow_sse2 jSFDS2IS |
|
122 #define jconst_fdct_ifast_sse2 jSCFDS2IF |
|
123 #define jsimd_fdct_ifast_sse2 jSFDS2IF |
|
124 #define jsimd_fdct_float_3dnow jSFD3DF |
|
125 #define jconst_fdct_float_sse jSCFDSF |
|
126 #define jsimd_fdct_float_sse jSFDSF |
|
127 #define jsimd_quantize_mmx jSQuantM |
|
128 #define jsimd_quantize_sse2 jSQuantS2 |
|
129 #define jsimd_quantize_float_3dnow jSQuantF3D |
|
130 #define jsimd_quantize_float_sse jSQuantFS |
|
131 #define jsimd_quantize_float_sse2 jSQuantFS2 |
|
132 #define jsimd_idct_2x2_mmx jSIDM22 |
|
133 #define jsimd_idct_4x4_mmx jSIDM44 |
|
134 #define jconst_idct_red_sse2 jSCIDS2R |
|
135 #define jsimd_idct_2x2_sse2 jSIDS222 |
|
136 #define jsimd_idct_4x4_sse2 jSIDS244 |
|
137 #define jsimd_idct_islow_mmx jSIDMIS |
|
138 #define jsimd_idct_ifast_mmx jSIDMIF |
|
139 #define jconst_idct_islow_sse2 jSCIDS2IS |
|
140 #define jsimd_idct_islow_sse2 jSIDS2IS |
|
141 #define jconst_idct_ifast_sse2 jSCIDS2IF |
|
142 #define jsimd_idct_ifast_sse2 jSIDS2IF |
|
143 #define jsimd_idct_float_3dnow jSID3DF |
|
144 #define jconst_fdct_float_sse jSCIDSF |
|
145 #define jsimd_idct_float_sse jSIDSF |
|
146 #define jconst_fdct_float_sse2 jSCIDS2F |
|
147 #define jsimd_idct_float_sse2 jSIDS2F |
|
148 #endif /* NEED_SHORT_EXTERNAL_NAMES */ |
|
149 |
|
150 /* SIMD Ext: retrieve SIMD/CPU information */ |
|
151 EXTERN(unsigned int) jpeg_simd_cpu_support JPP((void)); |
|
152 |
|
153 /* SIMD Color Space Conversion */ |
|
154 EXTERN(void) jsimd_rgb_ycc_convert_mmx |
|
155 JPP((JDIMENSION img_width, |
|
156 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
157 JDIMENSION output_row, int num_rows)); |
|
158 EXTERN(void) jsimd_extrgb_ycc_convert_mmx |
|
159 JPP((JDIMENSION img_width, |
|
160 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
161 JDIMENSION output_row, int num_rows)); |
|
162 EXTERN(void) jsimd_extrgbx_ycc_convert_mmx |
|
163 JPP((JDIMENSION img_width, |
|
164 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
165 JDIMENSION output_row, int num_rows)); |
|
166 EXTERN(void) jsimd_extbgr_ycc_convert_mmx |
|
167 JPP((JDIMENSION img_width, |
|
168 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
169 JDIMENSION output_row, int num_rows)); |
|
170 EXTERN(void) jsimd_extbgrx_ycc_convert_mmx |
|
171 JPP((JDIMENSION img_width, |
|
172 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
173 JDIMENSION output_row, int num_rows)); |
|
174 EXTERN(void) jsimd_extxbgr_ycc_convert_mmx |
|
175 JPP((JDIMENSION img_width, |
|
176 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
177 JDIMENSION output_row, int num_rows)); |
|
178 EXTERN(void) jsimd_extxrgb_ycc_convert_mmx |
|
179 JPP((JDIMENSION img_width, |
|
180 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
181 JDIMENSION output_row, int num_rows)); |
|
182 |
|
183 EXTERN(void) jsimd_rgb_gray_convert_mmx |
|
184 JPP((JDIMENSION img_width, |
|
185 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
186 JDIMENSION output_row, int num_rows)); |
|
187 EXTERN(void) jsimd_extrgb_gray_convert_mmx |
|
188 JPP((JDIMENSION img_width, |
|
189 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
190 JDIMENSION output_row, int num_rows)); |
|
191 EXTERN(void) jsimd_extrgbx_gray_convert_mmx |
|
192 JPP((JDIMENSION img_width, |
|
193 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
194 JDIMENSION output_row, int num_rows)); |
|
195 EXTERN(void) jsimd_extbgr_gray_convert_mmx |
|
196 JPP((JDIMENSION img_width, |
|
197 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
198 JDIMENSION output_row, int num_rows)); |
|
199 EXTERN(void) jsimd_extbgrx_gray_convert_mmx |
|
200 JPP((JDIMENSION img_width, |
|
201 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
202 JDIMENSION output_row, int num_rows)); |
|
203 EXTERN(void) jsimd_extxbgr_gray_convert_mmx |
|
204 JPP((JDIMENSION img_width, |
|
205 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
206 JDIMENSION output_row, int num_rows)); |
|
207 EXTERN(void) jsimd_extxrgb_gray_convert_mmx |
|
208 JPP((JDIMENSION img_width, |
|
209 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
210 JDIMENSION output_row, int num_rows)); |
|
211 |
|
212 EXTERN(void) jsimd_ycc_rgb_convert_mmx |
|
213 JPP((JDIMENSION out_width, |
|
214 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
215 JSAMPARRAY output_buf, int num_rows)); |
|
216 EXTERN(void) jsimd_ycc_extrgb_convert_mmx |
|
217 JPP((JDIMENSION out_width, |
|
218 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
219 JSAMPARRAY output_buf, int num_rows)); |
|
220 EXTERN(void) jsimd_ycc_extrgbx_convert_mmx |
|
221 JPP((JDIMENSION out_width, |
|
222 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
223 JSAMPARRAY output_buf, int num_rows)); |
|
224 EXTERN(void) jsimd_ycc_extbgr_convert_mmx |
|
225 JPP((JDIMENSION out_width, |
|
226 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
227 JSAMPARRAY output_buf, int num_rows)); |
|
228 EXTERN(void) jsimd_ycc_extbgrx_convert_mmx |
|
229 JPP((JDIMENSION out_width, |
|
230 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
231 JSAMPARRAY output_buf, int num_rows)); |
|
232 EXTERN(void) jsimd_ycc_extxbgr_convert_mmx |
|
233 JPP((JDIMENSION out_width, |
|
234 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
235 JSAMPARRAY output_buf, int num_rows)); |
|
236 EXTERN(void) jsimd_ycc_extxrgb_convert_mmx |
|
237 JPP((JDIMENSION out_width, |
|
238 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
239 JSAMPARRAY output_buf, int num_rows)); |
|
240 |
|
241 extern const int jconst_rgb_ycc_convert_sse2[]; |
|
242 EXTERN(void) jsimd_rgb_ycc_convert_sse2 |
|
243 JPP((JDIMENSION img_width, |
|
244 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
245 JDIMENSION output_row, int num_rows)); |
|
246 EXTERN(void) jsimd_extrgb_ycc_convert_sse2 |
|
247 JPP((JDIMENSION img_width, |
|
248 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
249 JDIMENSION output_row, int num_rows)); |
|
250 EXTERN(void) jsimd_extrgbx_ycc_convert_sse2 |
|
251 JPP((JDIMENSION img_width, |
|
252 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
253 JDIMENSION output_row, int num_rows)); |
|
254 EXTERN(void) jsimd_extbgr_ycc_convert_sse2 |
|
255 JPP((JDIMENSION img_width, |
|
256 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
257 JDIMENSION output_row, int num_rows)); |
|
258 EXTERN(void) jsimd_extbgrx_ycc_convert_sse2 |
|
259 JPP((JDIMENSION img_width, |
|
260 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
261 JDIMENSION output_row, int num_rows)); |
|
262 EXTERN(void) jsimd_extxbgr_ycc_convert_sse2 |
|
263 JPP((JDIMENSION img_width, |
|
264 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
265 JDIMENSION output_row, int num_rows)); |
|
266 EXTERN(void) jsimd_extxrgb_ycc_convert_sse2 |
|
267 JPP((JDIMENSION img_width, |
|
268 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
269 JDIMENSION output_row, int num_rows)); |
|
270 |
|
271 extern const int jconst_rgb_gray_convert_sse2[]; |
|
272 EXTERN(void) jsimd_rgb_gray_convert_sse2 |
|
273 JPP((JDIMENSION img_width, |
|
274 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
275 JDIMENSION output_row, int num_rows)); |
|
276 EXTERN(void) jsimd_extrgb_gray_convert_sse2 |
|
277 JPP((JDIMENSION img_width, |
|
278 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
279 JDIMENSION output_row, int num_rows)); |
|
280 EXTERN(void) jsimd_extrgbx_gray_convert_sse2 |
|
281 JPP((JDIMENSION img_width, |
|
282 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
283 JDIMENSION output_row, int num_rows)); |
|
284 EXTERN(void) jsimd_extbgr_gray_convert_sse2 |
|
285 JPP((JDIMENSION img_width, |
|
286 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
287 JDIMENSION output_row, int num_rows)); |
|
288 EXTERN(void) jsimd_extbgrx_gray_convert_sse2 |
|
289 JPP((JDIMENSION img_width, |
|
290 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
291 JDIMENSION output_row, int num_rows)); |
|
292 EXTERN(void) jsimd_extxbgr_gray_convert_sse2 |
|
293 JPP((JDIMENSION img_width, |
|
294 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
295 JDIMENSION output_row, int num_rows)); |
|
296 EXTERN(void) jsimd_extxrgb_gray_convert_sse2 |
|
297 JPP((JDIMENSION img_width, |
|
298 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
299 JDIMENSION output_row, int num_rows)); |
|
300 |
|
301 extern const int jconst_ycc_rgb_convert_sse2[]; |
|
302 EXTERN(void) jsimd_ycc_rgb_convert_sse2 |
|
303 JPP((JDIMENSION out_width, |
|
304 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
305 JSAMPARRAY output_buf, int num_rows)); |
|
306 EXTERN(void) jsimd_ycc_extrgb_convert_sse2 |
|
307 JPP((JDIMENSION out_width, |
|
308 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
309 JSAMPARRAY output_buf, int num_rows)); |
|
310 EXTERN(void) jsimd_ycc_extrgbx_convert_sse2 |
|
311 JPP((JDIMENSION out_width, |
|
312 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
313 JSAMPARRAY output_buf, int num_rows)); |
|
314 EXTERN(void) jsimd_ycc_extbgr_convert_sse2 |
|
315 JPP((JDIMENSION out_width, |
|
316 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
317 JSAMPARRAY output_buf, int num_rows)); |
|
318 EXTERN(void) jsimd_ycc_extbgrx_convert_sse2 |
|
319 JPP((JDIMENSION out_width, |
|
320 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
321 JSAMPARRAY output_buf, int num_rows)); |
|
322 EXTERN(void) jsimd_ycc_extxbgr_convert_sse2 |
|
323 JPP((JDIMENSION out_width, |
|
324 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
325 JSAMPARRAY output_buf, int num_rows)); |
|
326 EXTERN(void) jsimd_ycc_extxrgb_convert_sse2 |
|
327 JPP((JDIMENSION out_width, |
|
328 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
329 JSAMPARRAY output_buf, int num_rows)); |
|
330 |
|
331 EXTERN(void) jsimd_rgb_ycc_convert_neon |
|
332 JPP((JDIMENSION img_width, |
|
333 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
334 JDIMENSION output_row, int num_rows)); |
|
335 EXTERN(void) jsimd_extrgb_ycc_convert_neon |
|
336 JPP((JDIMENSION img_width, |
|
337 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
338 JDIMENSION output_row, int num_rows)); |
|
339 EXTERN(void) jsimd_extrgbx_ycc_convert_neon |
|
340 JPP((JDIMENSION img_width, |
|
341 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
342 JDIMENSION output_row, int num_rows)); |
|
343 EXTERN(void) jsimd_extbgr_ycc_convert_neon |
|
344 JPP((JDIMENSION img_width, |
|
345 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
346 JDIMENSION output_row, int num_rows)); |
|
347 EXTERN(void) jsimd_extbgrx_ycc_convert_neon |
|
348 JPP((JDIMENSION img_width, |
|
349 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
350 JDIMENSION output_row, int num_rows)); |
|
351 EXTERN(void) jsimd_extxbgr_ycc_convert_neon |
|
352 JPP((JDIMENSION img_width, |
|
353 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
354 JDIMENSION output_row, int num_rows)); |
|
355 EXTERN(void) jsimd_extxrgb_ycc_convert_neon |
|
356 JPP((JDIMENSION img_width, |
|
357 JSAMPARRAY input_buf, JSAMPIMAGE output_buf, |
|
358 JDIMENSION output_row, int num_rows)); |
|
359 |
|
360 EXTERN(void) jsimd_ycc_rgb_convert_neon |
|
361 JPP((JDIMENSION out_width, |
|
362 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
363 JSAMPARRAY output_buf, int num_rows)); |
|
364 EXTERN(void) jsimd_ycc_extrgb_convert_neon |
|
365 JPP((JDIMENSION out_width, |
|
366 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
367 JSAMPARRAY output_buf, int num_rows)); |
|
368 EXTERN(void) jsimd_ycc_extrgbx_convert_neon |
|
369 JPP((JDIMENSION out_width, |
|
370 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
371 JSAMPARRAY output_buf, int num_rows)); |
|
372 EXTERN(void) jsimd_ycc_extbgr_convert_neon |
|
373 JPP((JDIMENSION out_width, |
|
374 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
375 JSAMPARRAY output_buf, int num_rows)); |
|
376 EXTERN(void) jsimd_ycc_extbgrx_convert_neon |
|
377 JPP((JDIMENSION out_width, |
|
378 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
379 JSAMPARRAY output_buf, int num_rows)); |
|
380 EXTERN(void) jsimd_ycc_extxbgr_convert_neon |
|
381 JPP((JDIMENSION out_width, |
|
382 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
383 JSAMPARRAY output_buf, int num_rows)); |
|
384 EXTERN(void) jsimd_ycc_extxrgb_convert_neon |
|
385 JPP((JDIMENSION out_width, |
|
386 JSAMPIMAGE input_buf, JDIMENSION input_row, |
|
387 JSAMPARRAY output_buf, int num_rows)); |
|
388 |
|
389 /* SIMD Downsample */ |
|
390 EXTERN(void) jsimd_h2v2_downsample_mmx |
|
391 JPP((JDIMENSION image_width, int max_v_samp_factor, |
|
392 JDIMENSION v_samp_factor, JDIMENSION width_blocks, |
|
393 JSAMPARRAY input_data, JSAMPARRAY output_data)); |
|
394 EXTERN(void) jsimd_h2v1_downsample_mmx |
|
395 JPP((JDIMENSION image_width, int max_v_samp_factor, |
|
396 JDIMENSION v_samp_factor, JDIMENSION width_blocks, |
|
397 JSAMPARRAY input_data, JSAMPARRAY output_data)); |
|
398 |
|
399 EXTERN(void) jsimd_h2v2_downsample_sse2 |
|
400 JPP((JDIMENSION image_width, int max_v_samp_factor, |
|
401 JDIMENSION v_samp_factor, JDIMENSION width_blocks, |
|
402 JSAMPARRAY input_data, JSAMPARRAY output_data)); |
|
403 EXTERN(void) jsimd_h2v1_downsample_sse2 |
|
404 JPP((JDIMENSION image_width, int max_v_samp_factor, |
|
405 JDIMENSION v_samp_factor, JDIMENSION width_blocks, |
|
406 JSAMPARRAY input_data, JSAMPARRAY output_data)); |
|
407 |
|
408 /* SIMD Upsample */ |
|
409 EXTERN(void) jsimd_h2v2_upsample_mmx |
|
410 JPP((int max_v_samp_factor, JDIMENSION output_width, |
|
411 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
412 EXTERN(void) jsimd_h2v1_upsample_mmx |
|
413 JPP((int max_v_samp_factor, JDIMENSION output_width, |
|
414 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
415 |
|
416 EXTERN(void) jsimd_h2v2_fancy_upsample_mmx |
|
417 JPP((int max_v_samp_factor, JDIMENSION downsampled_width, |
|
418 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
419 EXTERN(void) jsimd_h2v1_fancy_upsample_mmx |
|
420 JPP((int max_v_samp_factor, JDIMENSION downsampled_width, |
|
421 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
422 |
|
423 EXTERN(void) jsimd_h2v2_merged_upsample_mmx |
|
424 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
425 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
426 EXTERN(void) jsimd_h2v2_extrgb_merged_upsample_mmx |
|
427 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
428 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
429 EXTERN(void) jsimd_h2v2_extrgbx_merged_upsample_mmx |
|
430 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
431 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
432 EXTERN(void) jsimd_h2v2_extbgr_merged_upsample_mmx |
|
433 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
434 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
435 EXTERN(void) jsimd_h2v2_extbgrx_merged_upsample_mmx |
|
436 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
437 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
438 EXTERN(void) jsimd_h2v2_extxbgr_merged_upsample_mmx |
|
439 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
440 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
441 EXTERN(void) jsimd_h2v2_extxrgb_merged_upsample_mmx |
|
442 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
443 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
444 EXTERN(void) jsimd_h2v1_merged_upsample_mmx |
|
445 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
446 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
447 EXTERN(void) jsimd_h2v1_extrgb_merged_upsample_mmx |
|
448 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
449 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
450 EXTERN(void) jsimd_h2v1_extrgbx_merged_upsample_mmx |
|
451 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
452 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
453 EXTERN(void) jsimd_h2v1_extbgr_merged_upsample_mmx |
|
454 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
455 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
456 EXTERN(void) jsimd_h2v1_extbgrx_merged_upsample_mmx |
|
457 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
458 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
459 EXTERN(void) jsimd_h2v1_extxbgr_merged_upsample_mmx |
|
460 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
461 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
462 EXTERN(void) jsimd_h2v1_extxrgb_merged_upsample_mmx |
|
463 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
464 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
465 |
|
466 EXTERN(void) jsimd_h2v2_upsample_sse2 |
|
467 JPP((int max_v_samp_factor, JDIMENSION output_width, |
|
468 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
469 EXTERN(void) jsimd_h2v1_upsample_sse2 |
|
470 JPP((int max_v_samp_factor, JDIMENSION output_width, |
|
471 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
472 |
|
473 extern const int jconst_fancy_upsample_sse2[]; |
|
474 EXTERN(void) jsimd_h2v2_fancy_upsample_sse2 |
|
475 JPP((int max_v_samp_factor, JDIMENSION downsampled_width, |
|
476 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
477 EXTERN(void) jsimd_h2v1_fancy_upsample_sse2 |
|
478 JPP((int max_v_samp_factor, JDIMENSION downsampled_width, |
|
479 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
480 |
|
481 extern const int jconst_merged_upsample_sse2[]; |
|
482 EXTERN(void) jsimd_h2v2_merged_upsample_sse2 |
|
483 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
484 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
485 EXTERN(void) jsimd_h2v2_extrgb_merged_upsample_sse2 |
|
486 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
487 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
488 EXTERN(void) jsimd_h2v2_extrgbx_merged_upsample_sse2 |
|
489 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
490 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
491 EXTERN(void) jsimd_h2v2_extbgr_merged_upsample_sse2 |
|
492 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
493 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
494 EXTERN(void) jsimd_h2v2_extbgrx_merged_upsample_sse2 |
|
495 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
496 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
497 EXTERN(void) jsimd_h2v2_extxbgr_merged_upsample_sse2 |
|
498 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
499 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
500 EXTERN(void) jsimd_h2v2_extxrgb_merged_upsample_sse2 |
|
501 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
502 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
503 EXTERN(void) jsimd_h2v1_merged_upsample_sse2 |
|
504 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
505 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
506 EXTERN(void) jsimd_h2v1_extrgb_merged_upsample_sse2 |
|
507 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
508 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
509 EXTERN(void) jsimd_h2v1_extrgbx_merged_upsample_sse2 |
|
510 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
511 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
512 EXTERN(void) jsimd_h2v1_extbgr_merged_upsample_sse2 |
|
513 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
514 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
515 EXTERN(void) jsimd_h2v1_extbgrx_merged_upsample_sse2 |
|
516 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
517 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
518 EXTERN(void) jsimd_h2v1_extxbgr_merged_upsample_sse2 |
|
519 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
520 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
521 EXTERN(void) jsimd_h2v1_extxrgb_merged_upsample_sse2 |
|
522 JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, |
|
523 JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); |
|
524 |
|
525 EXTERN(void) jsimd_h2v1_fancy_upsample_neon |
|
526 JPP((int max_v_samp_factor, JDIMENSION downsampled_width, |
|
527 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); |
|
528 |
|
529 /* SIMD Sample Conversion */ |
|
530 EXTERN(void) jsimd_convsamp_mmx JPP((JSAMPARRAY sample_data, |
|
531 JDIMENSION start_col, |
|
532 DCTELEM * workspace)); |
|
533 |
|
534 EXTERN(void) jsimd_convsamp_sse2 JPP((JSAMPARRAY sample_data, |
|
535 JDIMENSION start_col, |
|
536 DCTELEM * workspace)); |
|
537 |
|
538 EXTERN(void) jsimd_convsamp_neon JPP((JSAMPARRAY sample_data, |
|
539 JDIMENSION start_col, |
|
540 DCTELEM * workspace)); |
|
541 |
|
542 EXTERN(void) jsimd_convsamp_float_3dnow JPP((JSAMPARRAY sample_data, |
|
543 JDIMENSION start_col, |
|
544 FAST_FLOAT * workspace)); |
|
545 |
|
546 EXTERN(void) jsimd_convsamp_float_sse JPP((JSAMPARRAY sample_data, |
|
547 JDIMENSION start_col, |
|
548 FAST_FLOAT * workspace)); |
|
549 |
|
550 EXTERN(void) jsimd_convsamp_float_sse2 JPP((JSAMPARRAY sample_data, |
|
551 JDIMENSION start_col, |
|
552 FAST_FLOAT * workspace)); |
|
553 |
|
554 /* SIMD Forward DCT */ |
|
555 EXTERN(void) jsimd_fdct_islow_mmx JPP((DCTELEM * data)); |
|
556 EXTERN(void) jsimd_fdct_ifast_mmx JPP((DCTELEM * data)); |
|
557 |
|
558 extern const int jconst_fdct_ifast_sse2[]; |
|
559 EXTERN(void) jsimd_fdct_islow_sse2 JPP((DCTELEM * data)); |
|
560 extern const int jconst_fdct_islow_sse2[]; |
|
561 EXTERN(void) jsimd_fdct_ifast_sse2 JPP((DCTELEM * data)); |
|
562 |
|
563 EXTERN(void) jsimd_fdct_ifast_neon JPP((DCTELEM * data)); |
|
564 |
|
565 EXTERN(void) jsimd_fdct_float_3dnow JPP((FAST_FLOAT * data)); |
|
566 |
|
567 extern const int jconst_fdct_float_sse[]; |
|
568 EXTERN(void) jsimd_fdct_float_sse JPP((FAST_FLOAT * data)); |
|
569 |
|
570 /* SIMD Quantization */ |
|
571 EXTERN(void) jsimd_quantize_mmx JPP((JCOEFPTR coef_block, |
|
572 DCTELEM * divisors, |
|
573 DCTELEM * workspace)); |
|
574 |
|
575 EXTERN(void) jsimd_quantize_sse2 JPP((JCOEFPTR coef_block, |
|
576 DCTELEM * divisors, |
|
577 DCTELEM * workspace)); |
|
578 |
|
579 EXTERN(void) jsimd_quantize_neon JPP((JCOEFPTR coef_block, |
|
580 DCTELEM * divisors, |
|
581 DCTELEM * workspace)); |
|
582 |
|
583 EXTERN(void) jsimd_quantize_float_3dnow JPP((JCOEFPTR coef_block, |
|
584 FAST_FLOAT * divisors, |
|
585 FAST_FLOAT * workspace)); |
|
586 |
|
587 EXTERN(void) jsimd_quantize_float_sse JPP((JCOEFPTR coef_block, |
|
588 FAST_FLOAT * divisors, |
|
589 FAST_FLOAT * workspace)); |
|
590 |
|
591 EXTERN(void) jsimd_quantize_float_sse2 JPP((JCOEFPTR coef_block, |
|
592 FAST_FLOAT * divisors, |
|
593 FAST_FLOAT * workspace)); |
|
594 |
|
595 /* SIMD Reduced Inverse DCT */ |
|
596 EXTERN(void) jsimd_idct_2x2_mmx JPP((void * dct_table, |
|
597 JCOEFPTR coef_block, |
|
598 JSAMPARRAY output_buf, |
|
599 JDIMENSION output_col)); |
|
600 EXTERN(void) jsimd_idct_4x4_mmx JPP((void * dct_table, |
|
601 JCOEFPTR coef_block, |
|
602 JSAMPARRAY output_buf, |
|
603 JDIMENSION output_col)); |
|
604 |
|
605 extern const int jconst_idct_red_sse2[]; |
|
606 EXTERN(void) jsimd_idct_2x2_sse2 JPP((void * dct_table, |
|
607 JCOEFPTR coef_block, |
|
608 JSAMPARRAY output_buf, |
|
609 JDIMENSION output_col)); |
|
610 EXTERN(void) jsimd_idct_4x4_sse2 JPP((void * dct_table, |
|
611 JCOEFPTR coef_block, |
|
612 JSAMPARRAY output_buf, |
|
613 JDIMENSION output_col)); |
|
614 |
|
615 EXTERN(void) jsimd_idct_2x2_neon JPP((void * dct_table, |
|
616 JCOEFPTR coef_block, |
|
617 JSAMPARRAY output_buf, |
|
618 JDIMENSION output_col)); |
|
619 EXTERN(void) jsimd_idct_4x4_neon JPP((void * dct_table, |
|
620 JCOEFPTR coef_block, |
|
621 JSAMPARRAY output_buf, |
|
622 JDIMENSION output_col)); |
|
623 |
|
624 /* SIMD Inverse DCT */ |
|
625 EXTERN(void) jsimd_idct_islow_mmx JPP((void * dct_table, |
|
626 JCOEFPTR coef_block, |
|
627 JSAMPARRAY output_buf, |
|
628 JDIMENSION output_col)); |
|
629 EXTERN(void) jsimd_idct_ifast_mmx JPP((void * dct_table, |
|
630 JCOEFPTR coef_block, |
|
631 JSAMPARRAY output_buf, |
|
632 JDIMENSION output_col)); |
|
633 |
|
634 extern const int jconst_idct_islow_sse2[]; |
|
635 EXTERN(void) jsimd_idct_islow_sse2 JPP((void * dct_table, |
|
636 JCOEFPTR coef_block, |
|
637 JSAMPARRAY output_buf, |
|
638 JDIMENSION output_col)); |
|
639 extern const int jconst_idct_ifast_sse2[]; |
|
640 EXTERN(void) jsimd_idct_ifast_sse2 JPP((void * dct_table, |
|
641 JCOEFPTR coef_block, |
|
642 JSAMPARRAY output_buf, |
|
643 JDIMENSION output_col)); |
|
644 |
|
645 EXTERN(void) jsimd_idct_islow_neon JPP((void * dct_table, |
|
646 JCOEFPTR coef_block, |
|
647 JSAMPARRAY output_buf, |
|
648 JDIMENSION output_col)); |
|
649 EXTERN(void) jsimd_idct_ifast_neon JPP((void * dct_table, |
|
650 JCOEFPTR coef_block, |
|
651 JSAMPARRAY output_buf, |
|
652 JDIMENSION output_col)); |
|
653 |
|
654 EXTERN(void) jsimd_idct_float_3dnow JPP((void * dct_table, |
|
655 JCOEFPTR coef_block, |
|
656 JSAMPARRAY output_buf, |
|
657 JDIMENSION output_col)); |
|
658 |
|
659 extern const int jconst_idct_float_sse[]; |
|
660 EXTERN(void) jsimd_idct_float_sse JPP((void * dct_table, |
|
661 JCOEFPTR coef_block, |
|
662 JSAMPARRAY output_buf, |
|
663 JDIMENSION output_col)); |
|
664 |
|
665 extern const int jconst_idct_float_sse2[]; |
|
666 EXTERN(void) jsimd_idct_float_sse2 JPP((void * dct_table, |
|
667 JCOEFPTR coef_block, |
|
668 JSAMPARRAY output_buf, |
|
669 JDIMENSION output_col)); |
|
670 |