michael@0: /* michael@0: * simd/jsimd.h michael@0: * michael@0: * Copyright 2009 Pierre Ossman for Cendio AB michael@0: * Copyright 2011 D. R. Commander michael@0: * michael@0: * Based on the x86 SIMD extension for IJG JPEG library, michael@0: * Copyright (C) 1999-2006, MIYASAKA Masaru. michael@0: * For conditions of distribution and use, see copyright notice in jsimdext.inc michael@0: * michael@0: */ michael@0: michael@0: /* Bitmask for supported acceleration methods */ michael@0: michael@0: #define JSIMD_NONE 0x00 michael@0: #define JSIMD_MMX 0x01 michael@0: #define JSIMD_3DNOW 0x02 michael@0: #define JSIMD_SSE 0x04 michael@0: #define JSIMD_SSE2 0x08 michael@0: #define JSIMD_ARM_NEON 0x10 michael@0: michael@0: /* Short forms of external names for systems with brain-damaged linkers. */ michael@0: michael@0: #ifdef NEED_SHORT_EXTERNAL_NAMES michael@0: #define jpeg_simd_cpu_support jSiCpuSupport michael@0: #define jsimd_rgb_ycc_convert_mmx jSRGBYCCM michael@0: #define jsimd_extrgb_ycc_convert_mmx jSEXTRGBYCCM michael@0: #define jsimd_extrgbx_ycc_convert_mmx jSEXTRGBXYCCM michael@0: #define jsimd_extbgr_ycc_convert_mmx jSEXTBGRYCCM michael@0: #define jsimd_extbgrx_ycc_convert_mmx jSEXTBGRXYCCM michael@0: #define jsimd_extxbgr_ycc_convert_mmx jSEXTXBGRYCCM michael@0: #define jsimd_extxrgb_ycc_convert_mmx jSEXTXRGBYCCM michael@0: #define jsimd_rgb_gray_convert_mmx jSRGBGRYM michael@0: #define jsimd_extrgb_gray_convert_mmx jSEXTRGBGRYM michael@0: #define jsimd_extrgbx_gray_convert_mmx jSEXTRGBXGRYM michael@0: #define jsimd_extbgr_gray_convert_mmx jSEXTBGRGRYM michael@0: #define jsimd_extbgrx_gray_convert_mmx jSEXTBGRXGRYM michael@0: #define jsimd_extxbgr_gray_convert_mmx jSEXTXBGRGRYM michael@0: #define jsimd_extxrgb_gray_convert_mmx jSEXTXRGBGRYM michael@0: #define jsimd_ycc_rgb_convert_mmx jSYCCRGBM michael@0: #define jsimd_ycc_extrgb_convert_mmx jSYCCEXTRGBM michael@0: #define jsimd_ycc_extrgbx_convert_mmx jSYCCEXTRGBXM michael@0: #define jsimd_ycc_extbgr_convert_mmx jSYCCEXTBGRM michael@0: #define jsimd_ycc_extbgrx_convert_mmx jSYCCEXTBGRXM michael@0: #define jsimd_ycc_extxbgr_convert_mmx jSYCCEXTXBGRM michael@0: #define jsimd_ycc_extxrgb_convert_mmx jSYCCEXTXRGBM michael@0: #define jconst_rgb_ycc_convert_sse2 jSCRGBYCCS2 michael@0: #define jsimd_rgb_ycc_convert_sse2 jSRGBYCCS2 michael@0: #define jsimd_extrgb_ycc_convert_sse2 jSEXTRGBYCCS2 michael@0: #define jsimd_extrgbx_ycc_convert_sse2 jSEXTRGBXYCCS2 michael@0: #define jsimd_extbgr_ycc_convert_sse2 jSEXTBGRYCCS2 michael@0: #define jsimd_extbgrx_ycc_convert_sse2 jSEXTBGRXYCCS2 michael@0: #define jsimd_extxbgr_ycc_convert_sse2 jSEXTXBGRYCCS2 michael@0: #define jsimd_extxrgb_ycc_convert_sse2 jSEXTXRGBYCCS2 michael@0: #define jconst_rgb_gray_convert_sse2 jSCRGBGRYS2 michael@0: #define jsimd_rgb_gray_convert_sse2 jSRGBGRYS2 michael@0: #define jsimd_extrgb_gray_convert_sse2 jSEXTRGBGRYS2 michael@0: #define jsimd_extrgbx_gray_convert_sse2 jSEXTRGBXGRYS2 michael@0: #define jsimd_extbgr_gray_convert_sse2 jSEXTBGRGRYS2 michael@0: #define jsimd_extbgrx_gray_convert_sse2 jSEXTBGRXGRYS2 michael@0: #define jsimd_extxbgr_gray_convert_sse2 jSEXTXBGRGRYS2 michael@0: #define jsimd_extxrgb_gray_convert_sse2 jSEXTXRGBGRYS2 michael@0: #define jconst_ycc_rgb_convert_sse2 jSCYCCRGBS2 michael@0: #define jsimd_ycc_rgb_convert_sse2 jSYCCRGBS2 michael@0: #define jsimd_ycc_extrgb_convert_sse2 jSYCCEXTRGBS2 michael@0: #define jsimd_ycc_extrgbx_convert_sse2 jSYCCEXTRGBXS2 michael@0: #define jsimd_ycc_extbgr_convert_sse2 jSYCCEXTBGRS2 michael@0: #define jsimd_ycc_extbgrx_convert_sse2 jSYCCEXTBGRXS2 michael@0: #define jsimd_ycc_extxbgr_convert_sse2 jSYCCEXTXBGRS2 michael@0: #define jsimd_ycc_extxrgb_convert_sse2 jSYCCEXTXRGBS2 michael@0: #define jsimd_h2v2_downsample_mmx jSDnH2V2M michael@0: #define jsimd_h2v1_downsample_mmx jSDnH2V1M michael@0: #define jsimd_h2v2_downsample_sse2 jSDnH2V2S2 michael@0: #define jsimd_h2v1_downsample_sse2 jSDnH2V1S2 michael@0: #define jsimd_h2v2_upsample_mmx jSUpH2V2M michael@0: #define jsimd_h2v1_upsample_mmx jSUpH2V1M michael@0: #define jsimd_h2v2_fancy_upsample_mmx jSFUpH2V2M michael@0: #define jsimd_h2v1_fancy_upsample_mmx jSFUpH2V1M michael@0: #define jsimd_h2v2_merged_upsample_mmx jSMUpH2V2M michael@0: #define jsimd_h2v2_extrgb_merged_upsample_mmx jSMUpH2V2EXTRGBM michael@0: #define jsimd_h2v2_extrgbx_merged_upsample_mmx jSMUpH2V2EXTRGBXM michael@0: #define jsimd_h2v2_extbgr_merged_upsample_mmx jSMUpH2V2EXTBGRM michael@0: #define jsimd_h2v2_extbgrx_merged_upsample_mmx jSMUpH2V2EXTBGRXM michael@0: #define jsimd_h2v2_extxbgr_merged_upsample_mmx jSMUpH2V2EXTXBGRM michael@0: #define jsimd_h2v2_extxrgb_merged_upsample_mmx jSMUpH2V2EXTXRGBM michael@0: #define jsimd_h2v1_merged_upsample_mmx jSMUpH2V1M michael@0: #define jsimd_h2v1_extrgb_merged_upsample_mmx jSMUpH2V1EXTRGBM michael@0: #define jsimd_h2v1_extrgbx_merged_upsample_mmx jSMUpH2V1EXTRGBXM michael@0: #define jsimd_h2v1_extbgr_merged_upsample_mmx jSMUpH2V1EXTBGRM michael@0: #define jsimd_h2v1_extbgrx_merged_upsample_mmx jSMUpH2V1EXTBGRXM michael@0: #define jsimd_h2v1_extxbgr_merged_upsample_mmx jSMUpH2V1EXTXBGRM michael@0: #define jsimd_h2v1_extxrgb_merged_upsample_mmx jSMUpH2V1EXTXRGBM michael@0: #define jsimd_h2v2_upsample_sse2 jSUpH2V2S2 michael@0: #define jsimd_h2v1_upsample_sse2 jSUpH2V1S2 michael@0: #define jconst_fancy_upsample_sse2 jSCFUpS2 michael@0: #define jsimd_h2v2_fancy_upsample_sse2 jSFUpH2V2S2 michael@0: #define jsimd_h2v1_fancy_upsample_sse2 jSFUpH2V1S2 michael@0: #define jconst_merged_upsample_sse2 jSCMUpS2 michael@0: #define jsimd_h2v2_merged_upsample_sse2 jSMUpH2V2S2 michael@0: #define jsimd_h2v2_extrgb_merged_upsample_sse2 jSMUpH2V2EXTRGBS2 michael@0: #define jsimd_h2v2_extrgbx_merged_upsample_sse2 jSMUpH2V2EXTRGBXS2 michael@0: #define jsimd_h2v2_extbgr_merged_upsample_sse2 jSMUpH2V2EXTBGRS2 michael@0: #define jsimd_h2v2_extbgrx_merged_upsample_sse2 jSMUpH2V2EXTBGRXS2 michael@0: #define jsimd_h2v2_extxbgr_merged_upsample_sse2 jSMUpH2V2EXTXBGRS2 michael@0: #define jsimd_h2v2_extxrgb_merged_upsample_sse2 jSMUpH2V2EXTXRGBS2 michael@0: #define jsimd_h2v1_merged_upsample_sse2 jSMUpH2V1S2 michael@0: #define jsimd_h2v1_extrgb_merged_upsample_sse2 jSMUpH2V1EXTRGBS2 michael@0: #define jsimd_h2v1_extrgbx_merged_upsample_sse2 jSMUpH2V1EXTRGBXS2 michael@0: #define jsimd_h2v1_extbgr_merged_upsample_sse2 jSMUpH2V1EXTBGRS2 michael@0: #define jsimd_h2v1_extbgrx_merged_upsample_sse2 jSMUpH2V1EXTBGRXS2 michael@0: #define jsimd_h2v1_extxbgr_merged_upsample_sse2 jSMUpH2V1EXTXBGRS2 michael@0: #define jsimd_h2v1_extxrgb_merged_upsample_sse2 jSMUpH2V1EXTXRGBS2 michael@0: #define jsimd_convsamp_mmx jSConvM michael@0: #define jsimd_convsamp_sse2 jSConvS2 michael@0: #define jsimd_convsamp_float_3dnow jSConvF3D michael@0: #define jsimd_convsamp_float_sse jSConvFS michael@0: #define jsimd_convsamp_float_sse2 jSConvFS2 michael@0: #define jsimd_fdct_islow_mmx jSFDMIS michael@0: #define jsimd_fdct_ifast_mmx jSFDMIF michael@0: #define jconst_fdct_islow_sse2 jSCFDS2IS michael@0: #define jsimd_fdct_islow_sse2 jSFDS2IS michael@0: #define jconst_fdct_ifast_sse2 jSCFDS2IF michael@0: #define jsimd_fdct_ifast_sse2 jSFDS2IF michael@0: #define jsimd_fdct_float_3dnow jSFD3DF michael@0: #define jconst_fdct_float_sse jSCFDSF michael@0: #define jsimd_fdct_float_sse jSFDSF michael@0: #define jsimd_quantize_mmx jSQuantM michael@0: #define jsimd_quantize_sse2 jSQuantS2 michael@0: #define jsimd_quantize_float_3dnow jSQuantF3D michael@0: #define jsimd_quantize_float_sse jSQuantFS michael@0: #define jsimd_quantize_float_sse2 jSQuantFS2 michael@0: #define jsimd_idct_2x2_mmx jSIDM22 michael@0: #define jsimd_idct_4x4_mmx jSIDM44 michael@0: #define jconst_idct_red_sse2 jSCIDS2R michael@0: #define jsimd_idct_2x2_sse2 jSIDS222 michael@0: #define jsimd_idct_4x4_sse2 jSIDS244 michael@0: #define jsimd_idct_islow_mmx jSIDMIS michael@0: #define jsimd_idct_ifast_mmx jSIDMIF michael@0: #define jconst_idct_islow_sse2 jSCIDS2IS michael@0: #define jsimd_idct_islow_sse2 jSIDS2IS michael@0: #define jconst_idct_ifast_sse2 jSCIDS2IF michael@0: #define jsimd_idct_ifast_sse2 jSIDS2IF michael@0: #define jsimd_idct_float_3dnow jSID3DF michael@0: #define jconst_fdct_float_sse jSCIDSF michael@0: #define jsimd_idct_float_sse jSIDSF michael@0: #define jconst_fdct_float_sse2 jSCIDS2F michael@0: #define jsimd_idct_float_sse2 jSIDS2F michael@0: #endif /* NEED_SHORT_EXTERNAL_NAMES */ michael@0: michael@0: /* SIMD Ext: retrieve SIMD/CPU information */ michael@0: EXTERN(unsigned int) jpeg_simd_cpu_support JPP((void)); michael@0: michael@0: /* SIMD Color Space Conversion */ michael@0: EXTERN(void) jsimd_rgb_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgb_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgbx_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgr_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgrx_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxbgr_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxrgb_ycc_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: michael@0: EXTERN(void) jsimd_rgb_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgb_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgbx_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgr_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgrx_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxbgr_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxrgb_gray_convert_mmx michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: michael@0: EXTERN(void) jsimd_ycc_rgb_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extrgb_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extrgbx_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extbgr_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extbgrx_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extxbgr_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extxrgb_convert_mmx michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: michael@0: extern const int jconst_rgb_ycc_convert_sse2[]; michael@0: EXTERN(void) jsimd_rgb_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgb_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgbx_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgr_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgrx_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxbgr_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxrgb_ycc_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: michael@0: extern const int jconst_rgb_gray_convert_sse2[]; michael@0: EXTERN(void) jsimd_rgb_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgb_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgbx_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgr_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgrx_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxbgr_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxrgb_gray_convert_sse2 michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: michael@0: extern const int jconst_ycc_rgb_convert_sse2[]; michael@0: EXTERN(void) jsimd_ycc_rgb_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extrgb_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extrgbx_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extbgr_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extbgrx_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extxbgr_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extxrgb_convert_sse2 michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: michael@0: EXTERN(void) jsimd_rgb_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgb_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extrgbx_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgr_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extbgrx_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxbgr_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: EXTERN(void) jsimd_extxrgb_ycc_convert_neon michael@0: JPP((JDIMENSION img_width, michael@0: JSAMPARRAY input_buf, JSAMPIMAGE output_buf, michael@0: JDIMENSION output_row, int num_rows)); michael@0: michael@0: EXTERN(void) jsimd_ycc_rgb_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extrgb_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extrgbx_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extbgr_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extbgrx_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extxbgr_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: EXTERN(void) jsimd_ycc_extxrgb_convert_neon michael@0: JPP((JDIMENSION out_width, michael@0: JSAMPIMAGE input_buf, JDIMENSION input_row, michael@0: JSAMPARRAY output_buf, int num_rows)); michael@0: michael@0: /* SIMD Downsample */ michael@0: EXTERN(void) jsimd_h2v2_downsample_mmx michael@0: JPP((JDIMENSION image_width, int max_v_samp_factor, michael@0: JDIMENSION v_samp_factor, JDIMENSION width_blocks, michael@0: JSAMPARRAY input_data, JSAMPARRAY output_data)); michael@0: EXTERN(void) jsimd_h2v1_downsample_mmx michael@0: JPP((JDIMENSION image_width, int max_v_samp_factor, michael@0: JDIMENSION v_samp_factor, JDIMENSION width_blocks, michael@0: JSAMPARRAY input_data, JSAMPARRAY output_data)); michael@0: michael@0: EXTERN(void) jsimd_h2v2_downsample_sse2 michael@0: JPP((JDIMENSION image_width, int max_v_samp_factor, michael@0: JDIMENSION v_samp_factor, JDIMENSION width_blocks, michael@0: JSAMPARRAY input_data, JSAMPARRAY output_data)); michael@0: EXTERN(void) jsimd_h2v1_downsample_sse2 michael@0: JPP((JDIMENSION image_width, int max_v_samp_factor, michael@0: JDIMENSION v_samp_factor, JDIMENSION width_blocks, michael@0: JSAMPARRAY input_data, JSAMPARRAY output_data)); michael@0: michael@0: /* SIMD Upsample */ michael@0: EXTERN(void) jsimd_h2v2_upsample_mmx michael@0: JPP((int max_v_samp_factor, JDIMENSION output_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: EXTERN(void) jsimd_h2v1_upsample_mmx michael@0: JPP((int max_v_samp_factor, JDIMENSION output_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: michael@0: EXTERN(void) jsimd_h2v2_fancy_upsample_mmx michael@0: JPP((int max_v_samp_factor, JDIMENSION downsampled_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: EXTERN(void) jsimd_h2v1_fancy_upsample_mmx michael@0: JPP((int max_v_samp_factor, JDIMENSION downsampled_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: michael@0: EXTERN(void) jsimd_h2v2_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extrgb_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extrgbx_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extbgr_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extbgrx_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extxbgr_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extxrgb_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extrgb_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extrgbx_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extbgr_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extbgrx_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extxbgr_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extxrgb_merged_upsample_mmx michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: michael@0: EXTERN(void) jsimd_h2v2_upsample_sse2 michael@0: JPP((int max_v_samp_factor, JDIMENSION output_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: EXTERN(void) jsimd_h2v1_upsample_sse2 michael@0: JPP((int max_v_samp_factor, JDIMENSION output_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: michael@0: extern const int jconst_fancy_upsample_sse2[]; michael@0: EXTERN(void) jsimd_h2v2_fancy_upsample_sse2 michael@0: JPP((int max_v_samp_factor, JDIMENSION downsampled_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: EXTERN(void) jsimd_h2v1_fancy_upsample_sse2 michael@0: JPP((int max_v_samp_factor, JDIMENSION downsampled_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: michael@0: extern const int jconst_merged_upsample_sse2[]; michael@0: EXTERN(void) jsimd_h2v2_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extrgb_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extrgbx_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extbgr_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extbgrx_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extxbgr_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v2_extxrgb_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extrgb_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extrgbx_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extbgr_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extbgrx_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extxbgr_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: EXTERN(void) jsimd_h2v1_extxrgb_merged_upsample_sse2 michael@0: JPP((JDIMENSION output_width, JSAMPIMAGE input_buf, michael@0: JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf)); michael@0: michael@0: EXTERN(void) jsimd_h2v1_fancy_upsample_neon michael@0: JPP((int max_v_samp_factor, JDIMENSION downsampled_width, michael@0: JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); michael@0: michael@0: /* SIMD Sample Conversion */ michael@0: EXTERN(void) jsimd_convsamp_mmx JPP((JSAMPARRAY sample_data, michael@0: JDIMENSION start_col, michael@0: DCTELEM * workspace)); michael@0: michael@0: EXTERN(void) jsimd_convsamp_sse2 JPP((JSAMPARRAY sample_data, michael@0: JDIMENSION start_col, michael@0: DCTELEM * workspace)); michael@0: michael@0: EXTERN(void) jsimd_convsamp_neon JPP((JSAMPARRAY sample_data, michael@0: JDIMENSION start_col, michael@0: DCTELEM * workspace)); michael@0: michael@0: EXTERN(void) jsimd_convsamp_float_3dnow JPP((JSAMPARRAY sample_data, michael@0: JDIMENSION start_col, michael@0: FAST_FLOAT * workspace)); michael@0: michael@0: EXTERN(void) jsimd_convsamp_float_sse JPP((JSAMPARRAY sample_data, michael@0: JDIMENSION start_col, michael@0: FAST_FLOAT * workspace)); michael@0: michael@0: EXTERN(void) jsimd_convsamp_float_sse2 JPP((JSAMPARRAY sample_data, michael@0: JDIMENSION start_col, michael@0: FAST_FLOAT * workspace)); michael@0: michael@0: /* SIMD Forward DCT */ michael@0: EXTERN(void) jsimd_fdct_islow_mmx JPP((DCTELEM * data)); michael@0: EXTERN(void) jsimd_fdct_ifast_mmx JPP((DCTELEM * data)); michael@0: michael@0: extern const int jconst_fdct_ifast_sse2[]; michael@0: EXTERN(void) jsimd_fdct_islow_sse2 JPP((DCTELEM * data)); michael@0: extern const int jconst_fdct_islow_sse2[]; michael@0: EXTERN(void) jsimd_fdct_ifast_sse2 JPP((DCTELEM * data)); michael@0: michael@0: EXTERN(void) jsimd_fdct_ifast_neon JPP((DCTELEM * data)); michael@0: michael@0: EXTERN(void) jsimd_fdct_float_3dnow JPP((FAST_FLOAT * data)); michael@0: michael@0: extern const int jconst_fdct_float_sse[]; michael@0: EXTERN(void) jsimd_fdct_float_sse JPP((FAST_FLOAT * data)); michael@0: michael@0: /* SIMD Quantization */ michael@0: EXTERN(void) jsimd_quantize_mmx JPP((JCOEFPTR coef_block, michael@0: DCTELEM * divisors, michael@0: DCTELEM * workspace)); michael@0: michael@0: EXTERN(void) jsimd_quantize_sse2 JPP((JCOEFPTR coef_block, michael@0: DCTELEM * divisors, michael@0: DCTELEM * workspace)); michael@0: michael@0: EXTERN(void) jsimd_quantize_neon JPP((JCOEFPTR coef_block, michael@0: DCTELEM * divisors, michael@0: DCTELEM * workspace)); michael@0: michael@0: EXTERN(void) jsimd_quantize_float_3dnow JPP((JCOEFPTR coef_block, michael@0: FAST_FLOAT * divisors, michael@0: FAST_FLOAT * workspace)); michael@0: michael@0: EXTERN(void) jsimd_quantize_float_sse JPP((JCOEFPTR coef_block, michael@0: FAST_FLOAT * divisors, michael@0: FAST_FLOAT * workspace)); michael@0: michael@0: EXTERN(void) jsimd_quantize_float_sse2 JPP((JCOEFPTR coef_block, michael@0: FAST_FLOAT * divisors, michael@0: FAST_FLOAT * workspace)); michael@0: michael@0: /* SIMD Reduced Inverse DCT */ michael@0: EXTERN(void) jsimd_idct_2x2_mmx JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: EXTERN(void) jsimd_idct_4x4_mmx JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: extern const int jconst_idct_red_sse2[]; michael@0: EXTERN(void) jsimd_idct_2x2_sse2 JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: EXTERN(void) jsimd_idct_4x4_sse2 JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: EXTERN(void) jsimd_idct_2x2_neon JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: EXTERN(void) jsimd_idct_4x4_neon JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: /* SIMD Inverse DCT */ michael@0: EXTERN(void) jsimd_idct_islow_mmx JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: EXTERN(void) jsimd_idct_ifast_mmx JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: extern const int jconst_idct_islow_sse2[]; michael@0: EXTERN(void) jsimd_idct_islow_sse2 JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: extern const int jconst_idct_ifast_sse2[]; michael@0: EXTERN(void) jsimd_idct_ifast_sse2 JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: EXTERN(void) jsimd_idct_islow_neon JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: EXTERN(void) jsimd_idct_ifast_neon JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: EXTERN(void) jsimd_idct_float_3dnow JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: extern const int jconst_idct_float_sse[]; michael@0: EXTERN(void) jsimd_idct_float_sse JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: michael@0: extern const int jconst_idct_float_sse2[]; michael@0: EXTERN(void) jsimd_idct_float_sse2 JPP((void * dct_table, michael@0: JCOEFPTR coef_block, michael@0: JSAMPARRAY output_buf, michael@0: JDIMENSION output_col)); michael@0: