163 lines
7.1 KiB
C
163 lines
7.1 KiB
C
/*
|
|
* simd/jsimd.h
|
|
*
|
|
* Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
|
|
*
|
|
* Based on the x86 SIMD extension for IJG JPEG library,
|
|
* Copyright (C) 1999-2006, MIYASAKA Masaru.
|
|
*
|
|
*/
|
|
|
|
/* Bitmask for supported acceleration methods */
|
|
|
|
#define JSIMD_NONE 0x00
|
|
#define JSIMD_MMX 0x01
|
|
#define JSIMD_3DNOW 0x02
|
|
#define JSIMD_SSE 0x04
|
|
|
|
/* Short forms of external names for systems with brain-damaged linkers. */
|
|
|
|
#ifdef NEED_SHORT_EXTERNAL_NAMES
|
|
#define jpeg_simd_cpu_support jSiCpuSupport
|
|
#define jsimd_rgb_ycc_convert_mmx jSRGBYCCM
|
|
#define jsimd_ycc_rgb_convert_mmx jSYCCRGBM
|
|
#define jsimd_h2v2_downsample_mmx jSDnH2V2M
|
|
#define jsimd_h2v1_downsample_mmx jSDnH2V1M
|
|
#define jsimd_h2v2_upsample_mmx jSUpH2V2M
|
|
#define jsimd_h2v1_upsample_mmx jSUpH2V1M
|
|
#define jsimd_h2v2_fancy_upsample_mmx jSFUpH2V2M
|
|
#define jsimd_h2v1_fancy_upsample_mmx jSFUpH2V1M
|
|
#define jsimd_h2v2_merged_upsample_mmx jSMUpH2V2M
|
|
#define jsimd_h2v1_merged_upsample_mmx jSMUpH2V1M
|
|
#define jsimd_convsamp_mmx jSConvM
|
|
#define jsimd_convsamp_float_3dnow jSConvF3D
|
|
#define jsimd_convsamp_float_sse jSConvFS
|
|
#define jsimd_fdct_islow_mmx jSFDMIS
|
|
#define jsimd_fdct_ifast_mmx jSFDMIF
|
|
#define jsimd_fdct_float_3dnow jSFD3DF
|
|
#define jconst_fdct_float_sse jSCFDSF
|
|
#define jsimd_fdct_float_sse jSFDSF
|
|
#define jsimd_quantize_mmx jSQuantM
|
|
#define jsimd_quantize_float_3dnow jSQuantF3D
|
|
#define jsimd_quantize_float_sse jSQuantFS
|
|
#define jsimd_idct_2x2_mmx jSIDM22
|
|
#define jsimd_idct_4x4_mmx jSIDM44
|
|
#define jsimd_idct_islow_mmx jSIDMIS
|
|
#define jsimd_idct_ifast_mmx jSIDMIF
|
|
#define jsimd_idct_float_3dnow jSID3DF
|
|
#define jconst_fdct_float_sse jSCIDSF
|
|
#define jsimd_idct_float_sse jSIDSF
|
|
#endif /* NEED_SHORT_EXTERNAL_NAMES */
|
|
|
|
/* SIMD Ext: retrieve SIMD/CPU information */
|
|
EXTERN(unsigned int) jpeg_simd_cpu_support JPP((void));
|
|
|
|
/* SIMD Color Space Conversion */
|
|
EXTERN(void) jsimd_rgb_ycc_convert_mmx
|
|
JPP((JDIMENSION img_width,
|
|
JSAMPARRAY input_buf, JSAMPIMAGE output_buf,
|
|
JDIMENSION output_row, int num_rows));
|
|
EXTERN(void) jsimd_ycc_rgb_convert_mmx
|
|
JPP((JDIMENSION out_width,
|
|
JSAMPIMAGE input_buf, JDIMENSION input_row,
|
|
JSAMPARRAY output_buf, int num_rows));
|
|
|
|
/* SIMD Downsample */
|
|
EXTERN(void) jsimd_h2v2_downsample_mmx
|
|
JPP((JDIMENSION image_width, int max_v_samp_factor,
|
|
JDIMENSION v_samp_factor, JDIMENSION width_blocks,
|
|
JSAMPARRAY input_data, JSAMPARRAY output_data));
|
|
EXTERN(void) jsimd_h2v1_downsample_mmx
|
|
JPP((JDIMENSION image_width, int max_v_samp_factor,
|
|
JDIMENSION v_samp_factor, JDIMENSION width_blocks,
|
|
JSAMPARRAY input_data, JSAMPARRAY output_data));
|
|
|
|
/* SIMD Upsample */
|
|
EXTERN(void) jsimd_h2v2_upsample_mmx
|
|
JPP((int max_v_samp_factor, JDIMENSION output_width,
|
|
JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr));
|
|
EXTERN(void) jsimd_h2v1_upsample_mmx
|
|
JPP((int max_v_samp_factor, JDIMENSION output_width,
|
|
JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr));
|
|
|
|
EXTERN(void) jsimd_h2v2_fancy_upsample_mmx
|
|
JPP((int max_v_samp_factor, JDIMENSION downsampled_width,
|
|
JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr));
|
|
EXTERN(void) jsimd_h2v1_fancy_upsample_mmx
|
|
JPP((int max_v_samp_factor, JDIMENSION downsampled_width,
|
|
JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr));
|
|
|
|
EXTERN(void) jsimd_h2v2_merged_upsample_mmx
|
|
JPP((JDIMENSION output_width, JSAMPIMAGE input_buf,
|
|
JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf));
|
|
EXTERN(void) jsimd_h2v1_merged_upsample_mmx
|
|
JPP((JDIMENSION output_width, JSAMPIMAGE input_buf,
|
|
JDIMENSION in_row_group_ctr, JSAMPARRAY output_buf));
|
|
|
|
/* SIMD Sample Conversion */
|
|
EXTERN(void) jsimd_convsamp_mmx JPP((JSAMPARRAY sample_data,
|
|
JDIMENSION start_col,
|
|
DCTELEM * workspace));
|
|
|
|
EXTERN(void) jsimd_convsamp_float_3dnow JPP((JSAMPARRAY sample_data,
|
|
JDIMENSION start_col,
|
|
FAST_FLOAT * workspace));
|
|
|
|
EXTERN(void) jsimd_convsamp_float_sse JPP((JSAMPARRAY sample_data,
|
|
JDIMENSION start_col,
|
|
FAST_FLOAT * workspace));
|
|
|
|
/* SIMD Forward DCT */
|
|
EXTERN(void) jsimd_fdct_islow_mmx JPP((DCTELEM * data));
|
|
EXTERN(void) jsimd_fdct_ifast_mmx JPP((DCTELEM * data));
|
|
|
|
EXTERN(void) jsimd_fdct_float_3dnow JPP((FAST_FLOAT * data));
|
|
|
|
extern const int jconst_fdct_float_sse[];
|
|
EXTERN(void) jsimd_fdct_float_sse JPP((FAST_FLOAT * data));
|
|
|
|
/* SIMD Quantization */
|
|
EXTERN(void) jsimd_quantize_mmx JPP((JCOEFPTR coef_block,
|
|
DCTELEM * divisors,
|
|
DCTELEM * workspace));
|
|
|
|
EXTERN(void) jsimd_quantize_float_3dnow JPP((JCOEFPTR coef_block,
|
|
FAST_FLOAT * divisors,
|
|
FAST_FLOAT * workspace));
|
|
|
|
EXTERN(void) jsimd_quantize_float_sse JPP((JCOEFPTR coef_block,
|
|
FAST_FLOAT * divisors,
|
|
FAST_FLOAT * workspace));
|
|
|
|
/* SIMD Reduced Inverse DCT */
|
|
EXTERN(void) jsimd_idct_2x2_mmx JPP((void * dct_table,
|
|
JCOEFPTR coef_block,
|
|
JSAMPARRAY output_buf,
|
|
JDIMENSION output_col));
|
|
EXTERN(void) jsimd_idct_4x4_mmx JPP((void * dct_table,
|
|
JCOEFPTR coef_block,
|
|
JSAMPARRAY output_buf,
|
|
JDIMENSION output_col));
|
|
|
|
/* SIMD Inverse DCT */
|
|
EXTERN(void) jsimd_idct_islow_mmx JPP((void * dct_table,
|
|
JCOEFPTR coef_block,
|
|
JSAMPARRAY output_buf,
|
|
JDIMENSION output_col));
|
|
EXTERN(void) jsimd_idct_ifast_mmx JPP((void * dct_table,
|
|
JCOEFPTR coef_block,
|
|
JSAMPARRAY output_buf,
|
|
JDIMENSION output_col));
|
|
|
|
EXTERN(void) jsimd_idct_float_3dnow JPP((void * dct_table,
|
|
JCOEFPTR coef_block,
|
|
JSAMPARRAY output_buf,
|
|
JDIMENSION output_col));
|
|
|
|
extern const int jconst_idct_float_sse[];
|
|
EXTERN(void) jsimd_idct_float_sse JPP((void * dct_table,
|
|
JCOEFPTR coef_block,
|
|
JSAMPARRAY output_buf,
|
|
JDIMENSION output_col));
|
|
|