Lay the groundwork for 32-bit AVX2 SIMD support
This commit is contained in:
@@ -2,6 +2,7 @@
|
||||
; jidctflt.asm - floating-point IDCT (SSE & SSE2)
|
||||
;
|
||||
; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
|
||||
; Copyright (C) 2016, D. R. Commander.
|
||||
;
|
||||
; Based on the x86 SIMD extension for IJG JPEG library
|
||||
; Copyright (C) 1999-2006, MIYASAKA Masaru.
|
||||
@@ -35,7 +36,7 @@
|
||||
; --------------------------------------------------------------------------
|
||||
SECTION SEG_CONST
|
||||
|
||||
alignz 16
|
||||
alignz 32
|
||||
global EXTN(jconst_idct_float_sse2)
|
||||
|
||||
EXTN(jconst_idct_float_sse2):
|
||||
@@ -47,7 +48,7 @@ PD_M2_613 times 4 dd -2.613125929752753055713286
|
||||
PD_RNDINT_MAGIC times 4 dd 100663296.0 ; (float)(0x00C00000 << 3)
|
||||
PB_CENTERJSAMP times 16 db CENTERJSAMPLE
|
||||
|
||||
alignz 16
|
||||
alignz 32
|
||||
|
||||
; --------------------------------------------------------------------------
|
||||
SECTION SEG_TEXT
|
||||
@@ -71,7 +72,7 @@ PB_CENTERJSAMP times 16 db CENTERJSAMPLE
|
||||
%define workspace wk(0)-DCTSIZE2*SIZEOF_FAST_FLOAT
|
||||
; FAST_FLOAT workspace[DCTSIZE2]
|
||||
|
||||
align 16
|
||||
align 32
|
||||
global EXTN(jsimd_idct_float_sse2)
|
||||
|
||||
EXTN(jsimd_idct_float_sse2):
|
||||
@@ -494,4 +495,4 @@ EXTN(jsimd_idct_float_sse2):
|
||||
|
||||
; For some reason, the OS X linker does not honor the request to align the
|
||||
; segment unless we do this.
|
||||
align 16
|
||||
align 32
|
||||
|
||||
Reference in New Issue
Block a user