Lay the groundwork for 32-bit AVX2 SIMD support

This commit is contained in:
DRC
2016-07-05 16:19:26 -05:00
parent b5426c52c0
commit 7ee3ce9ada
45 changed files with 196 additions and 164 deletions

View File

@@ -2,6 +2,7 @@
; jfdctfst.asm - fast integer FDCT (MMX)
;
; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
; Copyright (C) 2016, D. R. Commander.
;
; Based on the x86 SIMD extension for IJG JPEG library
; Copyright (C) 1999-2006, MIYASAKA Masaru.
@@ -50,7 +51,7 @@ F_1_306 equ DESCALE(1402911301,30-CONST_BITS) ; FIX(1.306562965)
%define PRE_MULTIPLY_SCALE_BITS 2
%define CONST_SHIFT (16 - PRE_MULTIPLY_SCALE_BITS - CONST_BITS)
alignz 16
alignz 32
global EXTN(jconst_fdct_ifast_mmx)
EXTN(jconst_fdct_ifast_mmx):
@@ -60,7 +61,7 @@ PW_F0382 times 4 dw F_0_382 << CONST_SHIFT
PW_F0541 times 4 dw F_0_541 << CONST_SHIFT
PW_F1306 times 4 dw F_1_306 << CONST_SHIFT
alignz 16
alignz 32
; --------------------------------------------------------------------------
SECTION SEG_TEXT
@@ -78,7 +79,7 @@ PW_F1306 times 4 dw F_1_306 << CONST_SHIFT
%define wk(i) ebp-(WK_NUM-(i))*SIZEOF_MMWORD ; mmword wk[WK_NUM]
%define WK_NUM 2
align 16
align 32
global EXTN(jsimd_fdct_ifast_mmx)
EXTN(jsimd_fdct_ifast_mmx):
@@ -393,4 +394,4 @@ EXTN(jsimd_fdct_ifast_mmx):
; For some reason, the OS X linker does not honor the request to align the
; segment unless we do this.
align 16
align 32