xref: /aosp_15_r20/external/libjpeg-turbo/simd/i386/jdmerge-avx2.asm (revision dfc6aa5c1cfd4bc4e2018dc74aa96e29ee49c6da)
1*dfc6aa5cSAndroid Build Coastguard Worker;
2*dfc6aa5cSAndroid Build Coastguard Worker; jdmerge.asm - merged upsampling/color conversion (AVX2)
3*dfc6aa5cSAndroid Build Coastguard Worker;
4*dfc6aa5cSAndroid Build Coastguard Worker; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
5*dfc6aa5cSAndroid Build Coastguard Worker; Copyright (C) 2009, 2016, D. R. Commander.
6*dfc6aa5cSAndroid Build Coastguard Worker; Copyright (C) 2015, Intel Corporation.
7*dfc6aa5cSAndroid Build Coastguard Worker;
8*dfc6aa5cSAndroid Build Coastguard Worker; Based on the x86 SIMD extension for IJG JPEG library
9*dfc6aa5cSAndroid Build Coastguard Worker; Copyright (C) 1999-2006, MIYASAKA Masaru.
10*dfc6aa5cSAndroid Build Coastguard Worker; For conditions of distribution and use, see copyright notice in jsimdext.inc
11*dfc6aa5cSAndroid Build Coastguard Worker;
12*dfc6aa5cSAndroid Build Coastguard Worker; This file should be assembled with NASM (Netwide Assembler),
13*dfc6aa5cSAndroid Build Coastguard Worker; can *not* be assembled with Microsoft's MASM or any compatible
14*dfc6aa5cSAndroid Build Coastguard Worker; assembler (including Borland's Turbo Assembler).
15*dfc6aa5cSAndroid Build Coastguard Worker; NASM is available from http://nasm.sourceforge.net/ or
16*dfc6aa5cSAndroid Build Coastguard Worker; http://sourceforge.net/project/showfiles.php?group_id=6208
17*dfc6aa5cSAndroid Build Coastguard Worker
18*dfc6aa5cSAndroid Build Coastguard Worker%include "jsimdext.inc"
19*dfc6aa5cSAndroid Build Coastguard Worker
20*dfc6aa5cSAndroid Build Coastguard Worker; --------------------------------------------------------------------------
21*dfc6aa5cSAndroid Build Coastguard Worker
22*dfc6aa5cSAndroid Build Coastguard Worker%define SCALEBITS  16
23*dfc6aa5cSAndroid Build Coastguard Worker
24*dfc6aa5cSAndroid Build Coastguard WorkerF_0_344 equ  22554              ; FIX(0.34414)
25*dfc6aa5cSAndroid Build Coastguard WorkerF_0_714 equ  46802              ; FIX(0.71414)
26*dfc6aa5cSAndroid Build Coastguard WorkerF_1_402 equ  91881              ; FIX(1.40200)
27*dfc6aa5cSAndroid Build Coastguard WorkerF_1_772 equ 116130              ; FIX(1.77200)
28*dfc6aa5cSAndroid Build Coastguard WorkerF_0_402 equ (F_1_402 - 65536)   ; FIX(1.40200) - FIX(1)
29*dfc6aa5cSAndroid Build Coastguard WorkerF_0_285 equ ( 65536 - F_0_714)  ; FIX(1) - FIX(0.71414)
30*dfc6aa5cSAndroid Build Coastguard WorkerF_0_228 equ (131072 - F_1_772)  ; FIX(2) - FIX(1.77200)
31*dfc6aa5cSAndroid Build Coastguard Worker
32*dfc6aa5cSAndroid Build Coastguard Worker; --------------------------------------------------------------------------
33*dfc6aa5cSAndroid Build Coastguard Worker    SECTION     SEG_CONST
34*dfc6aa5cSAndroid Build Coastguard Worker
35*dfc6aa5cSAndroid Build Coastguard Worker    alignz      32
36*dfc6aa5cSAndroid Build Coastguard Worker    GLOBAL_DATA(jconst_merged_upsample_avx2)
37*dfc6aa5cSAndroid Build Coastguard Worker
38*dfc6aa5cSAndroid Build Coastguard WorkerEXTN(jconst_merged_upsample_avx2):
39*dfc6aa5cSAndroid Build Coastguard Worker
40*dfc6aa5cSAndroid Build Coastguard WorkerPW_F0402        times 16 dw  F_0_402
41*dfc6aa5cSAndroid Build Coastguard WorkerPW_MF0228       times 16 dw -F_0_228
42*dfc6aa5cSAndroid Build Coastguard WorkerPW_MF0344_F0285 times 8  dw -F_0_344, F_0_285
43*dfc6aa5cSAndroid Build Coastguard WorkerPW_ONE          times 16 dw  1
44*dfc6aa5cSAndroid Build Coastguard WorkerPD_ONEHALF      times 8  dd  1 << (SCALEBITS - 1)
45*dfc6aa5cSAndroid Build Coastguard Worker
46*dfc6aa5cSAndroid Build Coastguard Worker    alignz      32
47*dfc6aa5cSAndroid Build Coastguard Worker
48*dfc6aa5cSAndroid Build Coastguard Worker; --------------------------------------------------------------------------
49*dfc6aa5cSAndroid Build Coastguard Worker    SECTION     SEG_TEXT
50*dfc6aa5cSAndroid Build Coastguard Worker    BITS        32
51*dfc6aa5cSAndroid Build Coastguard Worker
52*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
53*dfc6aa5cSAndroid Build Coastguard Worker
54*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_RED
55*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_GREEN
56*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_BLUE
57*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_PIXELSIZE
58*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_RED  EXT_RGB_RED
59*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_GREEN  EXT_RGB_GREEN
60*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_BLUE  EXT_RGB_BLUE
61*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_PIXELSIZE  EXT_RGB_PIXELSIZE
62*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v1_merged_upsample_avx2 \
63*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v1_extrgb_merged_upsample_avx2
64*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v2_merged_upsample_avx2 \
65*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v2_extrgb_merged_upsample_avx2
66*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
67*dfc6aa5cSAndroid Build Coastguard Worker
68*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_RED
69*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_GREEN
70*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_BLUE
71*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_PIXELSIZE
72*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_RED  EXT_RGBX_RED
73*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_GREEN  EXT_RGBX_GREEN
74*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_BLUE  EXT_RGBX_BLUE
75*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_PIXELSIZE  EXT_RGBX_PIXELSIZE
76*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v1_merged_upsample_avx2 \
77*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v1_extrgbx_merged_upsample_avx2
78*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v2_merged_upsample_avx2 \
79*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v2_extrgbx_merged_upsample_avx2
80*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
81*dfc6aa5cSAndroid Build Coastguard Worker
82*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_RED
83*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_GREEN
84*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_BLUE
85*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_PIXELSIZE
86*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_RED  EXT_BGR_RED
87*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_GREEN  EXT_BGR_GREEN
88*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_BLUE  EXT_BGR_BLUE
89*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_PIXELSIZE  EXT_BGR_PIXELSIZE
90*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v1_merged_upsample_avx2 \
91*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v1_extbgr_merged_upsample_avx2
92*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v2_merged_upsample_avx2 \
93*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v2_extbgr_merged_upsample_avx2
94*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
95*dfc6aa5cSAndroid Build Coastguard Worker
96*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_RED
97*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_GREEN
98*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_BLUE
99*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_PIXELSIZE
100*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_RED  EXT_BGRX_RED
101*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_GREEN  EXT_BGRX_GREEN
102*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_BLUE  EXT_BGRX_BLUE
103*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_PIXELSIZE  EXT_BGRX_PIXELSIZE
104*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v1_merged_upsample_avx2 \
105*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v1_extbgrx_merged_upsample_avx2
106*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v2_merged_upsample_avx2 \
107*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v2_extbgrx_merged_upsample_avx2
108*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
109*dfc6aa5cSAndroid Build Coastguard Worker
110*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_RED
111*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_GREEN
112*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_BLUE
113*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_PIXELSIZE
114*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_RED  EXT_XBGR_RED
115*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_GREEN  EXT_XBGR_GREEN
116*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_BLUE  EXT_XBGR_BLUE
117*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_PIXELSIZE  EXT_XBGR_PIXELSIZE
118*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v1_merged_upsample_avx2 \
119*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v1_extxbgr_merged_upsample_avx2
120*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v2_merged_upsample_avx2 \
121*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v2_extxbgr_merged_upsample_avx2
122*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
123*dfc6aa5cSAndroid Build Coastguard Worker
124*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_RED
125*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_GREEN
126*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_BLUE
127*dfc6aa5cSAndroid Build Coastguard Worker%undef RGB_PIXELSIZE
128*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_RED  EXT_XRGB_RED
129*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_GREEN  EXT_XRGB_GREEN
130*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_BLUE  EXT_XRGB_BLUE
131*dfc6aa5cSAndroid Build Coastguard Worker%define RGB_PIXELSIZE  EXT_XRGB_PIXELSIZE
132*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v1_merged_upsample_avx2 \
133*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v1_extxrgb_merged_upsample_avx2
134*dfc6aa5cSAndroid Build Coastguard Worker%define jsimd_h2v2_merged_upsample_avx2 \
135*dfc6aa5cSAndroid Build Coastguard Worker  jsimd_h2v2_extxrgb_merged_upsample_avx2
136*dfc6aa5cSAndroid Build Coastguard Worker%include "jdmrgext-avx2.asm"
137