1*1fd5a2e1SPrashanth Swaminathan# =========================================================================== 2*1fd5a2e1SPrashanth Swaminathan# https://www.gnu.org/software/autoconf-archive/ax_cc_maxopt.html 3*1fd5a2e1SPrashanth Swaminathan# =========================================================================== 4*1fd5a2e1SPrashanth Swaminathan# 5*1fd5a2e1SPrashanth Swaminathan# SYNOPSIS 6*1fd5a2e1SPrashanth Swaminathan# 7*1fd5a2e1SPrashanth Swaminathan# AX_CC_MAXOPT 8*1fd5a2e1SPrashanth Swaminathan# 9*1fd5a2e1SPrashanth Swaminathan# DESCRIPTION 10*1fd5a2e1SPrashanth Swaminathan# 11*1fd5a2e1SPrashanth Swaminathan# Try to turn on "good" C optimization flags for various compilers and 12*1fd5a2e1SPrashanth Swaminathan# architectures, for some definition of "good". (In our case, good for 13*1fd5a2e1SPrashanth Swaminathan# FFTW and hopefully for other scientific codes. Modify as needed.) 14*1fd5a2e1SPrashanth Swaminathan# 15*1fd5a2e1SPrashanth Swaminathan# The user can override the flags by setting the CFLAGS environment 16*1fd5a2e1SPrashanth Swaminathan# variable. The user can also specify --enable-portable-binary in order to 17*1fd5a2e1SPrashanth Swaminathan# disable any optimization flags that might result in a binary that only 18*1fd5a2e1SPrashanth Swaminathan# runs on the host architecture. 19*1fd5a2e1SPrashanth Swaminathan# 20*1fd5a2e1SPrashanth Swaminathan# Note also that the flags assume that ANSI C aliasing rules are followed 21*1fd5a2e1SPrashanth Swaminathan# by the code (e.g. for gcc's -fstrict-aliasing), and that floating-point 22*1fd5a2e1SPrashanth Swaminathan# computations can be re-ordered as needed. 23*1fd5a2e1SPrashanth Swaminathan# 24*1fd5a2e1SPrashanth Swaminathan# Requires macros: AX_CHECK_COMPILE_FLAG, AX_COMPILER_VENDOR, 25*1fd5a2e1SPrashanth Swaminathan# AX_GCC_ARCHFLAG, AX_GCC_X86_CPUID. 26*1fd5a2e1SPrashanth Swaminathan# 27*1fd5a2e1SPrashanth Swaminathan# LICENSE 28*1fd5a2e1SPrashanth Swaminathan# 29*1fd5a2e1SPrashanth Swaminathan# Copyright (c) 2008 Steven G. Johnson <[email protected]> 30*1fd5a2e1SPrashanth Swaminathan# Copyright (c) 2008 Matteo Frigo 31*1fd5a2e1SPrashanth Swaminathan# 32*1fd5a2e1SPrashanth Swaminathan# This program is free software: you can redistribute it and/or modify it 33*1fd5a2e1SPrashanth Swaminathan# under the terms of the GNU General Public License as published by the 34*1fd5a2e1SPrashanth Swaminathan# Free Software Foundation, either version 3 of the License, or (at your 35*1fd5a2e1SPrashanth Swaminathan# option) any later version. 36*1fd5a2e1SPrashanth Swaminathan# 37*1fd5a2e1SPrashanth Swaminathan# This program is distributed in the hope that it will be useful, but 38*1fd5a2e1SPrashanth Swaminathan# WITHOUT ANY WARRANTY; without even the implied warranty of 39*1fd5a2e1SPrashanth Swaminathan# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General 40*1fd5a2e1SPrashanth Swaminathan# Public License for more details. 41*1fd5a2e1SPrashanth Swaminathan# 42*1fd5a2e1SPrashanth Swaminathan# You should have received a copy of the GNU General Public License along 43*1fd5a2e1SPrashanth Swaminathan# with this program. If not, see <https://www.gnu.org/licenses/>. 44*1fd5a2e1SPrashanth Swaminathan# 45*1fd5a2e1SPrashanth Swaminathan# As a special exception, the respective Autoconf Macro's copyright owner 46*1fd5a2e1SPrashanth Swaminathan# gives unlimited permission to copy, distribute and modify the configure 47*1fd5a2e1SPrashanth Swaminathan# scripts that are the output of Autoconf when processing the Macro. You 48*1fd5a2e1SPrashanth Swaminathan# need not follow the terms of the GNU General Public License when using 49*1fd5a2e1SPrashanth Swaminathan# or distributing such scripts, even though portions of the text of the 50*1fd5a2e1SPrashanth Swaminathan# Macro appear in them. The GNU General Public License (GPL) does govern 51*1fd5a2e1SPrashanth Swaminathan# all other use of the material that constitutes the Autoconf Macro. 52*1fd5a2e1SPrashanth Swaminathan# 53*1fd5a2e1SPrashanth Swaminathan# This special exception to the GPL applies to versions of the Autoconf 54*1fd5a2e1SPrashanth Swaminathan# Macro released by the Autoconf Archive. When you make and distribute a 55*1fd5a2e1SPrashanth Swaminathan# modified version of the Autoconf Macro, you may extend this special 56*1fd5a2e1SPrashanth Swaminathan# exception to the GPL to apply to your modified version as well. 57*1fd5a2e1SPrashanth Swaminathan 58*1fd5a2e1SPrashanth Swaminathan#serial 17 59*1fd5a2e1SPrashanth Swaminathan 60*1fd5a2e1SPrashanth SwaminathanAC_DEFUN([AX_CC_MAXOPT], 61*1fd5a2e1SPrashanth Swaminathan[ 62*1fd5a2e1SPrashanth SwaminathanAC_REQUIRE([AC_PROG_CC]) 63*1fd5a2e1SPrashanth SwaminathanAC_REQUIRE([AX_COMPILER_VENDOR]) 64*1fd5a2e1SPrashanth SwaminathanAC_REQUIRE([AC_CANONICAL_HOST]) 65*1fd5a2e1SPrashanth Swaminathan 66*1fd5a2e1SPrashanth SwaminathanAC_ARG_ENABLE(portable-binary, [AS_HELP_STRING([--enable-portable-binary], [disable compiler optimizations that would produce unportable binaries])], 67*1fd5a2e1SPrashanth Swaminathan acx_maxopt_portable=$enableval, acx_maxopt_portable=no) 68*1fd5a2e1SPrashanth Swaminathan 69*1fd5a2e1SPrashanth Swaminathan# Try to determine "good" native compiler flags if none specified via CFLAGS 70*1fd5a2e1SPrashanth Swaminathanif test "$ac_test_CFLAGS" != "set"; then 71*1fd5a2e1SPrashanth Swaminathan CFLAGS="" 72*1fd5a2e1SPrashanth Swaminathan case $ax_cv_c_compiler_vendor in 73*1fd5a2e1SPrashanth Swaminathan dec) CFLAGS="-newc -w0 -O5 -ansi_alias -ansi_args -fp_reorder -tune host" 74*1fd5a2e1SPrashanth Swaminathan if test "x$acx_maxopt_portable" = xno; then 75*1fd5a2e1SPrashanth Swaminathan CFLAGS="$CFLAGS -arch host" 76*1fd5a2e1SPrashanth Swaminathan fi;; 77*1fd5a2e1SPrashanth Swaminathan 78*1fd5a2e1SPrashanth Swaminathan sun) CFLAGS="-native -fast -xO5 -dalign" 79*1fd5a2e1SPrashanth Swaminathan if test "x$acx_maxopt_portable" = xyes; then 80*1fd5a2e1SPrashanth Swaminathan CFLAGS="$CFLAGS -xarch=generic" 81*1fd5a2e1SPrashanth Swaminathan fi;; 82*1fd5a2e1SPrashanth Swaminathan 83*1fd5a2e1SPrashanth Swaminathan hp) CFLAGS="+Oall +Optrs_ansi +DSnative" 84*1fd5a2e1SPrashanth Swaminathan if test "x$acx_maxopt_portable" = xyes; then 85*1fd5a2e1SPrashanth Swaminathan CFLAGS="$CFLAGS +DAportable" 86*1fd5a2e1SPrashanth Swaminathan fi;; 87*1fd5a2e1SPrashanth Swaminathan 88*1fd5a2e1SPrashanth Swaminathan ibm) if test "x$acx_maxopt_portable" = xno; then 89*1fd5a2e1SPrashanth Swaminathan xlc_opt="-qarch=auto -qtune=auto" 90*1fd5a2e1SPrashanth Swaminathan else 91*1fd5a2e1SPrashanth Swaminathan xlc_opt="-qtune=auto" 92*1fd5a2e1SPrashanth Swaminathan fi 93*1fd5a2e1SPrashanth Swaminathan AX_CHECK_COMPILE_FLAG($xlc_opt, 94*1fd5a2e1SPrashanth Swaminathan CFLAGS="-O3 -qansialias -w $xlc_opt", 95*1fd5a2e1SPrashanth Swaminathan [CFLAGS="-O3 -qansialias -w" 96*1fd5a2e1SPrashanth Swaminathan echo "******************************************************" 97*1fd5a2e1SPrashanth Swaminathan echo "* You seem to have the IBM C compiler. It is *" 98*1fd5a2e1SPrashanth Swaminathan echo "* recommended for best performance that you use: *" 99*1fd5a2e1SPrashanth Swaminathan echo "* *" 100*1fd5a2e1SPrashanth Swaminathan echo "* CFLAGS=-O3 -qarch=xxx -qtune=xxx -qansialias -w *" 101*1fd5a2e1SPrashanth Swaminathan echo "* ^^^ ^^^ *" 102*1fd5a2e1SPrashanth Swaminathan echo "* where xxx is pwr2, pwr3, 604, or whatever kind of *" 103*1fd5a2e1SPrashanth Swaminathan echo "* CPU you have. (Set the CFLAGS environment var. *" 104*1fd5a2e1SPrashanth Swaminathan echo "* and re-run configure.) For more info, man cc. *" 105*1fd5a2e1SPrashanth Swaminathan echo "******************************************************"]) 106*1fd5a2e1SPrashanth Swaminathan ;; 107*1fd5a2e1SPrashanth Swaminathan 108*1fd5a2e1SPrashanth Swaminathan intel) CFLAGS="-O3 -ansi_alias" 109*1fd5a2e1SPrashanth Swaminathan if test "x$acx_maxopt_portable" = xno; then 110*1fd5a2e1SPrashanth Swaminathan icc_archflag=unknown 111*1fd5a2e1SPrashanth Swaminathan icc_flags="" 112*1fd5a2e1SPrashanth Swaminathan case $host_cpu in 113*1fd5a2e1SPrashanth Swaminathan i686*|x86_64*) 114*1fd5a2e1SPrashanth Swaminathan # icc accepts gcc assembly syntax, so these should work: 115*1fd5a2e1SPrashanth Swaminathan AX_GCC_X86_CPUID(0) 116*1fd5a2e1SPrashanth Swaminathan AX_GCC_X86_CPUID(1) 117*1fd5a2e1SPrashanth Swaminathan case $ax_cv_gcc_x86_cpuid_0 in # see AX_GCC_ARCHFLAG 118*1fd5a2e1SPrashanth Swaminathan *:756e6547:6c65746e:49656e69) # Intel 119*1fd5a2e1SPrashanth Swaminathan case $ax_cv_gcc_x86_cpuid_1 in 120*1fd5a2e1SPrashanth Swaminathan *0?6[[78ab]]?:*:*:*|?6[[78ab]]?:*:*:*|6[[78ab]]?:*:*:*) icc_flags="-xK" ;; 121*1fd5a2e1SPrashanth Swaminathan *0?6[[9d]]?:*:*:*|?6[[9d]]?:*:*:*|6[[9d]]?:*:*:*|*1?65?:*:*:*) icc_flags="-xSSE2 -xB -xK" ;; 122*1fd5a2e1SPrashanth Swaminathan *0?6e?:*:*:*|?6e?:*:*:*|6e?:*:*:*) icc_flags="-xSSE3 -xP -xO -xB -xK" ;; 123*1fd5a2e1SPrashanth Swaminathan *0?6f?:*:*:*|?6f?:*:*:*|6f?:*:*:*|*1?66?:*:*:*) icc_flags="-xSSSE3 -xT -xB -xK" ;; 124*1fd5a2e1SPrashanth Swaminathan *1?6[[7d]]?:*:*:*) icc_flags="-xSSE4.1 -xS -xT -xB -xK" ;; 125*1fd5a2e1SPrashanth Swaminathan *1?6[[aef]]?:*:*:*|*2?6[[5cef]]?:*:*:*) icc_flags="-xSSE4.2 -xS -xT -xB -xK" ;; 126*1fd5a2e1SPrashanth Swaminathan *2?6[[ad]]?:*:*:*) icc_flags="-xAVX -SSE4.2 -xS -xT -xB -xK" ;; 127*1fd5a2e1SPrashanth Swaminathan *3?6[[ae]]?:*:*:*) icc_flags="-xCORE-AVX-I -xAVX -SSE4.2 -xS -xT -xB -xK" ;; 128*1fd5a2e1SPrashanth Swaminathan *3?6[[cf]]?:*:*:*|*4?6[[56]]?:*:*:*) icc_flags="-xCORE-AVX2 -xCORE-AVX-I -xAVX -SSE4.2 -xS -xT -xB -xK" ;; 129*1fd5a2e1SPrashanth Swaminathan *000?f[[346]]?:*:*:*|?f[[346]]?:*:*:*|f[[346]]?:*:*:*) icc_flags="-xSSE3 -xP -xO -xN -xW -xK" ;; 130*1fd5a2e1SPrashanth Swaminathan *00??f??:*:*:*|??f??:*:*:*|?f??:*:*:*|f??:*:*:*) icc_flags="-xSSE2 -xN -xW -xK" ;; 131*1fd5a2e1SPrashanth Swaminathan esac ;; 132*1fd5a2e1SPrashanth Swaminathan esac ;; 133*1fd5a2e1SPrashanth Swaminathan esac 134*1fd5a2e1SPrashanth Swaminathan if test "x$icc_flags" != x; then 135*1fd5a2e1SPrashanth Swaminathan for flag in $icc_flags; do 136*1fd5a2e1SPrashanth Swaminathan AX_CHECK_COMPILE_FLAG($flag, [icc_archflag=$flag; break]) 137*1fd5a2e1SPrashanth Swaminathan done 138*1fd5a2e1SPrashanth Swaminathan fi 139*1fd5a2e1SPrashanth Swaminathan AC_MSG_CHECKING([for icc architecture flag]) 140*1fd5a2e1SPrashanth Swaminathan AC_MSG_RESULT($icc_archflag) 141*1fd5a2e1SPrashanth Swaminathan if test "x$icc_archflag" != xunknown; then 142*1fd5a2e1SPrashanth Swaminathan CFLAGS="$CFLAGS $icc_archflag" 143*1fd5a2e1SPrashanth Swaminathan fi 144*1fd5a2e1SPrashanth Swaminathan fi 145*1fd5a2e1SPrashanth Swaminathan ;; 146*1fd5a2e1SPrashanth Swaminathan 147*1fd5a2e1SPrashanth Swaminathan gnu) 148*1fd5a2e1SPrashanth Swaminathan # default optimization flags for gcc on all systems 149*1fd5a2e1SPrashanth Swaminathan CFLAGS="-O3 -fomit-frame-pointer" 150*1fd5a2e1SPrashanth Swaminathan 151*1fd5a2e1SPrashanth Swaminathan # -malign-double for x86 systems 152*1fd5a2e1SPrashanth Swaminathan # libffi local change -- don't align double, as it changes the ABI 153*1fd5a2e1SPrashanth Swaminathan # AX_CHECK_COMPILE_FLAG(-malign-double, CFLAGS="$CFLAGS -malign-double") 154*1fd5a2e1SPrashanth Swaminathan 155*1fd5a2e1SPrashanth Swaminathan # -fstrict-aliasing for gcc-2.95+ 156*1fd5a2e1SPrashanth Swaminathan AX_CHECK_COMPILE_FLAG(-fstrict-aliasing, 157*1fd5a2e1SPrashanth Swaminathan CFLAGS="$CFLAGS -fstrict-aliasing") 158*1fd5a2e1SPrashanth Swaminathan 159*1fd5a2e1SPrashanth Swaminathan # note that we enable "unsafe" fp optimization with other compilers, too 160*1fd5a2e1SPrashanth Swaminathan AX_CHECK_COMPILE_FLAG(-ffast-math, CFLAGS="$CFLAGS -ffast-math") 161*1fd5a2e1SPrashanth Swaminathan 162*1fd5a2e1SPrashanth Swaminathan AX_GCC_ARCHFLAG($acx_maxopt_portable) 163*1fd5a2e1SPrashanth Swaminathan ;; 164*1fd5a2e1SPrashanth Swaminathan 165*1fd5a2e1SPrashanth Swaminathan microsoft) 166*1fd5a2e1SPrashanth Swaminathan # default optimization flags for MSVC opt builds 167*1fd5a2e1SPrashanth Swaminathan CFLAGS="-O2" 168*1fd5a2e1SPrashanth Swaminathan ;; 169*1fd5a2e1SPrashanth Swaminathan esac 170*1fd5a2e1SPrashanth Swaminathan 171*1fd5a2e1SPrashanth Swaminathan if test -z "$CFLAGS"; then 172*1fd5a2e1SPrashanth Swaminathan echo "" 173*1fd5a2e1SPrashanth Swaminathan echo "********************************************************" 174*1fd5a2e1SPrashanth Swaminathan echo "* WARNING: Don't know the best CFLAGS for this system *" 175*1fd5a2e1SPrashanth Swaminathan echo "* Use ./configure CFLAGS=... to specify your own flags *" 176*1fd5a2e1SPrashanth Swaminathan echo "* (otherwise, a default of CFLAGS=-O3 will be used) *" 177*1fd5a2e1SPrashanth Swaminathan echo "********************************************************" 178*1fd5a2e1SPrashanth Swaminathan echo "" 179*1fd5a2e1SPrashanth Swaminathan CFLAGS="-O3" 180*1fd5a2e1SPrashanth Swaminathan fi 181*1fd5a2e1SPrashanth Swaminathan 182*1fd5a2e1SPrashanth Swaminathan AX_CHECK_COMPILE_FLAG($CFLAGS, [], [ 183*1fd5a2e1SPrashanth Swaminathan echo "" 184*1fd5a2e1SPrashanth Swaminathan echo "********************************************************" 185*1fd5a2e1SPrashanth Swaminathan echo "* WARNING: The guessed CFLAGS don't seem to work with *" 186*1fd5a2e1SPrashanth Swaminathan echo "* your compiler. *" 187*1fd5a2e1SPrashanth Swaminathan echo "* Use ./configure CFLAGS=... to specify your own flags *" 188*1fd5a2e1SPrashanth Swaminathan echo "********************************************************" 189*1fd5a2e1SPrashanth Swaminathan echo "" 190*1fd5a2e1SPrashanth Swaminathan CFLAGS="" 191*1fd5a2e1SPrashanth Swaminathan ]) 192*1fd5a2e1SPrashanth Swaminathan 193*1fd5a2e1SPrashanth Swaminathanfi 194*1fd5a2e1SPrashanth Swaminathan]) 195