1# =========================================================================== 2# https://www.gnu.org/software/autoconf-archive/ax_gcc_archflag.html 3# =========================================================================== 4# 5# SYNOPSIS 6# 7# AX_GCC_ARCHFLAG([PORTABLE?], [ACTION-SUCCESS], [ACTION-FAILURE]) 8# 9# DESCRIPTION 10# 11# This macro tries to guess the "native" arch corresponding to the target 12# architecture for use with gcc's -march=arch or -mtune=arch flags. If 13# found, the cache variable $ax_cv_gcc_archflag is set to this flag and 14# ACTION-SUCCESS is executed; otherwise $ax_cv_gcc_archflag is set to 15# "unknown" and ACTION-FAILURE is executed. The default ACTION-SUCCESS is 16# to add $ax_cv_gcc_archflag to the end of $CFLAGS. 17# 18# PORTABLE? should be either [yes] (default) or [no]. In the former case, 19# the flag is set to -mtune (or equivalent) so that the architecture is 20# only used for tuning, but the instruction set used is still portable. In 21# the latter case, the flag is set to -march (or equivalent) so that 22# architecture-specific instructions are enabled. 23# 24# The user can specify --with-gcc-arch=<arch> in order to override the 25# macro's choice of architecture, or --without-gcc-arch to disable this. 26# 27# When cross-compiling, or if $CC is not gcc, then ACTION-FAILURE is 28# called unless the user specified --with-gcc-arch manually. 29# 30# Requires macros: AX_CHECK_COMPILE_FLAG, AX_GCC_X86_CPUID 31# 32# (The main emphasis here is on recent CPUs, on the principle that doing 33# high-performance computing on old hardware is uncommon.) 34# 35# LICENSE 36# 37# Copyright (c) 2008 Steven G. Johnson <stevenj@alum.mit.edu> 38# Copyright (c) 2008 Matteo Frigo 39# Copyright (c) 2014 Tsukasa Oi 40# Copyright (c) 2017-2018 Alexey Kopytov 41# 42# This program is free software: you can redistribute it and/or modify it 43# under the terms of the GNU General Public License as published by the 44# Free Software Foundation, either version 3 of the License, or (at your 45# option) any later version. 46# 47# This program is distributed in the hope that it will be useful, but 48# WITHOUT ANY WARRANTY; without even the implied warranty of 49# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General 50# Public License for more details. 51# 52# You should have received a copy of the GNU General Public License along 53# with this program. If not, see <https://www.gnu.org/licenses/>. 54# 55# As a special exception, the respective Autoconf Macro's copyright owner 56# gives unlimited permission to copy, distribute and modify the configure 57# scripts that are the output of Autoconf when processing the Macro. You 58# need not follow the terms of the GNU General Public License when using 59# or distributing such scripts, even though portions of the text of the 60# Macro appear in them. The GNU General Public License (GPL) does govern 61# all other use of the material that constitutes the Autoconf Macro. 62# 63# This special exception to the GPL applies to versions of the Autoconf 64# Macro released by the Autoconf Archive. When you make and distribute a 65# modified version of the Autoconf Macro, you may extend this special 66# exception to the GPL to apply to your modified version as well. 67 68#serial 22 69 70AC_DEFUN([AX_GCC_ARCHFLAG], 71[AC_REQUIRE([AC_PROG_CC]) 72AC_REQUIRE([AC_CANONICAL_HOST]) 73AC_REQUIRE([AC_PROG_SED]) 74AC_REQUIRE([AX_COMPILER_VENDOR]) 75 76AC_ARG_WITH(gcc-arch, [AS_HELP_STRING([--with-gcc-arch=<arch>], [use architecture <arch> for gcc -march/-mtune, instead of guessing])], 77 ax_gcc_arch=$withval, ax_gcc_arch=yes) 78 79AC_MSG_CHECKING([for gcc architecture flag]) 80AC_MSG_RESULT([]) 81AC_CACHE_VAL(ax_cv_gcc_archflag, 82[ 83ax_cv_gcc_archflag="unknown" 84 85if test "$GCC" = yes; then 86 87if test "x$ax_gcc_arch" = xyes; then 88ax_gcc_arch="" 89if test "$cross_compiling" = no; then 90case $host_cpu in 91 i[[3456]]86*|x86_64*|amd64*) # use cpuid codes 92 AX_GCC_X86_CPUID(0) 93 AX_GCC_X86_CPUID(1) 94 case $ax_cv_gcc_x86_cpuid_0 in 95 *:756e6547:6c65746e:49656e69) # Intel 96 case $ax_cv_gcc_x86_cpuid_1 in 97 *5[[4578]]?:*:*:*) ax_gcc_arch="pentium-mmx pentium" ;; 98 *5[[123]]?:*:*:*) ax_gcc_arch=pentium ;; 99 *0?61?:*:*:*|?61?:*:*:*|61?:*:*:*) ax_gcc_arch=pentiumpro ;; 100 *0?6[[356]]?:*:*:*|?6[[356]]?:*:*:*|6[[356]]?:*:*:*) ax_gcc_arch="pentium2 pentiumpro" ;; 101 *0?6[[78ab]]?:*:*:*|?6[[78ab]]?:*:*:*|6[[78ab]]?:*:*:*) ax_gcc_arch="pentium3 pentiumpro" ;; 102 *0?6[[9d]]?:*:*:*|?6[[9d]]?:*:*:*|6[[9d]]?:*:*:*|*1?65?:*:*:*) ax_gcc_arch="pentium-m pentium3 pentiumpro" ;; 103 *0?6e?:*:*:*|?6e?:*:*:*|6e?:*:*:*) ax_gcc_arch="yonah pentium-m pentium3 pentiumpro" ;; 104 *0?6f?:*:*:*|?6f?:*:*:*|6f?:*:*:*|*1?66?:*:*:*) ax_gcc_arch="core2 pentium-m pentium3 pentiumpro" ;; 105 *1?6[[7d]]?:*:*:*) ax_gcc_arch="penryn core2 pentium-m pentium3 pentiumpro" ;; 106 *1?6[[aef]]?:*:*:*|*2?6e?:*:*:*) ax_gcc_arch="nehalem corei7 core2 pentium-m pentium3 pentiumpro" ;; 107 *2?6[[5cf]]?:*:*:*) ax_gcc_arch="westmere corei7 core2 pentium-m pentium3 pentiumpro" ;; 108 *2?6[[ad]]?:*:*:*) ax_gcc_arch="sandybridge corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;; 109 *3?6[[ae]]?:*:*:*) ax_gcc_arch="ivybridge core-avx-i corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;; 110 *3?6[[cf]]?:*:*:*|*4?6[[56]]?:*:*:*) ax_gcc_arch="haswell core-avx2 core-avx-i corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;; 111 *3?6d?:*:*:*|*4?6[[7f]]?:*:*:*|*5?66?:*:*:*) ax_gcc_arch="broadwell core-avx2 core-avx-i corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;; 112 *1?6c?:*:*:*|*2?6[[67]]?:*:*:*|*3?6[[56]]?:*:*:*) ax_gcc_arch="bonnell atom core2 pentium-m pentium3 pentiumpro" ;; 113 *3?67?:*:*:*|*[[45]]?6[[ad]]?:*:*:*) ax_gcc_arch="silvermont atom core2 pentium-m pentium3 pentiumpro" ;; 114 *000?f[[012]]?:*:*:*|?f[[012]]?:*:*:*|f[[012]]?:*:*:*) ax_gcc_arch="pentium4 pentiumpro" ;; 115 *000?f[[346]]?:*:*:*|?f[[346]]?:*:*:*|f[[346]]?:*:*:*) ax_gcc_arch="nocona prescott pentium4 pentiumpro" ;; 116 # fallback 117 *5??:*:*:*) ax_gcc_arch=pentium ;; 118 *??6??:*:*:*) ax_gcc_arch="core2 pentiumpro" ;; 119 *6??:*:*:*) ax_gcc_arch=pentiumpro ;; 120 *00??f??:*:*:*|??f??:*:*:*|?f??:*:*:*|f??:*:*:*) ax_gcc_arch="pentium4 pentiumpro" ;; 121 esac ;; 122 *:68747541:444d4163:69746e65) # AMD 123 case $ax_cv_gcc_x86_cpuid_1 in 124 *5[[67]]?:*:*:*) ax_gcc_arch=k6 ;; 125 *5[[8]]?:*:*:*) ax_gcc_arch="k6-2 k6" ;; 126 *5[[9d]]?:*:*:*) ax_gcc_arch="k6-3 k6" ;; 127 *6[[12]]?:*:*:*) ax_gcc_arch="athlon k7" ;; 128 *6[[34]]?:*:*:*) ax_gcc_arch="athlon-tbird k7" ;; 129 *6[[678a]]?:*:*:*) ax_gcc_arch="athlon-xp athlon-4 athlon k7" ;; 130 *000?f[[4578bcef]]?:*:*:*|?f[[4578bcef]]?:*:*:*|f[[4578bcef]]?:*:*:*|*001?f[[4578bcf]]?:*:*:*|1?f[[4578bcf]]?:*:*:*) ax_gcc_arch="athlon64 k8" ;; 131 *002?f[[13457bcf]]?:*:*:*|2?f[[13457bcf]]?:*:*:*|*004?f[[138bcf]]?:*:*:*|4?f[[138bcf]]?:*:*:*|*005?f[[df]]?:*:*:*|5?f[[df]]?:*:*:*|*006?f[[8bcf]]?:*:*:*|6?f[[8bcf]]?:*:*:*|*007?f[[cf]]?:*:*:*|7?f[[cf]]?:*:*:*|*00c?f1?:*:*:*|c?f1?:*:*:*|*020?f3?:*:*:*|20?f3?:*:*:*) ax_gcc_arch="athlon64-sse3 k8-sse3 athlon64 k8" ;; 132 *010?f[[245689a]]?:*:*:*|10?f[[245689a]]?:*:*:*|*030?f1?:*:*:*|30?f1?:*:*:*) ax_gcc_arch="barcelona amdfam10 k8" ;; 133 *050?f[[12]]?:*:*:*|50?f[[12]]?:*:*:*) ax_gcc_arch="btver1 amdfam10 k8" ;; 134 *060?f1?:*:*:*|60?f1?:*:*:*) ax_gcc_arch="bdver1 amdfam10 k8" ;; 135 *060?f2?:*:*:*|60?f2?:*:*:*|*061?f[[03]]?:*:*:*|61?f[[03]]?:*:*:*) ax_gcc_arch="bdver2 bdver1 amdfam10 k8" ;; 136 *063?f0?:*:*:*|63?f0?:*:*:*) ax_gcc_arch="bdver3 bdver2 bdver1 amdfam10 k8" ;; 137 *07[[03]]?f0?:*:*:*|7[[03]]?f0?:*:*:*) ax_gcc_arch="btver2 btver1 amdfam10 k8" ;; 138 # fallback 139 *0[[13]]??f??:*:*:*|[[13]]??f??:*:*:*) ax_gcc_arch="barcelona amdfam10 k8" ;; 140 *020?f??:*:*:*|20?f??:*:*:*) ax_gcc_arch="athlon64-sse3 k8-sse3 athlon64 k8" ;; 141 *05??f??:*:*:*|5??f??:*:*:*) ax_gcc_arch="btver1 amdfam10 k8" ;; 142 *060?f??:*:*:*|60?f??:*:*:*) ax_gcc_arch="bdver1 amdfam10 k8" ;; 143 *061?f??:*:*:*|61?f??:*:*:*) ax_gcc_arch="bdver2 bdver1 amdfam10 k8" ;; 144 *06??f??:*:*:*|6??f??:*:*:*) ax_gcc_arch="bdver3 bdver2 bdver1 amdfam10 k8" ;; 145 *070?f??:*:*:*|70?f??:*:*:*) ax_gcc_arch="btver2 btver1 amdfam10 k8" ;; 146 *???f??:*:*:*) ax_gcc_arch="amdfam10 k8" ;; 147 esac ;; 148 *:746e6543:736c7561:48727561) # IDT / VIA (Centaur) 149 case $ax_cv_gcc_x86_cpuid_1 in 150 *54?:*:*:*) ax_gcc_arch=winchip-c6 ;; 151 *5[[89]]?:*:*:*) ax_gcc_arch=winchip2 ;; 152 *66?:*:*:*) ax_gcc_arch=winchip2 ;; 153 *6[[78]]?:*:*:*) ax_gcc_arch=c3 ;; 154 *6[[9adf]]?:*:*:*) ax_gcc_arch="c3-2 c3" ;; 155 esac ;; 156 esac 157 if test x"$ax_gcc_arch" = x; then # fallback 158 case $host_cpu in 159 i586*) ax_gcc_arch=pentium ;; 160 i686*) ax_gcc_arch=pentiumpro ;; 161 esac 162 fi 163 ;; 164 165 sparc*) 166 AC_PATH_PROG([PRTDIAG], [prtdiag], [prtdiag], [$PATH:/usr/platform/`uname -i`/sbin/:/usr/platform/`uname -m`/sbin/]) 167 cputype=`(((grep cpu /proc/cpuinfo | cut -d: -f2) ; ($PRTDIAG -v |grep -i sparc) ; grep -i cpu /var/run/dmesg.boot ) | head -n 1) 2> /dev/null` 168 cputype=`echo "$cputype" | tr -d ' -' | $SED 's/SPARCIIi/SPARCII/' |tr $as_cr_LETTERS $as_cr_letters` 169 case $cputype in 170 *ultrasparciv*) ax_gcc_arch="ultrasparc4 ultrasparc3 ultrasparc v9" ;; 171 *ultrasparciii*) ax_gcc_arch="ultrasparc3 ultrasparc v9" ;; 172 *ultrasparc*) ax_gcc_arch="ultrasparc v9" ;; 173 *supersparc*|*tms390z5[[05]]*) ax_gcc_arch="supersparc v8" ;; 174 *hypersparc*|*rt62[[056]]*) ax_gcc_arch="hypersparc v8" ;; 175 *cypress*) ax_gcc_arch=cypress ;; 176 esac ;; 177 178 alphaev5) ax_gcc_arch=ev5 ;; 179 alphaev56) ax_gcc_arch=ev56 ;; 180 alphapca56) ax_gcc_arch="pca56 ev56" ;; 181 alphapca57) ax_gcc_arch="pca57 pca56 ev56" ;; 182 alphaev6) ax_gcc_arch=ev6 ;; 183 alphaev67) ax_gcc_arch=ev67 ;; 184 alphaev68) ax_gcc_arch="ev68 ev67" ;; 185 alphaev69) ax_gcc_arch="ev69 ev68 ev67" ;; 186 alphaev7) ax_gcc_arch="ev7 ev69 ev68 ev67" ;; 187 alphaev79) ax_gcc_arch="ev79 ev7 ev69 ev68 ev67" ;; 188 189 powerpc*) 190 cputype=`((grep cpu /proc/cpuinfo | head -n 1 | cut -d: -f2 | cut -d, -f1 | $SED 's/ //g') ; /usr/bin/machine ; /bin/machine; grep CPU /var/run/dmesg.boot | head -n 1 | cut -d" " -f2) 2> /dev/null` 191 cputype=`echo $cputype | $SED -e 's/ppc//g;s/ *//g'` 192 case $cputype in 193 *750*) ax_gcc_arch="750 G3" ;; 194 *740[[0-9]]*) ax_gcc_arch="$cputype 7400 G4" ;; 195 *74[[4-5]][[0-9]]*) ax_gcc_arch="$cputype 7450 G4" ;; 196 *74[[0-9]][[0-9]]*) ax_gcc_arch="$cputype G4" ;; 197 *970*) ax_gcc_arch="970 G5 power4";; 198 *POWER4*|*power4*|*gq*) ax_gcc_arch="power4 970";; 199 *POWER5*|*power5*|*gr*|*gs*) ax_gcc_arch="power5 power4 970";; 200 603ev|8240) ax_gcc_arch="$cputype 603e 603";; 201 *POWER7*) ax_gcc_arch="power7";; 202 *POWER8*) ax_gcc_arch="power8";; 203 *POWER9*) ax_gcc_arch="power9";; 204 *POWER10*) ax_gcc_arch="power10";; 205 *) ax_gcc_arch=$cputype ;; 206 esac 207 ax_gcc_arch="$ax_gcc_arch powerpc" 208 ;; 209 aarch64) 210 cpuimpl=`grep 'CPU implementer' /proc/cpuinfo 2> /dev/null | cut -d: -f2 | tr -d " " | head -n 1` 211 cpuarch=`grep 'CPU architecture' /proc/cpuinfo 2> /dev/null | cut -d: -f2 | tr -d " " | head -n 1` 212 cpuvar=`grep 'CPU variant' /proc/cpuinfo 2> /dev/null | cut -d: -f2 | tr -d " " | head -n 1` 213 case $cpuimpl in 214 0x42) case $cpuarch in 215 8) case $cpuvar in 216 0x0) ax_gcc_arch="thunderx2t99 vulcan armv8.1-a armv8-a+lse armv8-a native" ;; 217 esac 218 ;; 219 esac 220 ;; 221 0x43) case $cpuarch in 222 8) case $cpuvar in 223 0x0) ax_gcc_arch="thunderx armv8-a native" ;; 224 0x1) ax_gcc_arch="thunderx+lse armv8.1-a armv8-a+lse armv8-a native" ;; 225 esac 226 ;; 227 esac 228 ;; 229 esac 230 ;; 231esac 232fi # not cross-compiling 233fi # guess arch 234 235if test "x$ax_gcc_arch" != x -a "x$ax_gcc_arch" != xno; then 236if test "x[]m4_default([$1],yes)" = xyes; then # if we require portable code 237 flag_prefixes="-mtune=" 238 if test "x$ax_cv_[]_AC_LANG_ABBREV[]_compiler_vendor" = xclang; then flag_prefixes="-march="; fi 239 # -mcpu=$arch and m$arch generate nonportable code on every arch except 240 # x86. And some other arches (e.g. Alpha) don't accept -mtune. Grrr. 241 case $host_cpu in i*86|x86_64*|amd64*) flag_prefixes="$flag_prefixes -mcpu= -m";; esac 242else 243 flag_prefixes="-march= -mcpu= -m" 244fi 245for flag_prefix in $flag_prefixes; do 246 for arch in $ax_gcc_arch; do 247 flag="$flag_prefix$arch" 248 AX_CHECK_COMPILE_FLAG($flag, [if test "x$ax_cv_[]_AC_LANG_ABBREV[]_compiler_vendor" = xclang; then 249 if test "x[]m4_default([$1],yes)" = xyes; then 250 if test "x$flag" = "x-march=$arch"; then flag=-mtune=$arch; fi 251 fi 252 fi; ax_cv_gcc_archflag=$flag; break]) 253 done 254 test "x$ax_cv_gcc_archflag" = xunknown || break 255done 256fi 257 258fi # $GCC=yes 259]) 260AC_MSG_CHECKING([for gcc architecture flag]) 261AC_MSG_RESULT($ax_cv_gcc_archflag) 262if test "x$ax_cv_gcc_archflag" = xunknown; then 263 m4_default([$3],:) 264else 265 m4_default([$2], [CFLAGS="$CFLAGS $ax_cv_gcc_archflag"]) 266fi 267]) 268