Home | History | Annotate | Download | only in m4
      1 # ===========================================================================
      2 #      http://www.gnu.org/software/autoconf-archive/ax_gcc_archflag.html
      3 # ===========================================================================
      4 #
      5 # SYNOPSIS
      6 #
      7 #   AX_GCC_ARCHFLAG([PORTABLE?], [ACTION-SUCCESS], [ACTION-FAILURE])
      8 #
      9 # DESCRIPTION
     10 #
     11 #   This macro tries to guess the "native" arch corresponding to the target
     12 #   architecture for use with gcc's -march=arch or -mtune=arch flags. If
     13 #   found, the cache variable $ax_cv_gcc_archflag is set to this flag and
     14 #   ACTION-SUCCESS is executed; otherwise $ax_cv_gcc_archflag is set to
     15 #   "unknown" and ACTION-FAILURE is executed. The default ACTION-SUCCESS is
     16 #   to add $ax_cv_gcc_archflag to the end of $CFLAGS.
     17 #
     18 #   PORTABLE? should be either [yes] (default) or [no]. In the former case,
     19 #   the flag is set to -mtune (or equivalent) so that the architecture is
     20 #   only used for tuning, but the instruction set used is still portable. In
     21 #   the latter case, the flag is set to -march (or equivalent) so that
     22 #   architecture-specific instructions are enabled.
     23 #
     24 #   The user can specify --with-gcc-arch=<arch> in order to override the
     25 #   macro's choice of architecture, or --without-gcc-arch to disable this.
     26 #
     27 #   When cross-compiling, or if $CC is not gcc, then ACTION-FAILURE is
     28 #   called unless the user specified --with-gcc-arch manually.
     29 #
     30 #   Requires macros: AX_CHECK_COMPILE_FLAG, AX_GCC_X86_CPUID
     31 #
     32 #   (The main emphasis here is on recent CPUs, on the principle that doing
     33 #   high-performance computing on old hardware is uncommon.)
     34 #
     35 # LICENSE
     36 #
     37 #   Copyright (c) 2008 Steven G. Johnson <stevenj (a] alum.mit.edu>
     38 #   Copyright (c) 2008 Matteo Frigo
     39 #   Copyright (c) 2014 Tsukasa Oi
     40 #
     41 #   This program is free software: you can redistribute it and/or modify it
     42 #   under the terms of the GNU General Public License as published by the
     43 #   Free Software Foundation, either version 3 of the License, or (at your
     44 #   option) any later version.
     45 #
     46 #   This program is distributed in the hope that it will be useful, but
     47 #   WITHOUT ANY WARRANTY; without even the implied warranty of
     48 #   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
     49 #   Public License for more details.
     50 #
     51 #   You should have received a copy of the GNU General Public License along
     52 #   with this program. If not, see <http://www.gnu.org/licenses/>.
     53 #
     54 #   As a special exception, the respective Autoconf Macro's copyright owner
     55 #   gives unlimited permission to copy, distribute and modify the configure
     56 #   scripts that are the output of Autoconf when processing the Macro. You
     57 #   need not follow the terms of the GNU General Public License when using
     58 #   or distributing such scripts, even though portions of the text of the
     59 #   Macro appear in them. The GNU General Public License (GPL) does govern
     60 #   all other use of the material that constitutes the Autoconf Macro.
     61 #
     62 #   This special exception to the GPL applies to versions of the Autoconf
     63 #   Macro released by the Autoconf Archive. When you make and distribute a
     64 #   modified version of the Autoconf Macro, you may extend this special
     65 #   exception to the GPL to apply to your modified version as well.
     66 
     67 #serial 17
     68 
     69 AC_DEFUN([AX_GCC_ARCHFLAG],
     70 [AC_REQUIRE([AC_PROG_CC])
     71 AC_REQUIRE([AC_CANONICAL_HOST])
     72 AC_REQUIRE([AC_PROG_SED])
     73 AC_REQUIRE([AX_COMPILER_VENDOR])
     74 
     75 AC_ARG_WITH(gcc-arch, [AS_HELP_STRING([--with-gcc-arch=<arch>], [use architecture <arch> for gcc -march/-mtune, instead of guessing])],
     76 	ax_gcc_arch=$withval, ax_gcc_arch=yes)
     77 
     78 AC_MSG_CHECKING([for gcc architecture flag])
     79 AC_MSG_RESULT([])
     80 AC_CACHE_VAL(ax_cv_gcc_archflag,
     81 [
     82 ax_cv_gcc_archflag="unknown"
     83 
     84 if test "$GCC" = yes; then
     85 
     86 if test "x$ax_gcc_arch" = xyes; then
     87 ax_gcc_arch=""
     88 if test "$cross_compiling" = no; then
     89 case $host_cpu in
     90   i[[3456]]86*|x86_64*|amd64*) # use cpuid codes
     91      AX_GCC_X86_CPUID(0)
     92      AX_GCC_X86_CPUID(1)
     93      case $ax_cv_gcc_x86_cpuid_0 in
     94        *:756e6547:6c65746e:49656e69) # Intel
     95           case $ax_cv_gcc_x86_cpuid_1 in
     96 	    *5[[4578]]?:*:*:*) ax_gcc_arch="pentium-mmx pentium" ;;
     97 	    *5[[123]]?:*:*:*) ax_gcc_arch=pentium ;;
     98 	    *0?61?:*:*:*|?61?:*:*:*|61?:*:*:*) ax_gcc_arch=pentiumpro ;;
     99 	    *0?6[[356]]?:*:*:*|?6[[356]]?:*:*:*|6[[356]]?:*:*:*) ax_gcc_arch="pentium2 pentiumpro" ;;
    100 	    *0?6[[78ab]]?:*:*:*|?6[[78ab]]?:*:*:*|6[[78ab]]?:*:*:*) ax_gcc_arch="pentium3 pentiumpro" ;;
    101 	    *0?6[[9d]]?:*:*:*|?6[[9d]]?:*:*:*|6[[9d]]?:*:*:*|*1?65?:*:*:*) ax_gcc_arch="pentium-m pentium3 pentiumpro" ;;
    102 	    *0?6e?:*:*:*|?6e?:*:*:*|6e?:*:*:*) ax_gcc_arch="yonah pentium-m pentium3 pentiumpro" ;;
    103 	    *0?6f?:*:*:*|?6f?:*:*:*|6f?:*:*:*|*1?66?:*:*:*) ax_gcc_arch="core2 pentium-m pentium3 pentiumpro" ;;
    104 	    *1?6[[7d]]?:*:*:*) ax_gcc_arch="penryn core2 pentium-m pentium3 pentiumpro" ;;
    105 	    *1?6[[aef]]?:*:*:*|*2?6e?:*:*:*) ax_gcc_arch="nehalem corei7 core2 pentium-m pentium3 pentiumpro" ;;
    106 	    *2?6[[5cf]]?:*:*:*) ax_gcc_arch="westmere corei7 core2 pentium-m pentium3 pentiumpro" ;;
    107 	    *2?6[[ad]]?:*:*:*) ax_gcc_arch="sandybridge corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;;
    108 	    *3?6[[ae]]?:*:*:*) ax_gcc_arch="ivybridge core-avx-i corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;;
    109 	    *3?6[[cf]]?:*:*:*|*4?6[[56]]?:*:*:*) ax_gcc_arch="haswell core-avx2 core-avx-i corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;;
    110 	    *3?6d?:*:*:*) ax_gcc_arch="broadwell core-avx2 core-avx-i corei7-avx corei7 core2 pentium-m pentium3 pentiumpro" ;;
    111 	    *1?6c?:*:*:*|*2?6[[67]]?:*:*:*|*3?6[[56]]?:*:*:*) ax_gcc_arch="bonnell atom core2 pentium-m pentium3 pentiumpro" ;;
    112 	    *3?67?:*:*:*|*[[45]]?6[[ad]]?:*:*:*) ax_gcc_arch="silvermont atom core2 pentium-m pentium3 pentiumpro" ;;
    113 	    *000?f[[012]]?:*:*:*|?f[[012]]?:*:*:*|f[[012]]?:*:*:*) ax_gcc_arch="pentium4 pentiumpro" ;;
    114 	    *000?f[[346]]?:*:*:*|?f[[346]]?:*:*:*|f[[346]]?:*:*:*) ax_gcc_arch="nocona prescott pentium4 pentiumpro" ;;
    115 	    # fallback
    116 	    *5??:*:*:*) ax_gcc_arch=pentium ;;
    117 	    *??6??:*:*:*) ax_gcc_arch="core2 pentiumpro" ;;
    118 	    *6??:*:*:*) ax_gcc_arch=pentiumpro ;;
    119 	    *00??f??:*:*:*|??f??:*:*:*|?f??:*:*:*|f??:*:*:*) ax_gcc_arch="pentium4 pentiumpro" ;;
    120           esac ;;
    121        *:68747541:444d4163:69746e65) # AMD
    122           case $ax_cv_gcc_x86_cpuid_1 in
    123 	    *5[[67]]?:*:*:*) ax_gcc_arch=k6 ;;
    124 	    *5[[8]]?:*:*:*) ax_gcc_arch="k6-2 k6" ;;
    125 	    *5[[9d]]?:*:*:*) ax_gcc_arch="k6-3 k6" ;;
    126 	    *6[[12]]?:*:*:*) ax_gcc_arch="athlon k7" ;;
    127 	    *6[[34]]?:*:*:*) ax_gcc_arch="athlon-tbird k7" ;;
    128 	    *6[[678a]]?:*:*:*) ax_gcc_arch="athlon-xp athlon-4 athlon k7" ;;
    129 	    *000?f[[4578bcef]]?:*:*:*|?f[[4578bcef]]?:*:*:*|f[[4578bcef]]?:*:*:*|*001?f[[4578bcf]]?:*:*:*|1?f[[4578bcf]]?:*:*:*) ax_gcc_arch="athlon64 k8" ;;
    130 	    *002?f[[13457bcf]]?:*:*:*|2?f[[13457bcf]]?:*:*:*|*004?f[[138bcf]]?:*:*:*|4?f[[138bcf]]?:*:*:*|*005?f[[df]]?:*:*:*|5?f[[df]]?:*:*:*|*006?f[[8bcf]]?:*:*:*|6?f[[8bcf]]?:*:*:*|*007?f[[cf]]?:*:*:*|7?f[[cf]]?:*:*:*|*00c?f1?:*:*:*|c?f1?:*:*:*|*020?f3?:*:*:*|20?f3?:*:*:*) ax_gcc_arch="athlon64-sse3 k8-sse3 athlon64 k8" ;;
    131 	    *010?f[[245689a]]?:*:*:*|10?f[[245689a]]?:*:*:*|*030?f1?:*:*:*|30?f1?:*:*:*) ax_gcc_arch="barcelona amdfam10 k8" ;;
    132 	    *050?f[[12]]?:*:*:*|50?f[[12]]?:*:*:*) ax_gcc_arch="btver1 amdfam10 k8" ;;
    133 	    *060?f1?:*:*:*|60?f1?:*:*:*) ax_gcc_arch="bdver1 amdfam10 k8" ;;
    134 	    *060?f2?:*:*:*|60?f2?:*:*:*|*061?f[[03]]?:*:*:*|61?f[[03]]?:*:*:*) ax_gcc_arch="bdver2 bdver1 amdfam10 k8" ;;
    135 	    *063?f0?:*:*:*|63?f0?:*:*:*) ax_gcc_arch="bdver3 bdver2 bdver1 amdfam10 k8" ;;
    136 	    *07[[03]]?f0?:*:*:*|7[[03]]?f0?:*:*:*) ax_gcc_arch="btver2 btver1 amdfam10 k8" ;;
    137 	    # fallback
    138 	    *0[[13]]??f??:*:*:*|[[13]]??f??:*:*:*) ax_gcc_arch="barcelona amdfam10 k8" ;;
    139 	    *020?f??:*:*:*|20?f??:*:*:*) ax_gcc_arch="athlon64-sse3 k8-sse3 athlon64 k8" ;;
    140 	    *05??f??:*:*:*|5??f??:*:*:*) ax_gcc_arch="btver1 amdfam10 k8" ;;
    141 	    *060?f??:*:*:*|60?f??:*:*:*) ax_gcc_arch="bdver1 amdfam10 k8" ;;
    142 	    *061?f??:*:*:*|61?f??:*:*:*) ax_gcc_arch="bdver2 bdver1 amdfam10 k8" ;;
    143 	    *06??f??:*:*:*|6??f??:*:*:*) ax_gcc_arch="bdver3 bdver2 bdver1 amdfam10 k8" ;;
    144 	    *070?f??:*:*:*|70?f??:*:*:*) ax_gcc_arch="btver2 btver1 amdfam10 k8" ;;
    145 	    *???f??:*:*:*) ax_gcc_arch="amdfam10 k8" ;;
    146           esac ;;
    147 	*:746e6543:736c7561:48727561) # IDT / VIA (Centaur)
    148 	   case $ax_cv_gcc_x86_cpuid_1 in
    149 	     *54?:*:*:*) ax_gcc_arch=winchip-c6 ;;
    150 	     *5[[89]]?:*:*:*) ax_gcc_arch=winchip2 ;;
    151 	     *66?:*:*:*) ax_gcc_arch=winchip2 ;;
    152 	     *6[[78]]?:*:*:*) ax_gcc_arch=c3 ;;
    153 	     *6[[9adf]]?:*:*:*) ax_gcc_arch="c3-2 c3" ;;
    154 	   esac ;;
    155      esac
    156      if test x"$ax_gcc_arch" = x; then # fallback
    157 	case $host_cpu in
    158 	  i586*) ax_gcc_arch=pentium ;;
    159 	  i686*) ax_gcc_arch=pentiumpro ;;
    160         esac
    161      fi
    162      ;;
    163 
    164   sparc*)
    165      AC_PATH_PROG([PRTDIAG], [prtdiag], [prtdiag], [$PATH:/usr/platform/`uname -i`/sbin/:/usr/platform/`uname -m`/sbin/])
    166      cputype=`(((grep cpu /proc/cpuinfo | cut -d: -f2) ; ($PRTDIAG -v |grep -i sparc) ; grep -i cpu /var/run/dmesg.boot ) | head -n 1) 2> /dev/null`
    167      cputype=`echo "$cputype" | tr -d ' -' | $SED 's/SPARCIIi/SPARCII/' |tr $as_cr_LETTERS $as_cr_letters`
    168      case $cputype in
    169          *ultrasparciv*) ax_gcc_arch="ultrasparc4 ultrasparc3 ultrasparc v9" ;;
    170          *ultrasparciii*) ax_gcc_arch="ultrasparc3 ultrasparc v9" ;;
    171          *ultrasparc*) ax_gcc_arch="ultrasparc v9" ;;
    172          *supersparc*|*tms390z5[[05]]*) ax_gcc_arch="supersparc v8" ;;
    173          *hypersparc*|*rt62[[056]]*) ax_gcc_arch="hypersparc v8" ;;
    174          *cypress*) ax_gcc_arch=cypress ;;
    175      esac ;;
    176 
    177   alphaev5) ax_gcc_arch=ev5 ;;
    178   alphaev56) ax_gcc_arch=ev56 ;;
    179   alphapca56) ax_gcc_arch="pca56 ev56" ;;
    180   alphapca57) ax_gcc_arch="pca57 pca56 ev56" ;;
    181   alphaev6) ax_gcc_arch=ev6 ;;
    182   alphaev67) ax_gcc_arch=ev67 ;;
    183   alphaev68) ax_gcc_arch="ev68 ev67" ;;
    184   alphaev69) ax_gcc_arch="ev69 ev68 ev67" ;;
    185   alphaev7) ax_gcc_arch="ev7 ev69 ev68 ev67" ;;
    186   alphaev79) ax_gcc_arch="ev79 ev7 ev69 ev68 ev67" ;;
    187 
    188   powerpc*)
    189      cputype=`((grep cpu /proc/cpuinfo | head -n 1 | cut -d: -f2 | cut -d, -f1 | $SED 's/ //g') ; /usr/bin/machine ; /bin/machine; grep CPU /var/run/dmesg.boot | head -n 1 | cut -d" " -f2) 2> /dev/null`
    190      cputype=`echo $cputype | $SED -e 's/ppc//g;s/ *//g'`
    191      case $cputype in
    192        *750*) ax_gcc_arch="750 G3" ;;
    193        *740[[0-9]]*) ax_gcc_arch="$cputype 7400 G4" ;;
    194        *74[[4-5]][[0-9]]*) ax_gcc_arch="$cputype 7450 G4" ;;
    195        *74[[0-9]][[0-9]]*) ax_gcc_arch="$cputype G4" ;;
    196        *970*) ax_gcc_arch="970 G5 power4";;
    197        *POWER4*|*power4*|*gq*) ax_gcc_arch="power4 970";;
    198        *POWER5*|*power5*|*gr*|*gs*) ax_gcc_arch="power5 power4 970";;
    199        603ev|8240) ax_gcc_arch="$cputype 603e 603";;
    200        *) ax_gcc_arch=$cputype ;;
    201      esac
    202      ax_gcc_arch="$ax_gcc_arch powerpc"
    203      ;;
    204 esac
    205 fi # not cross-compiling
    206 fi # guess arch
    207 
    208 if test "x$ax_gcc_arch" != x -a "x$ax_gcc_arch" != xno; then
    209 if test "x[]m4_default([$1],yes)" = xyes; then # if we require portable code
    210   flag_prefixes="-mtune="
    211   if test "x$ax_cv_[]_AC_LANG_ABBREV[]_compiler_vendor" = xclang; then flag_prefixes="-march="; fi
    212   # -mcpu=$arch and m$arch generate nonportable code on every arch except
    213   # x86.  And some other arches (e.g. Alpha) don't accept -mtune.  Grrr.
    214   case $host_cpu in i*86|x86_64*|amd64*) flag_prefixes="$flag_prefixes -mcpu= -m";; esac
    215 else
    216   flag_prefixes="-march= -mcpu= -m"
    217 fi
    218 for flag_prefix in $flag_prefixes; do
    219   for arch in $ax_gcc_arch; do
    220     flag="$flag_prefix$arch"
    221     AX_CHECK_COMPILE_FLAG($flag, [if test "x$ax_cv_[]_AC_LANG_ABBREV[]_compiler_vendor" = xclang; then
    222       if test "x[]m4_default([$1],yes)" = xyes; then
    223 	if test "x$flag" = "x-march=$arch"; then flag=-mtune=$arch; fi
    224       fi
    225     fi; ax_cv_gcc_archflag=$flag; break])
    226   done
    227   test "x$ax_cv_gcc_archflag" = xunknown || break
    228 done
    229 fi
    230 
    231 fi # $GCC=yes
    232 ])
    233 AC_MSG_CHECKING([for gcc architecture flag])
    234 AC_MSG_RESULT($ax_cv_gcc_archflag)
    235 if test "x$ax_cv_gcc_archflag" = xunknown; then
    236   m4_default([$3],:)
    237 else
    238   m4_default([$2], [CFLAGS="$CFLAGS $ax_cv_gcc_archflag"])
    239 fi
    240 ])
    241