From 6c20021826b181e4f98de9937f2f6886e4c6d64e Mon Sep 17 00:00:00 2001 From: Miguel Freitas Date: Sat, 22 Oct 2005 22:02:40 +0000 Subject: commit Flameeyes' optimizations.m4 patch CVS patchset: 7764 CVS date: 2005/10/22 22:02:40 --- m4/Makefile.am | 1 + m4/optimizations.m4 | 262 ++++++++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 263 insertions(+) create mode 100644 m4/optimizations.m4 (limited to 'm4') diff --git a/m4/Makefile.am b/m4/Makefile.am index c553cddc7..54bce8516 100644 --- a/m4/Makefile.am +++ b/m4/Makefile.am @@ -31,6 +31,7 @@ EXTRA_DIST = \ libfame.m4 \ ogg.m4 \ opengl.m4 \ + optimizations.m4 \ pkg.m4 \ progtest.m4 \ sdl.m4 \ diff --git a/m4/optimizations.m4 b/m4/optimizations.m4 new file mode 100644 index 000000000..9b45563ea --- /dev/null +++ b/m4/optimizations.m4 @@ -0,0 +1,262 @@ +dnl +dnl M4 macro to add support for extra optimizations +dnl +dnl It understand --enable/--disable-optimizations . +dnl when optimizations are disabled, it does not touch cflags +dnl +dnl Note: always disable while crosscompiling +dnl + +AC_DEFUN([AC_OPTIMIZATIONS], [ + AC_ARG_ENABLE([optimizations], + AC_HELP_STRING([--disable-optimizations], [Don't try to guess what optimization to enable])) + + if test "x$enable_optimizations" != "xno"; then + INLINE_FUNCTIONS=-finline-functions + + if test "$GCC" = yes; then + dnl + dnl check cflags not supported by all gcc versions + dnl eg: -mpreferred-stack-boundary=2 and 2.91.66, + dnl and gcc-2.7.2.3 support a bit less options + dnl + AC_TRY_CFLAGS("-mpreferred-stack-boundary=2", + m_psb="-mpreferred-stack-boundary=2", m_psb="") + AC_TRY_CFLAGS("-fno-strict-aliasing", f_nsa="-fno-strict-aliasing", f_nsa="") + AC_TRY_CFLAGS("-fschedule-insns2", f_si="-fschedule-insns2", f_si="") + AC_TRY_CFLAGS("-mwide-multiply", m_wm="-mwide-multiply", m_wm="") + dnl + dnl gcc 3.1 uses the -f version + dnl + AC_TRY_CFLAGS("-falign-functions=4", f_af="-falign-functions=4", + f_af="-malign-functions=4") + AC_TRY_CFLAGS("-falign-loops=4", f_al="-falign-loops=4", + f_al="-malign-loops=4") + AC_TRY_CFLAGS("-falign-jumps=4", f_aj="-falign-jumps=4", + f_aj="-malign-jumps=4") + dnl + dnl Check for some optimization disabling + dnl needed for win32 code + dnl + AC_TRY_CFLAGS("-fno-omit-frame-pointer", W32_NO_OPTIMIZE="$W32_NO_OPTIMIZE -fno-omit-frame-pointer",) + AC_TRY_CFLAGS("-fno-inline-functions", W32_NO_OPTIMIZE="$W32_NO_OPTIMIZE -fno-inline-functions",) + AC_TRY_CFLAGS("-fno-rename-registers", W32_NO_OPTIMIZE="$W32_NO_OPTIMIZE -fno-rename-registers",) + AC_SUBST(W32_NO_OPTIMIZE) + dnl + dnl Multipass compilation + dnl + AC_TRY_CFLAGS("-fprofile-arcs", PASS1_CFLAGS="-fprofile_arcs $PASS1_CFLAGS",) + AC_TRY_CFLAGS("-fbranch-probabilities", PASS2_CFLAGS="-fbranch-probabilities $PASS2_CFLAGS",) + AC_SUBST(PASS1_CFLAGS) + AC_SUBST(PASS2_CFLAGS) + dnl + dnl Warnings + dnl + CFLAGS="-Wchar-subscripts -Wmissing-declarations -Wmissing-prototypes $CFLAGS" + CFLAGS="-Wnested-externs -Wcast-align $CFLAGS" + dnl some combinations of gcc+glibc produce useless warnings on memset + dnl when compiling with -Wpointer-arith, so we check for this first + AC_MSG_CHECKING(for sane -Wpointer-arith) + SAVE_CFLAGS="$CFLAGS" + CFLAGS="-O2 -Wpointer-arith -Werror $CFLAGS" + AC_TRY_COMPILE([#include ],[int a; memset(&a, 0, sizeof(int));], + [AC_MSG_RESULT(yes); CFLAGS="-Wpointer-arith $SAVE_CFLAGS"], + [AC_MSG_RESULT(no); CFLAGS="$SAVE_CFLAGS"]); + + dnl gcc 3.3.5 (at least) is known to be buggy wrt optimisation and + dnl -finline-functions. Use -fno-inline-functions for gcc < 3.4.0. + + AC_MSG_CHECKING(for gcc 3.4.0 or later) + ARG1="$1" + ARG2="$2" + ARG3="$3" + newGCC="`"$CC" -dumpversion | + awk 'BEGIN { FS = "." }; + 1 { if (($ARG1 * 10000 + $ARG2 * 100 + $ARG3) >= 30400) { print "yes" } }' + `" + AC_MSG_RESULT(${newGCC:-no - assuming bugginess in -finline-functions}) + test "$newGCC" = yes || INLINE_FUNCTIONS=-fno-inline-functions + fi + + dnl Flags not supported by all *cc* variants + AC_TRY_CFLAGS("-Wall", wall="-Wall", wall="") + + CFLAGS="$wall ${CFLAGS}" + DEBUG_CFLAGS="$wall ${CFLAGS}" + + case "$host_or_hostalias" in + i?86-* | k?-* | athlon-* | pentium*) + if test "$GCC" = yes -o "${CC##*/}x" = "iccx" ; then + + if test "$GCC" = yes; then + dnl Check for gcc cpu optimization support + AC_TRY_CFLAGS("-mtune=i386", + sarchopt="-mtune", + AC_TRY_CFLAGS("-mcpu=i386", + sarchopt="-mcpu", + AC_TRY_CFLAGS("-march=i386", + sarchopt="-march", + [ AC_MSG_RESULT(** no cpu optimization supports **) + sarchopt=no + ] + ) + ) + ) + + dnl special check for k7 cpu CC support + AC_TRY_CFLAGS("$sarchopt=athlon", k7cpu="athlon", k7cpu="i686") + + dnl add x86 specific gcc CFLAGS + CFLAGS="-O3 -fomit-frame-pointer $f_af $f_al $f_aj $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS $CFLAGS" + + DEBUG_CFLAGS="-O $DEBUG_CFLAGS" + + if test x"$sarchopt" != "xno"; then + archopt_val= + + case "$host_or_hostalias" in + i386-*) + archopt_val="i386" ;; + i486-*) + archopt_val="i486" ;; + i586-*) + archopt_val="pentium" + ;; + pentium-mmx-*) + archopt_val="pentium-mmx" + ;; + pentiumpro-* | pentium2-* | i686-*) + archopt_val="pentiumpro" + if test x"$check_athlon" = "xyes"; then + if test -f /proc/cpuinfo; then + modelname=`cat /proc/cpuinfo | grep "model\ name\ :" | sed -e 's/ //g' | cut -d':' -f2` + case "$modelname" in + *Athlon* | *Duron* | *K7*) + archopt_val="$k7cpu" + ;; + VIAEzra) + archopt_val="c3" + ;; + esac + fi + fi + ;; + k6-2-* | k6-3-*) + archopt_val="k6-2" + ;; + k6-*) + archopt_val="k6" + ;; + pentium3-*) + archopt_val="pentium3" + ;; + pentium4-*) + archopt_val="pentium4" + ;; + athlon-4-* | athlon-xp-* | athlon-mp-*) + archopt_val="athlon-4" + ;; + k7-* | athlon-tbird-* | athlon-*) + archopt_val="athlon" + ;; + + esac + if test x"$archopt_val" != x; then + CFLAGS="$sarchopt=$archopt_val $CFLAGS" + DEBUG_CFLAGS="$sarchopt=$archopt_val $DEBUG_CFLAGS" + fi + fi + else + dnl we have the Intel compiler + CFLAGS="-unroll -ipo -ipo_obj -O3 $CFLAGS" + PASS1_CFLAGS="-prof_genx -prof_dir \$(PWD)/\$(top_builddir)/ $PASS1_CFLAGS" + PASS2_CFLAGS="-prof_use -prof_dir \$(PWD)/\$(top_builddir)/ $PASS2_CFLAGS" + AC_SUBST(PASS1_CFLAGS) + AC_SUBST(PASS2_CFLAGS) + fi + + else + dnl add x86 specific cc CFLAGS + CFLAGS="-O $CFLAGS" + DEBUG_CFLAGS="-O $DEBUG_CFLAGS" + AC_DEFINE_UNQUOTED(FPM_64BIT,,[Define to select libmad fixed point arithmetic implementation]) + fi + ;; + alphaev56-*) + CFLAGS="-O3 -mcpu=ev56 -mieee $CFLAGS" + DEBUG_CFLAGS="-O3 -mcpu=ev56 -mieee $DEBUG_CFLAGS" + ;; + alpha*) + CFLAGS="-O3 -mieee $CFLAGS" + DEBUG_CFLAGS="-O3 -mieee $DEBUG_CFLAGS" + ;; + *darwin*) + CFLAGS="-O3 -pipe -fomit-frame-pointer $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS -no-cpp-precomp -D_INTL_REDIRECT_MACROS $CFLAGS" + DEBUG_CFLAGS="-O3 $DEBUG_CFLAGS" + ;; + ppc-*-linux* | powerpc-*) + CFLAGS="-O3 -pipe -fomit-frame-pointer $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS $CFLAGS" + DEBUG_CFLAGS="-O3 $DEBUG_CFLAGS" + ;; + sparc*-*-linux*) + CFLAGS="-O3 $cpu_cflags -funroll-loops $INLINE_FUNCTIONS $CFLAGS" + DEBUG_CFLAGS="-O $cpu_cflags -funroll-loops $INLINE_FUNCTIONS $DEBUG_CFLAGS" + + case `uname -m` in + sparc) + cpu_cflags="-mcpu=supersparc -mtune=supersparc" ;; + sparc64) + cpu_cflags="-mcpu=ultrasparc -mtune=ultrasparc" ;; + esac + ;; + sparc-*-solaris*) + if test "$GCC" = yes; then + case `uname -m` in + sun4c) cpu_cflags="-mcpu=v7 -mtune=supersparc" ;; + sun4m) cpu_cflags="-mcpu=v8 -mtune=supersparc" ;; + sun4u) + case `$CC --version 2>/dev/null` in + 1.*|2.*) + # -mcpu=ultrasparc triggers a GCC 2.95.x compiler bug when + # compiling video_out.c: + # gcc: Internal compiler error: program cc1 got fatal signal 11 + # avoid -mcpu=ultrasparc with gcc 2.* + cpu_cflags="-mcpu=v8 -mtune=ultrasparc" + ;; + *) + # GCC 3 or newer should have no problem with -mcpu=ultrasparc + cpu_cflags="-mcpu=ultrasparc -mtune=ultrasparc" + ;; + esac + ;; + esac + cc_optimize_cflags="-O3 $cpu_cflags -funroll-loops $INLINE_FUNCTIONS" + cc_debug_cflags="-O $cpu_cflags -funroll-loops $INLINE_FUNCTIONS" + else + case `uname -m` in + sun4c) cpu_cflags="-xarch=v7" ;; + sun4m) cpu_cflags="-xarch=v8" ;; + sun4u) cpu_cflags="-xarch=v8plusa" ;; + esac + cc_optimize_cflags="-fast $cpu_cflags -xCC" + cc_debug_cflags="-O" + fi + + CFLAGS="$cc_optimize_cflags $CFLAGS" + DEBUG_CFLAGS="$cc_debug_cflags $DEBUG_CFLAGS" + ;; + x86_64-*) + CFLAGS="-O3 -fomit-frame-pointer $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS $CFLAGS" + DEBUG_CFLAGS="-g $DEBUG_CFLAGS" + ;; + armv4l-*-linux*) + CFLAGS="-O2 -fsigned-char -ffast-math -mcpu=strongarm1100 -fomit-frame-pointer -fthread-jumps -fregmove $CFLAGS" + dnl CFLAGS="-O1 -fforce-mem -fforce-addr -fthread-jumps -fcse-follow-jumps -fcse-skip-blocks -fexpensive-optimizations -fregmove -fschedule-insns2 $INLINE_FUNCTIONS -fsigned-char -fomit-frame-pointer -march=armv4 -mtune=strongarm $CFLAGS" + DEBUG_CFLAGS="-O2 $DEBUG_CFLAGS" + ;; + esac + fi +]) + +dnl Kate modeline: leave at the end +dnl kate: indent-width 2; replace-trailing-space-save 1; space-indent 1; backspace-indents 1; -- cgit v1.2.3