summaryrefslogtreecommitdiff
path: root/m4
diff options
context:
space:
mode:
Diffstat (limited to 'm4')
-rw-r--r--m4/Makefile.am1
-rw-r--r--m4/optimizations.m4262
2 files changed, 263 insertions, 0 deletions
diff --git a/m4/Makefile.am b/m4/Makefile.am
index c553cddc7..54bce8516 100644
--- a/m4/Makefile.am
+++ b/m4/Makefile.am
@@ -31,6 +31,7 @@ EXTRA_DIST = \
libfame.m4 \
ogg.m4 \
opengl.m4 \
+ optimizations.m4 \
pkg.m4 \
progtest.m4 \
sdl.m4 \
diff --git a/m4/optimizations.m4 b/m4/optimizations.m4
new file mode 100644
index 000000000..9b45563ea
--- /dev/null
+++ b/m4/optimizations.m4
@@ -0,0 +1,262 @@
+dnl
+dnl M4 macro to add support for extra optimizations
+dnl
+dnl It understand --enable/--disable-optimizations .
+dnl when optimizations are disabled, it does not touch cflags
+dnl
+dnl Note: always disable while crosscompiling
+dnl
+
+AC_DEFUN([AC_OPTIMIZATIONS], [
+ AC_ARG_ENABLE([optimizations],
+ AC_HELP_STRING([--disable-optimizations], [Don't try to guess what optimization to enable]))
+
+ if test "x$enable_optimizations" != "xno"; then
+ INLINE_FUNCTIONS=-finline-functions
+
+ if test "$GCC" = yes; then
+ dnl
+ dnl check cflags not supported by all gcc versions
+ dnl eg: -mpreferred-stack-boundary=2 and 2.91.66,
+ dnl and gcc-2.7.2.3 support a bit less options
+ dnl
+ AC_TRY_CFLAGS("-mpreferred-stack-boundary=2",
+ m_psb="-mpreferred-stack-boundary=2", m_psb="")
+ AC_TRY_CFLAGS("-fno-strict-aliasing", f_nsa="-fno-strict-aliasing", f_nsa="")
+ AC_TRY_CFLAGS("-fschedule-insns2", f_si="-fschedule-insns2", f_si="")
+ AC_TRY_CFLAGS("-mwide-multiply", m_wm="-mwide-multiply", m_wm="")
+ dnl
+ dnl gcc 3.1 uses the -f version
+ dnl
+ AC_TRY_CFLAGS("-falign-functions=4", f_af="-falign-functions=4",
+ f_af="-malign-functions=4")
+ AC_TRY_CFLAGS("-falign-loops=4", f_al="-falign-loops=4",
+ f_al="-malign-loops=4")
+ AC_TRY_CFLAGS("-falign-jumps=4", f_aj="-falign-jumps=4",
+ f_aj="-malign-jumps=4")
+ dnl
+ dnl Check for some optimization disabling
+ dnl needed for win32 code
+ dnl
+ AC_TRY_CFLAGS("-fno-omit-frame-pointer", W32_NO_OPTIMIZE="$W32_NO_OPTIMIZE -fno-omit-frame-pointer",)
+ AC_TRY_CFLAGS("-fno-inline-functions", W32_NO_OPTIMIZE="$W32_NO_OPTIMIZE -fno-inline-functions",)
+ AC_TRY_CFLAGS("-fno-rename-registers", W32_NO_OPTIMIZE="$W32_NO_OPTIMIZE -fno-rename-registers",)
+ AC_SUBST(W32_NO_OPTIMIZE)
+ dnl
+ dnl Multipass compilation
+ dnl
+ AC_TRY_CFLAGS("-fprofile-arcs", PASS1_CFLAGS="-fprofile_arcs $PASS1_CFLAGS",)
+ AC_TRY_CFLAGS("-fbranch-probabilities", PASS2_CFLAGS="-fbranch-probabilities $PASS2_CFLAGS",)
+ AC_SUBST(PASS1_CFLAGS)
+ AC_SUBST(PASS2_CFLAGS)
+ dnl
+ dnl Warnings
+ dnl
+ CFLAGS="-Wchar-subscripts -Wmissing-declarations -Wmissing-prototypes $CFLAGS"
+ CFLAGS="-Wnested-externs -Wcast-align $CFLAGS"
+ dnl some combinations of gcc+glibc produce useless warnings on memset
+ dnl when compiling with -Wpointer-arith, so we check for this first
+ AC_MSG_CHECKING(for sane -Wpointer-arith)
+ SAVE_CFLAGS="$CFLAGS"
+ CFLAGS="-O2 -Wpointer-arith -Werror $CFLAGS"
+ AC_TRY_COMPILE([#include <string.h>],[int a; memset(&a, 0, sizeof(int));],
+ [AC_MSG_RESULT(yes); CFLAGS="-Wpointer-arith $SAVE_CFLAGS"],
+ [AC_MSG_RESULT(no); CFLAGS="$SAVE_CFLAGS"]);
+
+ dnl gcc 3.3.5 (at least) is known to be buggy wrt optimisation and
+ dnl -finline-functions. Use -fno-inline-functions for gcc < 3.4.0.
+
+ AC_MSG_CHECKING(for gcc 3.4.0 or later)
+ ARG1="$1"
+ ARG2="$2"
+ ARG3="$3"
+ newGCC="`"$CC" -dumpversion |
+ awk 'BEGIN { FS = "." };
+ 1 { if (($ARG1 * 10000 + $ARG2 * 100 + $ARG3) >= 30400) { print "yes" } }'
+ `"
+ AC_MSG_RESULT(${newGCC:-no - assuming bugginess in -finline-functions})
+ test "$newGCC" = yes || INLINE_FUNCTIONS=-fno-inline-functions
+ fi
+
+ dnl Flags not supported by all *cc* variants
+ AC_TRY_CFLAGS("-Wall", wall="-Wall", wall="")
+
+ CFLAGS="$wall ${CFLAGS}"
+ DEBUG_CFLAGS="$wall ${CFLAGS}"
+
+ case "$host_or_hostalias" in
+ i?86-* | k?-* | athlon-* | pentium*)
+ if test "$GCC" = yes -o "${CC##*/}x" = "iccx" ; then
+
+ if test "$GCC" = yes; then
+ dnl Check for gcc cpu optimization support
+ AC_TRY_CFLAGS("-mtune=i386",
+ sarchopt="-mtune",
+ AC_TRY_CFLAGS("-mcpu=i386",
+ sarchopt="-mcpu",
+ AC_TRY_CFLAGS("-march=i386",
+ sarchopt="-march",
+ [ AC_MSG_RESULT(** no cpu optimization supports **)
+ sarchopt=no
+ ]
+ )
+ )
+ )
+
+ dnl special check for k7 cpu CC support
+ AC_TRY_CFLAGS("$sarchopt=athlon", k7cpu="athlon", k7cpu="i686")
+
+ dnl add x86 specific gcc CFLAGS
+ CFLAGS="-O3 -fomit-frame-pointer $f_af $f_al $f_aj $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS $CFLAGS"
+
+ DEBUG_CFLAGS="-O $DEBUG_CFLAGS"
+
+ if test x"$sarchopt" != "xno"; then
+ archopt_val=
+
+ case "$host_or_hostalias" in
+ i386-*)
+ archopt_val="i386" ;;
+ i486-*)
+ archopt_val="i486" ;;
+ i586-*)
+ archopt_val="pentium"
+ ;;
+ pentium-mmx-*)
+ archopt_val="pentium-mmx"
+ ;;
+ pentiumpro-* | pentium2-* | i686-*)
+ archopt_val="pentiumpro"
+ if test x"$check_athlon" = "xyes"; then
+ if test -f /proc/cpuinfo; then
+ modelname=`cat /proc/cpuinfo | grep "model\ name\ :" | sed -e 's/ //g' | cut -d':' -f2`
+ case "$modelname" in
+ *Athlon* | *Duron* | *K7*)
+ archopt_val="$k7cpu"
+ ;;
+ VIAEzra)
+ archopt_val="c3"
+ ;;
+ esac
+ fi
+ fi
+ ;;
+ k6-2-* | k6-3-*)
+ archopt_val="k6-2"
+ ;;
+ k6-*)
+ archopt_val="k6"
+ ;;
+ pentium3-*)
+ archopt_val="pentium3"
+ ;;
+ pentium4-*)
+ archopt_val="pentium4"
+ ;;
+ athlon-4-* | athlon-xp-* | athlon-mp-*)
+ archopt_val="athlon-4"
+ ;;
+ k7-* | athlon-tbird-* | athlon-*)
+ archopt_val="athlon"
+ ;;
+
+ esac
+ if test x"$archopt_val" != x; then
+ CFLAGS="$sarchopt=$archopt_val $CFLAGS"
+ DEBUG_CFLAGS="$sarchopt=$archopt_val $DEBUG_CFLAGS"
+ fi
+ fi
+ else
+ dnl we have the Intel compiler
+ CFLAGS="-unroll -ipo -ipo_obj -O3 $CFLAGS"
+ PASS1_CFLAGS="-prof_genx -prof_dir \$(PWD)/\$(top_builddir)/ $PASS1_CFLAGS"
+ PASS2_CFLAGS="-prof_use -prof_dir \$(PWD)/\$(top_builddir)/ $PASS2_CFLAGS"
+ AC_SUBST(PASS1_CFLAGS)
+ AC_SUBST(PASS2_CFLAGS)
+ fi
+
+ else
+ dnl add x86 specific cc CFLAGS
+ CFLAGS="-O $CFLAGS"
+ DEBUG_CFLAGS="-O $DEBUG_CFLAGS"
+ AC_DEFINE_UNQUOTED(FPM_64BIT,,[Define to select libmad fixed point arithmetic implementation])
+ fi
+ ;;
+ alphaev56-*)
+ CFLAGS="-O3 -mcpu=ev56 -mieee $CFLAGS"
+ DEBUG_CFLAGS="-O3 -mcpu=ev56 -mieee $DEBUG_CFLAGS"
+ ;;
+ alpha*)
+ CFLAGS="-O3 -mieee $CFLAGS"
+ DEBUG_CFLAGS="-O3 -mieee $DEBUG_CFLAGS"
+ ;;
+ *darwin*)
+ CFLAGS="-O3 -pipe -fomit-frame-pointer $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS -no-cpp-precomp -D_INTL_REDIRECT_MACROS $CFLAGS"
+ DEBUG_CFLAGS="-O3 $DEBUG_CFLAGS"
+ ;;
+ ppc-*-linux* | powerpc-*)
+ CFLAGS="-O3 -pipe -fomit-frame-pointer $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS $CFLAGS"
+ DEBUG_CFLAGS="-O3 $DEBUG_CFLAGS"
+ ;;
+ sparc*-*-linux*)
+ CFLAGS="-O3 $cpu_cflags -funroll-loops $INLINE_FUNCTIONS $CFLAGS"
+ DEBUG_CFLAGS="-O $cpu_cflags -funroll-loops $INLINE_FUNCTIONS $DEBUG_CFLAGS"
+
+ case `uname -m` in
+ sparc)
+ cpu_cflags="-mcpu=supersparc -mtune=supersparc" ;;
+ sparc64)
+ cpu_cflags="-mcpu=ultrasparc -mtune=ultrasparc" ;;
+ esac
+ ;;
+ sparc-*-solaris*)
+ if test "$GCC" = yes; then
+ case `uname -m` in
+ sun4c) cpu_cflags="-mcpu=v7 -mtune=supersparc" ;;
+ sun4m) cpu_cflags="-mcpu=v8 -mtune=supersparc" ;;
+ sun4u)
+ case `$CC --version 2>/dev/null` in
+ 1.*|2.*)
+ # -mcpu=ultrasparc triggers a GCC 2.95.x compiler bug when
+ # compiling video_out.c:
+ # gcc: Internal compiler error: program cc1 got fatal signal 11
+ # avoid -mcpu=ultrasparc with gcc 2.*
+ cpu_cflags="-mcpu=v8 -mtune=ultrasparc"
+ ;;
+ *)
+ # GCC 3 or newer should have no problem with -mcpu=ultrasparc
+ cpu_cflags="-mcpu=ultrasparc -mtune=ultrasparc"
+ ;;
+ esac
+ ;;
+ esac
+ cc_optimize_cflags="-O3 $cpu_cflags -funroll-loops $INLINE_FUNCTIONS"
+ cc_debug_cflags="-O $cpu_cflags -funroll-loops $INLINE_FUNCTIONS"
+ else
+ case `uname -m` in
+ sun4c) cpu_cflags="-xarch=v7" ;;
+ sun4m) cpu_cflags="-xarch=v8" ;;
+ sun4u) cpu_cflags="-xarch=v8plusa" ;;
+ esac
+ cc_optimize_cflags="-fast $cpu_cflags -xCC"
+ cc_debug_cflags="-O"
+ fi
+
+ CFLAGS="$cc_optimize_cflags $CFLAGS"
+ DEBUG_CFLAGS="$cc_debug_cflags $DEBUG_CFLAGS"
+ ;;
+ x86_64-*)
+ CFLAGS="-O3 -fomit-frame-pointer $m_wm $m_psb -fexpensive-optimizations $f_si $f_nsa -ffast-math -funroll-loops $INLINE_FUNCTIONS $CFLAGS"
+ DEBUG_CFLAGS="-g $DEBUG_CFLAGS"
+ ;;
+ armv4l-*-linux*)
+ CFLAGS="-O2 -fsigned-char -ffast-math -mcpu=strongarm1100 -fomit-frame-pointer -fthread-jumps -fregmove $CFLAGS"
+ dnl CFLAGS="-O1 -fforce-mem -fforce-addr -fthread-jumps -fcse-follow-jumps -fcse-skip-blocks -fexpensive-optimizations -fregmove -fschedule-insns2 $INLINE_FUNCTIONS -fsigned-char -fomit-frame-pointer -march=armv4 -mtune=strongarm $CFLAGS"
+ DEBUG_CFLAGS="-O2 $DEBUG_CFLAGS"
+ ;;
+ esac
+ fi
+])
+
+dnl Kate modeline: leave at the end
+dnl kate: indent-width 2; replace-trailing-space-save 1; space-indent 1; backspace-indents 1;