xref: /netbsd-src/external/lgpl3/gmp/dist/tune/Makefile.am (revision 72c7faa4dbb41dbb0238d6b4a109da0d4b236dd4)
1## Process this file with automake to generate Makefile.in
2
3# Copyright 2000-2003, 2005-2011 Free Software Foundation, Inc.
4#
5#  This file is part of the GNU MP Library.
6#
7#  The GNU MP Library is free software; you can redistribute it and/or modify
8#  it under the terms of either:
9#
10#    * the GNU Lesser General Public License as published by the Free
11#      Software Foundation; either version 3 of the License, or (at your
12#      option) any later version.
13#
14#  or
15#
16#    * the GNU General Public License as published by the Free Software
17#      Foundation; either version 2 of the License, or (at your option) any
18#      later version.
19#
20#  or both in parallel, as here.
21#
22#  The GNU MP Library is distributed in the hope that it will be useful, but
23#  WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
24#  or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
25#  for more details.
26#
27#  You should have received copies of the GNU General Public License and the
28#  GNU Lesser General Public License along with the GNU MP Library.  If not,
29#  see https://www.gnu.org/licenses/.
30
31
32AM_CPPFLAGS = -I$(top_srcdir) -I$(top_srcdir)/tests
33AM_LDFLAGS = -no-install
34
35EXTRA_DIST = alpha.asm pentium.asm sparcv9.asm hppa.asm hppa2.asm hppa2w.asm \
36  ia64.asm powerpc.asm powerpc64.asm x86_64.asm many.pl
37noinst_HEADERS = speed.h
38
39# Prefer -static on the speed and tune programs, since that can avoid
40# overheads of shared library linkages on some systems.  Libtool tends to
41# botch -static if configured with --disable-static, perhaps reasonably
42# enough.  In any event under --disable-static the only choice is a dynamic
43# link so there's no point in -static.
44#
45if ENABLE_STATIC
46STATIC = -static
47else
48STATIC =
49endif
50
51
52EXTRA_LTLIBRARIES = libspeed.la
53
54libspeed_la_SOURCES =							\
55  common.c divrem1div.c divrem1inv.c divrem2div.c divrem2inv.c		\
56  div_qr_1n_pi1_1.c div_qr_1n_pi1_2.c div_qr_1_tune.c			\
57  freq.c								\
58  gcdext_single.c gcdext_double.c gcdextod.c gcdextos.c			\
59  hgcd_lehmer.c hgcd_appr_lehmer.c hgcd_reduce_1.c hgcd_reduce_2.c	\
60  jacbase1.c jacbase2.c jacbase3.c jacbase4.c				\
61  hgcd2-1.c hgcd2-2.c hgcd2-3.c hgcd2-4.c hgcd2-5.c			\
62  mod_1_div.c mod_1_inv.c mod_1_1-1.c mod_1_1-2.c modlinv.c		\
63  noop.c powm_mod.c powm_redc.c pre_divrem_1.c				\
64  set_strb.c set_strs.c set_strp.c time.c
65
66libspeed_la_DEPENDENCIES = $(SPEED_CYCLECOUNTER_OBJ) \
67  $(top_builddir)/tests/libtests.la $(top_builddir)/libgmp.la
68libspeed_la_LIBADD = $(libspeed_la_DEPENDENCIES) $(LIBM)
69libspeed_la_LDFLAGS = $(STATIC)
70
71$(top_builddir)/tests/libtests.la:
72	cd $(top_builddir)/tests; $(MAKE) $(AM_MAKEFLAGS) libtests.la
73
74
75# The library code is faster static than shared on some systems, so do
76# tuning and measuring with static, since users who care about maximizing
77# speed will be using that.  speed-dynamic exists to show the difference.
78#
79# On Solaris 8, gcc 2.95.2 -static is somehow broken (it creates executables
80# that immediately seg fault), so -all-static is not used.  The only thing
81# -all-static does is make libc static linked as well as libgmp, and that
82# makes a difference only when measuring malloc and friends in the speed
83# program.  This can always be forced with "make speed_LDFLAGS=-all-static
84# ..." if desired, see tune/README.
85
86EXTRA_PROGRAMS = speed speed-dynamic speed-ext tuneup tune-gcd-p
87
88DEPENDENCIES = libspeed.la
89LDADD = $(DEPENDENCIES) $(TUNE_LIBS)
90
91speed_SOURCES = speed.c
92speed_LDFLAGS = $(STATIC)
93
94speed_dynamic_SOURCES = speed.c
95
96speed_ext_SOURCES = speed-ext.c
97speed_ext_LDFLAGS = $(STATIC)
98
99tuneup_SOURCES = tuneup.c hgcd2.c
100nodist_tuneup_SOURCES = sqr_basecase.c fac_ui.c $(TUNE_MPN_SRCS)
101tuneup_DEPENDENCIES = $(TUNE_SQR_OBJ) libspeed.la
102tuneup_LDADD = $(tuneup_DEPENDENCIES) $(TUNE_LIBS)
103tuneup_LDFLAGS = $(STATIC)
104
105tune_gcd_p_SOURCES = tune-gcd-p.c
106tune_gcd_p_DEPENDENCIES = ../mpn/gcd.c
107tune_gcd_p_LDFLAGS = $(STATIC)
108
109
110tune:
111	$(MAKE) $(AM_MAKEFLAGS) tuneup$(EXEEXT)
112	./tuneup
113
114allprogs: $(EXTRA_PROGRAMS)
115
116# $(MANY_CLEAN) and $(MANY_DISTCLEAN) are hooks for many.pl
117CLEANFILES = $(EXTRA_PROGRAMS) $(EXTRA_LTLIBRARIES) \
118	$(TUNE_MPN_SRCS) fac_ui.c sqr_asm.asm \
119	stg.gnuplot stg.data \
120	mtg.gnuplot mtg.data \
121	fibg.gnuplot fibg.data \
122	graph.gnuplot graph.data \
123	$(MANY_CLEAN)
124DISTCLEANFILES = sqr_basecase.c  $(MANY_DISTCLEAN)
125
126
127# Generating these little files at build time seems better than including
128# them in the distribution, since the list can be changed more easily.
129#
130# mpn/generic/tdiv_qr.c uses mpn_divrem_1 and mpn_divrem_2, but only for 1
131# and 2 limb divisors, which are never used during tuning, so it doesn't
132# matter whether it picks up a tuned or untuned version of those.
133#
134# divrem_1 and mod_1 are recompiled renamed to "_tune" to avoid a linking
135# problem.  If a native divrem_1 provides an mpn_divrem_1c entrypoint then
136# common.c will want that, but the generic divrem_1 doesn't provide it,
137# likewise for mod_1.  The simplest way around this is to have the tune
138# build versions renamed suitably.
139#
140# FIXME: Would like say mul_n.c to depend on $(top_builddir)/mul_n.c so the
141# recompiled object will be rebuilt if that file changes.
142
143TUNE_MPN_SRCS = $(TUNE_MPN_SRCS_BASIC) divrem_1.c mod_1.c
144TUNE_MPN_SRCS_BASIC = div_qr_2.c bdiv_q.c bdiv_qr.c			\
145  dcpi1_div_qr.c dcpi1_divappr_q.c dcpi1_bdiv_qr.c dcpi1_bdiv_q.c	\
146  invertappr.c invert.c binvert.c divrem_2.c gcd.c gcdext.c		\
147  get_str.c set_str.c matrix22_mul.c					\
148  hgcd.c hgcd_appr.c hgcd_reduce.c					\
149  mul_n.c sqr.c sec_powm.c						\
150  mullo_n.c mul_fft.c mul.c tdiv_qr.c mulmod_bnm1.c sqrmod_bnm1.c	\
151  mulmid.c mulmid_n.c toom42_mulmid.c sqrlo.c sqrlo_basecase.c		\
152  nussbaumer_mul.c toom6h_mul.c toom8h_mul.c toom6_sqr.c toom8_sqr.c	\
153  toom22_mul.c toom2_sqr.c toom33_mul.c toom3_sqr.c toom44_mul.c toom4_sqr.c
154
155$(TUNE_MPN_SRCS_BASIC):
156	for i in $(TUNE_MPN_SRCS_BASIC); do \
157	  echo "#define TUNE_PROGRAM_BUILD 1" >$$i; \
158	  echo "#include \"mpn/generic/$$i\"" >>$$i; \
159	done
160
161divrem_1.c:
162	echo "#define TUNE_PROGRAM_BUILD 1"                >divrem_1.c
163	echo "#define __gmpn_divrem_1  mpn_divrem_1_tune" >>divrem_1.c
164	echo "#include \"mpn/generic/divrem_1.c\""        >>divrem_1.c
165
166mod_1.c:
167	echo "#define TUNE_PROGRAM_BUILD 1"          >mod_1.c
168	echo "#define __gmpn_mod_1  mpn_mod_1_tune" >>mod_1.c
169	echo "#include \"mpn/generic/mod_1.c\""     >>mod_1.c
170
171sqr_asm.asm: $(top_builddir)/mpn/sqr_basecase.asm
172	echo 'define(SQR_TOOM2_THRESHOLD_OVERRIDE,SQR_TOOM2_THRESHOLD_MAX)' >sqr_asm.asm
173	echo 'include(../mpn/sqr_basecase.asm)' >>sqr_asm.asm
174
175# FIXME: Should it depend on $(top_builddir)/fac_ui.h too?
176fac_ui.c: $(top_builddir)/mpz/fac_ui.c
177	echo "#define TUNE_PROGRAM_BUILD 1"          >fac_ui.c
178	echo "#define __gmpz_fac_ui mpz_fac_ui_tune" >>fac_ui.c
179	echo "#define __gmpz_oddfac_1 mpz_oddfac_1_tune" >>fac_ui.c
180	echo "#include \"mpz/oddfac_1.c\""           >>fac_ui.c
181	echo "#include \"mpz/fac_ui.c\""             >>fac_ui.c
182
183include ../mpn/Makeasm.am
184
185.NOTPARALLEL:
186
187