]>
Commit | Line | Data |
---|---|---|
04277e02 | 1 | # Copyright (C) 2013-2019 Free Software Foundation, Inc. |
8cfdb7e0 SP |
2 | # This file is part of the GNU C Library. |
3 | ||
4 | # The GNU C Library is free software; you can redistribute it and/or | |
5 | # modify it under the terms of the GNU Lesser General Public | |
6 | # License as published by the Free Software Foundation; either | |
7 | # version 2.1 of the License, or (at your option) any later version. | |
8 | ||
9 | # The GNU C Library is distributed in the hope that it will be useful, | |
10 | # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
11 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
12 | # Lesser General Public License for more details. | |
13 | ||
14 | # You should have received a copy of the GNU Lesser General Public | |
15 | # License along with the GNU C Library; if not, see | |
16 | # <http://www.gnu.org/licenses/>. | |
17 | ||
8cfdb7e0 | 18 | # Makefile for benchmark tests. The only useful target here is `bench`. |
3ce9e010 | 19 | # Add benchmark functions in alphabetical order. |
8cfdb7e0 | 20 | |
8cfdb7e0 | 21 | subdir := benchtests |
a5f891ac JM |
22 | |
23 | include ../Makeconfig | |
aad287f3 | 24 | bench-math := acos acosh asin asinh atan atanh cos cosh exp exp2 log log2 \ |
da16c9b5 | 25 | modf pow rint sin sincos sinh sqrt tan tanh fmin fmax fminf \ |
077ee129 RS |
26 | fmaxf powf trunc truncf expf exp2f logf log2f sincosf sinf \ |
27 | cosf | |
bb9c256f | 28 | |
0edbf123 | 29 | bench-pthread := pthread_once thread_create |
bb9c256f | 30 | |
aad287f3 SP |
31 | bench-string := ffs ffsll |
32 | ||
0422ed1e | 33 | ifeq (${BENCHSET},) |
aad287f3 | 34 | bench := $(bench-math) $(bench-pthread) $(bench-string) |
0422ed1e VR |
35 | else |
36 | bench := $(foreach B,$(filter bench-%,${BENCHSET}), ${${B}}) | |
37 | endif | |
3ce9e010 | 38 | |
c1f75dc3 | 39 | # String function benchmarks. |
16f87cfd | 40 | string-benchset := memccpy memchr memcmp memcpy memmem memmove \ |
aad287f3 SP |
41 | mempcpy memset rawmemchr stpcpy stpncpy strcasecmp strcasestr \ |
42 | strcat strchr strchrnul strcmp strcpy strcspn strlen \ | |
43 | strncasecmp strncat strncmp strncpy strnlen strpbrk strrchr \ | |
44 | strspn strstr strcpy_chk stpcpy_chk memrchr strsep strtok \ | |
9ec87fd2 | 45 | strcoll memcpy-large memcpy-random memmove-large memset-large \ |
5bfb0404 | 46 | memcpy-walk memset-walk memmove-walk |
2d304f3c SP |
47 | |
48 | # Build and run locale-dependent benchmarks only if we're building natively. | |
49 | ifeq (no,$(cross-compiling)) | |
aad287f3 SP |
50 | wcsmbs-benchset := wcslen wcsnlen wcscpy wcpcpy wcsncpy wcpncpy wcscat wcsncat \ |
51 | wcscmp wcsncmp wcschr wcschrnul wcsrchr wcsspn wcspbrk wcscspn \ | |
52 | wmemchr wmemset wmemcmp | |
2d304f3c SP |
53 | else |
54 | wcsmbs-benchset := | |
55 | endif | |
56 | ||
aad287f3 | 57 | string-benchset-all := $(string-benchset) ${wcsmbs-benchset} |
c1f75dc3 | 58 | |
2d304f3c | 59 | ifeq (no,$(cross-compiling)) |
60ccaf75 LH |
60 | # We have to generate locales |
61 | LOCALES := en_US.UTF-8 tr_TR.UTF-8 cs_CZ.UTF-8 fa_IR.UTF-8 fr_FR.UTF-8 \ | |
62 | ja_JP.UTF-8 si_LK.UTF-8 en_GB.UTF-8 vi_VN.UTF-8 ar_SA.UTF-8 \ | |
63 | da_DK.UTF-8 pl_PL.UTF-8 pt_PT.UTF-8 el_GR.UTF-8 ru_RU.UTF-8 \ | |
20003c49 | 64 | he_IL.UTF-8 is_IS.UTF-8 es_ES.UTF-8 hi_IN.UTF-8 sv_SE.UTF-8 \ |
60ccaf75 LH |
65 | hu_HU.UTF-8 it_IT.UTF-8 sr_RS.UTF-8 zh_CN.UTF-8 |
66 | include ../gen-locales.mk | |
2d304f3c | 67 | endif |
60ccaf75 | 68 | |
aad287f3 | 69 | stdlib-benchset := strtod |
450a2e2d | 70 | |
aad287f3 | 71 | stdio-common-benchset := sprintf |
608f8971 | 72 | |
cb2f668d WD |
73 | math-benchset := math-inlines |
74 | ||
0422ed1e | 75 | ifeq (${BENCHSET},) |
aad287f3 | 76 | benchset := $(string-benchset-all) $(stdlib-benchset) $(stdio-common-benchset) \ |
cb2f668d | 77 | $(math-benchset) |
0422ed1e VR |
78 | else |
79 | benchset := $(foreach B,$(filter %-benchset,${BENCHSET}), ${${B}}) | |
80 | endif | |
c1f75dc3 | 81 | |
f6c55796 WN |
82 | CFLAGS-bench-ffs.c += -fno-builtin |
83 | CFLAGS-bench-ffsll.c += -fno-builtin | |
7a8330c0 | 84 | CFLAGS-bench-sqrt.c += -fno-builtin |
5d1f604a | 85 | CFLAGS-bench-fmin.c += -fno-builtin |
da16c9b5 | 86 | CFLAGS-bench-fminf.c += -fno-builtin |
5d1f604a | 87 | CFLAGS-bench-fmax.c += -fno-builtin |
da16c9b5 | 88 | CFLAGS-bench-fmaxf.c += -fno-builtin |
eb375def JM |
89 | CFLAGS-bench-trunc.c += -fno-builtin |
90 | CFLAGS-bench-truncf.c += -fno-builtin | |
f6c55796 | 91 | |
0422ed1e | 92 | ifeq (${BENCHSET},) |
3904fd85 | 93 | bench-malloc := malloc-thread malloc-simple |
0422ed1e VR |
94 | else |
95 | bench-malloc := $(filter malloc-%,${BENCHSET}) | |
96 | endif | |
b01ee67c | 97 | |
79520f4b | 98 | $(addprefix $(objpfx)bench-,$(bench-math)): $(libm) |
cb2f668d | 99 | $(addprefix $(objpfx)bench-,$(math-benchset)): $(libm) |
79520f4b | 100 | $(addprefix $(objpfx)bench-,$(bench-pthread)): $(shared-thread-library) |
3904fd85 | 101 | $(addprefix $(objpfx)bench-,$(bench-malloc)): $(shared-thread-library) |
7849ff93 | 102 | |
8fc1bee5 SP |
103 | \f |
104 | ||
105 | # Rules to build and execute the benchmarks. Do not put any benchmark | |
106 | # parameters beyond this point. | |
107 | ||
c1f75dc3 SP |
108 | # We don't want the benchmark programs to run in parallel since that could |
109 | # affect their performance. | |
110 | .NOTPARALLEL: | |
111 | ||
4504783c FW |
112 | bench-extra-objs = json-lib.o |
113 | ||
114 | extra-objs += $(bench-extra-objs) | |
115 | others-extras = $(bench-extra-objs) | |
116 | ||
8cfdb7e0 | 117 | include ../Rules |
8fc1bee5 SP |
118 | |
119 | binaries-bench := $(addprefix $(objpfx)bench-,$(bench)) | |
c1f75dc3 | 120 | binaries-benchset := $(addprefix $(objpfx)bench-,$(benchset)) |
b01ee67c | 121 | binaries-bench-malloc := $(addprefix $(objpfx)bench-,$(bench-malloc)) |
8fc1bee5 | 122 | |
fe92a91f | 123 | # The default duration: 1 seconds. |
d569c6ee | 124 | ifndef BENCH_DURATION |
fe92a91f | 125 | BENCH_DURATION := 1 |
d569c6ee SP |
126 | endif |
127 | ||
f1c8185d | 128 | CPPFLAGS-nonlib += -DDURATION=$(BENCH_DURATION) -D_ISOMAC |
d569c6ee | 129 | |
7cc65773 L |
130 | # On x86 processors, use RDTSCP, instead of RDTSC, to measure performance |
131 | # of functions. All x86 processors since 2010 support RDTSCP instruction. | |
132 | ifdef USE_RDTSCP | |
133 | CPPFLAGS-nonlib += -DUSE_RDTSCP | |
134 | endif | |
43fe811b | 135 | |
56737508 SP |
136 | DETAILED_OPT := |
137 | ||
138 | ifdef DETAILED | |
139 | DETAILED_OPT := -d | |
140 | endif | |
141 | ||
4856bcd2 SP |
142 | # This makes sure CPPFLAGS-nonlib and CFLAGS-nonlib are passed |
143 | # for all these modules. | |
b01ee67c WN |
144 | cpp-srcs-left := $(binaries-benchset:=.c) $(binaries-bench:=.c) \ |
145 | $(binaries-bench-malloc:=.c) | |
4856bcd2 | 146 | lib := nonlib |
2bfdaedd | 147 | include $(patsubst %,$(..)libof-iterator.mk,$(cpp-srcs-left)) |
4856bcd2 | 148 | |
43fe811b | 149 | bench-deps := bench-skeleton.c bench-timing.h Makefile |
acb4325f | 150 | |
8fc1bee5 | 151 | run-bench = $(test-wrapper-env) \ |
8540f6d2 | 152 | $(run-program-env) \ |
87da630b | 153 | $($*-ENV) $(test-via-rtld-prefix) $${run} |
8fc1bee5 | 154 | |
cb5e4aad SP |
155 | timing-type := $(objpfx)bench-timing-type |
156 | ||
a2964074 SP |
157 | bench-clean: |
158 | rm -f $(binaries-bench) $(addsuffix .o,$(binaries-bench)) | |
c1f75dc3 | 159 | rm -f $(binaries-benchset) $(addsuffix .o,$(binaries-benchset)) |
b01ee67c | 160 | rm -f $(binaries-bench-malloc) $(addsuffix .o,$(binaries-bench-malloc)) |
cb5e4aad | 161 | rm -f $(timing-type) $(addsuffix .o,$(timing-type)) |
d7aea0cf | 162 | rm -f $(addprefix $(objpfx),$(bench-extra-objs)) |
c1f75dc3 | 163 | |
0422ed1e VR |
164 | # Validate the passed in BENCHSET |
165 | ifneq ($(strip ${BENCHSET}),) | |
166 | VALIDBENCHSETNAMES := bench-pthread bench-math bench-string string-benchset \ | |
167 | wcsmbs-benchset stdlib-benchset stdio-common-benchset math-benchset \ | |
3904fd85 | 168 | malloc-thread malloc-simple |
0422ed1e VR |
169 | INVALIDBENCHSETNAMES := $(filter-out ${VALIDBENCHSETNAMES},${BENCHSET}) |
170 | ifneq (${INVALIDBENCHSETNAMES},) | |
171 | $(info The following values in BENCHSET are invalid: ${INVALIDBENCHSETNAMES}) | |
172 | $(info The valid ones are: ${VALIDBENCHSETNAMES}) | |
173 | $(error Invalid BENCHSET value) | |
174 | endif | |
175 | endif | |
176 | ||
2d304f3c | 177 | bench: bench-build bench-set bench-func bench-malloc |
8ce8299f | 178 | |
2d304f3c SP |
179 | # Target to only build the benchmark without running it. We generate locales |
180 | # only if we're building natively. | |
181 | ifeq (no,$(cross-compiling)) | |
182 | bench-build: $(gen-locales) $(timing-type) $(binaries-bench) \ | |
183 | $(binaries-benchset) $(binaries-bench-malloc) | |
184 | else | |
185 | bench-build: $(timing-type) $(binaries-bench) $(binaries-benchset) \ | |
186 | $(binaries-bench-malloc) | |
187 | endif | |
c1f75dc3 SP |
188 | |
189 | bench-set: $(binaries-benchset) | |
190 | for run in $^; do \ | |
191 | echo "Running $${run}"; \ | |
192 | $(run-bench) > $${run}.out; \ | |
193 | done | |
a2964074 | 194 | |
b01ee67c | 195 | bench-malloc: $(binaries-bench-malloc) |
0422ed1e | 196 | for run in $^; do \ |
3904fd85 WD |
197 | echo "$${run}"; \ |
198 | if [ `basename $${run}` = "bench-malloc-thread" ]; then \ | |
0422ed1e VR |
199 | for thr in 1 8 16 32; do \ |
200 | echo "Running $${run} $${thr}"; \ | |
3904fd85 WD |
201 | $(run-bench) $${thr} > $${run}-$${thr}.out; \ |
202 | done;\ | |
203 | else \ | |
204 | for thr in 8 16 32 64 128 256 512 1024 2048 4096; do \ | |
205 | echo "Running $${run} $${thr}"; \ | |
206 | $(run-bench) $${thr} > $${run}-$${thr}.out; \ | |
207 | done;\ | |
208 | fi;\ | |
b01ee67c WN |
209 | done |
210 | ||
cb5e4aad SP |
211 | # Build and execute the benchmark functions. This target generates JSON |
212 | # formatted bench.out. Each of the programs produce independent JSON output, | |
213 | # so one could even execute them individually and process it using any JSON | |
214 | # capable language or tool. | |
c1f75dc3 | 215 | bench-func: $(binaries-bench) |
0422ed1e | 216 | if [ -n '$^' ] ; then \ |
970c602a | 217 | { timing_type=$$($(timing-type)); \ |
0422ed1e VR |
218 | echo "{\"timing_type\": \"$${timing_type}\","; \ |
219 | echo " \"functions\": {"; \ | |
220 | for run in $^; do \ | |
221 | if ! [ "x$${run}" = "x$<" ]; then \ | |
222 | echo ","; \ | |
223 | fi; \ | |
224 | echo "Running $${run}" >&2; \ | |
225 | $(run-bench) $(DETAILED_OPT); \ | |
226 | done; \ | |
227 | echo; \ | |
228 | echo " }"; \ | |
229 | echo "}"; \ | |
230 | } > $(objpfx)bench.out-tmp; \ | |
231 | if [ -f $(objpfx)bench.out ]; then \ | |
232 | mv -f $(objpfx)bench.out $(objpfx)bench.out.old; \ | |
cb5e4aad | 233 | fi; \ |
0422ed1e VR |
234 | mv -f $(objpfx)bench.out-tmp $(objpfx)bench.out; \ |
235 | $(PYTHON) scripts/validate_benchout.py $(objpfx)bench.out \ | |
236 | scripts/benchout.schema.json; \ | |
237 | fi | |
8fc1bee5 | 238 | |
b5ffdc48 FW |
239 | ifeq ($(bind-now),yes) |
240 | link-bench-bind-now = -Wl,-z,now | |
241 | endif | |
242 | ||
243 | bench-link-targets = $(timing-type) $(binaries-bench) $(binaries-benchset) \ | |
244 | $(binaries-bench-malloc) | |
245 | ||
246 | $(bench-link-targets): %: %.o $(objpfx)json-lib.o \ | |
009ba649 | 247 | $(link-extra-libs-tests) \ |
8fc1bee5 SP |
248 | $(sort $(filter $(common-objpfx)lib%,$(link-libc))) \ |
249 | $(addprefix $(csu-objpfx),start.o) $(+preinit) $(+postinit) | |
87da630b | 250 | $(+link-tests) |
8fc1bee5 | 251 | |
b5ffdc48 FW |
252 | $(bench-link-targets): LDFLAGS += $(link-bench-bind-now) |
253 | ||
acb4325f | 254 | $(objpfx)bench-%.c: %-inputs $(bench-deps) |
8fc1bee5 SP |
255 | { if [ -n "$($*-INCLUDE)" ]; then \ |
256 | cat $($*-INCLUDE); \ | |
257 | fi; \ | |
67fc5637 | 258 | $(PYTHON) scripts/bench.py $(patsubst %-inputs,%,$<); } > $@-tmp |
8fc1bee5 | 259 | mv -f $@-tmp $@ |