benchmarks/uftrace.sh

OILS / benchmarks / uftrace.sh View on Github | oilshell.org

349 lines, 176 significant

1	#!/usr/bin/env bash
2	#
3	# Usage:
4	# benchmarks/uftrace.sh <function name>
5	#
6	# Examples:
7	# benchmarks/uftrace.sh record-oils-cpp
8	# benchmarks/uftrace.sh replay-alloc
9	# benchmarks/uftrace.sh plugin-allocs
10	#
11	# TODO:
12	# - uftrace dump --chrome # time-based trace
13	# - uftrace dump --flame-graph # common stack traces, e.g. for allocation
14
15	set -o nounset
16	set -o pipefail
17	set -o errexit
18
19	source benchmarks/common.sh # cmark function. TODO: could use executable
20	source build/dev-shell.sh # put uftrace in $PATH, R_LIBS_USER
21	source devtools/common.sh # banner
22	source test/common.sh # escape-html
23
24	readonly BASE_DIR=_tmp/uftrace
25
26	download() {
27	wget --no-clobber --directory _cache \
28	https://github.com/namhyung/uftrace/archive/refs/tags/v0.13.tar.gz
29	#https://github.com/namhyung/uftrace/archive/v0.9.3.tar.gz
30
31	}
32
33	extract() {
34	pushd _cache
35	tar --extract -z < v0.13.tar.gz
36	popd
37	}
38
39	build() {
40	cd _cache/uftrace-0.13
41	./configure
42	make
43
44	# It can't find some files unless we do this
45	echo 'Run sudo make install'
46	}
47
48	ubuntu-hack() {
49	# Annoying: the plugin engine tries to look for the wrong file?
50	# What's 3.6m.so vs 3.6.so ???
51
52	cd /usr/lib/x86_64-linux-gnu
53	ln -s libpython3.6m.so.1.0 libpython3.6.so
54	}
55
56	# https://github.com/namhyung/uftrace/wiki/Tutorial
57	hello-demo() {
58	cat >_tmp/hello.c <<EOF
59	#include <stdio.h>
60
61	int main(void) {
62	printf("Hello world\n");
63	return 0;
64	}
65	EOF
66
67	gcc -o _tmp/hello -pg _tmp/hello.c
68
69	uftrace _tmp/hello
70	}
71
72	record-oils-cpp() {
73	### Record a trace, but limit to allocations functions, for size
74
75	local out_dir=$1
76	local unfiltered=${2:-}
77	shift 2
78
79	#local flags=(-F process::Process::RunWait -F process::Process::Process)
80
81	local -a flags
82
83	if test -n "$unfiltered"; then
84	out_dir=$out_dir.unfiltered
85
86	# Look for the pattern:
87	# Alloc() {
88	# MarkSweepHeap::Allocate(24)
89	# syntax_asdl::line_span::line_span()
90	# }
91	flags=(
92	-F 'Alloc'
93	-F 'MarkSweepHeap::Allocate' -A 'MarkSweepHeap::Allocate@arg2'
94	-D 2
95	)
96	# If we don't filter at all, then it's huge
97	# flags=()
98
99	else
100	# It's faster to filter just these function calls
101	# Need .* for --demangle full
102
103	flags=(
104	# low level allocation
105	-F 'MarkSweepHeap::Allocate.' -A 'MarkSweepHeap::Allocate.@arg2'
106
107	# typed allocation
108	-F 'Alloc<.*' # missing type info
109
110	# Flexible array allocation
111	# arg 1 is str_len
112	-F 'NewStr.' -A 'NewStr.@arg1'
113	-F 'OverAllocatedStr.' -A 'OverAllocatedStr.@arg1'
114
115	# This constructor doesn't matter. We care about the interface in in
116	# mycpp/gc_alloc.h
117	# -F 'Str::Str.*'
118
119	# arg1 is number of elements of type T
120	-F 'NewSlab<.' -A 'NewSlab<.@arg1'
121	# -F 'Slab<.>::Slab.'
122
123	# Fixed size header allocation
124	# arg2 is the number of items to reserve
125	# -F 'List<.>::List.'
126	-F 'List<.>::reserve.' -A 'List<.>::reserve.@arg2'
127	# -F 'Dict<.>::Dict.' # does not allocate
128	-F 'Dict<.>::reserve.' -A 'Dict<.>::reserve.@arg2'
129
130	# Common object
131	# -F 'syntax_asdl::Token::Token'
132
133	-D 1
134	)
135
136	# Problem: some of these aren't allocations
137	# -F 'Tuple2::Tuple2'
138	# -F 'Tuple3::Tuple3'
139	# -F 'Tuple4::Tuple4'
140
141	# StrFromC calls NewStr, so we don't need it
142	# -F 'StrFromC' -A 'StrFromC@arg1' -A 'StrFromC@arg2'
143	fi
144
145	soil/cpp-tarball.sh build-like-ninja uftrace
146	local bin=_bin/cxx-uftrace/osh
147
148	mkdir -p $out_dir
149	time uftrace record --demangle full -d $out_dir "${flags[@]}" $bin "$@"
150
151	ls -d $out_dir/
152	ls -l --si $out_dir/
153	}
154
155	run-tasks() {
156	while read task; do
157	banner "$task: utrace record"
158
159	# TODO: Could share with benchmarks/gc
160	case $task in
161	parse.configure-cpython)
162	data_file='Python-2.7.13/configure'
163	;;
164	parse.abuild)
165	data_file='benchmarks/testdata/abuild'
166	;;
167	esac
168
169	# Construct argv for each task
170	local -a argv
171	case $task in
172	parse.*)
173	argv=( --ast-format none -n $data_file )
174	;;
175
176	ex.compute-fib)
177	argv=( benchmarks/compute/fib.sh 10 44 )
178	;;
179
180	ex.bashcomp-excerpt)
181	# NOTE: benchmarks/gc.sh uses the larger clang.txt file
182	argv=( benchmarks/parse-help/pure-excerpt.sh parse_help_file
183	benchmarks/parse-help/mypy.txt )
184	;;
185
186	ex.bin-true)
187	argv=( testdata/osh-runtime/bin_true.sh )
188	;;
189
190	esac
191
192	local out_dir=$BASE_DIR/raw/$task
193
194	record-oils-cpp $out_dir '' "${argv[@]}"
195	done
196	}
197
198	print-tasks() {
199	# Same as benchmarks/gc
200	local -a tasks=(
201	# This one is a bit big
202	# parse.configure-cpython
203
204	parse.abuild
205	ex.bashcomp-excerpt
206	ex.compute-fib
207	ex.bin-true
208	)
209
210	for task in "${tasks[@]}"; do
211	echo $task
212	done
213	}
214
215	measure-all() {
216	print-tasks \| run-tasks
217	}
218
219	frequent-calls() {
220	### Histogram
221
222	local out_dir=$1
223	uftrace report -d $out_dir -s call --demangle full
224	}
225
226	call-graph() {
227	### Time-based trace
228
229	local out_dir=$1
230	uftrace graph -d $out_dir
231	}
232
233	tsv-plugin() {
234	local task=${1:-ex.compute-fib}
235
236	local dir=$BASE_DIR/raw/$task
237
238	# On the big configure-coreutils script, this takes 10 seconds. That's
239	# acceptable. Gives 2,402,003 allocations.
240
241	local out_dir=_tmp/uftrace/stage1/$task
242	mkdir -p $out_dir
243	time uftrace script --demangle full -d $dir -S benchmarks/uftrace_allocs.py $out_dir
244
245	wc -l $out_dir/*.tsv
246	}
247
248	report-all() {
249	print-tasks \| while read task; do
250	banner "$task: report"
251
252	frequent-calls $BASE_DIR/raw/$task
253
254	echo
255	done
256	}
257
258	export-all() {
259	if uftrace --version \| grep python3; then
260	echo 'uftrace has Python 3 plugin support'
261	else
262	die 'uftrace is MISSING Python 3 plugin support'
263	fi
264
265	# TODO: Join into a single TSV file
266	print-tasks \| while read task; do
267	banner "$task: export to TSV with Python3 plugin"
268	time tsv-plugin $task
269	done
270	}
271
272	html-index() {
273	echo '<body style="margin: 0 auto; width: 40em; font-size: large">'
274
275	cmark << 'EOF'
276	# uftrace reports
277
278	Workloads:
279	EOF
280
281	# Link to text files
282	print-tasks \| while read task; do
283	echo "<a href="stage2/$task.txt">$task</a> <br/>"
284	done
285
286	cmark <<< '## Summary'
287
288	echo '<pre>'
289
290	cat $BASE_DIR/stage2/summary.txt \| escape-html
291
292	echo '</pre>'
293	echo '</body>'
294	}
295
296	analyze-all() {
297	local in_dir=$BASE_DIR/stage1/
298	local out_dir=$BASE_DIR/stage2/
299
300	# prepare dirs for R to write to
301	print-tasks \| while read task; do
302	mkdir -v -p $out_dir/$task
303	done
304
305	# Writes stage2/summary.txt
306	benchmarks/report.R uftrace $in_dir $out_dir
307
308	html-index > $BASE_DIR/index.html
309	echo "Wrote $BASE_DIR/index.html"
310	}
311
312
313	# Hm this shows EVERY call stack that produces a list!
314
315	# uftrace graph usage shown here
316	# https://github.com/namhyung/uftrace/wiki/Tutorial
317
318	replay-alloc() {
319	local out_dir=$1
320
321	# call graph
322	#uftrace graph -C 'MarkSweepHeap::Allocate'
323
324	# shows what calls this function
325	#uftrace replay -C 'MarkSweepHeap::Allocate'
326
327	# shows what this function calls
328	#uftrace replay -F 'MarkSweepHeap::Allocate'
329
330	# filters may happen at record or replay time
331
332	# depth of 1
333	#uftrace replay -D 1 -F 'MarkSweepHeap::Allocate'
334
335	uftrace replay -D 1 -F 'MarkSweepHeap::Allocate'
336	}
337
338	plugin() {
339	# Note this one likes UNFILTERED data
340	uftrace script -S benchmarks/uftrace_plugin.py
341	}
342
343	soil-run() {
344	measure-all
345	export-all
346	analyze-all
347	}
348
349	"$@"