OILS / metrics / native-code.sh View on Github | oilshell.org

201 lines, 89 significant
1#!/usr/bin/env bash
2#
3# Usage:
4# metrics/native-code.sh <function name>
5
6set -o nounset
7set -o pipefail
8set -o errexit
9
10source build/dev-shell.sh # put bloaty in $PATH, R_LIBS_USER
11
12readonly OVM_BASE_DIR=_tmp/metrics/ovm
13readonly OIL_BASE_DIR=_tmp/metrics/oils-for-unix
14
15pylibc-symbols() {
16 symbols _devbuild/py-ext/x86_64/libc.so
17}
18
19fastlex-symbols() {
20 symbols _devbuild/py-ext/x86_64/fastlex.so
21}
22
23print-symbols() {
24 local obj=$1
25 ls -l $obj
26 echo
27
28 # Summary
29 bloaty $obj
30 echo
31
32 # Top symbols
33 # fastlex_MatchToken is 21.2 KiB. That doesn't seem to large compared to
34 # the 14K line output?
35 bloaty -d symbols $obj
36 echo
37
38 nm $obj
39 echo
40}
41
42# Big functions:
43# - PyEval_EvalFrameEx (38 KiB)
44# - fastlex_MatchOSHToken (22.5 KiB)
45# - convertitem() in args.py (9.04 KiB)
46# - PyString_Format() in args.py (6.84 KiB)
47#
48# Easy removals:
49# - marshal_dumps and marshal_dump! We never use those.
50# - Remove all docstrings!!! Like sys_doc.
51
52compileunits() {
53 # Hm there doesn't seem to be a way to do this without
54 local file=${1:-_build/oil/ovm-dbg}
55
56 #local file=_build/oil/ovm-opt
57 #local sym=_build/oil/ovm-opt.symbols
58
59 bloaty --tsv -n 0 -d compileunits $file
60}
61
62symbols() {
63 # NOTE: This is different than the release binary!
64 # ovm-opt.stripped doesn't show a report.
65 local file=${1:-_build/oil/ovm-opt}
66
67 # Full output
68 # 3,588 lines!
69 bloaty --tsv -n 0 -d symbols $file
70}
71
72R-report() {
73 metrics/native-code.R "$@"
74}
75
76build-ovm() {
77 # 2022-12: hack for ./configure, because line_input failed to compile without
78 # HAVE_READLINE See _build/oil/module_init.c
79 # TODO: This metric should either be DELETED, or automated in the CI, so it
80 # doesn't break
81
82 ./configure
83
84 make _build/oil/ovm-{dbg,opt}
85}
86
87collect-and-report() {
88 local base_dir=$1
89 local dbg=$2
90 local opt=$3
91
92 mkdir -p $base_dir
93
94 print-symbols $opt > $base_dir/symbols.txt
95
96 symbols $opt > $base_dir/symbols.tsv
97
98 # Really 'translation units', but bloaty gives it that name.
99 compileunits $dbg > $base_dir/compileunits.tsv
100
101 head $base_dir/symbols.tsv $base_dir/compileunits.tsv
102
103 # Hack for now
104 if Rscript -e 'print("hi from R")'; then
105 R-report metrics $base_dir $dbg $opt | tee $base_dir/overview.txt
106 else
107 echo 'R not detected' | tee $base_dir/overview.txt
108 fi
109
110 # For CI
111 cat >$base_dir/index.html <<'EOF'
112<a href="overview.txt">overview.txt</a> <br/>
113<a href="compileunits.tsv">compileunits.tsv</a> <br/>
114<a href="symbols.tsv">symbols.tsv</a> <br/>
115<a href="symbols.txt">symbols.txt</a> <br/>
116EOF
117}
118
119oils-for-unix() {
120 ### Report on the ones we just built
121
122 # TODO: could compare GCC and Clang once we have R on the CI images
123 local -a targets=(_bin/cxx-{dbg,opt}/oils-for-unix)
124 ninja "${targets[@]}"
125
126 collect-and-report $OIL_BASE_DIR "${targets[@]}"
127
128 ls -l $OIL_BASE_DIR
129}
130
131compare-gcc-clang() {
132 ### Run by Soil 'cpp-coverage' task, because it has clang
133
134 local -a targets=(
135 _bin/{clang,cxx}-dbg/oils-for-unix
136 _bin/{clang,cxx}-opt/oils-for-unix.stripped
137 _bin/cxx-{opt+bumpleak,opt+bumproot}/oils-for-unix.stripped
138 _bin/{clang,cxx}-opt/yaks/yaks_main.mycpp.stripped
139 _bin/cxx-{opt+bumpleak,opt+bumproot}/yaks/yaks_main.mycpp.stripped
140 )
141 ninja "${targets[@]}"
142
143 mkdir -p _tmp/metrics
144 ls -l --sort=none "${targets[@]}" | tee _tmp/metrics/compare-gcc-clang.txt
145}
146
147readonly OIL_VERSION=$(head -n 1 oil-version.txt)
148
149run-for-release() {
150 build-ovm
151
152 local dbg=_build/oil/ovm-dbg
153 local opt=_build/oil/ovm-opt
154
155 collect-and-report $OVM_BASE_DIR $dbg $opt
156
157 # TODO: consolidate with benchmarks/common.sh, OSH_CPP_BENCHMARK_DATA
158 # For some reason _bin/cxx-opt/ and _bin/cxx-opt-sh can differ by a few bytes
159 local bin_dir="../benchmark-data/src/oils-for-unix-$OIL_VERSION"
160 collect-and-report $OIL_BASE_DIR $bin_dir/_bin/cxx-{dbg,opt}-sh/oils-for-unix
161}
162
163dupe-strings() {
164 ### Check for NUL-terminated strings
165
166 python2 -c '
167import collections
168import re
169import sys
170
171with open(sys.argv[1]) as f:
172 contents = f.read()
173strs = re.split("\\0", contents)
174
175printable = re.compile("[ -~]+$")
176
177d = collections.Counter()
178for s in strs:
179 if len(s) > 1 and printable.match(s):
180 d[s] += 1
181
182for s, count in d.most_common()[:50]:
183 if count == 1:
184 break
185 print("%5d %r" % (count, s))
186
187' "$@"
188}
189
190# Results:
191# Found StrFromC() and len() duplication
192
193oil-dupe-strings() {
194 local bin=_bin/cxx-opt/oils-for-unix.stripped
195 #local bin=_bin/clang-opt/oils-for-unix.stripped
196 ninja $bin
197
198 dupe-strings $bin
199}
200
201"$@"