1 | #!/usr/bin/env bash
|
2 | #
|
3 | # Usage:
|
4 | # metrics/native-code.sh <function name>
|
5 |
|
6 | set -o nounset
|
7 | set -o pipefail
|
8 | set -o errexit
|
9 |
|
10 | source build/dev-shell.sh # put bloaty in $PATH, R_LIBS_USER
|
11 |
|
12 | readonly OVM_BASE_DIR=_tmp/metrics/ovm
|
13 | readonly OIL_BASE_DIR=_tmp/metrics/oils-for-unix
|
14 |
|
15 | pylibc-symbols() {
|
16 | symbols _devbuild/py-ext/x86_64/libc.so
|
17 | }
|
18 |
|
19 | fastlex-symbols() {
|
20 | symbols _devbuild/py-ext/x86_64/fastlex.so
|
21 | }
|
22 |
|
23 | print-symbols() {
|
24 | local obj=$1
|
25 | ls -l $obj
|
26 | echo
|
27 |
|
28 | # Summary
|
29 | bloaty $obj
|
30 | echo
|
31 |
|
32 | # Top symbols
|
33 | # fastlex_MatchToken is 21.2 KiB. That doesn't seem to large compared to
|
34 | # the 14K line output?
|
35 | bloaty -d symbols $obj
|
36 | echo
|
37 |
|
38 | nm $obj
|
39 | echo
|
40 | }
|
41 |
|
42 | # Big functions:
|
43 | # - PyEval_EvalFrameEx (38 KiB)
|
44 | # - fastlex_MatchOSHToken (22.5 KiB)
|
45 | # - convertitem() in args.py (9.04 KiB)
|
46 | # - PyString_Format() in args.py (6.84 KiB)
|
47 | #
|
48 | # Easy removals:
|
49 | # - marshal_dumps and marshal_dump! We never use those.
|
50 | # - Remove all docstrings!!! Like sys_doc.
|
51 |
|
52 | compileunits() {
|
53 | # Hm there doesn't seem to be a way to do this without
|
54 | local file=${1:-_build/oil/ovm-dbg}
|
55 |
|
56 | #local file=_build/oil/ovm-opt
|
57 | #local sym=_build/oil/ovm-opt.symbols
|
58 |
|
59 | bloaty --tsv -n 0 -d compileunits $file
|
60 | }
|
61 |
|
62 | symbols() {
|
63 | # NOTE: This is different than the release binary!
|
64 | # ovm-opt.stripped doesn't show a report.
|
65 | local file=${1:-_build/oil/ovm-opt}
|
66 |
|
67 | # Full output
|
68 | # 3,588 lines!
|
69 | bloaty --tsv -n 0 -d symbols $file
|
70 | }
|
71 |
|
72 | R-report() {
|
73 | metrics/native-code.R "$@"
|
74 | }
|
75 |
|
76 | build-ovm() {
|
77 | # 2022-12: hack for ./configure, because line_input failed to compile without
|
78 | # HAVE_READLINE See _build/oil/module_init.c
|
79 | # TODO: This metric should either be DELETED, or automated in the CI, so it
|
80 | # doesn't break
|
81 |
|
82 | ./configure
|
83 |
|
84 | make _build/oil/ovm-{dbg,opt}
|
85 | }
|
86 |
|
87 | collect-and-report() {
|
88 | local base_dir=$1
|
89 | local dbg=$2
|
90 | local opt=$3
|
91 |
|
92 | mkdir -p $base_dir
|
93 |
|
94 | print-symbols $opt > $base_dir/symbols.txt
|
95 |
|
96 | symbols $opt > $base_dir/symbols.tsv
|
97 |
|
98 | # Really 'translation units', but bloaty gives it that name.
|
99 | compileunits $dbg > $base_dir/compileunits.tsv
|
100 |
|
101 | head $base_dir/symbols.tsv $base_dir/compileunits.tsv
|
102 |
|
103 | # Hack for now
|
104 | if Rscript -e 'print("hi from R")'; then
|
105 | R-report metrics $base_dir $dbg $opt | tee $base_dir/overview.txt
|
106 | else
|
107 | echo 'R not detected' | tee $base_dir/overview.txt
|
108 | fi
|
109 |
|
110 | # For CI
|
111 | cat >$base_dir/index.html <<'EOF'
|
112 | <a href="overview.txt">overview.txt</a> <br/>
|
113 | <a href="compileunits.tsv">compileunits.tsv</a> <br/>
|
114 | <a href="symbols.tsv">symbols.tsv</a> <br/>
|
115 | <a href="symbols.txt">symbols.txt</a> <br/>
|
116 | EOF
|
117 | }
|
118 |
|
119 | oils-for-unix() {
|
120 | ### Report on the ones we just built
|
121 |
|
122 | # TODO: could compare GCC and Clang once we have R on the CI images
|
123 | local -a targets=(_bin/cxx-{dbg,opt}/oils-for-unix)
|
124 | ninja "${targets[@]}"
|
125 |
|
126 | collect-and-report $OIL_BASE_DIR "${targets[@]}"
|
127 |
|
128 | ls -l $OIL_BASE_DIR
|
129 | }
|
130 |
|
131 | compare-gcc-clang() {
|
132 | ### Run by Soil 'cpp-coverage' task, because it has clang
|
133 |
|
134 | local -a targets=(
|
135 | _bin/{clang,cxx}-dbg/oils-for-unix
|
136 | _bin/{clang,cxx}-opt/oils-for-unix.stripped
|
137 | _bin/cxx-{opt+bumpleak,opt+bumproot}/oils-for-unix.stripped
|
138 | _bin/{clang,cxx}-opt/yaks/yaks_main.mycpp.stripped
|
139 | _bin/cxx-{opt+bumpleak,opt+bumproot}/yaks/yaks_main.mycpp.stripped
|
140 | )
|
141 | ninja "${targets[@]}"
|
142 |
|
143 | mkdir -p _tmp/metrics
|
144 | ls -l --sort=none "${targets[@]}" | tee _tmp/metrics/compare-gcc-clang.txt
|
145 | }
|
146 |
|
147 | readonly OIL_VERSION=$(head -n 1 oil-version.txt)
|
148 |
|
149 | run-for-release() {
|
150 | build-ovm
|
151 |
|
152 | local dbg=_build/oil/ovm-dbg
|
153 | local opt=_build/oil/ovm-opt
|
154 |
|
155 | collect-and-report $OVM_BASE_DIR $dbg $opt
|
156 |
|
157 | # TODO: consolidate with benchmarks/common.sh, OSH_CPP_BENCHMARK_DATA
|
158 | # For some reason _bin/cxx-opt/ and _bin/cxx-opt-sh can differ by a few bytes
|
159 | local bin_dir="../benchmark-data/src/oils-for-unix-$OIL_VERSION"
|
160 | collect-and-report $OIL_BASE_DIR $bin_dir/_bin/cxx-{dbg,opt}-sh/oils-for-unix
|
161 | }
|
162 |
|
163 | dupe-strings() {
|
164 | ### Check for NUL-terminated strings
|
165 |
|
166 | python2 -c '
|
167 | import collections
|
168 | import re
|
169 | import sys
|
170 |
|
171 | with open(sys.argv[1]) as f:
|
172 | contents = f.read()
|
173 | strs = re.split("\\0", contents)
|
174 |
|
175 | printable = re.compile("[ -~]+$")
|
176 |
|
177 | d = collections.Counter()
|
178 | for s in strs:
|
179 | if len(s) > 1 and printable.match(s):
|
180 | d[s] += 1
|
181 |
|
182 | for s, count in d.most_common()[:50]:
|
183 | if count == 1:
|
184 | break
|
185 | print("%5d %r" % (count, s))
|
186 |
|
187 | ' "$@"
|
188 | }
|
189 |
|
190 | # Results:
|
191 | # Found StrFromC() and len() duplication
|
192 |
|
193 | oil-dupe-strings() {
|
194 | local bin=_bin/cxx-opt/oils-for-unix.stripped
|
195 | #local bin=_bin/clang-opt/oils-for-unix.stripped
|
196 | ninja $bin
|
197 |
|
198 | dupe-strings $bin
|
199 | }
|
200 |
|
201 | "$@"
|