| #!/usr/bin/env python |
| # -*- coding: utf-8 -*- |
| # |
| # Copyright (c) 2018 Free Software Foundation |
| # Contributed by Bernhard Reutner-Fischer <aldot@gcc.gnu.org> |
| # Inspired by bloat-o-meter from busybox. |
| |
| # This software may be used and distributed according to the terms and |
| # conditions of the GNU General Public License as published by the Free |
| # Software Foundation. |
| |
| # For a set of object-files, determine symbols that are |
| # - public but should be static |
| |
| # Examples: |
| # unused_functions.py ./gcc/fortran |
| # unused_functions.py gcc/c gcc/c-family/ gcc/*-c.o | grep -v "'gt_" |
| # unused_functions.py gcc/cp gcc/c-family/ gcc/*-c.o | grep -v "'gt_" |
| |
| import sys, os |
| from tempfile import mkdtemp |
| from subprocess import Popen, PIPE |
| |
| def usage(): |
| sys.stderr.write("usage: %s [-v] [dirs | files] [-- <readelf options>]\n" |
| % sys.argv[0]) |
| sys.stderr.write("\t-v\tVerbose output\n"); |
| sys.exit(1) |
| |
| (odir, sym_args, tmpd, verbose) = (set(), "", None, False) |
| |
| for i in range(1, len(sys.argv)): |
| f = sys.argv[i] |
| if f == '--': # sym_args |
| sym_args = ' '.join(sys.argv[i + 1:]) |
| break |
| if f == '-v': |
| verbose = True |
| continue |
| if not os.path.exists(f): |
| sys.stderr.write("Error: No such file or directory '%s'\n" % f) |
| usage() |
| else: |
| if f.endswith('.a') and tmpd is None: |
| tmpd = mkdtemp(prefix='unused_fun') |
| odir.add(f) |
| |
| def dbg(args): |
| if not verbose: return |
| print(args) |
| |
| def get_symbols(file): |
| syms = {} |
| rargs = "readelf -W -s %s %s" % (sym_args, file) |
| p0 = Popen((a for a in rargs.split(' ') if a.strip() != ''), stdout=PIPE) |
| p1 = Popen(["c++filt"], stdin=p0.stdout, stdout=PIPE, |
| universal_newlines=True) |
| lines = p1.communicate()[0] |
| for l in lines.split('\n'): |
| l = l.strip() |
| if not len(l) or not l[0].isdigit(): continue |
| larr = l.split() |
| if len(larr) != 8: continue |
| num, value, size, typ, bind, vis, ndx, name = larr |
| if typ == 'SECTION' or typ == 'FILE': continue |
| # I don't think we have many aliases in gcc, re-instate the addr |
| # lut otherwise. |
| if vis != 'DEFAULT': continue |
| #value = int(value, 16) |
| #size = int(size, 16) if size.startswith('0x') else int(size) |
| defined = ndx != 'UND' |
| globl = bind == 'GLOBAL' |
| # c++ RID_FUNCTION_NAME dance. FORNOW: Handled as local use |
| # Is that correct? |
| if name.endswith('::__FUNCTION__') and typ == 'OBJECT': |
| name = name[0:(len(name) - len('::__FUNCTION__'))] |
| if defined: defined = False |
| if defined and not globl: continue |
| syms.setdefault(name, {}) |
| syms[name][['use','def'][defined]] = True |
| syms[name][['local','global'][globl]] = True |
| # Note: we could filter out e.g. debug_* symbols by looking for |
| # value in the debug_macro sections. |
| if p1.returncode != 0: |
| print("Warning: Reading file '%s' exited with %r|%r" |
| % (file, p0.returncode, p1.returncode)) |
| p0.kill() |
| return syms |
| |
| (oprog, nprog) = ({}, {}) |
| |
| def walker(paths): |
| def ar_x(archive): |
| dbg("Archive %s" % path) |
| f = os.path.abspath(archive) |
| f = os.path.splitdrive(f)[1] |
| d = tmpd + os.path.sep + f |
| d = os.path.normpath(d) |
| owd = os.getcwd() |
| try: |
| os.makedirs(d) |
| os.chdir(d) |
| p0 = Popen(["ar", "x", "%s" % os.path.join(owd, archive)], |
| stderr=PIPE, universal_newlines=True) |
| p0.communicate() |
| if p0.returncode > 0: d = None # assume thin archive |
| except: |
| dbg("ar x: Error: %s: %s" % (archive, sys.exc_info()[0])) |
| os.chdir(owd) |
| raise |
| os.chdir(owd) |
| if d: dbg("Extracted to %s" % (d)) |
| return (archive, d) |
| |
| def ar_t(archive): |
| dbg("Thin archive, using existing files:") |
| try: |
| p0 = Popen(["ar", "t", "%s" % archive], stdout=PIPE, |
| universal_newlines=True) |
| ret = p0.communicate()[0] |
| return ret.split('\n') |
| except: |
| dbg("ar t: Error: %s: %s" % (archive, sys.exc_info()[0])) |
| raise |
| |
| prog = {} |
| for path in paths: |
| if os.path.isdir(path): |
| for r, dirs, files in os.walk(path): |
| if files: dbg("Files %s" % ", ".join(files)) |
| if dirs: dbg("Dirs %s" % ", ".join(dirs)) |
| prog.update(walker([os.path.join(r, f) for f in files])) |
| prog.update(walker([os.path.join(r, d) for d in dirs])) |
| else: |
| if path.endswith('.a'): |
| if ar_x(path)[1] is not None: continue # extract worked |
| prog.update(walker(ar_t(path))) |
| if not path.endswith('.o'): continue |
| dbg("Reading symbols from %s" % (path)) |
| prog[os.path.normpath(path)] = get_symbols(path) |
| return prog |
| |
| def resolve(prog): |
| x = prog.keys() |
| use = set() |
| # for each unique pair of different files |
| for (f, g) in ((f,g) for f in x for g in x if f != g): |
| refs = set() |
| # for each defined symbol |
| for s in (s for s in prog[f] if prog[f][s].get('def') and s in prog[g]): |
| if prog[g][s].get('use'): |
| refs.add(s) |
| for s in refs: |
| # Prune externally referenced symbols as speed optimization only |
| for i in (i for i in x if s in prog[i]): del prog[i][s] |
| use |= refs |
| return use |
| |
| try: |
| oprog = walker(odir) |
| if tmpd is not None: |
| oprog.update(walker([tmpd])) |
| oused = resolve(oprog) |
| finally: |
| try: |
| p0 = Popen(["rm", "-r", "-f", "%s" % (tmpd)], stderr=PIPE, stdout=PIPE) |
| p0.communicate() |
| if p0.returncode != 0: raise "rm '%s' didn't work out" % (tmpd) |
| except: |
| from shutil import rmtree |
| rmtree(tmpd, ignore_errors=True) |
| |
| for (i,s) in ((i,s) for i in oprog.keys() for s in oprog[i] if oprog[i][s]): |
| if oprog[i][s].get('def') and not oprog[i][s].get('use'): |
| print("%s: Symbol '%s' declared extern but never referenced externally" |
| % (i,s)) |
| |
| |