xref: /optee_os/scripts/symbolize.py (revision d720431cdf0060bfd6c3e3d078e747f9491d880d)
1733a15f2SJerome Forissier#!/usr/bin/env python
2733a15f2SJerome Forissier#
3733a15f2SJerome Forissier# Copyright (c) 2017, Linaro Limited
4733a15f2SJerome Forissier# All rights reserved.
5733a15f2SJerome Forissier#
6733a15f2SJerome Forissier# Redistribution and use in source and binary forms, with or without
7733a15f2SJerome Forissier# modification, are permitted provided that the following conditions are met:
8733a15f2SJerome Forissier#
9733a15f2SJerome Forissier# 1. Redistributions of source code must retain the above copyright notice,
10733a15f2SJerome Forissier# this list of conditions and the following disclaimer.
11733a15f2SJerome Forissier#
12733a15f2SJerome Forissier# 2. Redistributions in binary form must reproduce the above copyright notice,
13733a15f2SJerome Forissier# this list of conditions and the following disclaimer in the documentation
14733a15f2SJerome Forissier# and/or other materials provided with the distribution.
15733a15f2SJerome Forissier#
16733a15f2SJerome Forissier# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
17733a15f2SJerome Forissier# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18733a15f2SJerome Forissier# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19733a15f2SJerome Forissier# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
20733a15f2SJerome Forissier# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
21733a15f2SJerome Forissier# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
22733a15f2SJerome Forissier# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
23733a15f2SJerome Forissier# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
24733a15f2SJerome Forissier# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
25733a15f2SJerome Forissier# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
26733a15f2SJerome Forissier# POSSIBILITY OF SUCH DAMAGE.
27733a15f2SJerome Forissier#
28733a15f2SJerome Forissier
29733a15f2SJerome Forissier
30733a15f2SJerome Forissierimport argparse
31733a15f2SJerome Forissierimport glob
32157e6213SJerome Forissierimport os
33733a15f2SJerome Forissierimport re
34733a15f2SJerome Forissierimport subprocess
35733a15f2SJerome Forissierimport sys
36733a15f2SJerome Forissier
37733a15f2SJerome ForissierTA_UUID_RE = re.compile(r'Status of TA (?P<uuid>[0-9a-f\-]+)')
38733a15f2SJerome ForissierTA_INFO_RE = re.compile(':  arch: (?P<arch>\w+)  '
39733a15f2SJerome Forissier                        'load address: (?P<load_addr>0x[0-9a-f]+)')
40733a15f2SJerome ForissierCALL_STACK_RE = re.compile('Call stack:')
41733a15f2SJerome ForissierSTACK_ADDR_RE = re.compile(r':  (?P<addr>0x[0-9a-f]+)')
42142c5cccSJerome ForissierABORT_ADDR_RE = re.compile('-abort at address (?P<addr>0x[0-9a-f]+)')
43733a15f2SJerome Forissier
44733a15f2SJerome Forissierepilog = '''
45733a15f2SJerome ForissierThis scripts reads an OP-TEE abort message from stdin and adds debug
46733a15f2SJerome Forissierinformation ('function at file:line') next to each address in the call stack.
47733a15f2SJerome ForissierIt uses the paths provided on the command line to locate the appropriate ELF
48733a15f2SJerome Forissierbinary (tee.elf or Trusted Application) and runs arm-linux-gnueabihf-addr2line
49733a15f2SJerome Forissieror aarch64-linux-gnu-addr2line to process the addresses.
50733a15f2SJerome Forissier
51733a15f2SJerome ForissierOP-TEE abort messages are sent to the secure console. They look like the
52733a15f2SJerome Forissierfollowing:
53733a15f2SJerome Forissier
54733a15f2SJerome Forissier  ERROR:   TEE-CORE: User TA data-abort at address 0xffffdecd (alignment fault)
55733a15f2SJerome Forissier  ...
56733a15f2SJerome Forissier  ERROR:   TEE-CORE: Call stack:
57733a15f2SJerome Forissier  ERROR:   TEE-CORE:  0x4000549e
58733a15f2SJerome Forissier  ERROR:   TEE-CORE:  0x40001f4b
59733a15f2SJerome Forissier  ERROR:   TEE-CORE:  0x4000273f
60733a15f2SJerome Forissier  ERROR:   TEE-CORE:  0x40005da7
61733a15f2SJerome Forissier
62733a15f2SJerome ForissierInspired by a script of the same name by the Chromium project.
63733a15f2SJerome Forissier
64733a15f2SJerome ForissierSample usage:
65733a15f2SJerome Forissier
66733a15f2SJerome Forissier  $ scripts/symbolize.py -d out/arm-plat-hikey/core -d ../optee_test/out/ta/*
67733a15f2SJerome Forissier  <paste whole dump here>
68733a15f2SJerome Forissier  ^D
69733a15f2SJerome Forissier'''
70733a15f2SJerome Forissier
71733a15f2SJerome Forissierdef get_args():
72733a15f2SJerome Forissier    parser = argparse.ArgumentParser(
73733a15f2SJerome Forissier                formatter_class=argparse.RawDescriptionHelpFormatter,
74733a15f2SJerome Forissier                description='Symbolizes OP-TEE abort dumps',
75733a15f2SJerome Forissier                epilog=epilog)
76733a15f2SJerome Forissier    parser.add_argument('-d', '--dir', action='append', nargs='+',
77733a15f2SJerome Forissier        help='Search for ELF file in DIR. tee.elf is needed to decode '
78733a15f2SJerome Forissier             'a TEE Core or pseudo-TA abort, while <TA_uuid>.elf is required '
79157e6213SJerome Forissier             'if a user-mode TA has crashed. For convenience, ELF files '
80157e6213SJerome Forissier             'may also be given.')
81733a15f2SJerome Forissier    parser.add_argument('-s', '--strip_path',
82733a15f2SJerome Forissier        help='Strip STRIP_PATH from file paths')
83733a15f2SJerome Forissier
84733a15f2SJerome Forissier    return parser.parse_args()
85733a15f2SJerome Forissier
86733a15f2SJerome Forissierclass Symbolizer(object):
87733a15f2SJerome Forissier    def __init__(self, out, dirs, strip_path):
88733a15f2SJerome Forissier        self._out = out
89733a15f2SJerome Forissier        self._dirs = dirs
90733a15f2SJerome Forissier        self._strip_path = strip_path
91733a15f2SJerome Forissier        self._addr2line = None
92733a15f2SJerome Forissier        self._bin = 'tee.elf'
93733a15f2SJerome Forissier        self.reset()
94733a15f2SJerome Forissier
95733a15f2SJerome Forissier    def get_elf(self, elf_or_uuid):
96733a15f2SJerome Forissier        if not elf_or_uuid.endswith('.elf'):
97733a15f2SJerome Forissier            elf_or_uuid += '.elf'
98733a15f2SJerome Forissier        for d in self._dirs:
99157e6213SJerome Forissier            if d.endswith(elf_or_uuid) and os.path.isfile(d):
100157e6213SJerome Forissier                return d
101733a15f2SJerome Forissier            elf = glob.glob(d + '/' + elf_or_uuid)
102733a15f2SJerome Forissier            if elf:
103733a15f2SJerome Forissier                return elf[0]
104733a15f2SJerome Forissier
105*d720431cSJerome Forissier    def set_arch(self):
106*d720431cSJerome Forissier        if self._arch:
107*d720431cSJerome Forissier            return
108*d720431cSJerome Forissier        if self._bin:
109*d720431cSJerome Forissier            p = subprocess.Popen([ 'file', self.get_elf(self._bin) ],
110*d720431cSJerome Forissier                                 stdout=subprocess.PIPE)
111*d720431cSJerome Forissier            output = p.stdout.readlines()
112*d720431cSJerome Forissier            p.terminate()
113*d720431cSJerome Forissier            if 'ARM aarch64,' in output[0]:
114*d720431cSJerome Forissier                self._arch = 'aarch64-linux-gnu-'
115*d720431cSJerome Forissier            elif 'ARM,' in output[0]:
116*d720431cSJerome Forissier                self._arch = 'arm-linux-gnueabihf-'
117*d720431cSJerome Forissier
118142c5cccSJerome Forissier    def arch_prefix(self, cmd):
119*d720431cSJerome Forissier        self.set_arch()
120*d720431cSJerome Forissier        return self._arch + cmd
121142c5cccSJerome Forissier
122733a15f2SJerome Forissier    def spawn_addr2line(self):
123733a15f2SJerome Forissier        if not self._addr2line:
124733a15f2SJerome Forissier            elf = self.get_elf(self._bin)
125733a15f2SJerome Forissier            if not elf:
126733a15f2SJerome Forissier                return
127142c5cccSJerome Forissier            cmd = self.arch_prefix('addr2line')
128142c5cccSJerome Forissier            if not cmd:
129733a15f2SJerome Forissier                return
130733a15f2SJerome Forissier            self._addr2line = subprocess.Popen([cmd, '-f', '-p', '-e', elf],
131733a15f2SJerome Forissier                                                stdin = subprocess.PIPE,
132733a15f2SJerome Forissier                                                stdout = subprocess.PIPE)
133733a15f2SJerome Forissier
134142c5cccSJerome Forissier    def subtract_load_addr(self, addr):
135733a15f2SJerome Forissier        offs = self._load_addr
136fd5d0622SJerome Forissier        if int(offs, 16) > int(addr, 16):
137142c5cccSJerome Forissier            return ''
138142c5cccSJerome Forissier        return '0x{:x}'.format(int(addr, 16) - int(offs, 16))
139142c5cccSJerome Forissier
140142c5cccSJerome Forissier    def resolve(self, addr):
141142c5cccSJerome Forissier        reladdr = self.subtract_load_addr(addr)
142733a15f2SJerome Forissier        self.spawn_addr2line()
143142c5cccSJerome Forissier        if not reladdr or not self._addr2line:
144733a15f2SJerome Forissier            return '???'
145733a15f2SJerome Forissier        try:
146733a15f2SJerome Forissier            print >> self._addr2line.stdin, reladdr
147733a15f2SJerome Forissier            ret = self._addr2line.stdout.readline().rstrip('\n')
148733a15f2SJerome Forissier        except IOError:
149733a15f2SJerome Forissier            ret = '!!!'
150733a15f2SJerome Forissier        return ret
151733a15f2SJerome Forissier
152142c5cccSJerome Forissier    def symbol_plus_offset(self, addr):
153142c5cccSJerome Forissier        ret = ''
154142c5cccSJerome Forissier        prevsize = 0
155142c5cccSJerome Forissier        reladdr = self.subtract_load_addr(addr)
156142c5cccSJerome Forissier        elf = self.get_elf(self._bin)
157142c5cccSJerome Forissier        cmd = self.arch_prefix('nm')
158142c5cccSJerome Forissier        if not reladdr or not elf or not cmd:
159142c5cccSJerome Forissier            return ''
160142c5cccSJerome Forissier        ireladdr = int(reladdr, 0)
161142c5cccSJerome Forissier        nm = subprocess.Popen([cmd, '--numeric-sort', '--print-size', elf],
162142c5cccSJerome Forissier                               stdin = subprocess.PIPE,
163142c5cccSJerome Forissier                               stdout = subprocess.PIPE)
164142c5cccSJerome Forissier        for line in iter(nm.stdout.readline, ''):
165142c5cccSJerome Forissier            try:
166142c5cccSJerome Forissier                addr, size, _, name = line.split()
167142c5cccSJerome Forissier            except:
168142c5cccSJerome Forissier                # Size is missing
169142c5cccSJerome Forissier                addr, _, name = line.split()
170142c5cccSJerome Forissier                size = '0'
171142c5cccSJerome Forissier            iaddr = int(addr, 16)
172142c5cccSJerome Forissier            isize = int(size, 16)
173142c5cccSJerome Forissier            if iaddr == ireladdr:
174142c5cccSJerome Forissier                ret = name
175142c5cccSJerome Forissier                break
176142c5cccSJerome Forissier            if iaddr < ireladdr and iaddr + isize >= ireladdr:
177142c5cccSJerome Forissier                offs = ireladdr - iaddr
178142c5cccSJerome Forissier                ret = name + '+' + str(offs)
179142c5cccSJerome Forissier                break
180142c5cccSJerome Forissier            if iaddr > ireladdr and prevsize == 0:
181142c5cccSJerome Forissier                offs = iaddr + ireladdr
182142c5cccSJerome Forissier                ret = prevname + '+' + str(offs)
183142c5cccSJerome Forissier                break
184142c5cccSJerome Forissier            prevsize = size
185142c5cccSJerome Forissier            prevname = name
186142c5cccSJerome Forissier        nm.terminate()
187142c5cccSJerome Forissier        return ret
188142c5cccSJerome Forissier
189142c5cccSJerome Forissier    def section_plus_offset(self, addr):
190142c5cccSJerome Forissier        ret = ''
191142c5cccSJerome Forissier        reladdr = self.subtract_load_addr(addr)
192142c5cccSJerome Forissier        elf = self.get_elf(self._bin)
193142c5cccSJerome Forissier        cmd = self.arch_prefix('objdump')
194142c5cccSJerome Forissier        if not reladdr or not elf or not cmd:
195142c5cccSJerome Forissier            return ''
196142c5cccSJerome Forissier        iaddr = int(reladdr, 0)
197142c5cccSJerome Forissier        objdump = subprocess.Popen([cmd, '--section-headers', elf],
198142c5cccSJerome Forissier                                    stdin = subprocess.PIPE,
199142c5cccSJerome Forissier                                    stdout = subprocess.PIPE)
200142c5cccSJerome Forissier        for line in iter(objdump.stdout.readline, ''):
201142c5cccSJerome Forissier            try:
202142c5cccSJerome Forissier                idx, name, size, vma, lma, offs, algn = line.split()
203142c5cccSJerome Forissier            except:
204142c5cccSJerome Forissier                continue;
205142c5cccSJerome Forissier            ivma = int(vma, 16)
206142c5cccSJerome Forissier            isize = int(size, 16)
207142c5cccSJerome Forissier            if ivma == iaddr:
208142c5cccSJerome Forissier                ret = name
209142c5cccSJerome Forissier                break
210142c5cccSJerome Forissier            if ivma < iaddr and ivma + isize >= iaddr:
211142c5cccSJerome Forissier                offs = iaddr - ivma
212142c5cccSJerome Forissier                ret = name + '+' + str(offs)
213142c5cccSJerome Forissier                break
214142c5cccSJerome Forissier        objdump.terminate()
215142c5cccSJerome Forissier        return ret
216142c5cccSJerome Forissier
217142c5cccSJerome Forissier    def process_abort(self, line):
218142c5cccSJerome Forissier        ret = ''
219142c5cccSJerome Forissier        match = re.search(ABORT_ADDR_RE, line)
220142c5cccSJerome Forissier        addr = match.group('addr')
221142c5cccSJerome Forissier        pre = match.start('addr')
222142c5cccSJerome Forissier        post = match.end('addr')
223142c5cccSJerome Forissier        sym = self.symbol_plus_offset(addr)
224142c5cccSJerome Forissier        sec = self.section_plus_offset(addr)
225142c5cccSJerome Forissier        if sym or sec:
226142c5cccSJerome Forissier            ret += line[:pre]
227142c5cccSJerome Forissier            ret += addr
228142c5cccSJerome Forissier            if sym:
229142c5cccSJerome Forissier                ret += ' ' + sym
230142c5cccSJerome Forissier            if sec:
231142c5cccSJerome Forissier                ret += ' ' + sec
232142c5cccSJerome Forissier            ret += line[post:]
233142c5cccSJerome Forissier        return ret
234142c5cccSJerome Forissier
235733a15f2SJerome Forissier    def reset(self):
236733a15f2SJerome Forissier        self._call_stack_found = False
237733a15f2SJerome Forissier        self._load_addr = '0'
238733a15f2SJerome Forissier        if self._addr2line:
239733a15f2SJerome Forissier            self._addr2line.terminate()
240733a15f2SJerome Forissier            self._addr2line = None
241*d720431cSJerome Forissier        self._arch = None
242142c5cccSJerome Forissier        self._saved_abort_line = ''
243733a15f2SJerome Forissier
244733a15f2SJerome Forissier    def write(self, line):
245733a15f2SJerome Forissier            if self._call_stack_found:
246733a15f2SJerome Forissier                match = re.search(STACK_ADDR_RE, line)
247733a15f2SJerome Forissier                if match:
248733a15f2SJerome Forissier                    addr = match.group('addr')
249733a15f2SJerome Forissier                    pre = match.start('addr')
250733a15f2SJerome Forissier                    post = match.end('addr')
251733a15f2SJerome Forissier                    self._out.write(line[:pre])
252733a15f2SJerome Forissier                    self._out.write(addr)
253733a15f2SJerome Forissier                    res = self.resolve(addr)
254733a15f2SJerome Forissier                    if self._strip_path:
255733a15f2SJerome Forissier                        res = re.sub(re.escape(self._strip_path) + '/*', '',
256733a15f2SJerome Forissier                              res)
257733a15f2SJerome Forissier                    self._out.write(' ' + res)
258733a15f2SJerome Forissier                    self._out.write(line[post:])
259733a15f2SJerome Forissier                    return
260733a15f2SJerome Forissier                else:
261733a15f2SJerome Forissier                    self.reset()
262733a15f2SJerome Forissier            match = re.search(CALL_STACK_RE, line)
263733a15f2SJerome Forissier            if match:
264733a15f2SJerome Forissier                self._call_stack_found = True
265142c5cccSJerome Forissier                # Here is a good place to resolve the abort address because we
266142c5cccSJerome Forissier                # have all the information we need
267142c5cccSJerome Forissier                if self._saved_abort_line:
268142c5cccSJerome Forissier                    self._out.write(self.process_abort(self._saved_abort_line))
269733a15f2SJerome Forissier            match = re.search(TA_UUID_RE, line)
270733a15f2SJerome Forissier            if match:
271733a15f2SJerome Forissier                self._bin = match.group('uuid')
272733a15f2SJerome Forissier            match = re.search(TA_INFO_RE, line)
273733a15f2SJerome Forissier            if match:
274733a15f2SJerome Forissier                self._load_addr = match.group('load_addr')
275142c5cccSJerome Forissier            match = re.search(ABORT_ADDR_RE, line)
276142c5cccSJerome Forissier            if match:
277142c5cccSJerome Forissier                # At this point the arch and TA load address are unknown.
278142c5cccSJerome Forissier                # Save the line so We can translate the abort address later.
279142c5cccSJerome Forissier                self._saved_abort_line = line
280733a15f2SJerome Forissier            self._out.write(line)
281733a15f2SJerome Forissier
282733a15f2SJerome Forissier    def flush(self):
283733a15f2SJerome Forissier        self._out.flush()
284733a15f2SJerome Forissier
285733a15f2SJerome Forissierdef main():
286733a15f2SJerome Forissier    args = get_args()
287733a15f2SJerome Forissier    if args.dir:
288733a15f2SJerome Forissier        # Flatten list in case -d is used several times *and* with multiple
289733a15f2SJerome Forissier        # arguments
290733a15f2SJerome Forissier        args.dirs = [item for sublist in args.dir for item in sublist]
291733a15f2SJerome Forissier    else:
292733a15f2SJerome Forissier        args.dirs = []
293733a15f2SJerome Forissier    symbolizer = Symbolizer(sys.stdout, args.dirs, args.strip_path)
294733a15f2SJerome Forissier
295733a15f2SJerome Forissier    for line in sys.stdin:
296733a15f2SJerome Forissier        symbolizer.write(line)
297733a15f2SJerome Forissier    symbolizer.flush()
298733a15f2SJerome Forissier
299733a15f2SJerome Forissierif __name__ == "__main__":
300733a15f2SJerome Forissier    main()
301