-
Notifications
You must be signed in to change notification settings - Fork 8
/
Copy pathsymbolize.py
138 lines (115 loc) · 4.87 KB
/
symbolize.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
import sys
import re
import subprocess
import tempfile
import collections
from trie import Trie
mapping = sys.argv[1]
base=sys.argv[2]
inp=sys.argv[3]
conv = dict()
ranges = dict()
pathrange=collections.defaultdict(list)
def multireplace(string, replacements, ignore_case=False):
"""
Given a string and a replacement map, it returns the replaced string.
:param str string: string to execute replacements on
:param dict replacements: replacement dictionary {value to find: value to replace}
:param bool ignore_case: whether the match should be case insensitive
:rtype: str
"""
if not replacements:
# Edge case that'd produce a funny regex and cause a KeyError
return string
# If case insensitive, we need to normalize the old string so that later a replacement
# can be found. For instance with {"HEY": "lol"} we should match and find a replacement for "hey",
# "HEY", "hEy", etc.
if ignore_case:
def normalize_old(s):
return s.lower()
re_mode = re.IGNORECASE
else:
def normalize_old(s):
return s
re_mode = 0
trie = Trie()
for r in replacements:
trie.add(r)
pattern = re.compile(r"(0x)?0*" + trie.pattern() + r"", re.IGNORECASE)
#replacements = {normalize_old(key): val for key, val in replacements.items()}
# Place longer ones first to keep shorter substrings from matching where the longer ones should take place
# For instance given the replacements {'ab': 'AB', 'abc': 'ABC'} against the string 'hey abc', it should produce
# 'hey ABC' and not 'hey ABc'
#rep_sorted = sorted(replacements, key=len, reverse=True)
#rep_escaped = map(re.escape, rep_sorted)
# Create a big OR regex that matches any of the substrings to replace
#pattern = re.compile("|".join(rep_escaped), re_mode)
#pattern = re.compile("|".join(["0?x?(" + a + ")" for a in rep_escaped]), re_mode)
#print(pattern)
# For each match, look up the new string in the replacements, being the key the normalized old string
return pattern.sub(lambda match: replacements[normalize_old("{:x}".format(int(match.group(0),16)))], string)
with open(mapping, 'r') as f:
lines = f.readlines()
for l in lines:
start = int(l.split()[2], 16)
end = int(l.split()[4], 16)
file = l.split()[8]
section_name = l.split()[10]
ranges[(start, end)] = (file, section_name)
# opening the text file
with open(inp,'r') as file:
contents = file.read()
nums = set(re.findall(r'0x[0-9A-Fa-f]+', contents, re.I))
nums.update(set(re.findall(r'[0-9A-Fa-f]+', contents, re.I)))
# print(set(nums))
for n in set(nums):
n = int(n, 16)
for r in ranges:
if(n >= r[0] and n <= r[1]):
path = base+"/"+ranges[r][0].split("/")[-1]
pathrange[(path,ranges[r][1], r[0])].append(n)
reps={}
for r in pathrange:
intemp = tempfile.TemporaryFile()
outtemp = tempfile.TemporaryFile()
for addr in pathrange[r]:
intemp.write("0x{:x}\n".format(addr-r[2]).encode("utf-8"))
intemp.seek(0)
#print(intemp.read().decode("utf-8"))
print(r)
if ".ko" in r[0]:
# print('eu-addr2line --demangle -af -e {} --section={} '.format(r[0],r[1]))
p = subprocess.Popen('eu-addr2line --demangle -af -e {} --section={} '.format(r[0],r[1]), shell=True, stdin=intemp, stdout=outtemp)
else :
a2lpath="addr2line"
binpath="debuginfod-find"
#binpath=elfpath+"./debuginfod/debuginfod-find"
# sopath = ":".join([elfpath+i for i in ["debuginfod/libdebuginfod.so.1", "/libdw/libdw.so.1"]])
# print('{} --demangle -a -f -e $({} debuginfo {} || echo {}) --section={}'.format(a2lpath, binpath, r[0], r[0], r[1]))
p = subprocess.Popen('{} --demangle -a -f -e $({} debuginfo {} || echo {}) --section={}'.format(a2lpath, binpath, r[0], r[0], r[1]), shell=True, stdin=intemp, stdout=outtemp)
ret_code = p.wait()
outtemp.flush()
outtemp.seek(0)
lines = [line.rstrip().decode("utf-8") for line in outtemp]
outtemp.seek(0)
i = 0
while i < len(lines):
addr = pathrange[r][int(i/3)]
func = lines[i+1]
file = lines[i+2]
i+=3
if file.startswith("/local"):
file = file[6:]
rep = "{}[{}](0x{:x})".format(func,file, addr)
# print("{:x} -> {}".format(addr, rep))
reps["{:x}".format(addr)] = rep
#reps["0x{:x}".format(addr)] = rep
#reg = re.compile(r'0?x?0*({:x}|{:X})'.format(addr, addr))
#contents = re.sub(reg, rep, contents)
#contents= contents.replace("0x{:x}".format(addr), rep)
#contents= contents.replace("0x{:X}".format(addr), rep)
#contents= contents.replace("{:x}".format(addr), rep)
#contents= contents.replace("{:X}".format(addr), rep)
contents = multireplace(contents, reps, True)
#print(reps)
print(contents)