-
Notifications
You must be signed in to change notification settings - Fork 23
/
Copy pathprogdb.py
184 lines (136 loc) · 4.48 KB
/
progdb.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
#
# This module deals with various "program databases" as required
# for analysis passes. Among them: function database (funcdb.yaml),
# databases of structures, etc.
#
import os.path
import copy
import logging
import yaml
import yamlutils
import utils
from utils import repr_stable
import core
from core import is_addr, is_value, is_expr, EXPR
_log = logging.getLogger(__name__)
FUNC_DB = {}
FUNC_DB_BY_ADDR = {}
struct_types = {}
struct_instances = {}
def set_funcdb(db):
global FUNC_DB, FUNC_DB_BY_ADDR
# index by name in addition to by addr
for addr, props in list(db.items()):
FUNC_DB[props["label"]] = props
FUNC_DB_BY_ADDR = db
REG_PROPS = [
"callsites_live_out", "modifieds", "preserveds", "reach_exit", "reach_exit_maybe",
"params", "estimated_params", "returns",
]
def reglist2set(regs):
return set(core.REG(x) for x in regs)
def preprocess_funcdb(FUNC_DB):
for addr, props in FUNC_DB.items():
for prop in REG_PROPS:
if prop in props:
props[prop] = reglist2set(props[prop])
if "calls_live_out" in props:
new = [(x, core.ADDR(y), reglist2set(z)) for x, y, z in props["calls_live_out"]]
props["calls_live_out"] = new
def postprocess_funcdb(FUNC_DB):
for addr, props in FUNC_DB.items():
for prop in REG_PROPS:
if prop in props:
props[prop] = sorted([x.name for x in props[prop]], key=utils.natural_sort_key)
def load_funcdb(*fnames):
FUNC_DB = {}
for fname in fnames:
with open(fname) as f:
db = yaml.safe_load(f)
FUNC_DB.update(db)
preprocess_funcdb(FUNC_DB)
set_funcdb(FUNC_DB)
def save_funcdb(fname, backup=True):
db = copy.deepcopy(FUNC_DB_BY_ADDR)
postprocess_funcdb(db)
if backup and os.path.exists(fname):
os.rename(fname, fname + ".bak")
with open(fname, "w") as f:
yaml.dump(db, f)
def check_invariants(cfg):
if "reach_exit" in cfg.props:
reach = cfg.props["reach_exit"]
reach_maybe = cfg.props.get("reach_exit_maybe", set())
assert reach_maybe.issubset(reach), "%s: maybe: %s, sure: %s" % (cfg.props["name"],
repr_stable(reach_maybe), repr_stable(reach))
def update_funcdb(cfg):
"Aggregate data from each CFG processed into a function DB."
if "addr" not in cfg.props:
return
check_invariants(cfg)
func_props = FUNC_DB_BY_ADDR.setdefault(cfg.props["addr"], {})
func_props["label"] = cfg.props["name"]
PROPS = (
"params", "estimated_params", "params_why", "modifieds", "preserveds",
"reach_exit", "reach_exit_maybe", "calls_live_out", "noreturn",
"has_infloops"
)
for prop in PROPS:
if prop in cfg.props:
func_props[prop] = cfg.props[prop]
for prop in ("calls", "calls_indir", "func_refs", "mmio_refs"):
if prop in cfg.props:
def ext_repr(x):
if is_addr(x):
return x.addr
if is_value(x):
return hex(x.val)
if is_expr(x):
if x.op == "+" and len(x.args) == 2:
if is_value(x.args[1]):
x = EXPR("+", [x.args[1], x.args[0]])
return str(x)
return str(x)
func_props[prop] = sorted([ext_repr(x) for x in cfg.props[prop]])
#
# Updated funcs tracking
#
UPDATED_FUNCS = set()
def clear_updated():
UPDATED_FUNCS.clear()
def mark_updated(func):
UPDATED_FUNCS.add(func)
def update_cfg_prop(cfg, prop, new_val):
if cfg.props.get(prop) != new_val:
mark_updated(cfg.props["name"])
_log.info("%s: %s updated from %s to %s" % (cfg.props["name"], prop,
utils.repr_stable(cfg.props.get(prop)), utils.repr_stable(new_val)))
cfg.props[prop] = new_val
#
# Symtab functions
#
SYMTAB = {}
def load_symtab(fname):
with open(fname) as f:
for l in f:
l = l.strip()
addr, sym = l.split()
SYMTAB[sym] = int(addr, 16)
# Returns real memory (not symbolic) address, for bindata module.
def lookup_sym(sym):
return SYMTAB[sym]
#
# Struct database functions
#
def set_struct_types(data):
global struct_types
struct_types = data
def set_struct_instances(data):
global struct_instances
struct_instances = data
def get_struct_types():
global struct_types
return struct_types
def get_struct_instances():
global struct_instances
return struct_instances