1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
|
from graphlib import TopologicalSorter
from sploit.arch import arch, btoi, itob
from sploit.payload.gadhint import GadHint
from sploit.payload.payload import Payload
from sploit.payload.payload_entry import padalign, padlen
_POP_MAGIC = 0xdead
_SPM_MAGIC = b"\x69"
_ERROR_MAGIC = 0xbaadc0de
class ROP:
"""
ROP chain generation tool
This class contains methods for automating basic return-oriented programming
workloads, such as loading register values and calling into arbitrary
functions or syscalls. The tools are currently designed to work on x86
(32 or 64 bit) and ARM (32 bit only).
The main appeal of the ROP class is the ability to abstract away the manual
construction of ROP chain data, and instead make declarative statements
like "call this function with these arguments". The ROP class will also
utilize its supplied binary objects to automatically find and use trivial
gadgets.
The user is able to provide annotations for more complicated gadgets, which
help instruct the class how to incorporate them into a ROP chain. This is
done with the GadHint dataclass. GadHint objects are provided to a ROP
instance by including them in the Symtbl of one of the binary objects it is
constructed with. If applicable, a user-supplied gadget will take
precedence over automatic gadget searching. See the GadHint module to learn
more about the descriptive attributes that are supported.
objects (list[ELF]): The binary objects this ROP instance will consider for
gadget searching. If one of these is the target executable binary, it
should appear first in the list.
safe_syscalls (bool): If True, require that automatically found syscall
instructions are immediately followed by a return instruction.
align_calls (bool): If True, ensure that the stack return address into
function calls is aligned according to the architecture alignment property.
clean_stack (bool): If True, attempt to locate a cleaning gadget to "pop"
stack data that is leftover from a function call. Required if attempting
to make multiple calls that involve stack-based arguments.
"""
def __init__(self, *objects, safe_syscalls=True, align_calls=True,
clean_stack=True):
"""Construct new ROP builder."""
self.objects = objects
self.safe_syscalls = safe_syscalls
self.align_calls = align_calls
self.clean_stack = clean_stack
def search_gadgets(self, *regexes, cont=False):
"""Return a list of matching gadgets, considering all objects."""
results = []
for obj in self.objects:
results += obj.gadgets(*regexes, cont=cont)
return results
def search_gadget(self, *regexes):
"""Return the first matching gadget, considering all objects."""
for obj in self.objects:
try:
return obj.gadget(*regexes)
except:
pass
raise LookupError(
f"ROP: Need to define gadget symbol for {'; '.join(regexes)}")
def gadget(self, gadget):
"""
Return a generic ROP payload.
gadget (GadHint): Annotated gadget to prepare a chain from.
"""
return self.__build_chain(gadget, {})
def assign(self, **sets):
"""
Return a ROP payload to control given registers.
**sets (str:int): Keyword arguments specify register assignments to
perform with this ROP chain. Argument names correspond to register
names.
"""
return self.gadget(GadHint(requirements=sets))
def call(self, func, *params):
"""
Return a ROP payload to call function.
func (int): Entry address of function to call.
*params (int): Remaining positional args are passed to func.
"""
register_params = dict(zip(arch.funcargs, params))
stack_params = params[len(register_params):]
gadget = GadHint(func, requirements=register_params, stack=stack_params,
align=self.align_calls)
return self.gadget(gadget)
def syscall(self, *params):
"""
Return a ROP payload to call kernel.
*params (int): The first argument is the syscall number. Remaining
positional arguments are passed to the syscall.
"""
if len(params) > len(arch.kernargs):
raise TypeError("ROP: Too many arguments passed to syscall. "
f"Target architecture supports up to {len(arch.kernargs)-1}.")
register_params = dict(zip(arch.kernargs, params))
sc = self.__get_gadget("syscall", {})
return self.gadget(sc.with_requirements(register_params))
def memcpy(self, dst, src):
"""
Return a ROP payload to write data into memory.
dst (int): The destination memory address.
src (bytes): The content to write.
"""
data = Payload()
for idx in range(0, len(src), arch.wordsize):
word = btoi(src[idx:idx+arch.wordsize])
data(self.gadget(self.__get_write(dst+idx, word)))
return data
def __get_hints(self):
"""Return all user-supplied gadget hints."""
return [h for obj in self.objects for _,h in obj.sym if type(h) is GadHint]
def __discover_requirements(self, seen, graph, current):
"""
Populate gadget dependency graph.
This function recursively looks up gadgets to ensure all necessary
required gadgets can be found, and stores this information into the
given graph object. Established dependencies encode the order that the
chain builder should attempt to satisfy register requirements.
Dependency loops are detected by the TopologicalSorter.
seen (set): Set of (register,value) tuples we have already discovered.
graph (TopologicalSorter): Dependency graph model object.
current (GadHint): Current gadget we are processing.
"""
for r, v in current.requirements.items():
# We key on register name _and_ value because some gadgets may
# only be capable of storing specific values in a target register.
# Requiring a register to store different values may require the
# use of multiple gadgets.
if (r, v) not in seen:
gadget = self.__get_gadget(r, current.requirements)
# Add gadget's requirements to the dependency graph.
# We say that each requirement is a 'successor' to this
# current gadget 'r', so that the chain builder will satisfy
# 'r' first. This prevents the fulfillment of 'r' from
# clobbering targets it requires, as the builder will satisfy
# them afterward.
for x in gadget.requirements:
graph.add(x, r)
# Treat gadget's load immediates as pseudo-requirements for
# the sake of target ordering, following the same logic
# as above.
for x in gadget.imms:
graph.add(x, r)
# Mark node as visited
seen.add((r, v))
self.__discover_requirements(seen, graph, gadget)
def __get_gadget(self, target, sets):
"""
Get context-specific gadget.
target (str): Either "ret", "syscall", or the name of a register we
would like to modify.
sets (dict{str:int}): The set of other register requirements we are
trying to fulfill in parallel. Values may affect the gadget we decide
to use.
"""
# First, consider user-provided hints before automatically locating
# gadgets.
for hint in self.__get_hints():
# Setup additional requirements based on hint's register moves.
# If a mov target is in sets, require to set the src to the 'sets'
# value.
addl_reqs = { src:sets[dst] for dst, src in hint.movs.items() if dst in sets }
hint = hint.with_requirements(addl_reqs)
# Pops will be accounted for by the chain builder.
# Immediates will be handled by gadget ordering in chain builder.
# Writes are a non-issue here.
if hint.syscall:
# Only consider syscalls if the target is syscall.
if target == "syscall":
return hint
elif target in hint.imms:
if hint.imms[target] == sets[target]:
return hint
elif target in hint.pops:
return hint
elif target in hint.movs:
return hint
# Automatically locate simple gadgets
if target == "ret":
return GadHint(self.search_gadget(arch.ret))
if target == "syscall":
insns = [arch.syscall, arch.ret] if self.safe_syscalls else [arch.syscall]
return GadHint(self.search_gadget(*insns), syscall=True)
# target == register
insns = [ i.format(target) for i in arch.popgad ]
return GadHint(self.search_gadget(*insns), pops=[target])
def __get_clean(self, size):
"""
Get a stack cleaning gadget that moves sp by _at least_ size.
size (int): Minimum stack pointer move.
"""
# spm values of zero (the default) can't be trusted, as in this case
# the user likely hasn't annotated the GadHint properly. Returning a
# larger move than requested is fine, since the chain builder can insert
# junk to be popped.
for hint in self.__get_hints():
if hint.spm >= size and hint.spm > 0:
return hint
results = self.search_gadgets(*arch.cleangad)
table = { int(g.asm[0].group(1), 0): g for g in results }
sizes = sorted([ x for x in table.keys() if x >= size ])
if len(sizes) > 0:
return GadHint(table[sizes[0]], spm=sizes[0])
raise LookupError(
f"ROP: Need to define a stack move gadget of at least {size}")
def __get_write(self, dst, src):
"""
Get a memory write gadget, injected with requirements for user data.
dst (int): The intended memory write location.
src (int): The intended value to write.
"""
# If any exist, take the first write provided by user hints, assuming
# the user's intent to specifically use _this_ write. Follow-on gadgets
# to setup the dst and src registers must be findable.
for hint in self.__get_hints():
if hint.writes:
d, s = list(hint.writes.items())[0]
return hint.with_requirements({d:dst, s:src})
# Only take an automatic write gadget if we can prove up front that its
# requirements can be met, otherwise move on. A later search result may
# pass the test.
results = self.search_gadgets(*arch.writegad)
for gad in results:
d = gad.asm[0].group("dst")
s = gad.asm[0].group("src")
try:
# Assert requirements are met.
gadget = GadHint(gad, writes={d: s}, requirements={d:dst, s:src})
self.__discover_requirements(set(), TopologicalSorter(), gadget)
return gadget
except:
pass
raise LookupError("ROP: Need to define gadgets for memory write / deps")
def __build_chain(self, gadget, sets):
"""
Generate ROP chain data for a given gadget.
This function recursively builds a ROP chain for the given gadget and
its requirements, returning the result as a Payload.
gadget (GadHint): Current gadget to process.
sets (dict{str:int}): The set of other register requirements we are
trying to fulfill in parallel.
"""
# Form a to-do-list of registers from our immediate requirements,
# attempting to order them such that we avoid overwriting/conflicting
# values. This may not be possible, in which case graph.static_order()
# will raise an exception.
reqs = gadget.requirements
graph = TopologicalSorter({ r:set() for r in reqs })
self.__discover_requirements(set(), graph, gadget)
to_do_list = [ x for x in graph.static_order() if x in reqs ]
chain = Payload()
# Start chain by satisfying to-do-list requirements.
if len(to_do_list) > 0:
chain.requirements = Payload()
while len(to_do_list) > 0:
r = to_do_list[0]
g = self.__get_gadget(r, reqs)
c = self.__build_chain(g, reqs)
chain.requirements[f"{r}_{reqs[r]}"] = c
# This gadget may satisfy multiple items in the to-do-list.
# Specifically, all of its pop and mov targets, and any load
# immediates that match our requirements. Non-matching
# immediates will be handled by a later gadget.
imms = g.imms.keys() & reqs.keys()
imms = [ x for x in imms if g.imms[x] == reqs[x] ]
done = g.pops + list(g.movs) + imms
to_do_list = [ x for x in to_do_list if x not in done ]
# Append chain data to execute this gadget, but respect offset == 0
# as a way to disable this gadget (perform a NULL gadget).
if gadget.offset != 0:
# Stack alignment if required.
if gadget.align:
ret = self.__get_gadget("ret", {})
chain.alignment = padalign(0, itob(ret))
# "Return address" entry into this gadget.
chain.gadget = gadget.offset
# The gadget's "inner stack data" will be values to be popped and
# additional junk data to be deallocated by the gadget itself.
if gadget.pops or gadget.spm > 0:
chain.inner = Payload()
chain.inner(*[ sets.get(p, _POP_MAGIC) for p in gadget.pops ])
if gadget.spm > 0:
chain.inner.pad = padlen(gadget.spm, _SPM_MAGIC)
# The gadget's "outer stack data" will be the additional values
# explicitly specified by the gadget. Append a separate gadget
# to clean up these values.
if gadget.stack:
size = len(gadget.stack) * arch.wordsize
if self.clean_stack:
clean = self.__get_clean(size)
chain.cleanup = clean.offset
pad = padlen(clean.spm, _SPM_MAGIC)
else:
chain.cleanup = _ERROR_MAGIC
pad = None
chain.outer = Payload()
chain.outer(*gadget.stack)
if pad: chain.outer.pad = pad
return chain
|