Skip to content

Commit 1ce1ad0

Browse files
committed
refactor!: ql own mem as bytearray, ref passed to uc and r2
BREAKING CHANGE: mem is managed in Python instead of uc BREAKING CHANGE: MapInfoEntry now has 6 elements instead of 5 BREAKING CHANGE: r2 map io from ql.mem, no full binary, now missing symbols BREAKING CHANGE: del_mapinfo and change_mapinfo recreate and remap mem Add unit tests for ql mem operations Also fix potential bug in syscall_munmap
1 parent cb7ca60 commit 1ce1ad0

File tree

8 files changed

+282
-53
lines changed

8 files changed

+282
-53
lines changed

examples/extensions/r2/hello_r2.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ def my_sandbox(path, rootfs):
3535
ql.hook_address(func, r2.functions['main'].offset)
3636
# enable trace powered by r2 symsmap
3737
# r2.enable_trace()
38-
r2.bt(0x401906)
38+
r2.set_backtrace(0x401906)
3939
ql.run()
4040

4141
if __name__ == "__main__":

examples/extensions/r2/mem_r2.py

Lines changed: 88 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,88 @@
1+
import sys
2+
from types import FrameType
3+
sys.path.append('..')
4+
5+
from tests.test_elf import ELFTest
6+
from qiling import Qiling
7+
from qiling.const import QL_VERBOSE
8+
from qiling.extensions.r2 import R2
9+
10+
def test_elf_linux_arm():
11+
def my_puts(ql: Qiling):
12+
params = ql.os.resolve_fcall_params(ELFTest.PARAMS_PUTS)
13+
print(f'puts("{params["s"]}")')
14+
# all_mem = ql.mem.save()
15+
# for lbound, ubound, perm, _, _, _data in ql.mem.map_info:
16+
# print(f"{lbound:#x} - {ubound:#x} {ubound - lbound:#x} {len(_data):#x} {perm:#x}")
17+
# print()
18+
# ql.mem.restore(all_mem)
19+
20+
ql = Qiling(["../examples/rootfs/arm_linux/bin/arm_stat64"], "../examples/rootfs/arm_linux", verbose=QL_VERBOSE.DEBUG)
21+
ql.os.set_api('puts', my_puts)
22+
ql.run()
23+
del ql
24+
25+
def fn(frame: FrameType, msg, arg):
26+
if msg == 'return':
27+
print("Return: ", arg)
28+
return
29+
if msg != 'call': return
30+
# Filter as appropriate
31+
if 'memory' not in frame.f_code.co_filename: return
32+
if '<' in frame.f_code.co_name: return
33+
caller = frame.f_back.f_code.co_name
34+
print("Called ", frame.f_code.co_name, "from ", caller)
35+
for i in range(frame.f_code.co_argcount):
36+
name = frame.f_code.co_varnames[i]
37+
var = frame.f_locals[name]
38+
if isinstance(var, (bytes, bytearray)):
39+
var = f'{type(var)} len {len(var)}'
40+
print(" Argument", name, "is", var)
41+
42+
sys.settrace(fn)
43+
44+
def unmap_hook(ql: "Qiling", access: int, addr: int, size: int, value: int):
45+
print(f"Unmapped memory access at {addr:#x} - {addr + size:#x} with {value:#x} in type {access}")
46+
47+
def mem_cmp_hook(ql: "Qiling", addr: int, size: int):
48+
mapinfo = ql.mem.map_info
49+
for i, mem_region in enumerate(ql.uc.mem_regions()):
50+
assert (mapinfo[i][0], mapinfo[i][1] - 1, mapinfo[i][2]) == mem_region
51+
uc_mem = ql.mem.read(mem_region[0], mem_region[1] - mem_region[0] + 1)
52+
data = ql.mem.map_info[i][5]
53+
if uc_mem == data: continue
54+
print(f"Memory region {i} {mem_region[0]:#x} - {mem_region[1]:#x} not equal to map_info from {addr:#x}")
55+
for line in ql.mem.get_formatted_mapinfo():
56+
print(line)
57+
with open("mem.bin", "wb") as f:
58+
f.write(uc_mem)
59+
with open("map.bin", "wb") as f:
60+
f.write(data)
61+
assert False
62+
63+
def addr_hook(ql: "Qiling"):
64+
mapinfo = ql.mem.map_info
65+
for i, mem_region in enumerate(ql.uc.mem_regions()):
66+
if i != 8: continue
67+
uc_mem = ql.mem.read(mem_region[0], mem_region[1] - mem_region[0] + 1)
68+
with open('right.bin', 'wb') as f:
69+
f.write(uc_mem)
70+
71+
if __name__ == '__main__':
72+
# from tests.test_shellcode import X8664_LIN
73+
env = {'LD_DEBUG': 'all'}
74+
# ql = Qiling(rootfs="rootfs/x8664_linux", code=X8664_LIN, archtype="x8664", ostype="linux", verbose=QL_VERBOSE.DEBUG)
75+
# ql = Qiling(["rootfs/x86_windows/bin/x86_hello.exe"], "rootfs/x86_windows")
76+
# ql = Qiling(["rootfs/arm_linux/bin/arm_hello_static"], "rootfs/arm_linux", verbose=QL_VERBOSE.DISASM)
77+
# ql = Qiling(["rootfs/arm_linux/bin/arm_hello"], "rootfs/arm_linux", env=env, verbose=QL_VERBOSE.DEBUG)
78+
ql = Qiling(["rootfs/x86_linux/bin/x86_hello"], "rootfs/x86_linux", verbose=QL_VERBOSE.DEBUG)
79+
# ql.hook_mem_unmapped(unmap_hook)
80+
# ql.hook_code(mem_cmp_hook)
81+
# mprot_addr = 0x047d4824
82+
# ql.hook_address(addr_hook, mprot_addr)
83+
# ql.debugger = 'qdb'
84+
# ql = Qiling(["rootfs/x8664_linux/bin/testcwd"], "rootfs/x8664_linux", verbose=QL_VERBOSE.DEBUG)
85+
for line in ql.mem.get_formatted_mapinfo():
86+
print(line)
87+
ql.run()
88+
# test_elf_linux_arm()

qiling/arch/utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ def __init__(self, ql: Qiling):
2727

2828
@lru_cache(maxsize=64)
2929
def get_base_and_name(self, addr: int) -> Tuple[int, str]:
30-
for begin, end, _, name, _ in self.ql.mem.map_info:
30+
for begin, end, _, name, _, _ in self.ql.mem.map_info:
3131
if begin <= addr < end:
3232
return begin, basename(name)
3333

qiling/extensions/r2/r2.py

Lines changed: 16 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -142,10 +142,8 @@ def __init__(self, ql: "Qiling", baseaddr=(1 << 64) - 1, loadaddr=0):
142142
self.loadaddr = loadaddr # r2 -m [addr] map file at given address
143143
self.analyzed = False
144144
self._r2c = libr.r_core.r_core_new()
145-
if ql.code:
146-
self._setup_code(ql.code)
147-
else:
148-
self._setup_file(ql.path)
145+
self._r2i = ctypes.cast(self._r2c.contents.io, ctypes.POINTER(libr.r_io.struct_r_io_t))
146+
self._setup_mem(ql)
149147

150148
def _qlarch2r(self, archtype: QL_ARCH) -> str:
151149
return {
@@ -162,20 +160,21 @@ def _qlarch2r(self, archtype: QL_ARCH) -> str:
162160
QL_ARCH.PPC: "ppc",
163161
}[archtype]
164162

165-
def _setup_code(self, code: bytes):
166-
path = f'malloc://{len(code)}'.encode()
167-
fh = libr.r_core.r_core_file_open(self._r2c, path, UC_PROT_ALL, self.loadaddr)
168-
libr.r_core.r_core_bin_load(self._r2c, path, self.baseaddr)
169-
self._cmd(f'wx {code.hex()}')
163+
def _rbuf_map(self, buf: bytearray, perm: int = UC_PROT_ALL, addr: int = 0, delta: int = 0):
164+
rbuf = libr.r_buf_new_with_pointers(ctypes.c_ubyte.from_buffer(buf), len(buf), False)
165+
rbuf = ctypes.cast(rbuf, ctypes.POINTER(libr.r_io.struct_r_buf_t))
166+
desc = libr.r_io_open_buffer(self._r2i, rbuf, perm, 0) # last arg `mode` is always 0 in r2 code
167+
libr.r_io.r_io_map_add(self._r2i, desc.contents.fd, desc.contents.perm, delta, addr, len(buf))
168+
169+
def _setup_mem(self, ql: 'Qiling'):
170+
if not hasattr(ql, '_mem'):
171+
return
172+
for start, end, perms, _label, _mmio, buf in ql.mem.map_info:
173+
self._rbuf_map(buf, perms, start)
170174
# set architecture and bits for r2 asm
171-
arch = self._qlarch2r(self.ql.arch.type)
172-
self._cmd(f"e,asm.arch={arch},asm.bits={self.ql.arch.bits}")
173-
174-
def _setup_file(self, path: str):
175-
path = path.encode()
176-
fh = libr.r_core.r_core_file_open(self._r2c, path, UC_PROT_READ | UC_PROT_EXEC, self.loadaddr)
177-
libr.r_core.r_core_bin_load(self._r2c, path, self.baseaddr)
178-
175+
arch = self._qlarch2r(ql.arch.type)
176+
self._cmd(f"e,asm.arch={arch},asm.bits={ql.arch.bits}")
177+
179178
def _cmd(self, cmd: str) -> str:
180179
r = libr.r_core.r_core_cmd_str(
181180
self._r2c, ctypes.create_string_buffer(cmd.encode("utf-8")))

qiling/os/memory.py

Lines changed: 64 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@
33
# Cross Platform and Multi Architecture Advanced Binary Emulation Framework
44
#
55

6+
import ctypes
67
import os, re
78
from typing import Any, Callable, Iterator, List, Mapping, MutableSequence, Optional, Pattern, Sequence, Tuple, Union
89

@@ -11,8 +12,8 @@
1112
from qiling import Qiling
1213
from qiling.exception import *
1314

14-
# tuple: range start, range end, permissions mask, range label, is mmio?
15-
MapInfoEntry = Tuple[int, int, int, str, bool]
15+
# tuple: range start, range end, permissions mask, range label, is mmio?, bytearray
16+
MapInfoEntry = Tuple[int, int, int, str, bool, bytearray]
1617

1718
MmioReadCallback = Callable[[Qiling, int, int], int]
1819
MmioWriteCallback = Callable[[Qiling, int, int, int], None]
@@ -48,6 +49,8 @@ def __init__(self, ql: Qiling):
4849
# make sure pagesize is a power of 2
4950
assert self.pagesize & (self.pagesize - 1) == 0, 'pagesize has to be a power of 2'
5051

52+
self.cmap = {} # mapping from start addr to cdata ptr
53+
5154
def __read_string(self, addr: int) -> str:
5255
ret = bytearray()
5356
c = self.read(addr, 1)
@@ -80,7 +83,7 @@ def string(self, addr: int, value=None, encoding='utf-8') -> Optional[str]:
8083

8184
self.__write_string(addr, value, encoding)
8285

83-
def add_mapinfo(self, mem_s: int, mem_e: int, mem_p: int, mem_info: str, is_mmio: bool = False):
86+
def add_mapinfo(self, mem_s: int, mem_e: int, mem_p: int, mem_info: str, is_mmio: bool = False, data : bytearray = None):
8487
"""Add a new memory range to map.
8588
8689
Args:
@@ -90,12 +93,11 @@ def add_mapinfo(self, mem_s: int, mem_e: int, mem_p: int, mem_info: str, is_mmio
9093
mem_info: map entry label
9194
is_mmio: memory range is mmio
9295
"""
93-
94-
self.map_info.append((mem_s, mem_e, mem_p, mem_info, is_mmio))
95-
self.map_info = sorted(self.map_info, key=lambda tp: tp[0])
96+
self.map_info.append((mem_s, mem_e, mem_p, mem_info, is_mmio, data))
97+
self.map_info.sort(key=lambda tp: tp[0])
9698

9799
def del_mapinfo(self, mem_s: int, mem_e: int):
98-
"""Subtract a memory range from map.
100+
"""Subtract a memory range from map, will destroy data and unmap uc mem in the range.
99101
100102
Args:
101103
mem_s: memory range start
@@ -104,30 +106,37 @@ def del_mapinfo(self, mem_s: int, mem_e: int):
104106

105107
tmp_map_info: MutableSequence[MapInfoEntry] = []
106108

107-
for s, e, p, info, mmio in self.map_info:
109+
for s, e, p, info, mmio, data in self.map_info:
108110
if e <= mem_s:
109-
tmp_map_info.append((s, e, p, info, mmio))
111+
tmp_map_info.append((s, e, p, info, mmio, data))
110112
continue
111113

112114
if s >= mem_e:
113-
tmp_map_info.append((s, e, p, info, mmio))
115+
tmp_map_info.append((s, e, p, info, mmio, data))
114116
continue
115117

118+
del self.cmap[s] # remove cdata reference starting at s
116119
if s < mem_s:
117-
tmp_map_info.append((s, mem_s, p, info, mmio))
120+
self.ql.uc.mem_unmap(s, mem_s - s)
121+
self.map_ptr(s, mem_s - s, p, data[:mem_s - s])
122+
tmp_map_info.append((s, mem_s, p, info, mmio, data[:mem_s - s]))
118123

119124
if s == mem_s:
120125
pass
121126

122127
if e > mem_e:
123-
tmp_map_info.append((mem_e, e, p, info, mmio))
128+
self.ql.uc.mem_unmap(mem_e, e - mem_e)
129+
self.map_ptr(mem_e, e - mem_e, p, data[mem_e - e:])
130+
tmp_map_info.append((mem_e, e, p, info, mmio, data[mem_e - e:]))
124131

125132
if e == mem_e:
126133
pass
127134

135+
del data[mem_s - s:mem_e - s]
136+
128137
self.map_info = tmp_map_info
129138

130-
def change_mapinfo(self, mem_s: int, mem_e: int, mem_p: Optional[int] = None, mem_info: Optional[str] = None):
139+
def change_mapinfo(self, mem_s: int, mem_e: int, mem_p: Optional[int] = None, mem_info: Optional[str] = None, data: Optional[bytearray] = None):
131140
tmp_map_info: Optional[MapInfoEntry] = None
132141
info_idx: int = None
133142

@@ -142,12 +151,15 @@ def change_mapinfo(self, mem_s: int, mem_e: int, mem_p: Optional[int] = None, me
142151
return
143152

144153
if mem_p is not None:
145-
self.del_mapinfo(mem_s, mem_e)
146-
self.add_mapinfo(mem_s, mem_e, mem_p, mem_info if mem_info else tmp_map_info[3])
154+
data = data or self.read(mem_s, mem_e - mem_s).copy()
155+
assert(len(data) == mem_e - mem_s)
156+
self.unmap(mem_s, mem_e - mem_s)
157+
self.map_ptr(mem_s, mem_e - mem_s, mem_p, data)
158+
self.add_mapinfo(mem_s, mem_e, mem_p, mem_info or tmp_map_info[3], tmp_map_info[4], data)
147159
return
148160

149161
if mem_info is not None:
150-
self.map_info[info_idx] = (tmp_map_info[0], tmp_map_info[1], tmp_map_info[2], mem_info, tmp_map_info[4])
162+
self.map_info[info_idx] = (tmp_map_info[0], tmp_map_info[1], tmp_map_info[2], mem_info, tmp_map_info[4], tmp_map_info[5])
151163

152164
def get_mapinfo(self) -> Sequence[Tuple[int, int, str, str, str]]:
153165
"""Get memory map info.
@@ -166,7 +178,7 @@ def __perms_mapping(ps: int) -> str:
166178

167179
return ''.join(val if idx & ps else '-' for idx, val in perms_d.items())
168180

169-
def __process(lbound: int, ubound: int, perms: int, label: str, is_mmio: bool) -> Tuple[int, int, str, str, str]:
181+
def __process(lbound: int, ubound: int, perms: int, label: str, is_mmio: bool, _data: bytearray) -> Tuple[int, int, str, str, str]:
170182
perms_str = __perms_mapping(perms)
171183

172184
if hasattr(self.ql, 'loader'):
@@ -211,7 +223,7 @@ def get_lib_base(self, filename: str) -> Optional[int]:
211223

212224
# some info labels may be prefixed by boxed label which breaks the search by basename.
213225
# iterate through all info labels and remove all boxed prefixes, if any
214-
stripped = ((lbound, p.sub('', info)) for lbound, _, _, info, _ in self.map_info)
226+
stripped = ((lbound, p.sub('', info)) for lbound, _, _, info, _, _ in self.map_info)
215227

216228
return next((lbound for lbound, info in stripped if os.path.basename(info) == filename), None)
217229

@@ -268,12 +280,11 @@ def save(self):
268280
"mmio" : []
269281
}
270282

271-
for lbound, ubound, perm, label, is_mmio in self.map_info:
283+
for lbound, ubound, perm, label, is_mmio, data in self.map_info:
272284
if is_mmio:
273285
mem_dict['mmio'].append((lbound, ubound, perm, label, *self.mmio_cbs[(lbound, ubound)]))
274286
else:
275-
data = self.read(lbound, ubound - lbound)
276-
mem_dict['ram'].append((lbound, ubound, perm, label, bytes(data)))
287+
mem_dict['ram'].append((lbound, ubound, perm, label, data))
277288

278289
return mem_dict
279290

@@ -287,10 +298,10 @@ def restore(self, mem_dict):
287298
size = ubound - lbound
288299
if self.is_available(lbound, size):
289300
self.ql.log.debug(f'mapping {lbound:#08x} {ubound:#08x}, mapsize = {size:#x}')
290-
self.map(lbound, size, perms, label)
301+
self.map(lbound, size, perms, label, data)
291302

292303
self.ql.log.debug(f'writing {len(data):#x} bytes at {lbound:#08x}')
293-
self.write(lbound, data)
304+
self.write(lbound, bytes(data))
294305

295306
for lbound, ubound, perms, label, read_cb, write_cb in mem_dict['mmio']:
296307
self.ql.log.debug(f"restoring mmio range: {lbound:#08x} {ubound:#08x} {label}")
@@ -393,7 +404,7 @@ def search(self, needle: Union[bytes, Pattern[bytes]], begin: Optional[int] = No
393404
assert begin < end, 'search arguments do not make sense'
394405

395406
# narrow the search down to relevant ranges; mmio ranges are excluded due to potential read size effects
396-
ranges = [(max(begin, lbound), min(ubound, end)) for lbound, ubound, _, _, is_mmio in self.map_info if not (end < lbound or ubound < begin or is_mmio)]
407+
ranges = [(max(begin, lbound), min(ubound, end)) for lbound, ubound, _, _, is_mmio, _data in self.map_info if not (end < lbound or ubound < begin or is_mmio)]
397408
results = []
398409

399410
# if needle is a bytes sequence use it verbatim, not as a pattern
@@ -439,10 +450,10 @@ def __mapped_regions(self) -> Iterator[Tuple[int, int]]:
439450

440451
iter_memmap = iter(self.map_info)
441452

442-
p_lbound, p_ubound, _, _, _ = next(iter_memmap)
453+
p_lbound, p_ubound, _, _, _, _ = next(iter_memmap)
443454

444455
# map_info is assumed to contain non-overlapping regions sorted by lbound
445-
for lbound, ubound, _, _, _ in iter_memmap:
456+
for lbound, ubound, _, _, _, _ in iter_memmap:
446457
if lbound == p_ubound:
447458
p_ubound = ubound
448459
else:
@@ -514,8 +525,8 @@ def find_free_space(self, size: int, minaddr: Optional[int] = None, maxaddr: Opt
514525
assert minaddr < maxaddr
515526

516527
# get gap ranges between mapped ones and memory bounds
517-
gaps_ubounds = tuple(lbound for lbound, _, _, _, _ in self.map_info) + (mem_ubound,)
518-
gaps_lbounds = (mem_lbound,) + tuple(ubound for _, ubound, _, _, _ in self.map_info)
528+
gaps_ubounds = tuple(lbound for lbound, _, _, _, _, _ in self.map_info) + (mem_ubound,)
529+
gaps_lbounds = (mem_lbound,) + tuple(ubound for _, ubound, _, _, _, _ in self.map_info)
519530
gaps = zip(gaps_lbounds, gaps_ubounds)
520531

521532
for lbound, ubound in gaps:
@@ -563,7 +574,7 @@ def protect(self, addr: int, size: int, perms):
563574
self.change_mapinfo(aligned_address, aligned_address + aligned_size, mem_p = perms)
564575

565576

566-
def map(self, addr: int, size: int, perms: int = UC_PROT_ALL, info: Optional[str] = None):
577+
def map(self, addr: int, size: int, perms: int = UC_PROT_ALL, info: Optional[str] = None, ptr: Optional[bytearray] = None):
567578
"""Map a new memory range.
568579
569580
Args:
@@ -580,10 +591,31 @@ def map(self, addr: int, size: int, perms: int = UC_PROT_ALL, info: Optional[str
580591
assert perms & ~UC_PROT_ALL == 0, f'unexpected permissions mask {perms}'
581592

582593
if not self.is_available(addr, size):
583-
raise QlMemoryMappedError('Requested memory is unavailable')
594+
for line in self.get_formatted_mapinfo():
595+
print(line)
596+
raise QlMemoryMappedError(f'Requested memory {addr:#x} + {size:#x} is unavailable')
584597

585-
self.ql.uc.mem_map(addr, size, perms)
586-
self.add_mapinfo(addr, addr + size, perms, info or '[mapped]', is_mmio=False)
598+
buf = self.map_ptr(addr, size, perms, ptr)
599+
self.add_mapinfo(addr, addr + size, perms, info or '[mapped]', is_mmio=False, data=buf)
600+
601+
def map_ptr(self, addr: int, size: int, perms: int = UC_PROT_ALL, buf: Optional[bytearray] = None) -> bytearray:
602+
"""Map a new memory range allocated as Python bytearray, will not affect map_info
603+
604+
Args:
605+
addr: memory range base address
606+
size: memory range size (in bytes)
607+
perms: requested permissions mask
608+
buf: bytearray already allocated (if any)
609+
610+
Returns:
611+
bytearray with size, should be added to map_info by caller
612+
"""
613+
buf = buf or bytearray(size)
614+
buf_type = ctypes.c_byte * size
615+
cdata = buf_type.from_buffer(buf)
616+
self.cmap[addr] = cdata
617+
self.ql.uc.mem_map_ptr(addr, size, perms, cdata)
618+
return buf
587619

588620
def map_mmio(self, addr: int, size: int, read_cb: Optional[MmioReadCallback], write_cb: Optional[MmioWriteCallback], info: str = '[mmio]'):
589621
# TODO: mmio memory overlap with ram? Is that possible?

0 commit comments

Comments
 (0)