]>
Commit | Line | Data |
---|---|---|
28fbf8f6 JF |
1 | """ |
2 | This python script adds a new gdb command, "dump-guest-memory". It | |
3 | should be loaded with "source dump-guest-memory.py" at the (gdb) | |
4 | prompt. | |
5 | ||
6 | Copyright (C) 2013, Red Hat, Inc. | |
7 | ||
8 | Authors: | |
9 | Laszlo Ersek <[email protected]> | |
10 | Janosch Frank <[email protected]> | |
11 | ||
12 | This work is licensed under the terms of the GNU GPL, version 2 or later. See | |
13 | the COPYING file in the top-level directory. | |
14 | """ | |
f03868bd | 15 | from __future__ import print_function |
3e16d14f | 16 | |
368e3adc | 17 | import ctypes |
d23bfa91 | 18 | import struct |
3e16d14f | 19 | |
4b17bc93 AJ |
20 | try: |
21 | UINTPTR_T = gdb.lookup_type("uintptr_t") | |
22 | except Exception as inst: | |
23 | raise gdb.GdbError("Symbols must be loaded prior to sourcing dump-guest-memory.\n" | |
24 | "Symbols may be loaded by 'attach'ing a QEMU process id or by " | |
25 | "'load'ing a QEMU binary.") | |
47890203 | 26 | |
ca81ce72 JF |
27 | TARGET_PAGE_SIZE = 0x1000 |
28 | TARGET_PAGE_MASK = 0xFFFFFFFFFFFFF000 | |
29 | ||
ca81ce72 JF |
30 | # Special value for e_phnum. This indicates that the real number of |
31 | # program headers is too large to fit into e_phnum. Instead the real | |
32 | # value is in the field sh_info of section 0. | |
33 | PN_XNUM = 0xFFFF | |
34 | ||
368e3adc JF |
35 | EV_CURRENT = 1 |
36 | ||
37 | ELFCLASS32 = 1 | |
38 | ELFCLASS64 = 2 | |
39 | ||
40 | ELFDATA2LSB = 1 | |
41 | ELFDATA2MSB = 2 | |
42 | ||
43 | ET_CORE = 4 | |
44 | ||
45 | PT_LOAD = 1 | |
46 | PT_NOTE = 4 | |
47 | ||
48 | EM_386 = 3 | |
49 | EM_PPC = 20 | |
50 | EM_PPC64 = 21 | |
51 | EM_S390 = 22 | |
52 | EM_AARCH = 183 | |
53 | EM_X86_64 = 62 | |
54 | ||
d23bfa91 MAL |
55 | VMCOREINFO_FORMAT_ELF = 1 |
56 | ||
57 | def le16_to_cpu(val): | |
58 | return struct.unpack("<H", struct.pack("=H", val))[0] | |
59 | ||
60 | def le32_to_cpu(val): | |
61 | return struct.unpack("<I", struct.pack("=I", val))[0] | |
62 | ||
63 | def le64_to_cpu(val): | |
64 | return struct.unpack("<Q", struct.pack("=Q", val))[0] | |
65 | ||
368e3adc JF |
66 | class ELF(object): |
67 | """Representation of a ELF file.""" | |
68 | ||
69 | def __init__(self, arch): | |
70 | self.ehdr = None | |
71 | self.notes = [] | |
72 | self.segments = [] | |
73 | self.notes_size = 0 | |
1d817db3 | 74 | self.endianness = None |
368e3adc JF |
75 | self.elfclass = ELFCLASS64 |
76 | ||
77 | if arch == 'aarch64-le': | |
1d817db3 | 78 | self.endianness = ELFDATA2LSB |
368e3adc | 79 | self.elfclass = ELFCLASS64 |
1d817db3 | 80 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) |
368e3adc JF |
81 | self.ehdr.e_machine = EM_AARCH |
82 | ||
83 | elif arch == 'aarch64-be': | |
1d817db3 SW |
84 | self.endianness = ELFDATA2MSB |
85 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) | |
368e3adc JF |
86 | self.ehdr.e_machine = EM_AARCH |
87 | ||
88 | elif arch == 'X86_64': | |
1d817db3 SW |
89 | self.endianness = ELFDATA2LSB |
90 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) | |
368e3adc JF |
91 | self.ehdr.e_machine = EM_X86_64 |
92 | ||
93 | elif arch == '386': | |
1d817db3 | 94 | self.endianness = ELFDATA2LSB |
368e3adc | 95 | self.elfclass = ELFCLASS32 |
1d817db3 | 96 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) |
368e3adc JF |
97 | self.ehdr.e_machine = EM_386 |
98 | ||
99 | elif arch == 's390': | |
1d817db3 SW |
100 | self.endianness = ELFDATA2MSB |
101 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) | |
368e3adc JF |
102 | self.ehdr.e_machine = EM_S390 |
103 | ||
104 | elif arch == 'ppc64-le': | |
1d817db3 SW |
105 | self.endianness = ELFDATA2LSB |
106 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) | |
368e3adc JF |
107 | self.ehdr.e_machine = EM_PPC64 |
108 | ||
109 | elif arch == 'ppc64-be': | |
1d817db3 SW |
110 | self.endianness = ELFDATA2MSB |
111 | self.ehdr = get_arch_ehdr(self.endianness, self.elfclass) | |
368e3adc JF |
112 | self.ehdr.e_machine = EM_PPC64 |
113 | ||
114 | else: | |
115 | raise gdb.GdbError("No valid arch type specified.\n" | |
116 | "Currently supported types:\n" | |
117 | "aarch64-be, aarch64-le, X86_64, 386, s390, " | |
118 | "ppc64-be, ppc64-le") | |
119 | ||
120 | self.add_segment(PT_NOTE, 0, 0) | |
121 | ||
122 | def add_note(self, n_name, n_desc, n_type): | |
123 | """Adds a note to the ELF.""" | |
124 | ||
1d817db3 | 125 | note = get_arch_note(self.endianness, len(n_name), len(n_desc)) |
368e3adc JF |
126 | note.n_namesz = len(n_name) + 1 |
127 | note.n_descsz = len(n_desc) | |
128 | note.n_name = n_name.encode() | |
129 | note.n_type = n_type | |
130 | ||
131 | # Desc needs to be 4 byte aligned (although the 64bit spec | |
132 | # specifies 8 byte). When defining n_desc as uint32 it will be | |
133 | # automatically aligned but we need the memmove to copy the | |
134 | # string into it. | |
135 | ctypes.memmove(note.n_desc, n_desc.encode(), len(n_desc)) | |
136 | ||
137 | self.notes.append(note) | |
138 | self.segments[0].p_filesz += ctypes.sizeof(note) | |
139 | self.segments[0].p_memsz += ctypes.sizeof(note) | |
140 | ||
d23bfa91 MAL |
141 | |
142 | def add_vmcoreinfo_note(self, vmcoreinfo): | |
143 | """Adds a vmcoreinfo note to the ELF dump.""" | |
144 | # compute the header size, and copy that many bytes from the note | |
145 | header = get_arch_note(self.endianness, 0, 0) | |
146 | ctypes.memmove(ctypes.pointer(header), | |
147 | vmcoreinfo, ctypes.sizeof(header)) | |
148 | if header.n_descsz > 1 << 20: | |
149 | print('warning: invalid vmcoreinfo size') | |
150 | return | |
151 | # now get the full note | |
152 | note = get_arch_note(self.endianness, | |
153 | header.n_namesz - 1, header.n_descsz) | |
154 | ctypes.memmove(ctypes.pointer(note), vmcoreinfo, ctypes.sizeof(note)) | |
155 | ||
156 | self.notes.append(note) | |
157 | self.segments[0].p_filesz += ctypes.sizeof(note) | |
158 | self.segments[0].p_memsz += ctypes.sizeof(note) | |
159 | ||
368e3adc JF |
160 | def add_segment(self, p_type, p_paddr, p_size): |
161 | """Adds a segment to the elf.""" | |
162 | ||
1d817db3 | 163 | phdr = get_arch_phdr(self.endianness, self.elfclass) |
368e3adc JF |
164 | phdr.p_type = p_type |
165 | phdr.p_paddr = p_paddr | |
166 | phdr.p_filesz = p_size | |
167 | phdr.p_memsz = p_size | |
168 | self.segments.append(phdr) | |
169 | self.ehdr.e_phnum += 1 | |
170 | ||
171 | def to_file(self, elf_file): | |
172 | """Writes all ELF structures to the the passed file. | |
173 | ||
174 | Structure: | |
175 | Ehdr | |
176 | Segment 0:PT_NOTE | |
177 | Segment 1:PT_LOAD | |
178 | Segment N:PT_LOAD | |
179 | Note 0..N | |
180 | Dump contents | |
181 | """ | |
182 | elf_file.write(self.ehdr) | |
183 | off = ctypes.sizeof(self.ehdr) + \ | |
184 | len(self.segments) * ctypes.sizeof(self.segments[0]) | |
185 | ||
186 | for phdr in self.segments: | |
187 | phdr.p_offset = off | |
188 | elf_file.write(phdr) | |
189 | off += phdr.p_filesz | |
190 | ||
191 | for note in self.notes: | |
192 | elf_file.write(note) | |
193 | ||
194 | ||
1d817db3 SW |
195 | def get_arch_note(endianness, len_name, len_desc): |
196 | """Returns a Note class with the specified endianness.""" | |
368e3adc | 197 | |
1d817db3 | 198 | if endianness == ELFDATA2LSB: |
368e3adc JF |
199 | superclass = ctypes.LittleEndianStructure |
200 | else: | |
201 | superclass = ctypes.BigEndianStructure | |
202 | ||
203 | len_name = len_name + 1 | |
204 | ||
205 | class Note(superclass): | |
206 | """Represents an ELF note, includes the content.""" | |
207 | ||
208 | _fields_ = [("n_namesz", ctypes.c_uint32), | |
209 | ("n_descsz", ctypes.c_uint32), | |
210 | ("n_type", ctypes.c_uint32), | |
211 | ("n_name", ctypes.c_char * len_name), | |
212 | ("n_desc", ctypes.c_uint32 * ((len_desc + 3) // 4))] | |
213 | return Note() | |
214 | ||
215 | ||
216 | class Ident(ctypes.Structure): | |
217 | """Represents the ELF ident array in the ehdr structure.""" | |
218 | ||
219 | _fields_ = [('ei_mag0', ctypes.c_ubyte), | |
220 | ('ei_mag1', ctypes.c_ubyte), | |
221 | ('ei_mag2', ctypes.c_ubyte), | |
222 | ('ei_mag3', ctypes.c_ubyte), | |
223 | ('ei_class', ctypes.c_ubyte), | |
224 | ('ei_data', ctypes.c_ubyte), | |
225 | ('ei_version', ctypes.c_ubyte), | |
226 | ('ei_osabi', ctypes.c_ubyte), | |
227 | ('ei_abiversion', ctypes.c_ubyte), | |
228 | ('ei_pad', ctypes.c_ubyte * 7)] | |
229 | ||
1d817db3 | 230 | def __init__(self, endianness, elfclass): |
368e3adc JF |
231 | self.ei_mag0 = 0x7F |
232 | self.ei_mag1 = ord('E') | |
233 | self.ei_mag2 = ord('L') | |
234 | self.ei_mag3 = ord('F') | |
235 | self.ei_class = elfclass | |
1d817db3 | 236 | self.ei_data = endianness |
368e3adc JF |
237 | self.ei_version = EV_CURRENT |
238 | ||
239 | ||
1d817db3 SW |
240 | def get_arch_ehdr(endianness, elfclass): |
241 | """Returns a EHDR64 class with the specified endianness.""" | |
368e3adc | 242 | |
1d817db3 | 243 | if endianness == ELFDATA2LSB: |
368e3adc JF |
244 | superclass = ctypes.LittleEndianStructure |
245 | else: | |
246 | superclass = ctypes.BigEndianStructure | |
247 | ||
248 | class EHDR64(superclass): | |
249 | """Represents the 64 bit ELF header struct.""" | |
250 | ||
251 | _fields_ = [('e_ident', Ident), | |
252 | ('e_type', ctypes.c_uint16), | |
253 | ('e_machine', ctypes.c_uint16), | |
254 | ('e_version', ctypes.c_uint32), | |
255 | ('e_entry', ctypes.c_uint64), | |
256 | ('e_phoff', ctypes.c_uint64), | |
257 | ('e_shoff', ctypes.c_uint64), | |
258 | ('e_flags', ctypes.c_uint32), | |
259 | ('e_ehsize', ctypes.c_uint16), | |
260 | ('e_phentsize', ctypes.c_uint16), | |
261 | ('e_phnum', ctypes.c_uint16), | |
262 | ('e_shentsize', ctypes.c_uint16), | |
263 | ('e_shnum', ctypes.c_uint16), | |
264 | ('e_shstrndx', ctypes.c_uint16)] | |
265 | ||
266 | def __init__(self): | |
267 | super(superclass, self).__init__() | |
1d817db3 | 268 | self.e_ident = Ident(endianness, elfclass) |
368e3adc JF |
269 | self.e_type = ET_CORE |
270 | self.e_version = EV_CURRENT | |
271 | self.e_ehsize = ctypes.sizeof(self) | |
272 | self.e_phoff = ctypes.sizeof(self) | |
1d817db3 | 273 | self.e_phentsize = ctypes.sizeof(get_arch_phdr(endianness, elfclass)) |
368e3adc JF |
274 | self.e_phnum = 0 |
275 | ||
276 | ||
277 | class EHDR32(superclass): | |
278 | """Represents the 32 bit ELF header struct.""" | |
279 | ||
280 | _fields_ = [('e_ident', Ident), | |
281 | ('e_type', ctypes.c_uint16), | |
282 | ('e_machine', ctypes.c_uint16), | |
283 | ('e_version', ctypes.c_uint32), | |
284 | ('e_entry', ctypes.c_uint32), | |
285 | ('e_phoff', ctypes.c_uint32), | |
286 | ('e_shoff', ctypes.c_uint32), | |
287 | ('e_flags', ctypes.c_uint32), | |
288 | ('e_ehsize', ctypes.c_uint16), | |
289 | ('e_phentsize', ctypes.c_uint16), | |
290 | ('e_phnum', ctypes.c_uint16), | |
291 | ('e_shentsize', ctypes.c_uint16), | |
292 | ('e_shnum', ctypes.c_uint16), | |
293 | ('e_shstrndx', ctypes.c_uint16)] | |
294 | ||
295 | def __init__(self): | |
296 | super(superclass, self).__init__() | |
1d817db3 | 297 | self.e_ident = Ident(endianness, elfclass) |
368e3adc JF |
298 | self.e_type = ET_CORE |
299 | self.e_version = EV_CURRENT | |
300 | self.e_ehsize = ctypes.sizeof(self) | |
301 | self.e_phoff = ctypes.sizeof(self) | |
1d817db3 | 302 | self.e_phentsize = ctypes.sizeof(get_arch_phdr(endianness, elfclass)) |
368e3adc JF |
303 | self.e_phnum = 0 |
304 | ||
305 | # End get_arch_ehdr | |
306 | if elfclass == ELFCLASS64: | |
307 | return EHDR64() | |
308 | else: | |
309 | return EHDR32() | |
310 | ||
311 | ||
1d817db3 SW |
312 | def get_arch_phdr(endianness, elfclass): |
313 | """Returns a 32 or 64 bit PHDR class with the specified endianness.""" | |
368e3adc | 314 | |
1d817db3 | 315 | if endianness == ELFDATA2LSB: |
368e3adc JF |
316 | superclass = ctypes.LittleEndianStructure |
317 | else: | |
318 | superclass = ctypes.BigEndianStructure | |
319 | ||
320 | class PHDR64(superclass): | |
321 | """Represents the 64 bit ELF program header struct.""" | |
322 | ||
323 | _fields_ = [('p_type', ctypes.c_uint32), | |
324 | ('p_flags', ctypes.c_uint32), | |
325 | ('p_offset', ctypes.c_uint64), | |
326 | ('p_vaddr', ctypes.c_uint64), | |
327 | ('p_paddr', ctypes.c_uint64), | |
328 | ('p_filesz', ctypes.c_uint64), | |
329 | ('p_memsz', ctypes.c_uint64), | |
330 | ('p_align', ctypes.c_uint64)] | |
331 | ||
332 | class PHDR32(superclass): | |
333 | """Represents the 32 bit ELF program header struct.""" | |
334 | ||
335 | _fields_ = [('p_type', ctypes.c_uint32), | |
336 | ('p_offset', ctypes.c_uint32), | |
337 | ('p_vaddr', ctypes.c_uint32), | |
338 | ('p_paddr', ctypes.c_uint32), | |
339 | ('p_filesz', ctypes.c_uint32), | |
340 | ('p_memsz', ctypes.c_uint32), | |
341 | ('p_flags', ctypes.c_uint32), | |
342 | ('p_align', ctypes.c_uint32)] | |
343 | ||
344 | # End get_arch_phdr | |
345 | if elfclass == ELFCLASS64: | |
346 | return PHDR64() | |
347 | else: | |
348 | return PHDR32() | |
349 | ||
ca81ce72 | 350 | |
47890203 | 351 | def int128_get64(val): |
6782c0e7 JF |
352 | """Returns low 64bit part of Int128 struct.""" |
353 | ||
9b4b157e MAL |
354 | try: |
355 | assert val["hi"] == 0 | |
356 | return val["lo"] | |
357 | except gdb.error: | |
358 | u64t = gdb.lookup_type('uint64_t').array(2) | |
359 | u64 = val.cast(u64t) | |
360 | if sys.byteorder == 'little': | |
361 | assert u64[1] == 0 | |
362 | return u64[0] | |
363 | else: | |
364 | assert u64[0] == 0 | |
365 | return u64[1] | |
47890203 | 366 | |
6782c0e7 | 367 | |
47890203 | 368 | def qlist_foreach(head, field_str): |
6782c0e7 JF |
369 | """Generator for qlists.""" |
370 | ||
47890203 | 371 | var_p = head["lh_first"] |
6782c0e7 | 372 | while var_p != 0: |
47890203 | 373 | var = var_p.dereference() |
47890203 | 374 | var_p = var[field_str]["le_next"] |
6782c0e7 JF |
375 | yield var |
376 | ||
47890203 | 377 | |
0878d0e1 | 378 | def qemu_map_ram_ptr(block, offset): |
6782c0e7 JF |
379 | """Returns qemu vaddr for given guest physical address.""" |
380 | ||
0878d0e1 | 381 | return block["host"] + offset |
47890203 | 382 | |
6782c0e7 JF |
383 | |
384 | def memory_region_get_ram_ptr(memory_region): | |
385 | if memory_region["alias"] != 0: | |
386 | return (memory_region_get_ram_ptr(memory_region["alias"].dereference()) | |
387 | + memory_region["alias_offset"]) | |
388 | ||
0878d0e1 | 389 | return qemu_map_ram_ptr(memory_region["ram_block"], 0) |
6782c0e7 | 390 | |
47890203 JF |
391 | |
392 | def get_guest_phys_blocks(): | |
6782c0e7 JF |
393 | """Returns a list of ram blocks. |
394 | ||
395 | Each block entry contains: | |
396 | 'target_start': guest block phys start address | |
397 | 'target_end': guest block phys end address | |
398 | 'host_addr': qemu vaddr of the block's start | |
399 | """ | |
400 | ||
47890203 | 401 | guest_phys_blocks = [] |
6782c0e7 | 402 | |
7cb1089d JF |
403 | print("guest RAM blocks:") |
404 | print("target_start target_end host_addr message " | |
405 | "count") | |
406 | print("---------------- ---------------- ---------------- ------- " | |
407 | "-----") | |
47890203 JF |
408 | |
409 | current_map_p = gdb.parse_and_eval("address_space_memory.current_map") | |
410 | current_map = current_map_p.dereference() | |
7cb1089d JF |
411 | |
412 | # Conversion to int is needed for python 3 | |
413 | # compatibility. Otherwise range doesn't cast the value itself and | |
414 | # breaks. | |
415 | for cur in range(int(current_map["nr"])): | |
6782c0e7 JF |
416 | flat_range = (current_map["ranges"] + cur).dereference() |
417 | memory_region = flat_range["mr"].dereference() | |
47890203 JF |
418 | |
419 | # we only care about RAM | |
6782c0e7 | 420 | if not memory_region["ram"]: |
47890203 JF |
421 | continue |
422 | ||
423 | section_size = int128_get64(flat_range["addr"]["size"]) | |
424 | target_start = int128_get64(flat_range["addr"]["start"]) | |
6782c0e7 JF |
425 | target_end = target_start + section_size |
426 | host_addr = (memory_region_get_ram_ptr(memory_region) | |
427 | + flat_range["offset_in_region"]) | |
47890203 JF |
428 | predecessor = None |
429 | ||
430 | # find continuity in guest physical address space | |
6782c0e7 | 431 | if len(guest_phys_blocks) > 0: |
47890203 JF |
432 | predecessor = guest_phys_blocks[-1] |
433 | predecessor_size = (predecessor["target_end"] - | |
434 | predecessor["target_start"]) | |
435 | ||
436 | # the memory API guarantees monotonically increasing | |
437 | # traversal | |
6782c0e7 | 438 | assert predecessor["target_end"] <= target_start |
47890203 JF |
439 | |
440 | # we want continuity in both guest-physical and | |
441 | # host-virtual memory | |
442 | if (predecessor["target_end"] < target_start or | |
443 | predecessor["host_addr"] + predecessor_size != host_addr): | |
444 | predecessor = None | |
445 | ||
6782c0e7 | 446 | if predecessor is None: |
47890203 JF |
447 | # isolated mapping, add it to the list |
448 | guest_phys_blocks.append({"target_start": target_start, | |
6782c0e7 JF |
449 | "target_end": target_end, |
450 | "host_addr": host_addr}) | |
47890203 JF |
451 | message = "added" |
452 | else: | |
453 | # expand predecessor until @target_end; predecessor's | |
454 | # start doesn't change | |
455 | predecessor["target_end"] = target_end | |
456 | message = "joined" | |
457 | ||
7cb1089d JF |
458 | print("%016x %016x %016x %-7s %5u" % |
459 | (target_start, target_end, host_addr.cast(UINTPTR_T), | |
460 | message, len(guest_phys_blocks))) | |
47890203 JF |
461 | |
462 | return guest_phys_blocks | |
463 | ||
464 | ||
28fbf8f6 JF |
465 | # The leading docstring doesn't have idiomatic Python formatting. It is |
466 | # printed by gdb's "help" command (the first line is printed in the | |
467 | # "help data" summary), and it should match how other help texts look in | |
468 | # gdb. | |
3e16d14f LE |
469 | class DumpGuestMemory(gdb.Command): |
470 | """Extract guest vmcore from qemu process coredump. | |
471 | ||
368e3adc JF |
472 | The two required arguments are FILE and ARCH: |
473 | FILE identifies the target file to write the guest vmcore to. | |
474 | ARCH specifies the architecture for which the core will be generated. | |
3e16d14f LE |
475 | |
476 | This GDB command reimplements the dump-guest-memory QMP command in | |
477 | python, using the representation of guest memory as captured in the qemu | |
478 | coredump. The qemu process that has been dumped must have had the | |
368e3adc | 479 | command line option "-machine dump-guest-core=on" which is the default. |
3e16d14f LE |
480 | |
481 | For simplicity, the "paging", "begin" and "end" parameters of the QMP | |
482 | command are not supported -- no attempt is made to get the guest's | |
483 | internal paging structures (ie. paging=false is hard-wired), and guest | |
484 | memory is always fully dumped. | |
485 | ||
368e3adc JF |
486 | Currently aarch64-be, aarch64-le, X86_64, 386, s390, ppc64-be, |
487 | ppc64-le guests are supported. | |
3e16d14f LE |
488 | |
489 | The CORE/NT_PRSTATUS and QEMU notes (that is, the VCPUs' statuses) are | |
490 | not written to the vmcore. Preparing these would require context that is | |
491 | only present in the KVM host kernel module when the guest is alive. A | |
492 | fake ELF note is written instead, only to keep the ELF parser of "crash" | |
493 | happy. | |
494 | ||
495 | Dependent on how busted the qemu process was at the time of the | |
496 | coredump, this command might produce unpredictable results. If qemu | |
497 | deliberately called abort(), or it was dumped in response to a signal at | |
498 | a halfway fortunate point, then its coredump should be in reasonable | |
499 | shape and this command should mostly work.""" | |
500 | ||
3e16d14f LE |
501 | def __init__(self): |
502 | super(DumpGuestMemory, self).__init__("dump-guest-memory", | |
503 | gdb.COMMAND_DATA, | |
504 | gdb.COMPLETE_FILENAME) | |
368e3adc | 505 | self.elf = None |
47890203 | 506 | self.guest_phys_blocks = None |
3e16d14f | 507 | |
368e3adc JF |
508 | def dump_init(self, vmcore): |
509 | """Prepares and writes ELF structures to core file.""" | |
510 | ||
511 | # Needed to make crash happy, data for more useful notes is | |
512 | # not available in a qemu core. | |
513 | self.elf.add_note("NONE", "EMPTY", 0) | |
514 | ||
515 | # We should never reach PN_XNUM for paging=false dumps, | |
516 | # there's just a handful of discontiguous ranges after | |
517 | # merging. | |
518 | # The constant is needed to account for the PT_NOTE segment. | |
519 | phdr_num = len(self.guest_phys_blocks) + 1 | |
520 | assert phdr_num < PN_XNUM | |
521 | ||
3e16d14f | 522 | for block in self.guest_phys_blocks: |
368e3adc JF |
523 | block_size = block["target_end"] - block["target_start"] |
524 | self.elf.add_segment(PT_LOAD, block["target_start"], block_size) | |
525 | ||
526 | self.elf.to_file(vmcore) | |
3e16d14f LE |
527 | |
528 | def dump_iterate(self, vmcore): | |
368e3adc JF |
529 | """Writes guest core to file.""" |
530 | ||
3e16d14f LE |
531 | qemu_core = gdb.inferiors()[0] |
532 | for block in self.guest_phys_blocks: | |
6782c0e7 | 533 | cur = block["host_addr"] |
3e16d14f | 534 | left = block["target_end"] - block["target_start"] |
7cb1089d JF |
535 | print("dumping range at %016x for length %016x" % |
536 | (cur.cast(UINTPTR_T), left)) | |
368e3adc | 537 | |
6782c0e7 | 538 | while left > 0: |
ca81ce72 | 539 | chunk_size = min(TARGET_PAGE_SIZE, left) |
3e16d14f LE |
540 | chunk = qemu_core.read_memory(cur, chunk_size) |
541 | vmcore.write(chunk) | |
6782c0e7 | 542 | cur += chunk_size |
3e16d14f LE |
543 | left -= chunk_size |
544 | ||
d23bfa91 MAL |
545 | def phys_memory_read(self, addr, size): |
546 | qemu_core = gdb.inferiors()[0] | |
547 | for block in self.guest_phys_blocks: | |
548 | if block["target_start"] <= addr \ | |
549 | and addr + size <= block["target_end"]: | |
550 | haddr = block["host_addr"] + (addr - block["target_start"]) | |
551 | return qemu_core.read_memory(haddr, size) | |
552 | return None | |
553 | ||
554 | def add_vmcoreinfo(self): | |
ce6b9e42 MAL |
555 | if gdb.lookup_symbol("vmcoreinfo_realize")[0] is None: |
556 | return | |
c3b1642b | 557 | vmci = 'vmcoreinfo_realize::vmcoreinfo_state' |
d36d0a9d MAL |
558 | if not gdb.parse_and_eval("%s" % vmci) \ |
559 | or not gdb.parse_and_eval("(%s)->has_vmcoreinfo" % vmci): | |
d23bfa91 MAL |
560 | return |
561 | ||
d36d0a9d MAL |
562 | fmt = gdb.parse_and_eval("(%s)->vmcoreinfo.guest_format" % vmci) |
563 | addr = gdb.parse_and_eval("(%s)->vmcoreinfo.paddr" % vmci) | |
564 | size = gdb.parse_and_eval("(%s)->vmcoreinfo.size" % vmci) | |
d23bfa91 MAL |
565 | |
566 | fmt = le16_to_cpu(fmt) | |
567 | addr = le64_to_cpu(addr) | |
568 | size = le32_to_cpu(size) | |
569 | ||
570 | if fmt != VMCOREINFO_FORMAT_ELF: | |
571 | return | |
572 | ||
573 | vmcoreinfo = self.phys_memory_read(addr, size) | |
574 | if vmcoreinfo: | |
6f49ec40 | 575 | self.elf.add_vmcoreinfo_note(bytes(vmcoreinfo)) |
d23bfa91 | 576 | |
3e16d14f | 577 | def invoke(self, args, from_tty): |
368e3adc JF |
578 | """Handles command invocation from gdb.""" |
579 | ||
3e16d14f LE |
580 | # Unwittingly pressing the Enter key after the command should |
581 | # not dump the same multi-gig coredump to the same file. | |
582 | self.dont_repeat() | |
583 | ||
584 | argv = gdb.string_to_argv(args) | |
368e3adc JF |
585 | if len(argv) != 2: |
586 | raise gdb.GdbError("usage: dump-guest-memory FILE ARCH") | |
587 | ||
588 | self.elf = ELF(argv[1]) | |
589 | self.guest_phys_blocks = get_guest_phys_blocks() | |
d23bfa91 | 590 | self.add_vmcoreinfo() |
3e16d14f | 591 | |
368e3adc JF |
592 | with open(argv[0], "wb") as vmcore: |
593 | self.dump_init(vmcore) | |
594 | self.dump_iterate(vmcore) | |
3e16d14f LE |
595 | |
596 | DumpGuestMemory() |