blob: 5a857cebcf64c9e2abcdaedb40e7ace092f22a25 [file] [log] [blame]
Janosch Frank28fbf8f2016-01-22 13:08:40 +01001"""
2This python script adds a new gdb command, "dump-guest-memory". It
3should be loaded with "source dump-guest-memory.py" at the (gdb)
4prompt.
5
6Copyright (C) 2013, Red Hat, Inc.
7
8Authors:
9 Laszlo Ersek <lersek@redhat.com>
10 Janosch Frank <frankja@linux.vnet.ibm.com>
11
12This work is licensed under the terms of the GNU GPL, version 2 or later. See
13the COPYING file in the top-level directory.
14"""
Eduardo Habkostf03868b2018-06-08 09:29:43 -030015from __future__ import print_function
Laszlo Ersek3e16d142013-12-17 01:37:06 +010016
Janosch Frank368e3ad2016-01-22 13:08:39 +010017import ctypes
Marc-André Lureaud23bfa92017-09-11 18:59:28 +020018import struct
Laszlo Ersek3e16d142013-12-17 01:37:06 +010019
Andrew Jones4b17bc92018-03-14 16:38:20 +010020try:
21 UINTPTR_T = gdb.lookup_type("uintptr_t")
22except Exception as inst:
23 raise gdb.GdbError("Symbols must be loaded prior to sourcing dump-guest-memory.\n"
24 "Symbols may be loaded by 'attach'ing a QEMU process id or by "
25 "'load'ing a QEMU binary.")
Janosch Frank47890202016-01-22 13:08:36 +010026
Janosch Frankca81ce72016-01-22 13:08:35 +010027TARGET_PAGE_SIZE = 0x1000
28TARGET_PAGE_MASK = 0xFFFFFFFFFFFFF000
29
Janosch Frankca81ce72016-01-22 13:08:35 +010030# Special value for e_phnum. This indicates that the real number of
31# program headers is too large to fit into e_phnum. Instead the real
32# value is in the field sh_info of section 0.
33PN_XNUM = 0xFFFF
34
Janosch Frank368e3ad2016-01-22 13:08:39 +010035EV_CURRENT = 1
36
37ELFCLASS32 = 1
38ELFCLASS64 = 2
39
40ELFDATA2LSB = 1
41ELFDATA2MSB = 2
42
43ET_CORE = 4
44
45PT_LOAD = 1
46PT_NOTE = 4
47
48EM_386 = 3
49EM_PPC = 20
50EM_PPC64 = 21
51EM_S390 = 22
52EM_AARCH = 183
53EM_X86_64 = 62
54
Marc-André Lureaud23bfa92017-09-11 18:59:28 +020055VMCOREINFO_FORMAT_ELF = 1
56
57def le16_to_cpu(val):
58 return struct.unpack("<H", struct.pack("=H", val))[0]
59
60def le32_to_cpu(val):
61 return struct.unpack("<I", struct.pack("=I", val))[0]
62
63def le64_to_cpu(val):
64 return struct.unpack("<Q", struct.pack("=Q", val))[0]
65
Janosch Frank368e3ad2016-01-22 13:08:39 +010066class ELF(object):
67 """Representation of a ELF file."""
68
69 def __init__(self, arch):
70 self.ehdr = None
71 self.notes = []
72 self.segments = []
73 self.notes_size = 0
Stefan Weil1d817db2016-03-21 19:21:26 +010074 self.endianness = None
Janosch Frank368e3ad2016-01-22 13:08:39 +010075 self.elfclass = ELFCLASS64
76
77 if arch == 'aarch64-le':
Stefan Weil1d817db2016-03-21 19:21:26 +010078 self.endianness = ELFDATA2LSB
Janosch Frank368e3ad2016-01-22 13:08:39 +010079 self.elfclass = ELFCLASS64
Stefan Weil1d817db2016-03-21 19:21:26 +010080 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +010081 self.ehdr.e_machine = EM_AARCH
82
83 elif arch == 'aarch64-be':
Stefan Weil1d817db2016-03-21 19:21:26 +010084 self.endianness = ELFDATA2MSB
85 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +010086 self.ehdr.e_machine = EM_AARCH
87
88 elif arch == 'X86_64':
Stefan Weil1d817db2016-03-21 19:21:26 +010089 self.endianness = ELFDATA2LSB
90 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +010091 self.ehdr.e_machine = EM_X86_64
92
93 elif arch == '386':
Stefan Weil1d817db2016-03-21 19:21:26 +010094 self.endianness = ELFDATA2LSB
Janosch Frank368e3ad2016-01-22 13:08:39 +010095 self.elfclass = ELFCLASS32
Stefan Weil1d817db2016-03-21 19:21:26 +010096 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +010097 self.ehdr.e_machine = EM_386
98
99 elif arch == 's390':
Stefan Weil1d817db2016-03-21 19:21:26 +0100100 self.endianness = ELFDATA2MSB
101 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100102 self.ehdr.e_machine = EM_S390
103
104 elif arch == 'ppc64-le':
Stefan Weil1d817db2016-03-21 19:21:26 +0100105 self.endianness = ELFDATA2LSB
106 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100107 self.ehdr.e_machine = EM_PPC64
108
109 elif arch == 'ppc64-be':
Stefan Weil1d817db2016-03-21 19:21:26 +0100110 self.endianness = ELFDATA2MSB
111 self.ehdr = get_arch_ehdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100112 self.ehdr.e_machine = EM_PPC64
113
114 else:
115 raise gdb.GdbError("No valid arch type specified.\n"
116 "Currently supported types:\n"
117 "aarch64-be, aarch64-le, X86_64, 386, s390, "
118 "ppc64-be, ppc64-le")
119
120 self.add_segment(PT_NOTE, 0, 0)
121
122 def add_note(self, n_name, n_desc, n_type):
123 """Adds a note to the ELF."""
124
Stefan Weil1d817db2016-03-21 19:21:26 +0100125 note = get_arch_note(self.endianness, len(n_name), len(n_desc))
Janosch Frank368e3ad2016-01-22 13:08:39 +0100126 note.n_namesz = len(n_name) + 1
127 note.n_descsz = len(n_desc)
128 note.n_name = n_name.encode()
129 note.n_type = n_type
130
131 # Desc needs to be 4 byte aligned (although the 64bit spec
132 # specifies 8 byte). When defining n_desc as uint32 it will be
133 # automatically aligned but we need the memmove to copy the
134 # string into it.
135 ctypes.memmove(note.n_desc, n_desc.encode(), len(n_desc))
136
137 self.notes.append(note)
138 self.segments[0].p_filesz += ctypes.sizeof(note)
139 self.segments[0].p_memsz += ctypes.sizeof(note)
140
Marc-André Lureaud23bfa92017-09-11 18:59:28 +0200141
142 def add_vmcoreinfo_note(self, vmcoreinfo):
143 """Adds a vmcoreinfo note to the ELF dump."""
144 # compute the header size, and copy that many bytes from the note
145 header = get_arch_note(self.endianness, 0, 0)
146 ctypes.memmove(ctypes.pointer(header),
147 vmcoreinfo, ctypes.sizeof(header))
148 if header.n_descsz > 1 << 20:
149 print('warning: invalid vmcoreinfo size')
150 return
151 # now get the full note
152 note = get_arch_note(self.endianness,
153 header.n_namesz - 1, header.n_descsz)
154 ctypes.memmove(ctypes.pointer(note), vmcoreinfo, ctypes.sizeof(note))
155
156 self.notes.append(note)
157 self.segments[0].p_filesz += ctypes.sizeof(note)
158 self.segments[0].p_memsz += ctypes.sizeof(note)
159
Janosch Frank368e3ad2016-01-22 13:08:39 +0100160 def add_segment(self, p_type, p_paddr, p_size):
161 """Adds a segment to the elf."""
162
Stefan Weil1d817db2016-03-21 19:21:26 +0100163 phdr = get_arch_phdr(self.endianness, self.elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100164 phdr.p_type = p_type
165 phdr.p_paddr = p_paddr
166 phdr.p_filesz = p_size
167 phdr.p_memsz = p_size
168 self.segments.append(phdr)
169 self.ehdr.e_phnum += 1
170
171 def to_file(self, elf_file):
172 """Writes all ELF structures to the the passed file.
173
174 Structure:
175 Ehdr
176 Segment 0:PT_NOTE
177 Segment 1:PT_LOAD
178 Segment N:PT_LOAD
179 Note 0..N
180 Dump contents
181 """
182 elf_file.write(self.ehdr)
183 off = ctypes.sizeof(self.ehdr) + \
184 len(self.segments) * ctypes.sizeof(self.segments[0])
185
186 for phdr in self.segments:
187 phdr.p_offset = off
188 elf_file.write(phdr)
189 off += phdr.p_filesz
190
191 for note in self.notes:
192 elf_file.write(note)
193
194
Stefan Weil1d817db2016-03-21 19:21:26 +0100195def get_arch_note(endianness, len_name, len_desc):
196 """Returns a Note class with the specified endianness."""
Janosch Frank368e3ad2016-01-22 13:08:39 +0100197
Stefan Weil1d817db2016-03-21 19:21:26 +0100198 if endianness == ELFDATA2LSB:
Janosch Frank368e3ad2016-01-22 13:08:39 +0100199 superclass = ctypes.LittleEndianStructure
200 else:
201 superclass = ctypes.BigEndianStructure
202
203 len_name = len_name + 1
204
205 class Note(superclass):
206 """Represents an ELF note, includes the content."""
207
208 _fields_ = [("n_namesz", ctypes.c_uint32),
209 ("n_descsz", ctypes.c_uint32),
210 ("n_type", ctypes.c_uint32),
211 ("n_name", ctypes.c_char * len_name),
212 ("n_desc", ctypes.c_uint32 * ((len_desc + 3) // 4))]
213 return Note()
214
215
216class Ident(ctypes.Structure):
217 """Represents the ELF ident array in the ehdr structure."""
218
219 _fields_ = [('ei_mag0', ctypes.c_ubyte),
220 ('ei_mag1', ctypes.c_ubyte),
221 ('ei_mag2', ctypes.c_ubyte),
222 ('ei_mag3', ctypes.c_ubyte),
223 ('ei_class', ctypes.c_ubyte),
224 ('ei_data', ctypes.c_ubyte),
225 ('ei_version', ctypes.c_ubyte),
226 ('ei_osabi', ctypes.c_ubyte),
227 ('ei_abiversion', ctypes.c_ubyte),
228 ('ei_pad', ctypes.c_ubyte * 7)]
229
Stefan Weil1d817db2016-03-21 19:21:26 +0100230 def __init__(self, endianness, elfclass):
Janosch Frank368e3ad2016-01-22 13:08:39 +0100231 self.ei_mag0 = 0x7F
232 self.ei_mag1 = ord('E')
233 self.ei_mag2 = ord('L')
234 self.ei_mag3 = ord('F')
235 self.ei_class = elfclass
Stefan Weil1d817db2016-03-21 19:21:26 +0100236 self.ei_data = endianness
Janosch Frank368e3ad2016-01-22 13:08:39 +0100237 self.ei_version = EV_CURRENT
238
239
Stefan Weil1d817db2016-03-21 19:21:26 +0100240def get_arch_ehdr(endianness, elfclass):
241 """Returns a EHDR64 class with the specified endianness."""
Janosch Frank368e3ad2016-01-22 13:08:39 +0100242
Stefan Weil1d817db2016-03-21 19:21:26 +0100243 if endianness == ELFDATA2LSB:
Janosch Frank368e3ad2016-01-22 13:08:39 +0100244 superclass = ctypes.LittleEndianStructure
245 else:
246 superclass = ctypes.BigEndianStructure
247
248 class EHDR64(superclass):
249 """Represents the 64 bit ELF header struct."""
250
251 _fields_ = [('e_ident', Ident),
252 ('e_type', ctypes.c_uint16),
253 ('e_machine', ctypes.c_uint16),
254 ('e_version', ctypes.c_uint32),
255 ('e_entry', ctypes.c_uint64),
256 ('e_phoff', ctypes.c_uint64),
257 ('e_shoff', ctypes.c_uint64),
258 ('e_flags', ctypes.c_uint32),
259 ('e_ehsize', ctypes.c_uint16),
260 ('e_phentsize', ctypes.c_uint16),
261 ('e_phnum', ctypes.c_uint16),
262 ('e_shentsize', ctypes.c_uint16),
263 ('e_shnum', ctypes.c_uint16),
264 ('e_shstrndx', ctypes.c_uint16)]
265
266 def __init__(self):
267 super(superclass, self).__init__()
Stefan Weil1d817db2016-03-21 19:21:26 +0100268 self.e_ident = Ident(endianness, elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100269 self.e_type = ET_CORE
270 self.e_version = EV_CURRENT
271 self.e_ehsize = ctypes.sizeof(self)
272 self.e_phoff = ctypes.sizeof(self)
Stefan Weil1d817db2016-03-21 19:21:26 +0100273 self.e_phentsize = ctypes.sizeof(get_arch_phdr(endianness, elfclass))
Janosch Frank368e3ad2016-01-22 13:08:39 +0100274 self.e_phnum = 0
275
276
277 class EHDR32(superclass):
278 """Represents the 32 bit ELF header struct."""
279
280 _fields_ = [('e_ident', Ident),
281 ('e_type', ctypes.c_uint16),
282 ('e_machine', ctypes.c_uint16),
283 ('e_version', ctypes.c_uint32),
284 ('e_entry', ctypes.c_uint32),
285 ('e_phoff', ctypes.c_uint32),
286 ('e_shoff', ctypes.c_uint32),
287 ('e_flags', ctypes.c_uint32),
288 ('e_ehsize', ctypes.c_uint16),
289 ('e_phentsize', ctypes.c_uint16),
290 ('e_phnum', ctypes.c_uint16),
291 ('e_shentsize', ctypes.c_uint16),
292 ('e_shnum', ctypes.c_uint16),
293 ('e_shstrndx', ctypes.c_uint16)]
294
295 def __init__(self):
296 super(superclass, self).__init__()
Stefan Weil1d817db2016-03-21 19:21:26 +0100297 self.e_ident = Ident(endianness, elfclass)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100298 self.e_type = ET_CORE
299 self.e_version = EV_CURRENT
300 self.e_ehsize = ctypes.sizeof(self)
301 self.e_phoff = ctypes.sizeof(self)
Stefan Weil1d817db2016-03-21 19:21:26 +0100302 self.e_phentsize = ctypes.sizeof(get_arch_phdr(endianness, elfclass))
Janosch Frank368e3ad2016-01-22 13:08:39 +0100303 self.e_phnum = 0
304
305 # End get_arch_ehdr
306 if elfclass == ELFCLASS64:
307 return EHDR64()
308 else:
309 return EHDR32()
310
311
Stefan Weil1d817db2016-03-21 19:21:26 +0100312def get_arch_phdr(endianness, elfclass):
313 """Returns a 32 or 64 bit PHDR class with the specified endianness."""
Janosch Frank368e3ad2016-01-22 13:08:39 +0100314
Stefan Weil1d817db2016-03-21 19:21:26 +0100315 if endianness == ELFDATA2LSB:
Janosch Frank368e3ad2016-01-22 13:08:39 +0100316 superclass = ctypes.LittleEndianStructure
317 else:
318 superclass = ctypes.BigEndianStructure
319
320 class PHDR64(superclass):
321 """Represents the 64 bit ELF program header struct."""
322
323 _fields_ = [('p_type', ctypes.c_uint32),
324 ('p_flags', ctypes.c_uint32),
325 ('p_offset', ctypes.c_uint64),
326 ('p_vaddr', ctypes.c_uint64),
327 ('p_paddr', ctypes.c_uint64),
328 ('p_filesz', ctypes.c_uint64),
329 ('p_memsz', ctypes.c_uint64),
330 ('p_align', ctypes.c_uint64)]
331
332 class PHDR32(superclass):
333 """Represents the 32 bit ELF program header struct."""
334
335 _fields_ = [('p_type', ctypes.c_uint32),
336 ('p_offset', ctypes.c_uint32),
337 ('p_vaddr', ctypes.c_uint32),
338 ('p_paddr', ctypes.c_uint32),
339 ('p_filesz', ctypes.c_uint32),
340 ('p_memsz', ctypes.c_uint32),
341 ('p_flags', ctypes.c_uint32),
342 ('p_align', ctypes.c_uint32)]
343
344 # End get_arch_phdr
345 if elfclass == ELFCLASS64:
346 return PHDR64()
347 else:
348 return PHDR32()
349
Janosch Frankca81ce72016-01-22 13:08:35 +0100350
Janosch Frank47890202016-01-22 13:08:36 +0100351def int128_get64(val):
Janosch Frank6782c0e2016-01-22 13:08:38 +0100352 """Returns low 64bit part of Int128 struct."""
353
Marc-André Lureau9b4b1572017-03-10 15:28:19 +0400354 try:
355 assert val["hi"] == 0
356 return val["lo"]
357 except gdb.error:
358 u64t = gdb.lookup_type('uint64_t').array(2)
359 u64 = val.cast(u64t)
360 if sys.byteorder == 'little':
361 assert u64[1] == 0
362 return u64[0]
363 else:
364 assert u64[0] == 0
365 return u64[1]
Janosch Frank47890202016-01-22 13:08:36 +0100366
Janosch Frank6782c0e2016-01-22 13:08:38 +0100367
Janosch Frank47890202016-01-22 13:08:36 +0100368def qlist_foreach(head, field_str):
Janosch Frank6782c0e2016-01-22 13:08:38 +0100369 """Generator for qlists."""
370
Janosch Frank47890202016-01-22 13:08:36 +0100371 var_p = head["lh_first"]
Janosch Frank6782c0e2016-01-22 13:08:38 +0100372 while var_p != 0:
Janosch Frank47890202016-01-22 13:08:36 +0100373 var = var_p.dereference()
Janosch Frank47890202016-01-22 13:08:36 +0100374 var_p = var[field_str]["le_next"]
Janosch Frank6782c0e2016-01-22 13:08:38 +0100375 yield var
376
Janosch Frank47890202016-01-22 13:08:36 +0100377
Paolo Bonzini0878d0e2016-02-22 11:02:12 +0100378def qemu_map_ram_ptr(block, offset):
Janosch Frank6782c0e2016-01-22 13:08:38 +0100379 """Returns qemu vaddr for given guest physical address."""
380
Paolo Bonzini0878d0e2016-02-22 11:02:12 +0100381 return block["host"] + offset
Janosch Frank47890202016-01-22 13:08:36 +0100382
Janosch Frank6782c0e2016-01-22 13:08:38 +0100383
384def memory_region_get_ram_ptr(memory_region):
385 if memory_region["alias"] != 0:
386 return (memory_region_get_ram_ptr(memory_region["alias"].dereference())
387 + memory_region["alias_offset"])
388
Paolo Bonzini0878d0e2016-02-22 11:02:12 +0100389 return qemu_map_ram_ptr(memory_region["ram_block"], 0)
Janosch Frank6782c0e2016-01-22 13:08:38 +0100390
Janosch Frank47890202016-01-22 13:08:36 +0100391
392def get_guest_phys_blocks():
Janosch Frank6782c0e2016-01-22 13:08:38 +0100393 """Returns a list of ram blocks.
394
395 Each block entry contains:
396 'target_start': guest block phys start address
397 'target_end': guest block phys end address
398 'host_addr': qemu vaddr of the block's start
399 """
400
Janosch Frank47890202016-01-22 13:08:36 +0100401 guest_phys_blocks = []
Janosch Frank6782c0e2016-01-22 13:08:38 +0100402
Janosch Frank7cb10892016-01-22 13:08:37 +0100403 print("guest RAM blocks:")
404 print("target_start target_end host_addr message "
405 "count")
406 print("---------------- ---------------- ---------------- ------- "
407 "-----")
Janosch Frank47890202016-01-22 13:08:36 +0100408
409 current_map_p = gdb.parse_and_eval("address_space_memory.current_map")
410 current_map = current_map_p.dereference()
Janosch Frank7cb10892016-01-22 13:08:37 +0100411
412 # Conversion to int is needed for python 3
413 # compatibility. Otherwise range doesn't cast the value itself and
414 # breaks.
415 for cur in range(int(current_map["nr"])):
Janosch Frank6782c0e2016-01-22 13:08:38 +0100416 flat_range = (current_map["ranges"] + cur).dereference()
417 memory_region = flat_range["mr"].dereference()
Janosch Frank47890202016-01-22 13:08:36 +0100418
419 # we only care about RAM
Janosch Frank6782c0e2016-01-22 13:08:38 +0100420 if not memory_region["ram"]:
Janosch Frank47890202016-01-22 13:08:36 +0100421 continue
422
423 section_size = int128_get64(flat_range["addr"]["size"])
424 target_start = int128_get64(flat_range["addr"]["start"])
Janosch Frank6782c0e2016-01-22 13:08:38 +0100425 target_end = target_start + section_size
426 host_addr = (memory_region_get_ram_ptr(memory_region)
427 + flat_range["offset_in_region"])
Janosch Frank47890202016-01-22 13:08:36 +0100428 predecessor = None
429
430 # find continuity in guest physical address space
Janosch Frank6782c0e2016-01-22 13:08:38 +0100431 if len(guest_phys_blocks) > 0:
Janosch Frank47890202016-01-22 13:08:36 +0100432 predecessor = guest_phys_blocks[-1]
433 predecessor_size = (predecessor["target_end"] -
434 predecessor["target_start"])
435
436 # the memory API guarantees monotonically increasing
437 # traversal
Janosch Frank6782c0e2016-01-22 13:08:38 +0100438 assert predecessor["target_end"] <= target_start
Janosch Frank47890202016-01-22 13:08:36 +0100439
440 # we want continuity in both guest-physical and
441 # host-virtual memory
442 if (predecessor["target_end"] < target_start or
443 predecessor["host_addr"] + predecessor_size != host_addr):
444 predecessor = None
445
Janosch Frank6782c0e2016-01-22 13:08:38 +0100446 if predecessor is None:
Janosch Frank47890202016-01-22 13:08:36 +0100447 # isolated mapping, add it to the list
448 guest_phys_blocks.append({"target_start": target_start,
Janosch Frank6782c0e2016-01-22 13:08:38 +0100449 "target_end": target_end,
450 "host_addr": host_addr})
Janosch Frank47890202016-01-22 13:08:36 +0100451 message = "added"
452 else:
453 # expand predecessor until @target_end; predecessor's
454 # start doesn't change
455 predecessor["target_end"] = target_end
456 message = "joined"
457
Janosch Frank7cb10892016-01-22 13:08:37 +0100458 print("%016x %016x %016x %-7s %5u" %
459 (target_start, target_end, host_addr.cast(UINTPTR_T),
460 message, len(guest_phys_blocks)))
Janosch Frank47890202016-01-22 13:08:36 +0100461
462 return guest_phys_blocks
463
464
Janosch Frank28fbf8f2016-01-22 13:08:40 +0100465# The leading docstring doesn't have idiomatic Python formatting. It is
466# printed by gdb's "help" command (the first line is printed in the
467# "help data" summary), and it should match how other help texts look in
468# gdb.
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100469class DumpGuestMemory(gdb.Command):
470 """Extract guest vmcore from qemu process coredump.
471
Janosch Frank368e3ad2016-01-22 13:08:39 +0100472The two required arguments are FILE and ARCH:
473FILE identifies the target file to write the guest vmcore to.
474ARCH specifies the architecture for which the core will be generated.
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100475
476This GDB command reimplements the dump-guest-memory QMP command in
477python, using the representation of guest memory as captured in the qemu
478coredump. The qemu process that has been dumped must have had the
Janosch Frank368e3ad2016-01-22 13:08:39 +0100479command line option "-machine dump-guest-core=on" which is the default.
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100480
481For simplicity, the "paging", "begin" and "end" parameters of the QMP
482command are not supported -- no attempt is made to get the guest's
483internal paging structures (ie. paging=false is hard-wired), and guest
484memory is always fully dumped.
485
Janosch Frank368e3ad2016-01-22 13:08:39 +0100486Currently aarch64-be, aarch64-le, X86_64, 386, s390, ppc64-be,
487ppc64-le guests are supported.
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100488
489The CORE/NT_PRSTATUS and QEMU notes (that is, the VCPUs' statuses) are
490not written to the vmcore. Preparing these would require context that is
491only present in the KVM host kernel module when the guest is alive. A
492fake ELF note is written instead, only to keep the ELF parser of "crash"
493happy.
494
495Dependent on how busted the qemu process was at the time of the
496coredump, this command might produce unpredictable results. If qemu
497deliberately called abort(), or it was dumped in response to a signal at
498a halfway fortunate point, then its coredump should be in reasonable
499shape and this command should mostly work."""
500
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100501 def __init__(self):
502 super(DumpGuestMemory, self).__init__("dump-guest-memory",
503 gdb.COMMAND_DATA,
504 gdb.COMPLETE_FILENAME)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100505 self.elf = None
Janosch Frank47890202016-01-22 13:08:36 +0100506 self.guest_phys_blocks = None
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100507
Janosch Frank368e3ad2016-01-22 13:08:39 +0100508 def dump_init(self, vmcore):
509 """Prepares and writes ELF structures to core file."""
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100510
Janosch Frank368e3ad2016-01-22 13:08:39 +0100511 # Needed to make crash happy, data for more useful notes is
512 # not available in a qemu core.
513 self.elf.add_note("NONE", "EMPTY", 0)
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100514
Janosch Frank368e3ad2016-01-22 13:08:39 +0100515 # We should never reach PN_XNUM for paging=false dumps,
516 # there's just a handful of discontiguous ranges after
517 # merging.
518 # The constant is needed to account for the PT_NOTE segment.
519 phdr_num = len(self.guest_phys_blocks) + 1
520 assert phdr_num < PN_XNUM
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100521
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100522 for block in self.guest_phys_blocks:
Janosch Frank368e3ad2016-01-22 13:08:39 +0100523 block_size = block["target_end"] - block["target_start"]
524 self.elf.add_segment(PT_LOAD, block["target_start"], block_size)
525
526 self.elf.to_file(vmcore)
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100527
528 def dump_iterate(self, vmcore):
Janosch Frank368e3ad2016-01-22 13:08:39 +0100529 """Writes guest core to file."""
530
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100531 qemu_core = gdb.inferiors()[0]
532 for block in self.guest_phys_blocks:
Janosch Frank6782c0e2016-01-22 13:08:38 +0100533 cur = block["host_addr"]
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100534 left = block["target_end"] - block["target_start"]
Janosch Frank7cb10892016-01-22 13:08:37 +0100535 print("dumping range at %016x for length %016x" %
536 (cur.cast(UINTPTR_T), left))
Janosch Frank368e3ad2016-01-22 13:08:39 +0100537
Janosch Frank6782c0e2016-01-22 13:08:38 +0100538 while left > 0:
Janosch Frankca81ce72016-01-22 13:08:35 +0100539 chunk_size = min(TARGET_PAGE_SIZE, left)
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100540 chunk = qemu_core.read_memory(cur, chunk_size)
541 vmcore.write(chunk)
Janosch Frank6782c0e2016-01-22 13:08:38 +0100542 cur += chunk_size
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100543 left -= chunk_size
544
Marc-André Lureaud23bfa92017-09-11 18:59:28 +0200545 def phys_memory_read(self, addr, size):
546 qemu_core = gdb.inferiors()[0]
547 for block in self.guest_phys_blocks:
548 if block["target_start"] <= addr \
549 and addr + size <= block["target_end"]:
550 haddr = block["host_addr"] + (addr - block["target_start"])
551 return qemu_core.read_memory(haddr, size)
552 return None
553
554 def add_vmcoreinfo(self):
Marc-André Lureauce6b9e42018-01-31 11:37:24 +0100555 if gdb.lookup_symbol("vmcoreinfo_realize")[0] is None:
556 return
Marc-André Lureauc3b16422017-12-12 17:27:58 +0100557 vmci = 'vmcoreinfo_realize::vmcoreinfo_state'
Marc-André Lureaud36d0a92017-12-01 12:37:44 +0100558 if not gdb.parse_and_eval("%s" % vmci) \
559 or not gdb.parse_and_eval("(%s)->has_vmcoreinfo" % vmci):
Marc-André Lureaud23bfa92017-09-11 18:59:28 +0200560 return
561
Marc-André Lureaud36d0a92017-12-01 12:37:44 +0100562 fmt = gdb.parse_and_eval("(%s)->vmcoreinfo.guest_format" % vmci)
563 addr = gdb.parse_and_eval("(%s)->vmcoreinfo.paddr" % vmci)
564 size = gdb.parse_and_eval("(%s)->vmcoreinfo.size" % vmci)
Marc-André Lureaud23bfa92017-09-11 18:59:28 +0200565
566 fmt = le16_to_cpu(fmt)
567 addr = le64_to_cpu(addr)
568 size = le32_to_cpu(size)
569
570 if fmt != VMCOREINFO_FORMAT_ELF:
571 return
572
573 vmcoreinfo = self.phys_memory_read(addr, size)
574 if vmcoreinfo:
Marc-André Lureau6f49ec42018-01-17 12:13:00 +0100575 self.elf.add_vmcoreinfo_note(bytes(vmcoreinfo))
Marc-André Lureaud23bfa92017-09-11 18:59:28 +0200576
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100577 def invoke(self, args, from_tty):
Janosch Frank368e3ad2016-01-22 13:08:39 +0100578 """Handles command invocation from gdb."""
579
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100580 # Unwittingly pressing the Enter key after the command should
581 # not dump the same multi-gig coredump to the same file.
582 self.dont_repeat()
583
584 argv = gdb.string_to_argv(args)
Janosch Frank368e3ad2016-01-22 13:08:39 +0100585 if len(argv) != 2:
586 raise gdb.GdbError("usage: dump-guest-memory FILE ARCH")
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100587
Janosch Frank368e3ad2016-01-22 13:08:39 +0100588 self.elf = ELF(argv[1])
589 self.guest_phys_blocks = get_guest_phys_blocks()
Marc-André Lureaud23bfa92017-09-11 18:59:28 +0200590 self.add_vmcoreinfo()
Janosch Frank368e3ad2016-01-22 13:08:39 +0100591
592 with open(argv[0], "wb") as vmcore:
593 self.dump_init(vmcore)
594 self.dump_iterate(vmcore)
Laszlo Ersek3e16d142013-12-17 01:37:06 +0100595
596DumpGuestMemory()