| #!/usr/bin/env python |
| # |
| # Copyright 2011 the V8 project authors. All rights reserved. |
| # Redistribution and use in source and binary forms, with or without |
| # modification, are permitted provided that the following conditions are |
| # met: |
| # |
| # * Redistributions of source code must retain the above copyright |
| # notice, this list of conditions and the following disclaimer. |
| # * Redistributions in binary form must reproduce the above |
| # copyright notice, this list of conditions and the following |
| # disclaimer in the documentation and/or other materials provided |
| # with the distribution. |
| # * Neither the name of Google Inc. nor the names of its |
| # contributors may be used to endorse or promote products derived |
| # from this software without specific prior written permission. |
| # |
| # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| |
| import ctypes |
| import mmap |
| import optparse |
| import os |
| import disasm |
| import sys |
| import types |
| import codecs |
| import re |
| |
| |
| USAGE="""usage: %prog [OPTION]... |
| |
| Minidump analyzer. |
| |
| Shows the processor state at the point of exception including the |
| stack of the active thread and the referenced objects in the V8 |
| heap. Code objects are disassembled and the addresses linked from the |
| stack (pushed return addresses) are marked with "=>". |
| |
| |
| Examples: |
| $ %prog 12345678-1234-1234-1234-123456789abcd-full.dmp |
| """ |
| |
| DEBUG=False |
| |
| |
| def DebugPrint(s): |
| if not DEBUG: return |
| print s |
| |
| |
| class Descriptor(object): |
| """Descriptor of a structure in a memory.""" |
| |
| def __init__(self, fields): |
| self.fields = fields |
| self.is_flexible = False |
| for _, type_or_func in fields: |
| if isinstance(type_or_func, types.FunctionType): |
| self.is_flexible = True |
| break |
| if not self.is_flexible: |
| self.ctype = Descriptor._GetCtype(fields) |
| self.size = ctypes.sizeof(self.ctype) |
| |
| def Read(self, memory, offset): |
| if self.is_flexible: |
| fields_copy = self.fields[:] |
| last = 0 |
| for name, type_or_func in fields_copy: |
| if isinstance(type_or_func, types.FunctionType): |
| partial_ctype = Descriptor._GetCtype(fields_copy[:last]) |
| partial_object = partial_ctype.from_buffer(memory, offset) |
| type = type_or_func(partial_object) |
| if type is not None: |
| fields_copy[last] = (name, type) |
| last += 1 |
| else: |
| last += 1 |
| complete_ctype = Descriptor._GetCtype(fields_copy[:last]) |
| else: |
| complete_ctype = self.ctype |
| return complete_ctype.from_buffer(memory, offset) |
| |
| @staticmethod |
| def _GetCtype(fields): |
| class Raw(ctypes.Structure): |
| _fields_ = fields |
| _pack_ = 1 |
| |
| def __str__(self): |
| return "{" + ", ".join("%s: %s" % (field, self.__getattribute__(field)) |
| for field, _ in Raw._fields_) + "}" |
| return Raw |
| |
| |
| # Set of structures and constants that describe the layout of minidump |
| # files. Based on MSDN and Google Breakpad. |
| |
| MINIDUMP_HEADER = Descriptor([ |
| ("signature", ctypes.c_uint32), |
| ("version", ctypes.c_uint32), |
| ("stream_count", ctypes.c_uint32), |
| ("stream_directories_rva", ctypes.c_uint32), |
| ("checksum", ctypes.c_uint32), |
| ("time_date_stampt", ctypes.c_uint32), |
| ("flags", ctypes.c_uint64) |
| ]) |
| |
| MINIDUMP_LOCATION_DESCRIPTOR = Descriptor([ |
| ("data_size", ctypes.c_uint32), |
| ("rva", ctypes.c_uint32) |
| ]) |
| |
| MINIDUMP_DIRECTORY = Descriptor([ |
| ("stream_type", ctypes.c_uint32), |
| ("location", MINIDUMP_LOCATION_DESCRIPTOR.ctype) |
| ]) |
| |
| MD_EXCEPTION_MAXIMUM_PARAMETERS = 15 |
| |
| MINIDUMP_EXCEPTION = Descriptor([ |
| ("code", ctypes.c_uint32), |
| ("flags", ctypes.c_uint32), |
| ("record", ctypes.c_uint64), |
| ("address", ctypes.c_uint64), |
| ("parameter_count", ctypes.c_uint32), |
| ("unused_alignment", ctypes.c_uint32), |
| ("information", ctypes.c_uint64 * MD_EXCEPTION_MAXIMUM_PARAMETERS) |
| ]) |
| |
| MINIDUMP_EXCEPTION_STREAM = Descriptor([ |
| ("thread_id", ctypes.c_uint32), |
| ("unused_alignment", ctypes.c_uint32), |
| ("exception", MINIDUMP_EXCEPTION.ctype), |
| ("thread_context", MINIDUMP_LOCATION_DESCRIPTOR.ctype) |
| ]) |
| |
| # Stream types. |
| MD_UNUSED_STREAM = 0 |
| MD_RESERVED_STREAM_0 = 1 |
| MD_RESERVED_STREAM_1 = 2 |
| MD_THREAD_LIST_STREAM = 3 |
| MD_MODULE_LIST_STREAM = 4 |
| MD_MEMORY_LIST_STREAM = 5 |
| MD_EXCEPTION_STREAM = 6 |
| MD_SYSTEM_INFO_STREAM = 7 |
| MD_THREAD_EX_LIST_STREAM = 8 |
| MD_MEMORY_64_LIST_STREAM = 9 |
| MD_COMMENT_STREAM_A = 10 |
| MD_COMMENT_STREAM_W = 11 |
| MD_HANDLE_DATA_STREAM = 12 |
| MD_FUNCTION_TABLE_STREAM = 13 |
| MD_UNLOADED_MODULE_LIST_STREAM = 14 |
| MD_MISC_INFO_STREAM = 15 |
| MD_MEMORY_INFO_LIST_STREAM = 16 |
| MD_THREAD_INFO_LIST_STREAM = 17 |
| MD_HANDLE_OPERATION_LIST_STREAM = 18 |
| |
| MD_FLOATINGSAVEAREA_X86_REGISTERAREA_SIZE = 80 |
| |
| MINIDUMP_FLOATING_SAVE_AREA_X86 = Descriptor([ |
| ("control_word", ctypes.c_uint32), |
| ("status_word", ctypes.c_uint32), |
| ("tag_word", ctypes.c_uint32), |
| ("error_offset", ctypes.c_uint32), |
| ("error_selector", ctypes.c_uint32), |
| ("data_offset", ctypes.c_uint32), |
| ("data_selector", ctypes.c_uint32), |
| ("register_area", ctypes.c_uint8 * MD_FLOATINGSAVEAREA_X86_REGISTERAREA_SIZE), |
| ("cr0_npx_state", ctypes.c_uint32) |
| ]) |
| |
| MD_CONTEXT_X86_EXTENDED_REGISTERS_SIZE = 512 |
| |
| # Context flags. |
| MD_CONTEXT_X86 = 0x00010000 |
| MD_CONTEXT_X86_CONTROL = (MD_CONTEXT_X86 | 0x00000001) |
| MD_CONTEXT_X86_INTEGER = (MD_CONTEXT_X86 | 0x00000002) |
| MD_CONTEXT_X86_SEGMENTS = (MD_CONTEXT_X86 | 0x00000004) |
| MD_CONTEXT_X86_FLOATING_POINT = (MD_CONTEXT_X86 | 0x00000008) |
| MD_CONTEXT_X86_DEBUG_REGISTERS = (MD_CONTEXT_X86 | 0x00000010) |
| MD_CONTEXT_X86_EXTENDED_REGISTERS = (MD_CONTEXT_X86 | 0x00000020) |
| |
| def EnableOnFlag(type, flag): |
| return lambda o: [None, type][int((o.context_flags & flag) != 0)] |
| |
| MINIDUMP_CONTEXT_X86 = Descriptor([ |
| ("context_flags", ctypes.c_uint32), |
| # MD_CONTEXT_X86_DEBUG_REGISTERS. |
| ("dr0", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_DEBUG_REGISTERS)), |
| ("dr1", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_DEBUG_REGISTERS)), |
| ("dr2", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_DEBUG_REGISTERS)), |
| ("dr3", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_DEBUG_REGISTERS)), |
| ("dr6", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_DEBUG_REGISTERS)), |
| ("dr7", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_DEBUG_REGISTERS)), |
| # MD_CONTEXT_X86_FLOATING_POINT. |
| ("float_save", EnableOnFlag(MINIDUMP_FLOATING_SAVE_AREA_X86.ctype, |
| MD_CONTEXT_X86_FLOATING_POINT)), |
| # MD_CONTEXT_X86_SEGMENTS. |
| ("gs", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_SEGMENTS)), |
| ("fs", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_SEGMENTS)), |
| ("es", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_SEGMENTS)), |
| ("ds", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_SEGMENTS)), |
| # MD_CONTEXT_X86_INTEGER. |
| ("edi", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_INTEGER)), |
| ("esi", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_INTEGER)), |
| ("ebx", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_INTEGER)), |
| ("edx", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_INTEGER)), |
| ("ecx", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_INTEGER)), |
| ("eax", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_INTEGER)), |
| # MD_CONTEXT_X86_CONTROL. |
| ("ebp", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_CONTROL)), |
| ("eip", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_CONTROL)), |
| ("cs", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_CONTROL)), |
| ("eflags", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_CONTROL)), |
| ("esp", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_CONTROL)), |
| ("ss", EnableOnFlag(ctypes.c_uint32, MD_CONTEXT_X86_CONTROL)), |
| # MD_CONTEXT_X86_EXTENDED_REGISTERS. |
| ("extended_registers", |
| EnableOnFlag(ctypes.c_uint8 * MD_CONTEXT_X86_EXTENDED_REGISTERS_SIZE, |
| MD_CONTEXT_X86_EXTENDED_REGISTERS)) |
| ]) |
| |
| MINIDUMP_MEMORY_DESCRIPTOR = Descriptor([ |
| ("start", ctypes.c_uint64), |
| ("memory", MINIDUMP_LOCATION_DESCRIPTOR.ctype) |
| ]) |
| |
| MINIDUMP_MEMORY_DESCRIPTOR64 = Descriptor([ |
| ("start", ctypes.c_uint64), |
| ("size", ctypes.c_uint64) |
| ]) |
| |
| MINIDUMP_MEMORY_LIST = Descriptor([ |
| ("range_count", ctypes.c_uint32), |
| ("ranges", lambda m: MINIDUMP_MEMORY_DESCRIPTOR.ctype * m.range_count) |
| ]) |
| |
| MINIDUMP_MEMORY_LIST64 = Descriptor([ |
| ("range_count", ctypes.c_uint64), |
| ("base_rva", ctypes.c_uint64), |
| ("ranges", lambda m: MINIDUMP_MEMORY_DESCRIPTOR64.ctype * m.range_count) |
| ]) |
| |
| MINIDUMP_THREAD = Descriptor([ |
| ("id", ctypes.c_uint32), |
| ("suspend_count", ctypes.c_uint32), |
| ("priority_class", ctypes.c_uint32), |
| ("priority", ctypes.c_uint32), |
| ("ted", ctypes.c_uint64), |
| ("stack", MINIDUMP_MEMORY_DESCRIPTOR.ctype), |
| ("context", MINIDUMP_LOCATION_DESCRIPTOR.ctype) |
| ]) |
| |
| MINIDUMP_THREAD_LIST = Descriptor([ |
| ("thread_count", ctypes.c_uint32), |
| ("threads", lambda t: MINIDUMP_THREAD.ctype * t.thread_count) |
| ]) |
| |
| |
| class MinidumpReader(object): |
| """Minidump (.dmp) reader.""" |
| |
| _HEADER_MAGIC = 0x504d444d |
| |
| def __init__(self, options, minidump_name): |
| self.minidump_name = minidump_name |
| self.minidump_file = open(minidump_name, "r") |
| self.minidump = mmap.mmap(self.minidump_file.fileno(), 0, mmap.MAP_PRIVATE) |
| self.header = MINIDUMP_HEADER.Read(self.minidump, 0) |
| if self.header.signature != MinidumpReader._HEADER_MAGIC: |
| print >>sys.stderr, "Warning: unsupported minidump header magic" |
| DebugPrint(self.header) |
| directories = [] |
| offset = self.header.stream_directories_rva |
| for _ in xrange(self.header.stream_count): |
| directories.append(MINIDUMP_DIRECTORY.Read(self.minidump, offset)) |
| offset += MINIDUMP_DIRECTORY.size |
| self.exception = None |
| self.exception_context = None |
| self.memory_list = None |
| self.memory_list64 = None |
| self.thread_map = {} |
| for d in directories: |
| DebugPrint(d) |
| # TODO(vitalyr): extract system info including CPU features. |
| if d.stream_type == MD_EXCEPTION_STREAM: |
| self.exception = MINIDUMP_EXCEPTION_STREAM.Read( |
| self.minidump, d.location.rva) |
| DebugPrint(self.exception) |
| self.exception_context = MINIDUMP_CONTEXT_X86.Read( |
| self.minidump, self.exception.thread_context.rva) |
| DebugPrint(self.exception_context) |
| elif d.stream_type == MD_THREAD_LIST_STREAM: |
| thread_list = MINIDUMP_THREAD_LIST.Read(self.minidump, d.location.rva) |
| assert ctypes.sizeof(thread_list) == d.location.data_size |
| DebugPrint(thread_list) |
| for thread in thread_list.threads: |
| DebugPrint(thread) |
| self.thread_map[thread.id] = thread |
| elif d.stream_type == MD_MEMORY_LIST_STREAM: |
| print >>sys.stderr, "Warning: not a full minidump" |
| assert self.memory_list is None |
| self.memory_list = MINIDUMP_MEMORY_LIST.Read( |
| self.minidump, d.location.rva) |
| assert ctypes.sizeof(self.memory_list) == d.location.data_size |
| DebugPrint(self.memory_list) |
| elif d.stream_type == MD_MEMORY_64_LIST_STREAM: |
| assert self.memory_list64 is None |
| self.memory_list64 = MINIDUMP_MEMORY_LIST64.Read( |
| self.minidump, d.location.rva) |
| assert ctypes.sizeof(self.memory_list64) == d.location.data_size |
| DebugPrint(self.memory_list64) |
| |
| def IsValidAddress(self, address): |
| return self.FindLocation(address) is not None |
| |
| def ReadU8(self, address): |
| location = self.FindLocation(address) |
| return ctypes.c_uint8.from_buffer(self.minidump, location).value |
| |
| def ReadU32(self, address): |
| location = self.FindLocation(address) |
| return ctypes.c_uint32.from_buffer(self.minidump, location).value |
| |
| def ReadBytes(self, address, size): |
| location = self.FindLocation(address) |
| return self.minidump[location:location + size] |
| |
| def FindLocation(self, address): |
| offset = 0 |
| if self.memory_list64 is not None: |
| for r in self.memory_list64.ranges: |
| if r.start <= address < r.start + r.size: |
| return self.memory_list64.base_rva + offset + address - r.start |
| offset += r.size |
| if self.memory_list is not None: |
| for r in self.memory_list.ranges: |
| if r.start <= address < r.start + r.memory.data_size: |
| return r.memory.rva + address - r.start |
| return None |
| |
| def GetDisasmLines(self, address, size): |
| location = self.FindLocation(address) |
| if location is None: return [] |
| return disasm.GetDisasmLines(self.minidump_name, |
| location, |
| size, |
| "ia32", |
| False) |
| |
| |
| def Dispose(self): |
| self.minidump.close() |
| self.minidump_file.close() |
| |
| |
| # List of V8 instance types. Obtained by adding the code below to any .cc file. |
| # |
| # #define DUMP_TYPE(T) printf("%d: \"%s\",\n", T, #T); |
| # struct P { |
| # P() { |
| # printf("{\n"); |
| # INSTANCE_TYPE_LIST(DUMP_TYPE) |
| # printf("}\n"); |
| # } |
| # }; |
| # static P p; |
| INSTANCE_TYPES = { |
| 64: "SYMBOL_TYPE", |
| 68: "ASCII_SYMBOL_TYPE", |
| 65: "CONS_SYMBOL_TYPE", |
| 69: "CONS_ASCII_SYMBOL_TYPE", |
| 66: "EXTERNAL_SYMBOL_TYPE", |
| 74: "EXTERNAL_SYMBOL_WITH_ASCII_DATA_TYPE", |
| 70: "EXTERNAL_ASCII_SYMBOL_TYPE", |
| 0: "STRING_TYPE", |
| 4: "ASCII_STRING_TYPE", |
| 1: "CONS_STRING_TYPE", |
| 5: "CONS_ASCII_STRING_TYPE", |
| 2: "EXTERNAL_STRING_TYPE", |
| 10: "EXTERNAL_STRING_WITH_ASCII_DATA_TYPE", |
| 6: "EXTERNAL_ASCII_STRING_TYPE", |
| 6: "PRIVATE_EXTERNAL_ASCII_STRING_TYPE", |
| 128: "MAP_TYPE", |
| 129: "CODE_TYPE", |
| 130: "ODDBALL_TYPE", |
| 131: "JS_GLOBAL_PROPERTY_CELL_TYPE", |
| 132: "HEAP_NUMBER_TYPE", |
| 133: "FOREIGN_TYPE", |
| 134: "BYTE_ARRAY_TYPE", |
| 135: "EXTERNAL_BYTE_ARRAY_TYPE", |
| 136: "EXTERNAL_UNSIGNED_BYTE_ARRAY_TYPE", |
| 137: "EXTERNAL_SHORT_ARRAY_TYPE", |
| 138: "EXTERNAL_UNSIGNED_SHORT_ARRAY_TYPE", |
| 139: "EXTERNAL_INT_ARRAY_TYPE", |
| 140: "EXTERNAL_UNSIGNED_INT_ARRAY_TYPE", |
| 141: "EXTERNAL_FLOAT_ARRAY_TYPE", |
| 143: "EXTERNAL_PIXEL_ARRAY_TYPE", |
| 145: "FILLER_TYPE", |
| 146: "ACCESSOR_INFO_TYPE", |
| 147: "ACCESS_CHECK_INFO_TYPE", |
| 148: "INTERCEPTOR_INFO_TYPE", |
| 149: "CALL_HANDLER_INFO_TYPE", |
| 150: "FUNCTION_TEMPLATE_INFO_TYPE", |
| 151: "OBJECT_TEMPLATE_INFO_TYPE", |
| 152: "SIGNATURE_INFO_TYPE", |
| 153: "TYPE_SWITCH_INFO_TYPE", |
| 154: "SCRIPT_TYPE", |
| 155: "CODE_CACHE_TYPE", |
| 156: "POLYMORPHIC_CODE_CACHE_TYPE", |
| 159: "FIXED_ARRAY_TYPE", |
| 160: "SHARED_FUNCTION_INFO_TYPE", |
| 161: "JS_MESSAGE_OBJECT_TYPE", |
| 162: "JS_VALUE_TYPE", |
| 163: "JS_OBJECT_TYPE", |
| 164: "JS_CONTEXT_EXTENSION_OBJECT_TYPE", |
| 165: "JS_GLOBAL_OBJECT_TYPE", |
| 166: "JS_BUILTINS_OBJECT_TYPE", |
| 167: "JS_GLOBAL_PROXY_TYPE", |
| 168: "JS_ARRAY_TYPE", |
| 169: "JS_PROXY_TYPE", |
| 170: "JS_WEAK_MAP_TYPE", |
| 171: "JS_REGEXP_TYPE", |
| 172: "JS_FUNCTION_TYPE", |
| 173: "JS_FUNCTION_PROXY_TYPE", |
| 157: "DEBUG_INFO_TYPE", |
| 158: "BREAK_POINT_INFO_TYPE", |
| } |
| |
| |
| class Printer(object): |
| """Printer with indentation support.""" |
| |
| def __init__(self): |
| self.indent = 0 |
| |
| def Indent(self): |
| self.indent += 2 |
| |
| def Dedent(self): |
| self.indent -= 2 |
| |
| def Print(self, string): |
| print "%s%s" % (self._IndentString(), string) |
| |
| def PrintLines(self, lines): |
| indent = self._IndentString() |
| print "\n".join("%s%s" % (indent, line) for line in lines) |
| |
| def _IndentString(self): |
| return self.indent * " " |
| |
| |
| ADDRESS_RE = re.compile(r"0x[0-9a-fA-F]+") |
| |
| |
| def FormatDisasmLine(start, heap, line): |
| line_address = start + line[0] |
| stack_slot = heap.stack_map.get(line_address) |
| marker = " " |
| if stack_slot: |
| marker = "=>" |
| code = AnnotateAddresses(heap, line[1]) |
| return "%s%08x %08x: %s" % (marker, line_address, line[0], code) |
| |
| |
| def AnnotateAddresses(heap, line): |
| extra = [] |
| for m in ADDRESS_RE.finditer(line): |
| maybe_address = int(m.group(0), 16) |
| object = heap.FindObject(maybe_address) |
| if not object: continue |
| extra.append(str(object)) |
| if len(extra) == 0: return line |
| return "%s ;; %s" % (line, ", ".join(extra)) |
| |
| |
| class HeapObject(object): |
| def __init__(self, heap, map, address): |
| self.heap = heap |
| self.map = map |
| self.address = address |
| |
| def Is(self, cls): |
| return isinstance(self, cls) |
| |
| def Print(self, p): |
| p.Print(str(self)) |
| |
| def __str__(self): |
| return "HeapObject(%08x, %s)" % (self.address, |
| INSTANCE_TYPES[self.map.instance_type]) |
| |
| def ObjectField(self, offset): |
| field_value = self.heap.reader.ReadU32(self.address + offset) |
| return self.heap.FindObjectOrSmi(field_value) |
| |
| def SmiField(self, offset): |
| field_value = self.heap.reader.ReadU32(self.address + offset) |
| assert (field_value & 1) == 0 |
| return field_value / 2 |
| |
| |
| class Map(HeapObject): |
| INSTANCE_TYPE_OFFSET = 8 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.instance_type = \ |
| heap.reader.ReadU8(self.address + Map.INSTANCE_TYPE_OFFSET) |
| |
| |
| class String(HeapObject): |
| LENGTH_OFFSET = 4 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.length = self.SmiField(String.LENGTH_OFFSET) |
| |
| def GetChars(self): |
| return "?string?" |
| |
| def Print(self, p): |
| p.Print(str(self)) |
| |
| def __str__(self): |
| return "\"%s\"" % self.GetChars() |
| |
| |
| class SeqString(String): |
| CHARS_OFFSET = 12 |
| |
| def __init__(self, heap, map, address): |
| String.__init__(self, heap, map, address) |
| self.chars = heap.reader.ReadBytes(self.address + SeqString.CHARS_OFFSET, |
| self.length) |
| |
| def GetChars(self): |
| return self.chars |
| |
| |
| class ExternalString(String): |
| RESOURCE_OFFSET = 12 |
| |
| WEBKIT_RESOUCE_STRING_IMPL_OFFSET = 4 |
| WEBKIT_STRING_IMPL_CHARS_OFFSET = 8 |
| |
| def __init__(self, heap, map, address): |
| String.__init__(self, heap, map, address) |
| reader = heap.reader |
| self.resource = \ |
| reader.ReadU32(self.address + ExternalString.RESOURCE_OFFSET) |
| self.chars = "?external string?" |
| if not reader.IsValidAddress(self.resource): return |
| string_impl_address = self.resource + \ |
| ExternalString.WEBKIT_RESOUCE_STRING_IMPL_OFFSET |
| if not reader.IsValidAddress(string_impl_address): return |
| string_impl = reader.ReadU32(string_impl_address) |
| chars_ptr_address = string_impl + \ |
| ExternalString.WEBKIT_STRING_IMPL_CHARS_OFFSET |
| if not reader.IsValidAddress(chars_ptr_address): return |
| chars_ptr = reader.ReadU32(chars_ptr_address) |
| if not reader.IsValidAddress(chars_ptr): return |
| raw_chars = reader.ReadBytes(chars_ptr, 2 * self.length) |
| self.chars = codecs.getdecoder("utf16")(raw_chars)[0] |
| |
| def GetChars(self): |
| return self.chars |
| |
| |
| class ConsString(String): |
| LEFT_OFFSET = 12 |
| RIGHT_OFFSET = 16 |
| |
| def __init__(self, heap, map, address): |
| String.__init__(self, heap, map, address) |
| self.left = self.ObjectField(ConsString.LEFT_OFFSET) |
| self.right = self.ObjectField(ConsString.RIGHT_OFFSET) |
| |
| def GetChars(self): |
| return self.left.GetChars() + self.right.GetChars() |
| |
| |
| class Oddball(HeapObject): |
| TO_STRING_OFFSET = 4 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.to_string = self.ObjectField(Oddball.TO_STRING_OFFSET) |
| |
| def Print(self, p): |
| p.Print(str(self)) |
| |
| def __str__(self): |
| return "<%s>" % self.to_string.GetChars() |
| |
| |
| class FixedArray(HeapObject): |
| LENGTH_OFFSET = 4 |
| ELEMENTS_OFFSET = 8 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.length = self.SmiField(FixedArray.LENGTH_OFFSET) |
| |
| def Print(self, p): |
| p.Print("FixedArray(%08x) {" % self.address) |
| p.Indent() |
| p.Print("length: %d" % self.length) |
| for i in xrange(self.length): |
| offset = FixedArray.ELEMENTS_OFFSET + 4 * i |
| p.Print("[%08d] = %s" % (i, self.ObjectField(offset))) |
| p.Dedent() |
| p.Print("}") |
| |
| def __str__(self): |
| return "FixedArray(%08x, length=%d)" % (self.address, self.length) |
| |
| |
| class JSFunction(HeapObject): |
| CODE_ENTRY_OFFSET = 12 |
| SHARED_OFFSET = 20 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| code_entry = \ |
| heap.reader.ReadU32(self.address + JSFunction.CODE_ENTRY_OFFSET) |
| self.code = heap.FindObject(code_entry - Code.ENTRY_OFFSET + 1) |
| self.shared = self.ObjectField(JSFunction.SHARED_OFFSET) |
| |
| def Print(self, p): |
| source = "\n".join(" %s" % line for line in self._GetSource().split("\n")) |
| p.Print("JSFunction(%08x) {" % self.address) |
| p.Indent() |
| p.Print("inferred name: %s" % self.shared.inferred_name) |
| if self.shared.script.Is(Script) and self.shared.script.name.Is(String): |
| p.Print("script name: %s" % self.shared.script.name) |
| p.Print("source:") |
| p.PrintLines(self._GetSource().split("\n")) |
| p.Print("code:") |
| self.code.Print(p) |
| if self.code != self.shared.code: |
| p.Print("unoptimized code:") |
| self.shared.code.Print(p) |
| p.Dedent() |
| p.Print("}") |
| |
| def __str__(self): |
| inferred_name = "" |
| if self.shared.Is(SharedFunctionInfo): |
| inferred_name = self.shared.inferred_name |
| return "JSFunction(%08x, %s)" % (self.address, inferred_name) |
| |
| def _GetSource(self): |
| source = "?source?" |
| start = self.shared.start_position |
| end = self.shared.end_position |
| if not self.shared.script.Is(Script): return source |
| script_source = self.shared.script.source |
| if not script_source.Is(String): return source |
| return script_source.GetChars()[start:end] |
| |
| |
| class SharedFunctionInfo(HeapObject): |
| CODE_OFFSET = 2 * 4 |
| SCRIPT_OFFSET = 7 * 4 |
| INFERRED_NAME_OFFSET = 9 * 4 |
| START_POSITION_AND_TYPE_OFFSET = 17 * 4 |
| END_POSITION_OFFSET = 18 * 4 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.code = self.ObjectField(SharedFunctionInfo.CODE_OFFSET) |
| self.script = self.ObjectField(SharedFunctionInfo.SCRIPT_OFFSET) |
| self.inferred_name = \ |
| self.ObjectField(SharedFunctionInfo.INFERRED_NAME_OFFSET) |
| start_position_and_type = \ |
| self.SmiField(SharedFunctionInfo.START_POSITION_AND_TYPE_OFFSET) |
| self.start_position = start_position_and_type >> 2 |
| self.end_position = self.SmiField(SharedFunctionInfo.END_POSITION_OFFSET) |
| |
| |
| class Script(HeapObject): |
| SOURCE_OFFSET = 4 |
| NAME_OFFSET = 8 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.source = self.ObjectField(Script.SOURCE_OFFSET) |
| self.name = self.ObjectField(Script.NAME_OFFSET) |
| |
| |
| class Code(HeapObject): |
| INSTRUCTION_SIZE_OFFSET = 4 |
| ENTRY_OFFSET = 32 |
| |
| def __init__(self, heap, map, address): |
| HeapObject.__init__(self, heap, map, address) |
| self.entry = self.address + Code.ENTRY_OFFSET |
| self.instruction_size = \ |
| heap.reader.ReadU32(self.address + Code.INSTRUCTION_SIZE_OFFSET) |
| |
| def Print(self, p): |
| lines = self.heap.reader.GetDisasmLines(self.entry, self.instruction_size) |
| p.Print("Code(%08x) {" % self.address) |
| p.Indent() |
| p.Print("instruction_size: %d" % self.instruction_size) |
| p.PrintLines(self._FormatLine(line) for line in lines) |
| p.Dedent() |
| p.Print("}") |
| |
| def _FormatLine(self, line): |
| return FormatDisasmLine(self.entry, self.heap, line) |
| |
| |
| class V8Heap(object): |
| CLASS_MAP = { |
| "SYMBOL_TYPE": SeqString, |
| "ASCII_SYMBOL_TYPE": SeqString, |
| "CONS_SYMBOL_TYPE": ConsString, |
| "CONS_ASCII_SYMBOL_TYPE": ConsString, |
| "EXTERNAL_SYMBOL_TYPE": ExternalString, |
| "EXTERNAL_SYMBOL_WITH_ASCII_DATA_TYPE": ExternalString, |
| "EXTERNAL_ASCII_SYMBOL_TYPE": ExternalString, |
| "STRING_TYPE": SeqString, |
| "ASCII_STRING_TYPE": SeqString, |
| "CONS_STRING_TYPE": ConsString, |
| "CONS_ASCII_STRING_TYPE": ConsString, |
| "EXTERNAL_STRING_TYPE": ExternalString, |
| "EXTERNAL_STRING_WITH_ASCII_DATA_TYPE": ExternalString, |
| "EXTERNAL_ASCII_STRING_TYPE": ExternalString, |
| |
| "MAP_TYPE": Map, |
| "ODDBALL_TYPE": Oddball, |
| "FIXED_ARRAY_TYPE": FixedArray, |
| "JS_FUNCTION_TYPE": JSFunction, |
| "SHARED_FUNCTION_INFO_TYPE": SharedFunctionInfo, |
| "SCRIPT_TYPE": Script, |
| "CODE_TYPE": Code |
| } |
| |
| def __init__(self, reader, stack_map): |
| self.reader = reader |
| self.stack_map = stack_map |
| self.objects = {} |
| |
| def FindObjectOrSmi(self, tagged_address): |
| if (tagged_address & 1) == 0: return tagged_address / 2 |
| return self.FindObject(tagged_address) |
| |
| def FindObject(self, tagged_address): |
| if tagged_address in self.objects: |
| return self.objects[tagged_address] |
| if (tagged_address & 1) != 1: return None |
| address = tagged_address - 1 |
| if not self.reader.IsValidAddress(address): return None |
| map_tagged_address = self.reader.ReadU32(address) |
| if tagged_address == map_tagged_address: |
| # Meta map? |
| meta_map = Map(self, None, address) |
| instance_type_name = INSTANCE_TYPES.get(meta_map.instance_type) |
| if instance_type_name != "MAP_TYPE": return None |
| meta_map.map = meta_map |
| object = meta_map |
| else: |
| map = self.FindObject(map_tagged_address) |
| if map is None: return None |
| instance_type_name = INSTANCE_TYPES.get(map.instance_type) |
| if instance_type_name is None: return None |
| cls = V8Heap.CLASS_MAP.get(instance_type_name, HeapObject) |
| object = cls(self, map, address) |
| self.objects[tagged_address] = object |
| return object |
| |
| |
| EIP_PROXIMITY = 64 |
| |
| |
| def AnalyzeMinidump(options, minidump_name): |
| reader = MinidumpReader(options, minidump_name) |
| DebugPrint("========================================") |
| if reader.exception is None: |
| print "Minidump has no exception info" |
| return |
| print "Exception info:" |
| exception_thread = reader.thread_map[reader.exception.thread_id] |
| print " thread id: %d" % exception_thread.id |
| print " code: %08X" % reader.exception.exception.code |
| print " context:" |
| print " eax: %08x" % reader.exception_context.eax |
| print " ebx: %08x" % reader.exception_context.ebx |
| print " ecx: %08x" % reader.exception_context.ecx |
| print " edx: %08x" % reader.exception_context.edx |
| print " edi: %08x" % reader.exception_context.edi |
| print " esi: %08x" % reader.exception_context.esi |
| print " ebp: %08x" % reader.exception_context.ebp |
| print " esp: %08x" % reader.exception_context.esp |
| print " eip: %08x" % reader.exception_context.eip |
| # TODO(vitalyr): decode eflags. |
| print " eflags: %s" % bin(reader.exception_context.eflags)[2:] |
| print |
| |
| stack_bottom = exception_thread.stack.start + \ |
| exception_thread.stack.memory.data_size |
| stack_map = {reader.exception_context.eip: -1} |
| for slot in xrange(reader.exception_context.esp, stack_bottom, 4): |
| maybe_address = reader.ReadU32(slot) |
| if not maybe_address in stack_map: |
| stack_map[maybe_address] = slot |
| heap = V8Heap(reader, stack_map) |
| |
| print "Disassembly around exception.eip:" |
| start = reader.exception_context.eip - EIP_PROXIMITY |
| lines = reader.GetDisasmLines(start, 2 * EIP_PROXIMITY) |
| for line in lines: |
| print FormatDisasmLine(start, heap, line) |
| print |
| |
| print "Annotated stack (from exception.esp to bottom):" |
| for slot in xrange(reader.exception_context.esp, stack_bottom, 4): |
| maybe_address = reader.ReadU32(slot) |
| heap_object = heap.FindObject(maybe_address) |
| print "%08x: %08x" % (slot, maybe_address) |
| if heap_object: |
| heap_object.Print(Printer()) |
| print |
| |
| reader.Dispose() |
| |
| |
| if __name__ == "__main__": |
| parser = optparse.OptionParser(USAGE) |
| options, args = parser.parse_args() |
| if len(args) != 1: |
| parser.print_help() |
| sys.exit(1) |
| AnalyzeMinidump(options, args[0]) |