{ This file is part of the Free Pascal run time library. Copyright (c) 2006 by Thomas Schatzl, member of the FreePascal Development team Parts (c) 2000 Peter Vreman (adapted from original dwarfs line reader) Dwarf LineInfo Retriever See the file COPYING.FPC, included in this distribution, for details about the copyright. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. **********************************************************************} { This unit should not be compiled in objfpc mode, since this would make it dependent on objpas unit. } unit lnfodwrf; interface {$S-} {$IF FPC_VERSION<3} type CodePointer = Pointer; {$ENDIF} function GetLineInfo(addr:codeptruint;var func,source:string;var line:longint) : boolean; function DwarfBackTraceStr(addr: CodePointer): shortstring; procedure CloseDwarf; var // Allows more efficient operation by reusing previously loaded debug data // when the target module filename is the same. However, if an invalid memory // address is supplied then further calls may result in an undefined behaviour. // In summary: enable for speed, disable for resilience. AllowReuseOfLineInfoData: Boolean = True; implementation {$IFDEF FPC_DOTTEDUNITS} uses System.ExeInfo; {$ELSE FPC_DOTTEDUNITS} uses exeinfo; {$ENDIF FPC_DOTTEDUNITS} { Current issues: - ignores DW_LNS_SET_FILE } {$MACRO ON} { $DEFINE DEBUG_DWARF_PARSER} {$ifdef DEBUG_DWARF_PARSER} {$define DEBUG_WRITELN := WriteLn} {$define DEBUG_COMMENT := } {$else} {$define DEBUG_WRITELN := //} {$define DEBUG_COMMENT := //} {$endif} { some type definitions } type Bool8 = ByteBool; {$ifdef CPUI8086} TOffset = Word; {$else CPUI8086} TOffset = PtrUInt; {$endif CPUI8086} TSegment = Word; {$WARNING This code is not thread-safe, and needs improvement} var { the input file to read DWARF debug info from, i.e. paramstr(0) } e : TExeFile; { the offset and size of the DWARF debug_line section in the file } Dwarf_Debug_Line_Section_Offset, Dwarf_Debug_Line_Section_Size, { the offset and size of the DWARF debug_info section in the file } Dwarf_Debug_Info_Section_Offset, Dwarf_Debug_Info_Section_Size, { the offset and size of the DWARF debug_aranges section in the file } Dwarf_Debug_Aranges_Section_Offset, Dwarf_Debug_Aranges_Section_Size, { the offset and size of the DWARF debug_abbrev section in the file } Dwarf_Debug_Abbrev_Section_Offset, Dwarf_Debug_Abbrev_Section_Size : longint; { DWARF 2 default opcodes} const { Extended opcodes } DW_LNE_END_SEQUENCE = 1; DW_LNE_SET_ADDRESS = 2; DW_LNE_DEFINE_FILE = 3; {$ifdef CPUI8086} { non-standard Open Watcom extension; might conflict with future versions of the DWARF standard } DW_LNE_SET_SEGMENT = 4; {$endif CPUI8086} { Standard opcodes } DW_LNS_COPY = 1; DW_LNS_ADVANCE_PC = 2; DW_LNS_ADVANCE_LINE = 3; DW_LNS_SET_FILE = 4; DW_LNS_SET_COLUMN = 5; DW_LNS_NEGATE_STMT = 6; DW_LNS_SET_BASIC_BLOCK = 7; DW_LNS_CONST_ADD_PC = 8; DW_LNS_FIXED_ADVANCE_PC = 9; DW_LNS_SET_PROLOGUE_END = 10; DW_LNS_SET_EPILOGUE_BEGIN = 11; DW_LNS_SET_ISA = 12; DW_FORM_addr = $1; DW_FORM_block2 = $3; DW_FORM_block4 = $4; DW_FORM_data2 = $5; DW_FORM_data4 = $6; DW_FORM_data8 = $7; DW_FORM_string = $8; DW_FORM_block = $9; DW_FORM_block1 = $a; DW_FORM_data1 = $b; DW_FORM_flag = $c; DW_FORM_sdata = $d; DW_FORM_strp = $e; DW_FORM_udata = $f; DW_FORM_ref_addr = $10; DW_FORM_ref1 = $11; DW_FORM_ref2 = $12; DW_FORM_ref4 = $13; DW_FORM_ref8 = $14; DW_FORM_ref_udata = $15; DW_FORM_indirect = $16; DW_FORM_sec_offset = $17; DW_FORM_exprloc = $18; DW_FORM_flag_present = $19; type { state record for the line info state machine } TMachineState = record address : QWord; segment : TSegment; file_id : DWord; line : QWord; column : DWord; is_stmt : Boolean; basic_block : Boolean; end_sequence : Boolean; prolouge_end : Boolean; epilouge_begin : Boolean; isa : DWord; append_row : Boolean; end; { DWARF line number program header preceding the line number program, 64 bit version } TLineNumberProgramHeader64 = packed record magic : DWord; unit_length : QWord; version : Word; length : QWord; minimum_instruction_length : Byte; default_is_stmt : Bool8; line_base : ShortInt; line_range : Byte; opcode_base : Byte; end; { DWARF line number program header preceding the line number program, 32 bit version } TLineNumberProgramHeader32 = packed record unit_length : DWord; version : Word; length : DWord; minimum_instruction_length : Byte; default_is_stmt : Bool8; line_base : ShortInt; line_range : Byte; opcode_base : Byte; end; TDebugInfoProgramHeader64 = packed record magic : DWord; unit_length : QWord; version : Word; debug_abbrev_offset : QWord; address_size : Byte; end; TDebugInfoProgramHeader32= packed record unit_length : DWord; version : Word; debug_abbrev_offset : DWord; address_size : Byte; end; TDebugArangesHeader64 = packed record magic : DWord; unit_length : QWord; version : Word; debug_info_offset : QWord; address_size : Byte; segment_size : Byte; {$ifndef CPUI8086} padding : DWord; {$endif CPUI8086} end; TDebugArangesHeader32= packed record unit_length : DWord; version : Word; debug_info_offset : DWord; address_size : Byte; segment_size : Byte; {$ifndef CPUI8086} padding : DWord; {$endif CPUI8086} end; {--------------------------------------------------------------------------- I/O utility functions ---------------------------------------------------------------------------} type {$ifdef cpui8086} TFilePos = LongInt; {$else cpui8086} TFilePos = SizeInt; {$endif cpui8086} var lastfilename: string; { store last processed file } lastbaseaddr: {$ifdef cpui8086}farpointer{$else}pointer{$endif}; { store last base address } lastopendwarf: Boolean; { store last result of processing a file } {$ifdef cpui8086} function tofar(fp: FarPointer): FarPointer; inline; begin tofar:=fp; end; function tofar(cp: NearCsPointer): FarPointer; inline; begin tofar:=Ptr(CSeg,Word(cp)); end; function tofar(cp: NearPointer): FarPointer; inline; begin tofar:=Ptr(DSeg,Word(cp)); end; {$else cpui8086} type tofar=Pointer; {$endif cpui8086} function OpenDwarf(addr : codepointer) : boolean; var oldprocessaddress: TExeProcessAddress; baseaddr : {$ifdef cpui8086}farpointer{$else}pointer{$endif}; filename,dbgfn : ansistring; begin // False by default OpenDwarf:=false; // Empty so can test if GetModuleByAddr has worked filename := ''; // Get filename by address using GetModuleByAddr GetModuleByAddr(tofar(addr),baseaddr,filename); {$ifdef DEBUG_LINEINFO} writeln(stderr,filename,' Baseaddr: ',hexstr(baseaddr)); {$endif DEBUG_LINEINFO} // Check if GetModuleByAddr has worked if filename = '' then exit; // If target filename same as previous, then re-use previous result if AllowReuseOfLineInfoData and (filename = lastfilename) and (baseaddr = lastbaseaddr) then begin {$ifdef DEBUG_LINEINFO} writeln(stderr,'Reusing debug data'); {$endif DEBUG_LINEINFO} OpenDwarf:=lastopendwarf; exit; end; // Close previously opened Dwarf CloseDwarf; // Reset last open dwarf result lastopendwarf := false; // Save newly processed filename lastfilename := filename; // Save newly processed file's base address lastbaseaddr := baseaddr; // Open exe file or debug link if not OpenExeFile(e,filename) then exit; if ReadDebugLink(e,dbgfn) then begin oldprocessaddress:=e.processaddress; CloseExeFile(e); if not OpenExeFile(e,dbgfn) then exit; e.processaddress:=oldprocessaddress; end; // Find debug data section e.processaddress:=ptruint(baseaddr)-e.processaddress; if FindExeSection(e,'.debug_line',Dwarf_Debug_Line_Section_offset,dwarf_Debug_Line_Section_size) and FindExeSection(e,'.debug_info',Dwarf_Debug_Info_Section_offset,dwarf_Debug_Info_Section_size) and FindExeSection(e,'.debug_abbrev',Dwarf_Debug_Abbrev_Section_offset,dwarf_Debug_Abbrev_Section_size) and FindExeSection(e,'.debug_aranges',Dwarf_Debug_Aranges_Section_offset,dwarf_Debug_Aranges_Section_size) then begin lastopendwarf:=true; OpenDwarf:=true; DEBUG_WRITELN('.debug_line starts at offset $',hexstr(Dwarf_Debug_Line_Section_offset,8),' with a size of ',Dwarf_Debug_Line_Section_Size,' Bytes'); DEBUG_WRITELN('.debug_info starts at offset $',hexstr(Dwarf_Debug_Info_Section_offset,8),' with a size of ',Dwarf_Debug_Info_Section_Size,' Bytes'); DEBUG_WRITELN('.debug_abbrev starts at offset $',hexstr(Dwarf_Debug_Abbrev_Section_offset,8),' with a size of ',Dwarf_Debug_Abbrev_Section_Size,' Bytes'); DEBUG_WRITELN('.debug_aranges starts at offset $',hexstr(Dwarf_Debug_Aranges_Section_offset,8),' with a size of ',Dwarf_Debug_Aranges_Section_Size,' Bytes'); end else CloseExeFile(e); end; procedure CloseDwarf; begin if e.isopen then CloseExeFile(e); // Reset last processed filename lastfilename := ''; end; type TEReader = object bufstart, base, limit: Int64; { All of these are absolute. } bufp, bufe: pByte; { bufp = pointer into buf, bufe - bufp = available bytes. } buf: array[0 .. 1023] of byte; procedure Init; procedure SetRange(aBase, aSize : Int64); function Pos : TFilePos; { Relative to base. } procedure Seek(newIndex : Int64); { Relative to base. } function ReadNext : longint; inline; function ReadNext(var dest; size : SizeInt) : Boolean; function ReadULEB128 : QWord; function ReadLEB128 : Int64; function ReadAddress(addr_size: smallint) : PtrUInt; {$ifdef CPUI8086} function ReadSegment() : Word; {$endif CPUI8086} function ReadString : ShortString; function ReadUHalf : Word; private function ReadNextBuffer : longint; end; procedure TEReader.Init; begin bufstart := 0; base := 0; limit := 0; bufp := pByte(buf); bufe := bufp; end; procedure TEReader.SetRange(aBase, aSize : Int64); begin base := aBase; limit := base + aSize; Seek(0); if limit < bufstart + (bufe - pByte(buf)) then begin bufe := pByte(buf) + (limit - bufstart); { Respect the limit if the buffer was reused. Probably unreachable, but just in case... } System.Seek(e.f, limit); end; end; function TEReader.Pos() : TFilePos; begin Pos := (bufstart - base) + (bufp - pByte(buf)); end; procedure TEReader.Seek(newIndex : Int64); var gpos : Int64; begin gpos := base + newIndex; if (gpos >= bufstart) and (gpos <= bufstart + (bufe - pByte(buf))) then bufp := pByte(buf) + (gpos - bufstart) { Reuse the buffer. } else begin bufstart := gpos; System.Seek(e.f, gpos); bufp := pByte(buf); bufe := bufp; end; end; { Returns the next Byte from the input stream, or -1 if there has been an error } function TEReader.ReadNext() : Longint; begin if (bufp = bufe) and (ReadNextBuffer <= 0) then exit(-1); ReadNext := bufp^; inc(bufp); end; { Reads the next size bytes into dest. Returns true if successful, false otherwise. Note that dest may be partially overwritten after returning false. dest = nil^ — skip size bytes. } function TEReader.ReadNext(var dest; size : SizeInt) : Boolean; var bytesread : SizeInt; d: PByte; begin d := @dest; while (size > 0) and ((bufp < bufe) or (ReadNextBuffer > 0)) do begin bytesread := bufe - bufp; if bytesread > size then bytesread := size; if Assigned(d) then begin Move(bufp^, d^, bytesread); inc(d, bytesread); end; inc(bufp, bytesread); dec(size, bytesread); end; ReadNext := size = 0; end; { Reads an unsigned LEB encoded number from the input stream } function TEReader.ReadULEB128() : QWord; var shift : cardinal; begin shift := 0; ReadULEB128 := 0; repeat if (bufp = bufe) and (ReadNextBuffer <= 0) then break; ReadULEB128 := ReadULEB128 or (QWord(bufp^ and $7f) shl shift); inc(bufp); inc(shift, 7); until ((bufp[-1] and $80) = 0); end; { Reads a signed LEB encoded number from the input stream } function TEReader.ReadLEB128() : Int64; var shift : cardinal; begin shift := 0; ReadLEB128 := 0; repeat if (bufp = bufe) and (ReadNextBuffer <= 0) then break; ReadLEB128 := ReadLEB128 or (Int64(bufp^ and $7f) shl shift); inc(bufp); inc(shift, 7); until ((bufp[-1] and $80) = 0); { extend sign. Note that we can not use shl/shr since the latter does not translate to arithmetic shifting for signed types } ReadLEB128 := (not ((ReadLEB128 and (Int64(1) shl (shift-1)))-1)) or ReadLEB128; end; { Reads an address from the current input stream } function TEReader.ReadAddress(addr_size: smallint) : PtrUInt; begin {$ifdef CPUI8086} ReadAddress := 0; if (addr_size = 4) or (addr_size = 2) then {$endif} ReadNext(ReadAddress, sizeof(ReadAddress)); end; {$ifdef CPUI8086} { Reads a segment from the current input stream } function TEReader.ReadSegment() : Word; begin ReadNext(ReadSegment, sizeof(ReadSegment)); end; {$endif CPUI8086} { Reads a zero-terminated string from the current input stream. If the string is larger than 255 chars (maximum allowed number of elements in a ShortString, excess characters will be chopped off. } function TEReader.ReadString() : ShortString; var nbufpart,zp,nmove : SizeInt; begin ReadString[0] := #0; repeat if (bufp = bufe) and (ReadNextBuffer <= 0) then exit(''); { unexpected end of file occurred } nbufpart := bufe - bufp; zp := IndexByte(bufp^, nbufpart, 0); { Search #0 in the available buffer. } if zp >= 0 then nbufpart := zp; { #0 found, copy up to it (otherwise copy the entire available buffer, and don’t end). } nmove := 255 - length(ReadString); if nmove <> 0 then begin if nmove > nbufpart then nmove := nbufpart; Move(bufp^, ReadString[1 + length(ReadString)], nmove); inc(byte(ReadString[0]), nmove); end; inc(bufp, nbufpart); until zp >= 0; inc(bufp); { Null terminator. } end; { Reads an unsigned Half from the current input stream } function TEReader.ReadUHalf() : Word; begin ReadNext(ReadUHalf, sizeof(ReadUHalf)); end; function TEReader.ReadNextBuffer : longint; begin inc(bufstart, bufp - pByte(buf)); ReadNextBuffer := limit - bufstart; if ReadNextBuffer > 0 then begin if ReadNextBuffer > length(buf) then ReadNextBuffer := length(buf); BlockRead(e.f, buf, ReadNextBuffer, ReadNextBuffer); end; bufp := pByte(buf); bufe := pByte(buf) + ReadNextBuffer; end; {--------------------------------------------------------------------------- Generic Dwarf lineinfo reader The line info reader is based on the information contained in DWARF Debugging Information Format Version 3 Chapter 6.2 "Line Number Information" from the DWARF Debugging Information Format Workgroup. For more information on this document see also http://dwarf.freestandards.org/ ---------------------------------------------------------------------------} { initializes the line info state to the default values } procedure InitStateRegisters(var state : TMachineState; const aIs_Stmt : Bool8); begin with state do begin address := 0; segment := 0; file_id := 1; line := 1; column := 0; is_stmt := aIs_Stmt; basic_block := false; end_sequence := false; prolouge_end := false; epilouge_begin := false; isa := 0; append_row := false; end; end; { Skips all line info directory entries } procedure SkipDirectories(var er: TEReader); var s : ShortString; begin while (true) do begin s := er.ReadString(); if (s = '') then break; DEBUG_WRITELN('Skipping directory : ', s); end; end; { Skips an LEB128 } procedure SkipLEB128(var er: TEReader); {$ifdef DEBUG_DWARF_PARSER} var temp : QWord; {$endif} begin {$ifdef DEBUG_DWARF_PARSER}temp := {$endif}er.ReadLEB128(); DEBUG_WRITELN('Skipping LEB128 : ', temp); end; { Skips the filename section from the current file stream } procedure SkipFilenames(var er: TEReader); var s : ShortString; begin while (true) do begin s := er.ReadString(); if (s = '') then break; DEBUG_WRITELN('Skipping filename : ', s); SkipLEB128(er); { skip the directory index for the file } SkipLEB128(er); { skip last modification time for file } SkipLEB128(er); { skip length of file } end; end; function CalculateAddressIncrement(opcode : Byte; const header : TLineNumberProgramHeader64) : Int64; begin CalculateAddressIncrement := (Int64(opcode) - header.opcode_base) div header.line_range * header.minimum_instruction_length; end; function GetFullFilename(var er: TEReader; const filenameStart, directoryStart : Int64; const file_id : DWord) : ShortString; var i : DWord; filename, directory : ShortString; dirindex : Int64; begin filename := ''; directory := ''; i := 1; er.Seek(filenameStart); while (i <= file_id) do begin filename := er.ReadString(); DEBUG_WRITELN('Found "', filename, '"'); if (filename = '') then break; dirindex := er.ReadLEB128(); { read the directory index for the file } SkipLEB128(er); { skip last modification time for file } SkipLEB128(er); { skip length of file } inc(i); end; { if we could not find the file index, exit } if (filename = '') then begin GetFullFilename := '(Unknown file)'; exit; end; er.Seek(directoryStart); i := 1; while (i <= dirindex) do begin directory := er.ReadString(); if (directory = '') then break; inc(i); end; if (directory<>'') and (directory[length(directory)]<>'/') then directory:=directory+'/'; GetFullFilename := directory + filename; end; function ParseCompilationUnit(var er : TEReader; const addr : TOffset; const segment : TSegment; const file_offset : QWord; var source : String; var line : longint; var found : Boolean) : QWord; var state : TMachineState; { we need both headers on the stack, although we only use the 64 bit one internally } header64 : TLineNumberProgramHeader64; header32 : TLineNumberProgramHeader32; adjusted_opcode : Int64; opcode : PtrInt; extended_opcode : PtrInt; extended_opcode_length : PtrInt; i, addrIncrement, lineIncrement : PtrInt; {$ifdef DEBUG_DWARF_PARSER} s : ShortString; {$endif} numoptable : array[1..255] of Byte; { the offset into the file where the include directories are stored for this compilation unit } include_directories : QWord; { the offset into the file where the file names are stored for this compilation unit } file_names : Int64; temp_length : DWord; unit_length : QWord; header_length : SizeInt; first_row : Boolean; prev_line : QWord; prev_file : DWord; begin prev_line := 0; prev_file := 0; first_row := true; found := false; er.ReadNext(temp_length, sizeof(temp_length)); if (temp_length <> $ffffffff) then begin unit_length := temp_length + sizeof(temp_length) end else begin er.ReadNext(unit_length, sizeof(unit_length)); inc(unit_length, 12); end; ParseCompilationUnit := file_offset + unit_length; er.SetRange(file_offset, unit_length); DEBUG_WRITELN('Unit length: ', unit_length); if (temp_length <> $ffffffff) then begin DEBUG_WRITELN('32 bit DWARF detected'); er.ReadNext(header32, sizeof(header32)); header64.magic := $ffffffff; header64.unit_length := header32.unit_length; header64.version := header32.version; header64.length := header32.length; header64.minimum_instruction_length := header32.minimum_instruction_length; header64.default_is_stmt := header32.default_is_stmt; header64.line_base := header32.line_base; header64.line_range := header32.line_range; header64.opcode_base := header32.opcode_base; header_length := sizeof(header32.length) + sizeof(header32.version) + sizeof(header32.unit_length); end else begin DEBUG_WRITELN('64 bit DWARF detected'); er.ReadNext(header64, sizeof(header64)); header_length := sizeof(header64.magic) + sizeof(header64.version) + sizeof(header64.length) + sizeof(header64.unit_length); end; inc(header_length, header64.length); fillchar(numoptable, sizeof(numoptable), #0); er.ReadNext(numoptable, header64.opcode_base-1); DEBUG_WRITELN('Opcode parameter count table'); for i := 1 to header64.opcode_base-1 do begin DEBUG_WRITELN('Opcode[', i, '] - ', numoptable[i], ' parameters'); end; DEBUG_WRITELN('Reading directories...'); include_directories := er.Pos(); SkipDirectories(er); DEBUG_WRITELN('Reading filenames...'); file_names := er.Pos(); SkipFilenames(er); er.Seek(header_length); with header64 do begin InitStateRegisters(state, default_is_stmt); end; opcode := er.ReadNext(); while (opcode <> -1) and (not found) do begin DEBUG_WRITELN('Next opcode: '); case (opcode) of { extended opcode } 0 : begin extended_opcode_length := er.ReadULEB128(); extended_opcode := er.ReadNext(); case (extended_opcode) of -1: begin exit; end; DW_LNE_END_SEQUENCE : begin state.end_sequence := true; state.append_row := true; DEBUG_WRITELN('DW_LNE_END_SEQUENCE'); end; DW_LNE_SET_ADDRESS : begin state.address := er.ReadAddress(extended_opcode_length-1); DEBUG_WRITELN('DW_LNE_SET_ADDRESS (', hexstr(state.address, sizeof(state.address)*2), ')'); end; {$ifdef CPUI8086} DW_LNE_SET_SEGMENT : begin state.segment := er.ReadSegment(); DEBUG_WRITELN('DW_LNE_SET_SEGMENT (', hexstr(state.segment, sizeof(state.segment)*2), ')'); end; {$endif CPUI8086} DW_LNE_DEFINE_FILE : begin {$ifdef DEBUG_DWARF_PARSER}s := {$endif}er.ReadString(); SkipLEB128(er); SkipLEB128(er); SkipLEB128(er); DEBUG_WRITELN('DW_LNE_DEFINE_FILE (', s, ')'); end; else begin DEBUG_WRITELN('Unknown extended opcode (opcode ', extended_opcode, ' length ', extended_opcode_length, ')'); if (extended_opcode_length>1) and not er.ReadNext(nil^, extended_opcode_length-1) then exit; end; end; end; DW_LNS_COPY : begin state.basic_block := false; state.prolouge_end := false; state.epilouge_begin := false; state.append_row := true; DEBUG_WRITELN('DW_LNS_COPY'); end; DW_LNS_ADVANCE_PC : begin inc(state.address, er.ReadULEB128() * header64.minimum_instruction_length); DEBUG_WRITELN('DW_LNS_ADVANCE_PC (', hexstr(state.address, sizeof(state.address)*2), ')'); end; DW_LNS_ADVANCE_LINE : begin // inc(state.line, ReadLEB128()); negative values are allowed // but those may generate a range check error state.line := state.line + er.ReadLEB128(); DEBUG_WRITELN('DW_LNS_ADVANCE_LINE (', state.line, ')'); end; DW_LNS_SET_FILE : begin state.file_id := er.ReadULEB128(); DEBUG_WRITELN('DW_LNS_SET_FILE (', state.file_id, ')'); end; DW_LNS_SET_COLUMN : begin state.column := er.ReadULEB128(); DEBUG_WRITELN('DW_LNS_SET_COLUMN (', state.column, ')'); end; DW_LNS_NEGATE_STMT : begin state.is_stmt := not state.is_stmt; DEBUG_WRITELN('DW_LNS_NEGATE_STMT (', state.is_stmt, ')'); end; DW_LNS_SET_BASIC_BLOCK : begin state.basic_block := true; DEBUG_WRITELN('DW_LNS_SET_BASIC_BLOCK'); end; DW_LNS_CONST_ADD_PC : begin inc(state.address, CalculateAddressIncrement(255, header64)); DEBUG_WRITELN('DW_LNS_CONST_ADD_PC (', hexstr(state.address, sizeof(state.address)*2), ')'); end; DW_LNS_FIXED_ADVANCE_PC : begin inc(state.address, er.ReadUHalf()); DEBUG_WRITELN('DW_LNS_FIXED_ADVANCE_PC (', hexstr(state.address, sizeof(state.address)*2), ')'); end; DW_LNS_SET_PROLOGUE_END : begin state.prolouge_end := true; DEBUG_WRITELN('DW_LNS_SET_PROLOGUE_END'); end; DW_LNS_SET_EPILOGUE_BEGIN : begin state.epilouge_begin := true; DEBUG_WRITELN('DW_LNS_SET_EPILOGUE_BEGIN'); end; DW_LNS_SET_ISA : begin state.isa := er.ReadULEB128(); DEBUG_WRITELN('DW_LNS_SET_ISA (', state.isa, ')'); end; else begin { special opcode } if (opcode < header64.opcode_base) then begin DEBUG_WRITELN('Unknown standard opcode $', hexstr(opcode, 2), '; skipping'); for i := 1 to numoptable[opcode] do SkipLEB128(er); end else begin adjusted_opcode := opcode - header64.opcode_base; addrIncrement := CalculateAddressIncrement(opcode, header64); inc(state.address, addrIncrement); lineIncrement := header64.line_base + (adjusted_opcode mod header64.line_range); inc(state.line, lineIncrement); DEBUG_WRITELN('Special opcode $', hexstr(opcode, 2), ' address increment: ', addrIncrement, ' new line: ', lineIncrement); state.basic_block := false; state.prolouge_end := false; state.epilouge_begin := false; state.append_row := true; end; end; end; if (state.append_row) then begin DEBUG_WRITELN('Current state : address = ', hexstr(state.address, sizeof(state.address) * 2), {$ifdef CPUI8086} DEBUG_COMMENT ' segment = ', hexstr(state.segment, sizeof(state.segment) * 2), {$endif CPUI8086} DEBUG_COMMENT ' file_id = ', state.file_id, ' line = ', state.line, ' column = ', state.column, DEBUG_COMMENT ' is_stmt = ', state.is_stmt, ' basic_block = ', state.basic_block, DEBUG_COMMENT ' end_sequence = ', state.end_sequence, ' prolouge_end = ', state.prolouge_end, DEBUG_COMMENT ' epilouge_begin = ', state.epilouge_begin, ' isa = ', state.isa); if (first_row) then begin if (state.segment > segment) or ((state.segment = segment) and (state.address > addr)) then break; first_row := false; end; { when we have found the address we need to return the previous line because that contains the call instruction Note that there may not be any call instruction, because this may be the actual instruction that crashed, and it may be on the first line of the function } if (state.segment > segment) or ((state.segment = segment) and (state.address >= addr)) then found:=true else begin { save line information } prev_file := state.file_id; prev_line := state.line; end; state.append_row := false; if (state.end_sequence) then begin InitStateRegisters(state, header64.default_is_stmt); first_row := true; end; end; opcode := er.ReadNext(); end; if (found) then begin { can happen if the crash happens on the first instruction with line info } if prev_line = 0 then begin prev_line := state.line; prev_file := state.file_id; end; line := prev_line; source := GetFullFilename(er, file_names, include_directories, prev_file); end; end; type TAbbrevs = record Tags : array of QWord; Children : array of Byte; Attrs : array of array of record attr,form : QWord; end; end; procedure ReadAbbrevTable(var er: TEReader; var abbrevs: TAbbrevs); var i : PtrInt; tag, nr, attr, form : Int64; begin DEBUG_WRITELN('Starting to read abbrev. section at $',hexstr(Dwarf_Debug_Abbrev_Section_Offset+er.Pos,16)); repeat nr:=er.ReadULEB128; if nr=0 then break; if nr>high(abbrevs.Tags) then begin SetLength(abbrevs.Tags,SizeUint(nr)+128+SizeUint(nr) div 4); SetLength(abbrevs.Attrs,length(abbrevs.Tags)); SetLength(abbrevs.Children,length(abbrevs.Tags)); end; { read tag } tag:=er.ReadULEB128; abbrevs.Tags[nr]:=tag; DEBUG_WRITELN('Abbrev ',nr,' at offset ',er.Pos,' has tag $',hexstr(tag,4)); { read flag for children } abbrevs.Children[nr]:=er.ReadNext; i:=0; { ensure that length(Abbrev_Attrs)=0 if an entry is overwritten (not sure if this will ever happen) and the new entry has no attributes } abbrevs.Attrs[nr]:=nil; repeat attr:=er.ReadULEB128; form:=er.ReadULEB128; if attr<>0 then begin SetLength(abbrevs.Attrs[nr],i+1); abbrevs.Attrs[nr][i].attr:=attr; abbrevs.Attrs[nr][i].form:=form; end; inc(i); until attr=0; DEBUG_WRITELN('Abbrev ',nr,' has ',Length(abbrevs.Attrs[nr]),' attributes'); until false; end; function ParseCompilationUnitForDebugInfoOffset(var er: TEReader; const addr : TOffset; const segment : TSegment; const file_offset : QWord; var debug_info_offset : QWord; var found : Boolean) : QWord; {$ifndef CPUI8086} const arange_segment = 0; {$endif CPUI8086} var { we need both headers on the stack, although we only use the 64 bit one internally } header64 : TDebugArangesHeader64; header32 : TDebugArangesHeader32; temp_length : DWord; unit_length : QWord; {$ifdef CPUI8086} arange_start, arange_size: DWord; arange_segment: Word; {$else CPUI8086} arange_start, arange_size: PtrUInt; {$endif CPUI8086} begin found := false; er.ReadNext(temp_length, sizeof(temp_length)); if (temp_length <> $ffffffff) then begin unit_length := temp_length + sizeof(temp_length) end else begin er.ReadNext(unit_length, sizeof(unit_length)); inc(unit_length, 12); end; ParseCompilationUnitForDebugInfoOffset := file_offset + unit_length; er.SetRange(file_offset, unit_length); DEBUG_WRITELN('Unit length: ', unit_length); if (temp_length <> $ffffffff) then begin DEBUG_WRITELN('32 bit DWARF detected'); er.ReadNext(header32, sizeof(header32)); header64.magic := $ffffffff; header64.unit_length := header32.unit_length; header64.version := header32.version; header64.debug_info_offset := header32.debug_info_offset; header64.address_size := header32.address_size; header64.segment_size := header32.segment_size; end else begin DEBUG_WRITELN('64 bit DWARF detected'); er.ReadNext(header64, sizeof(header64)); end; DEBUG_WRITELN('debug_info_offset: ',header64.debug_info_offset); DEBUG_WRITELN('address_size: ', header64.address_size); DEBUG_WRITELN('segment_size: ', header64.segment_size); arange_start:=er.ReadAddress(header64.address_size); {$ifdef CPUI8086} arange_segment:=er.ReadSegment(); {$endif CPUI8086} arange_size:=er.ReadAddress(header64.address_size); while not((arange_start=0) and (arange_segment=0) and (arange_size=0)) and (not found) do begin if (segment=arange_segment) and (addr>=arange_start) and (addr<=arange_start+arange_size) then begin found:=true; debug_info_offset:=header64.debug_info_offset; DEBUG_WRITELN('Matching aranges entry $',hexStr(arange_start,header64.address_size*2),', $',hexStr(arange_size,header64.address_size*2)); end; arange_start:=er.ReadAddress(header64.address_size); {$ifdef CPUI8086} arange_segment:=er.ReadSegment(); {$endif CPUI8086} arange_size:=er.ReadAddress(header64.address_size); end; end; function ParseCompilationUnitForFunctionName(var er: TEReader; const addr : TOffset; const segment : TSegment; const file_offset : QWord; var func : String; var found : Boolean) : QWord; var { we need both headers on the stack, although we only use the 64 bit one internally } header64 : TDebugInfoProgramHeader64; header32 : TDebugInfoProgramHeader32; isdwarf64 : boolean; abbrev, high_pc, low_pc : QWord; temp_length : DWord; unit_length : QWord; name : String; level : Integer; procedure SkipAttr(var er: TEReader; form : QWord); var dl,nskip : dword; begin nskip := 0; case form of DW_FORM_addr: nskip := header64.address_size; DW_FORM_block2: nskip := er.ReadUHalf; DW_FORM_block4: begin er.ReadNext(dl,SizeOf(dl)); nskip := dl; end; DW_FORM_data2, DW_FORM_data4, DW_FORM_data8: nskip := 2 shl (form - DW_FORM_data2); DW_FORM_string: er.ReadString; DW_FORM_block, DW_FORM_exprloc: nskip := er.ReadULEB128; DW_FORM_block1: nskip := er.ReadNext; DW_FORM_data1, DW_FORM_flag: er.ReadNext; DW_FORM_sdata: er.ReadLEB128; DW_FORM_ref_addr: { the size of DW_FORM_ref_addr changed between DWAWRF2 and later versions: in DWARF2 it depends on the architecture address size, in later versions on the DWARF type (32 bit/64 bit) } if header64.version>2 then begin if isdwarf64 then nskip := 8 else nskip := 4; end else begin { address size for DW_FORM_ref_addr must be at least 32 bits } { this is compatible with Open Watcom on i8086 } if header64.address_size<4 then nskip := 4 else nskip := header64.address_size; end; DW_FORM_strp, DW_FORM_sec_offset: if isdwarf64 then nskip := 8 else nskip := 4; DW_FORM_udata: er.ReadULEB128; DW_FORM_ref1, DW_FORM_ref2, DW_FORM_ref4, DW_FORM_ref8: nskip := 1 shl (form - DW_FORM_ref1); DW_FORM_ref_udata: er.ReadULEB128; DW_FORM_indirect: SkipAttr(er, er.ReadULEB128); DW_FORM_flag_present: {none}; else begin writeln(stderr,'Internal error: unknown dwarf form: $',hexstr(form,2)); nskip := 1; end; end; er.ReadNext(nil^, nskip); end; var i : PtrInt; prev_base,prev_size,prev_pos : TFilePos; abbrevs : TAbbrevs; begin found := false; er.ReadNext(temp_length, sizeof(temp_length)); if (temp_length <> $ffffffff) then begin unit_length := temp_length + sizeof(temp_length) end else begin er.ReadNext(unit_length, sizeof(unit_length)); inc(unit_length, 12); end; ParseCompilationUnitForFunctionName := file_offset + unit_length; er.SetRange(file_offset, unit_length); DEBUG_WRITELN('Unit length: ', unit_length); if (temp_length <> $ffffffff) then begin DEBUG_WRITELN('32 bit DWARF detected'); er.ReadNext(header32, sizeof(header32)); header64.magic := $ffffffff; header64.unit_length := header32.unit_length; header64.version := header32.version; header64.debug_abbrev_offset := header32.debug_abbrev_offset; header64.address_size := header32.address_size; isdwarf64:=false; end else begin DEBUG_WRITELN('64 bit DWARF detected'); er.ReadNext(header64, sizeof(header64)); isdwarf64:=true; end; DEBUG_WRITELN('debug_abbrev_offset: ',header64.debug_abbrev_offset); DEBUG_WRITELN('address_size: ',header64.address_size); { not nice, but we have to read the abbrev section after the start of the debug_info section has been read } prev_size:=er.limit-er.base; prev_base:=er.base; prev_pos:=er.Pos; er.SetRange(Dwarf_Debug_Abbrev_Section_Offset+header64.debug_abbrev_offset,Dwarf_Debug_Abbrev_Section_Size); ReadAbbrevTable(er, abbrevs); { restore previous reading state and position } er.SetRange(prev_base,prev_size); er.Seek(prev_pos); abbrev:=er.ReadULEB128; level:=0; while (abbrev <> 0) and (not found) do begin DEBUG_WRITELN('Next abbrev: ',abbrev); if abbrevs.Children[abbrev]<>0 then inc(level); { DW_TAG_subprogram? } if abbrevs.Tags[abbrev]=$2e then begin low_pc:=1; high_pc:=0; name:=''; for i:=0 to high(abbrevs.Attrs[abbrev]) do begin { DW_AT_low_pc } if (abbrevs.Attrs[abbrev][i].attr=$11) and (abbrevs.Attrs[abbrev][i].form=DW_FORM_addr) then begin low_pc:=0; er.ReadNext(low_pc,header64.address_size); end { DW_AT_high_pc } else if (abbrevs.Attrs[abbrev][i].attr=$12) and (abbrevs.Attrs[abbrev][i].form=DW_FORM_addr) then begin high_pc:=0; er.ReadNext(high_pc,header64.address_size); end { DW_AT_name } else if (abbrevs.Attrs[abbrev][i].attr=$3) and { avoid that we accidently read an DW_FORM_strp entry accidently } (abbrevs.Attrs[abbrev][i].form=DW_FORM_string) then begin name:=er.ReadString; end else SkipAttr(er, abbrevs.Attrs[abbrev][i].form); end; DEBUG_WRITELN('Got DW_TAG_subprogram with low pc = $',hexStr(low_pc,header64.address_size*2),', high pc = $',hexStr(high_pc,header64.address_size*2),', name = ',name); if (addr>low_pc) and (addr0) and (abbrev=0) do begin dec(level); abbrev:=er.ReadULEB128; end; end; end; const { 64 bit and 32 bit CPUs tend to have more memory } {$if defined(CPU64)} LineInfoCacheLength = 2039; {$elseif defined(CPU32)} LineInfoCacheLength = 251; {$else} LineInfoCacheLength = 1; {$endif CPU64} var LineInfoCache : array[0..LineInfoCacheLength-1] of record addr : codeptruint; func, source : string; line : longint; end; function GetLineInfo(addr : codeptruint; var func, source : string; var line : longint) : boolean; var current_offset, end_offset, debug_info_offset_from_aranges : QWord; segment : Word = 0; found, found_aranges : Boolean; CacheIndex: CodePtrUInt; er: TEReader; begin func := ''; source := ''; GetLineInfo:=false; CacheIndex:=addr mod LineInfoCacheLength; if LineInfoCache[CacheIndex].addr=addr then begin func:=LineInfoCache[CacheIndex].func; source:=LineInfoCache[CacheIndex].source; line:=LineInfoCache[CacheIndex].line; GetLineInfo:=true; exit; end; if not OpenDwarf(codepointer(addr)) then exit; {$ifdef CPUI8086} {$if defined(FPC_MM_MEDIUM) or defined(FPC_MM_LARGE) or defined(FPC_MM_HUGE)} segment := (addr shr 16) - e.processsegment; addr := Word(addr); {$else} segment := CSeg - e.processsegment; {$endif} {$endif CPUI8086} addr := addr - e.processaddress; current_offset := Dwarf_Debug_Line_Section_Offset; end_offset := Dwarf_Debug_Line_Section_Offset + Dwarf_Debug_Line_Section_Size; er.Init; found := false; while (current_offset < end_offset) and (not found) do begin er.SetRange(current_offset, end_offset - current_offset); current_offset := ParseCompilationUnit(er, addr, segment, current_offset, source, line, found); end; current_offset := Dwarf_Debug_Aranges_Section_Offset; end_offset := Dwarf_Debug_Aranges_Section_Offset + Dwarf_Debug_Aranges_Section_Size; found_aranges := false; while (current_offset < end_offset) and (not found_aranges) do begin er.SetRange(current_offset, end_offset - current_offset); current_offset := ParseCompilationUnitForDebugInfoOffset(er, addr, segment, current_offset, debug_info_offset_from_aranges, found_aranges); end; { no function name found yet } found := false; if found_aranges then begin DEBUG_WRITELN('Found .debug_info offset $',hexstr(debug_info_offset_from_aranges,8),' from .debug_aranges'); current_offset := Dwarf_Debug_Info_Section_Offset + debug_info_offset_from_aranges; end_offset := Dwarf_Debug_Info_Section_Offset + debug_info_offset_from_aranges + Dwarf_Debug_Info_Section_Size; DEBUG_WRITELN('Reading .debug_info at section offset $',hexStr(current_offset-Dwarf_Debug_Info_Section_Offset,16)); er.SetRange(current_offset, end_offset - current_offset); current_offset := ParseCompilationUnitForFunctionName(er, addr, segment, current_offset, func, found); if found then DEBUG_WRITELN('Found .debug_info entry by using .debug_aranges information'); end else DEBUG_WRITELN('No .debug_info offset found from .debug_aranges'); current_offset := Dwarf_Debug_Info_Section_Offset; end_offset := Dwarf_Debug_Info_Section_Offset + Dwarf_Debug_Info_Section_Size; while (current_offset < end_offset) and (not found) do begin DEBUG_WRITELN('Reading .debug_info at section offset $',hexStr(current_offset-Dwarf_Debug_Info_Section_Offset,16)); er.SetRange(current_offset, end_offset - current_offset); current_offset := ParseCompilationUnitForFunctionName(er, addr, segment, current_offset, func, found); end; if not AllowReuseOfLineInfoData then CloseDwarf; LineInfoCache[CacheIndex].addr:=addr; LineInfoCache[CacheIndex].func:=func; LineInfoCache[CacheIndex].source:=source; LineInfoCache[CacheIndex].line:=line; GetLineInfo:=true; end; function DwarfBackTraceStr(addr: CodePointer): shortstring; var func, source : string; hs : string; line : longint; Store : TBackTraceStrFunc; Success : boolean; begin {$ifdef DEBUG_LINEINFO} writeln(stderr,'DwarfBackTraceStr called'); {$endif DEBUG_LINEINFO} { reset to prevent infinite recursion if problems inside the code } Success:=false; Store := BackTraceStrFunc; BackTraceStrFunc := @SysBackTraceStr; Success:=GetLineInfo(codeptruint(addr), func, source, line); { create string } DwarfBackTraceStr :=' $' + HexStr(addr); if Success then begin if func<>'' then DwarfBackTraceStr := DwarfBackTraceStr + ' ' + func; if source<>'' then begin if func<>'' then DwarfBackTraceStr := DwarfBackTraceStr + ', '; if line<>0 then begin str(line, hs); DwarfBackTraceStr := DwarfBackTraceStr + ' line ' + hs; end; DwarfBackTraceStr := DwarfBackTraceStr + ' of ' + source; end; end; BackTraceStrFunc := Store; end; initialization lastfilename := ''; lastopendwarf := false; BackTraceStrFunc := @DwarfBacktraceStr; finalization CloseDwarf; end.