dwarf: fixup integer overflow in readEhPointer

debug: handle the possibility of eh_frame / debug_frame being mapped in memory or loaded from disk
This commit is contained in:
kcbanner 2023-07-16 02:00:17 -04:00
parent 5e399d97d7
commit 618b0eb3d3
3 changed files with 66 additions and 37 deletions

View File

@ -1253,14 +1253,12 @@ pub const Coff = struct {
return null; return null;
} }
pub fn getSectionData(self: *const Coff, comptime name: []const u8) ![]const u8 { pub fn getSectionData(self: *const Coff, sec: *align(1) const SectionHeader) []const u8 {
const sec = self.getSectionByName(name) orelse return error.MissingCoffSection;
return self.data[sec.pointer_to_raw_data..][0..sec.virtual_size]; return self.data[sec.pointer_to_raw_data..][0..sec.virtual_size];
} }
// Return an owned slice full of the section data pub fn getSectionDataAlloc(self: *const Coff, sec: *align(1) const SectionHeader, allocator: mem.Allocator) ![]u8 {
pub fn getSectionDataAlloc(self: *const Coff, comptime name: []const u8, allocator: mem.Allocator) ![]u8 { const section_data = self.getSectionData(sec);
const section_data = try self.getSectionData(name);
return allocator.dupe(u8, section_data); return allocator.dupe(u8, section_data);
} }
}; };

View File

@ -987,23 +987,19 @@ fn readCoffDebugInfo(allocator: mem.Allocator, coff_obj: *coff.Coff) !ModuleDebu
.debug_data = undefined, .debug_data = undefined,
}; };
if (coff_obj.getSectionByName(".debug_info")) |sec| { if (coff_obj.getSectionByName(".debug_info")) |_| {
// This coff file has embedded DWARF debug info // This coff file has embedded DWARF debug info
_ = sec;
var sections: DW.DwarfInfo.SectionArray = DW.DwarfInfo.null_section_array; var sections: DW.DwarfInfo.SectionArray = DW.DwarfInfo.null_section_array;
errdefer for (sections) |section| if (section) |s| if (s.owned) allocator.free(s.data); errdefer for (sections) |section| if (section) |s| if (s.owned) allocator.free(s.data);
inline for (@typeInfo(DW.DwarfSection).Enum.fields, 0..) |section, i| { inline for (@typeInfo(DW.DwarfSection).Enum.fields, 0..) |section, i| {
sections[i] = if (coff_obj.getSectionDataAlloc("." ++ section.name, allocator)) |data| blk: { sections[i] = if (coff_obj.getSectionByName("." ++ section.name)) |section_header| blk: {
break :blk .{ break :blk .{
.data = data, .data = try coff_obj.getSectionDataAlloc(section_header, allocator),
.virtual_address = section_header.virtual_address,
.owned = true, .owned = true,
}; };
} else |err| blk: { } else null;
if (err == error.MissingCoffSection) break :blk null;
return err;
};
} }
var dwarf = DW.DwarfInfo{ var dwarf = DW.DwarfInfo{
@ -1012,7 +1008,7 @@ fn readCoffDebugInfo(allocator: mem.Allocator, coff_obj: *coff.Coff) !ModuleDebu
.is_macho = false, .is_macho = false,
}; };
try DW.openDwarfDebugInfo(&dwarf, allocator, coff_obj.data); try DW.openDwarfDebugInfo(&dwarf, allocator);
di.debug_data = PdbOrDwarf{ .dwarf = dwarf }; di.debug_data = PdbOrDwarf{ .dwarf = dwarf };
return di; return di;
} }
@ -1049,6 +1045,10 @@ fn chopSlice(ptr: []const u8, offset: u64, size: u64) error{Overflow}![]const u8
return ptr[start..end]; return ptr[start..end];
} }
/// Reads debug info from an ELF file, or the current binary if none in specified.
/// If the required sections aren't present but a reference to external debug info is,
/// then this this function will recurse to attempt to load the debug sections from
/// an external file.
pub fn readElfDebugInfo( pub fn readElfDebugInfo(
allocator: mem.Allocator, allocator: mem.Allocator,
elf_filename: ?[]const u8, elf_filename: ?[]const u8,
@ -1146,10 +1146,12 @@ pub fn readElfDebugInfo(
break :blk .{ break :blk .{
.data = decompressed_section, .data = decompressed_section,
.virtual_address = shdr.sh_addr,
.owned = true, .owned = true,
}; };
} else .{ } else .{
.data = section_bytes, .data = section_bytes,
.virtual_address = shdr.sh_addr,
.owned = false, .owned = false,
}; };
} }
@ -1232,7 +1234,7 @@ pub fn readElfDebugInfo(
.is_macho = false, .is_macho = false,
}; };
try DW.openDwarfDebugInfo(&di, allocator, parent_mapped_mem orelse mapped_mem); try DW.openDwarfDebugInfo(&di, allocator);
return ModuleDebugInfo{ return ModuleDebugInfo{
.base_address = undefined, .base_address = undefined,
@ -1900,6 +1902,10 @@ pub const DebugInfo = struct {
obj_di.* = try readElfDebugInfo(self.allocator, if (ctx.name.len > 0) ctx.name else null, ctx.build_id, null, &sections, null); obj_di.* = try readElfDebugInfo(self.allocator, if (ctx.name.len > 0) ctx.name else null, ctx.build_id, null, &sections, null);
obj_di.base_address = ctx.base_address; obj_di.base_address = ctx.base_address;
// TODO: Don't actually scan everything, search on demand
// Missing unwind info isn't treated as a failure, as the unwinder will fall back to FP-based unwinding
obj_di.dwarf.scanAllUnwindInfo(self.allocator, ctx.base_address) catch {};
try self.address_map.putNoClobber(ctx.base_address, obj_di); try self.address_map.putNoClobber(ctx.base_address, obj_di);
return obj_di; return obj_di;
@ -2004,11 +2010,12 @@ pub const ModuleDebugInfo = switch (native_os) {
inline for (@typeInfo(DW.DwarfSection).Enum.fields, 0..) |section, i| { inline for (@typeInfo(DW.DwarfSection).Enum.fields, 0..) |section, i| {
if (mem.eql(u8, "__" ++ section.name, sect.sectName())) section_index = i; if (mem.eql(u8, "__" ++ section.name, sect.sectName())) section_index = i;
} }
if (section_index == null or sections[section_index.?] != null) continue; if (section_index == null) continue;
const section_bytes = try chopSlice(mapped_mem, sect.offset, sect.size); const section_bytes = try chopSlice(mapped_mem, sect.offset, sect.size);
sections[section_index.?] = .{ sections[section_index.?] = .{
.data = section_bytes, .data = section_bytes,
.virtual_address = sect.addr,
.owned = false, .owned = false,
}; };
} }
@ -2026,9 +2033,11 @@ pub const ModuleDebugInfo = switch (native_os) {
.is_macho = true, .is_macho = true,
}; };
// TODO: Don't actually need to scan unwind info in this case, since __unwind_info points us to the entries try DW.openDwarfDebugInfo(&di, allocator);
// TODO: Don't actually scan everything, search on demand
di.scanAllUnwindInfo(allocator, self.base_address) catch {};
try DW.openDwarfDebugInfo(&di, allocator, mapped_mem);
var info = OFileInfo{ var info = OFileInfo{
.di = di, .di = di,
.addr_table = addr_table, .addr_table = addr_table,

View File

@ -663,7 +663,22 @@ pub const DwarfSection = enum {
pub const DwarfInfo = struct { pub const DwarfInfo = struct {
pub const Section = struct { pub const Section = struct {
data: []const u8, data: []const u8,
// Module-relative virtual address.
// Only set if the section data was loaded from disk.
virtual_address: ?usize = null,
// If `data` is owned by this DwarfInfo.
owned: bool, owned: bool,
// For sections that are not memory mapped by the loader, this is an offset
// from `data.ptr` to where the section would have been mapped. Otherwise,
// `data` is directly backed by the section and the offset is zero.
pub fn virtualOffset(self: Section, base_address: usize) i64 {
return if (self.virtual_address) |va|
@as(i64, @intCast(base_address + va)) -
@as(i64, @intCast(@intFromPtr(self.data.ptr)))
else
0;
}
}; };
const num_sections = std.enums.directEnumArrayLen(DwarfSection, 0); const num_sections = std.enums.directEnumArrayLen(DwarfSection, 0);
@ -690,6 +705,10 @@ pub const DwarfInfo = struct {
return if (di.sections[@intFromEnum(dwarf_section)]) |s| s.data else null; return if (di.sections[@intFromEnum(dwarf_section)]) |s| s.data else null;
} }
pub fn sectionVirtualOffset(di: DwarfInfo, dwarf_section: DwarfSection, base_address: usize) ?i64 {
return if (di.sections[@intFromEnum(dwarf_section)]) |s| s.virtualOffset(base_address) else null;
}
pub fn deinit(di: *DwarfInfo, allocator: mem.Allocator) void { pub fn deinit(di: *DwarfInfo, allocator: mem.Allocator) void {
for (di.sections) |opt_section| { for (di.sections) |opt_section| {
if (opt_section) |s| if (s.owned) allocator.free(s.data); if (opt_section) |s| if (s.owned) allocator.free(s.data);
@ -1540,7 +1559,12 @@ pub const DwarfInfo = struct {
}; };
} }
pub fn scanAllUnwindInfo(di: *DwarfInfo, allocator: mem.Allocator, binary_mem: []const u8) !void { /// If .eh_frame_hdr is present, then only the header needs to be parsed.
///
/// Otherwise, .eh_frame and .debug_frame are scanned and a sorted list
/// of FDEs is built. In this case, the decoded PC ranges in the FDEs
/// are all normalized to be relative to the module's base.
pub fn scanAllUnwindInfo(di: *DwarfInfo, allocator: mem.Allocator, base_address: usize) !void {
if (di.section(.eh_frame_hdr)) |eh_frame_hdr| blk: { if (di.section(.eh_frame_hdr)) |eh_frame_hdr| blk: {
var stream = io.fixedBufferStream(eh_frame_hdr); var stream = io.fixedBufferStream(eh_frame_hdr);
const reader = stream.reader(); const reader = stream.reader();
@ -1582,15 +1606,15 @@ pub const DwarfInfo = struct {
const frame_sections = [2]DwarfSection{ .eh_frame, .debug_frame }; const frame_sections = [2]DwarfSection{ .eh_frame, .debug_frame };
for (frame_sections) |frame_section| { for (frame_sections) |frame_section| {
if (di.section(frame_section)) |eh_frame| { if (di.section(frame_section)) |section_data| {
var stream = io.fixedBufferStream(eh_frame); var stream = io.fixedBufferStream(section_data);
while (stream.pos < stream.buffer.len) { while (stream.pos < stream.buffer.len) {
const entry_header = try EntryHeader.read(&stream, frame_section, di.endian); const entry_header = try EntryHeader.read(&stream, frame_section, di.endian);
switch (entry_header.type) { switch (entry_header.type) {
.cie => { .cie => {
const cie = try CommonInformationEntry.parse( const cie = try CommonInformationEntry.parse(
entry_header.entry_bytes, entry_header.entry_bytes,
-@as(i64, @intCast(@intFromPtr(binary_mem.ptr))), di.sectionVirtualOffset(frame_section, base_address).?,
true, true,
entry_header.is_64, entry_header.is_64,
frame_section, frame_section,
@ -1604,7 +1628,7 @@ pub const DwarfInfo = struct {
const cie = di.cie_map.get(cie_offset) orelse return badDwarf(); const cie = di.cie_map.get(cie_offset) orelse return badDwarf();
const fde = try FrameDescriptionEntry.parse( const fde = try FrameDescriptionEntry.parse(
entry_header.entry_bytes, entry_header.entry_bytes,
-@as(i64, @intCast(@intFromPtr(binary_mem.ptr))), di.sectionVirtualOffset(frame_section, base_address).?,
true, true,
cie, cie,
@sizeOf(usize), @sizeOf(usize),
@ -1637,7 +1661,7 @@ pub const DwarfInfo = struct {
var fde: FrameDescriptionEntry = undefined; var fde: FrameDescriptionEntry = undefined;
// In order to support reading .eh_frame from the ELF file (vs using the already-mapped section), // In order to support reading .eh_frame from the ELF file (vs using the already-mapped section),
// scanAllUnwindInfo has already mapped any pc-relative offsets such that they we be relative to zero // scanAllUnwindInfo has already mapped any pc-relative offsets such that they will be relative to zero
// instead of the actual base address of the module. When using .eh_frame_hdr, PC can be used directly // instead of the actual base address of the module. When using .eh_frame_hdr, PC can be used directly
// as pointers will be decoded relative to the already-mapped .eh_frame. // as pointers will be decoded relative to the already-mapped .eh_frame.
var mapped_pc: usize = undefined; var mapped_pc: usize = undefined;
@ -1653,7 +1677,8 @@ pub const DwarfInfo = struct {
&fde, &fde,
); );
} else { } else {
mapped_pc = context.pc - module_base_address; //mapped_pc = context.pc - module_base_address;
mapped_pc = context.pc;
const index = std.sort.binarySearch(FrameDescriptionEntry, mapped_pc, di.fde_list.items, {}, struct { const index = std.sort.binarySearch(FrameDescriptionEntry, mapped_pc, di.fde_list.items, {}, struct {
pub fn compareFn(_: void, pc: usize, mid_item: FrameDescriptionEntry) std.math.Order { pub fn compareFn(_: void, pc: usize, mid_item: FrameDescriptionEntry) std.math.Order {
if (pc < mid_item.pc_begin) return .lt; if (pc < mid_item.pc_begin) return .lt;
@ -1819,12 +1844,9 @@ pub const UnwindContext = struct {
/// Initialize DWARF info. The caller has the responsibility to initialize most /// Initialize DWARF info. The caller has the responsibility to initialize most
/// the DwarfInfo fields before calling. `binary_mem` is the raw bytes of the /// the DwarfInfo fields before calling. `binary_mem` is the raw bytes of the
/// main binary file (not the secondary debug info file). /// main binary file (not the secondary debug info file).
pub fn openDwarfDebugInfo(di: *DwarfInfo, allocator: mem.Allocator, binary_mem: []const u8) !void { pub fn openDwarfDebugInfo(di: *DwarfInfo, allocator: mem.Allocator) !void {
try di.scanAllFunctions(allocator); try di.scanAllFunctions(allocator);
try di.scanAllCompileUnits(allocator); try di.scanAllCompileUnits(allocator);
// Unwind info is not required
di.scanAllUnwindInfo(allocator, binary_mem) catch {};
} }
/// This function is to make it handy to comment out the return and make it /// This function is to make it handy to comment out the return and make it
@ -1898,9 +1920,10 @@ fn readEhPointer(reader: anytype, enc: u8, addr_size_bytes: u8, ctx: EhPointerCo
else => null, else => null,
}; };
const ptr = if (base) |b| switch (value) { const ptr: u64 = if (base) |b| switch (value) {
.signed => |s| @as(u64, @intCast(s + @as(i64, @intCast(b)))), .signed => |s| @intCast(try math.add(i64, s, @as(i64, @intCast(b)))),
.unsigned => |u| u + b, // absptr can actually contain signed values in some cases (aarch64 MachO)
.unsigned => |u| u +% b,
} else switch (value) { } else switch (value) {
.signed => |s| @as(u64, @intCast(s)), .signed => |s| @as(u64, @intCast(s)),
.unsigned => |u| u, .unsigned => |u| u,
@ -2311,15 +2334,14 @@ pub const FrameDescriptionEntry = struct {
instructions: []const u8, instructions: []const u8,
/// This function expects to read the FDE starting at the PC Begin field. /// This function expects to read the FDE starting at the PC Begin field.
/// The returned struct references memory backed by fde_bytes. /// The returned struct references memory backed by `fde_bytes`.
/// ///
/// `pc_rel_offset` specifies an offset to be applied to pc_rel_base values /// `pc_rel_offset` specifies an offset to be applied to pc_rel_base values
/// used when decoding pointers. This should be set to zero if fde_bytes is /// used when decoding pointers. This should be set to zero if fde_bytes is
/// backed by the memory of the .eh_frame section in the running executable. /// backed by the memory of a .eh_frame / .debug_frame section in the running executable.
///
/// Otherwise, it should be the relative offset to translate addresses from /// Otherwise, it should be the relative offset to translate addresses from
/// where the section is currently stored in memory, to where it *would* be /// where the section is currently stored in memory, to where it *would* be
/// stored at runtime: section runtime offset - backing section data base ptr. /// stored at runtime: section base addr - backing data base ptr.
/// ///
/// Similarly, `is_runtime` specifies this function is being called on a runtime /// Similarly, `is_runtime` specifies this function is being called on a runtime
/// section, and so indirect pointers can be followed. /// section, and so indirect pointers can be followed.