/* radare - LGPL - Copyright 2012-2014 - pancake, Fedor Sakharov */ #define D0 if(1) #define D1 if(1) #include #define DWARF_DUMP 0 #if DWARF_DUMP #define DBGFD stdout #else #define DBGFD NULL #endif #include #include #include #define STANDARD_OPERAND_COUNT_DWARF2 9 #define STANDARD_OPERAND_COUNT_DWARF3 12 #define R_BIN_DWARF_INFO 1 #define READ(x,y) *((y*)x); x += sizeof (y) static const char *dwarf_tag_name_encodings[] = { [DW_TAG_array_type] = "DW_TAG_array_type", [DW_TAG_class_type] = "DW_TAG_class_type", [DW_TAG_entry_point] = "DW_TAG_entry_point", [DW_TAG_enumeration_type] = "DW_TAG_enumeration_type", [DW_TAG_formal_parameter] = "DW_TAG_formal_parameter", [DW_TAG_imported_declaration] = "DW_TAG_imported_declaration", [DW_TAG_label] = "DW_TAG_label", [DW_TAG_lexical_block] = "DW_TAG_lexical_block", [DW_TAG_member] = "DW_TAG_member", [DW_TAG_pointer_type] = "DW_TAG_pointer_type", [DW_TAG_reference_type] = "DW_TAG_reference_type", [DW_TAG_compile_unit] = "DW_TAG_compile_unit", [DW_TAG_string_type] = "DW_TAG_string_type", [DW_TAG_structure_type] = "DW_TAG_structure_type", [DW_TAG_subroutine_type] = "DW_TAG_subroutine_type", [DW_TAG_typedef] = "DW_TAG_typedef", [DW_TAG_union_type] = "DW_TAG_union_type", [DW_TAG_unspecified_parameters] = "DW_TAG_unspecified_parameters", [DW_TAG_variant] = "DW_TAG_variant", [DW_TAG_common_block] = "DW_TAG_common_block", [DW_TAG_common_inclusion] = "DW_TAG_common_inclusion", [DW_TAG_inheritance] = "DW_TAG_inheritance", [DW_TAG_inlined_subroutine] = "DW_TAG_inlined_subroutine", [DW_TAG_module] = "DW_TAG_module", [DW_TAG_ptr_to_member_type] = "DW_TAG_ptr_to_member_type", [DW_TAG_set_type] = "DW_TAG_set_type", [DW_TAG_subrange_type] = "DW_TAG_subrange_type", [DW_TAG_with_stmt] = "DW_TAG_with_stmt", [DW_TAG_access_declaration] = "DW_TAG_access_declaration", [DW_TAG_base_type] = "DW_TAG_base_type", [DW_TAG_catch_block] = "DW_TAG_catch_block", [DW_TAG_const_type] = "DW_TAG_const_type", [DW_TAG_constant] = "DW_TAG_constant", [DW_TAG_enumerator] = "DW_TAG_enumerator", [DW_TAG_file_type] = "DW_TAG_file_type", [DW_TAG_friend] = "DW_TAG_friend", [DW_TAG_namelist] = "DW_TAG_namelist", [DW_TAG_namelist_item] = "DW_TAG_namelist_item", [DW_TAG_packed_type] = "DW_TAG_packed_type", [DW_TAG_subprogram] = "DW_TAG_subprogram", [DW_TAG_template_type_param] = "DW_TAG_template_type_param", [DW_TAG_template_value_param] = "DW_TAG_template_value_param", [DW_TAG_thrown_type] = "DW_TAG_thrown_type", [DW_TAG_try_block] = "DW_TAG_try_block", [DW_TAG_variant_part] = "DW_TAG_variant_part", [DW_TAG_variable] = "DW_TAG_variable", [DW_TAG_volatile_type] = "DW_TAG_volatile_type" }; static const char *dwarf_attr_encodings[] = { [DW_AT_sibling] = "DW_AT_siblings", [DW_AT_location] = "DW_AT_location", [DW_AT_name] = "DW_AT_name", [DW_AT_ordering] = "DW_AT_ordering", [DW_AT_byte_size] = "DW_AT_byte_size", [DW_AT_bit_size] = "DW_AT_bit_size", [DW_AT_stmt_list] = "DW_AT_stmt_list", [DW_AT_low_pc] = "DW_AT_low_pc", [DW_AT_high_pc] = "DW_AT_high_pc", [DW_AT_language] = "DW_AT_language", [DW_AT_discr] = "DW_AT_discr", [DW_AT_discr_value] = "DW_AT_discr_value", [DW_AT_visibility] = "DW_AT_visibility", [DW_AT_import] = "DW_AT_import", [DW_AT_string_length] = "DW_AT_string_length", [DW_AT_common_reference] = "DW_AT_common_reference", [DW_AT_comp_dir] = "DW_AT_comp_dir", [DW_AT_const_value] = "DW_AT_const_value", [DW_AT_containing_type] = "DW_AT_containig_type", [DW_AT_default_value] = "DW_AT_default_value", [DW_AT_inline] = "DW_AT_inline", [DW_AT_is_optional] = "DW_AT_is_optional", [DW_AT_lower_bound] = "DW_AT_lower_bound", [DW_AT_producer] = "DW_AT_producer", [DW_AT_prototyped] = "DW_AT_prototyped", [DW_AT_return_addr] = "DW_AT_return_addr", [DW_AT_start_scope] = "DW_AT_start_scope", [DW_AT_stride_size] = "DW_AT_stride_size", [DW_AT_upper_bound] = "DW_AT_upper_bound", [DW_AT_abstract_origin] = "DW_AT_abstract_origin", [DW_AT_accessibility] = "DW_AT_accessibility", [DW_AT_address_class] = "DW_AT_address_class", [DW_AT_artificial] = "DW_AT_artificial", [DW_AT_base_types] = "DW_AT_base_types", [DW_AT_calling_convention] = "DW_AT_calling_convention", [DW_AT_count] = "DW_AT_count", [DW_AT_data_member_location] = "DW_AT_data_member_location", [DW_AT_decl_column] = "DW_AT_decl_column", [DW_AT_decl_file] = "DW_AT_decl_file", [DW_AT_decl_line] = "DW_AT_decl_line", [DW_AT_declaration] = "DW_AT_declaration", [DW_AT_discr_list] = "DW_AT_discr_list", [DW_AT_encoding] = "DW_AT_encoding", [DW_AT_external] = "DW_AT_external", [DW_AT_frame_base] = "DW_AT_frame_base", [DW_AT_friend] = "DW_AT_friend", [DW_AT_identifier_case] = "DW_AT_identifier_case", [DW_AT_macro_info] = "DW_AT_macro_info", [DW_AT_namelist_item] = "DW_AT_namelist_item", [DW_AT_priority] = "DW_AT_priority", [DW_AT_segment] = "DW_AT_segment", [DW_AT_specification] = "DW_AT_specification", [DW_AT_static_link] = "DW_AT_static_link", [DW_AT_type] = "DW_AT_type", [DW_AT_use_location] = "DW_AT_use_location", [DW_AT_variable_parameter] = "DW_AT_variable_parameter", [DW_AT_virtuality] = "DW_AT_virtuality", [DW_AT_vtable_elem_location] = "DW_AT_vtable_elem_location" }; static const char *dwarf_attr_form_encodings[] = { [DW_FORM_addr] = "DW_FORM_addr", [DW_FORM_block2] = "DW_FORM_block2", [DW_FORM_block4] = "DW_FORM_block4", [DW_FORM_data2] = "DW_FORM_data2", [DW_FORM_data4] = "DW_FORM_data4", [DW_FORM_data8] = "DW_FORM_data8", [DW_FORM_string] = "DW_FORM_string", [DW_FORM_block] = "DW_FORM_block", [DW_FORM_block1] = "DW_FORM_block1", [DW_FORM_data1] = "DW_FORM_data1", [DW_FORM_flag] = "DW_FORM_flag", [DW_FORM_sdata] = "DW_FORM_sdata", [DW_FORM_strp] = "DW_FORM_strp", [DW_FORM_udata] = "DW_FORM_udata", [DW_FORM_ref_addr] = "DW_FORM_ref_addr", [DW_FORM_ref1] = "DW_FORM_ref1", [DW_FORM_ref2] = "DW_FORM_ref2", [DW_FORM_ref4] = "DW_FORM_ref4", [DW_FORM_ref8] = "DW_FORM_ref8", [DW_FORM_ref_udata] = "DW_FORM_ref_udata", [DW_FORM_indirect] = "DW_FORM_indirect" }; static const char *dwarf_langs[] = { [DW_LANG_C89] = "C89", [DW_LANG_C] = "C", [DW_LANG_Ada83] = "Ada83", [DW_LANG_C_plus_plus] = "C++", [DW_LANG_Cobol74] = "Cobol74", [DW_LANG_Cobol85] = "Cobol85", [DW_LANG_Fortran77] = "Fortran77", [DW_LANG_Fortran90] = "Fortran90", [DW_LANG_Pascal83] = "Pascal83", [DW_LANG_Modula2] = "Modula2", [DW_LANG_Java] = "Java", [DW_LANG_C99] = "C99", [DW_LANG_Ada95] = "Ada95", [DW_LANG_Fortran95] = "Fortran95", [DW_LANG_PLI] = "PLI", [DW_LANG_ObjC] = "ObjC", [DW_LANG_ObjC_plus_plus] = "ObjC_plus_plus", [DW_LANG_UPC] = "UPC", [DW_LANG_D] = "D", [DW_LANG_Python] = "Python", }; static int add_sdb_include_dir(Sdb *s, const char *incl, int idx) { if (!s || !incl) return R_FALSE; return sdb_array_set (s, "includedirs", idx, incl, 0); } static const ut8 *r_bin_dwarf_parse_lnp_header( RBinFile *bf, const ut8 *buf, RBinDwarfLNPHeader *hdr, FILE *f) { int i; size_t count; const ut8 *tmp_buf = NULL; if (!hdr || !bf || !buf) return NULL; hdr->unit_length.part1 = READ (buf, ut32); if (hdr->unit_length.part1 == DWARF_INIT_LEN_64) { hdr->unit_length.part2 = READ (buf, ut32); } Sdb *s = sdb_new (NULL, NULL, 0); hdr->version = READ (buf, ut16); if (hdr->unit_length.part1 == DWARF_INIT_LEN_64) { hdr->header_length = READ (buf, ut64); } else { hdr->header_length = READ (buf, ut32); } hdr->min_inst_len = READ (buf, ut8); //hdr->max_ops_per_inst = READ (buf, ut8); hdr->default_is_stmt = READ (buf, ut8); hdr->line_base = READ (buf, char); hdr->line_range = READ (buf, ut8); hdr->opcode_base = READ (buf, ut8); if (f) { fprintf(f, "DWARF LINE HEADER\n"); fprintf(f, " total_length: %d\n", hdr->unit_length.part1); fprintf(f, " version: %d\n", hdr->version); fprintf(f, " header_length: : %lld\n", hdr->header_length); fprintf(f, " mininstlen: %d\n", hdr->min_inst_len); fprintf(f, " is_stmt: %d\n", hdr->default_is_stmt); fprintf(f, " line_base: %d\n", hdr->line_base); fprintf(f, " line_range: %d\n", hdr->line_range); fprintf(f, " opcode_base: %d\n", hdr->opcode_base); } hdr->std_opcode_lengths = calloc(sizeof(ut8), hdr->opcode_base); for (i = 1; i <= hdr->opcode_base - 1; i++) { hdr->std_opcode_lengths[i] = READ (buf, ut8); if (f) { fprintf(f, " op %d %d\n", i, hdr->std_opcode_lengths[i]); } } i = 0; while (1) { size_t len = strlen((const char*)buf); if (!len) { buf += 1; break; } if (f) { fprintf(f, "INCLUDEDIR (%s)\n", buf); } add_sdb_include_dir (s, (const char *)buf, i); i++; buf += len + 1; } tmp_buf = buf; count = 0; for (i = 0; i < 2; i++) { while (1) { const char *filename = (const char *)buf; ut64 id_idx, mod_time, file_len; size_t len = strlen(filename); if (!len) { buf++; break; } buf += len + 1; buf = r_uleb128 (buf, &id_idx); buf = r_uleb128 (buf, &mod_time); buf = r_uleb128 (buf, &file_len); if (i) { char *include_dir = NULL, *comp_dir = NULL; char *allocated_id = NULL; if (id_idx > 0) { include_dir = sdb_array_get (s, "includedirs", id_idx - 1, 0); if (include_dir && include_dir[0] != '/') { comp_dir = sdb_get (bf->sdb_addrinfo, "DW_AT_comp_dir", 0); if (comp_dir) { allocated_id = malloc(strlen(comp_dir) + strlen(include_dir) + 8); snprintf(allocated_id, strlen(comp_dir) + strlen(include_dir) + 8, "%s/%s/", comp_dir, include_dir); include_dir = allocated_id; } } } else { include_dir = sdb_get (bf->sdb_addrinfo, "DW_AT_comp_dir", 0); if (!include_dir) include_dir = "./"; } size_t namelen = len + (include_dir?strlen (include_dir):0) + 8; hdr->file_names[count].name = malloc (sizeof(char) * namelen); snprintf (hdr->file_names[count].name, namelen - 1, "%s/%s", include_dir, filename); hdr->file_names[count].name[namelen - 1] = '\0'; if (allocated_id) free (allocated_id); hdr->file_names[count].id_idx = id_idx; hdr->file_names[count].mod_time = mod_time; hdr->file_names[count].file_len = file_len; } count++; if (f && i) { fprintf(f, "FILE (%s)\n", filename); fprintf(f, "| dir idx %lld\n", id_idx); fprintf(f, "| lastmod %lld\n", mod_time); fprintf(f, "| filelen %lld\n", file_len); } } if (i == 0) { hdr->file_names = calloc(sizeof(file_entry), count); hdr->file_names_count = count; buf = tmp_buf; count = 0; } } sdb_free (s); return buf; } static inline void add_sdb_addrline(Sdb *s, ut64 addr, const char *file, ut64 line) { char fileline[128]; char offset[64]; char *offset_ptr; if (!s || !file) return; snprintf (fileline, sizeof(fileline) - 1, "%s|%lld", file, line); offset_ptr = sdb_itoa (addr, offset, 16); if (!sdb_add (s, offset_ptr, fileline, 0)) { sdb_set (s, offset_ptr, fileline, 0); } if (!sdb_add (s, fileline, offset_ptr, 0)) { sdb_set (s, fileline, offset_ptr, 0); } } static const ut8* r_bin_dwarf_parse_ext_opcode(const RBin *a, const ut8 *obuf, size_t len, const RBinDwarfLNPHeader *hdr, RBinDwarfSMRegisters *regs, FILE *f) { // XXX - list is an unused parameter. const ut8 *buf; ut8 opcode; ut64 addr; buf = obuf; st64 op_len; RBinFile *binfile = a ? a->cur : NULL; RBinObject *o = binfile ? binfile->o : NULL; ut32 addr_size = o && o->info && o->info->bits ? o->info->bits / 8 : 4; const char *filename; if (!binfile || !obuf || !hdr || !regs) return NULL; buf = r_leb128(buf, &op_len); opcode = *buf++; if (f) { fprintf(f, "Extended opcode %d: ", opcode); } switch (opcode) { case DW_LNE_end_sequence: regs->end_sequence = DWARF_TRUE; if (binfile && binfile->sdb_addrinfo) { add_sdb_addrline(binfile->sdb_addrinfo, regs->address, hdr->file_names[regs->file - 1].name, regs->line); } if (f) { fprintf(f, "End of Sequence\n"); } break; case DW_LNE_set_address: if (addr_size == 8) { addr = READ (buf, ut64); } else { addr = READ (buf, ut32); } regs->address = addr; if (f) { fprintf(f, "set Address to 0x%llx\n", addr); } break; case DW_LNE_define_file: filename = (const char*)buf; if (f) { fprintf(f, "define_file\n"); fprintf(f, "filename %s\n", filename); } buf += (strlen (filename) + 1); ut64 dir_idx; buf = r_uleb128 (buf, &dir_idx); break; case DW_LNE_set_discriminator: buf = r_uleb128(buf, &addr); if (f) { fprintf(f, "set Discriminator to %lld\n", addr); } regs->discriminator = addr; break; default: if (f) { fprintf(f, "Unexpeced opcode %d\n", opcode); } break; } return buf; } static const ut8* r_bin_dwarf_parse_spec_opcode( const RBin *a, const ut8 *obuf, size_t len, const RBinDwarfLNPHeader *hdr, RBinDwarfSMRegisters *regs, ut8 opcode, FILE *f) { // XXX - list is not used const ut8 *buf = obuf; ut8 adj_opcode = 0; ut64 advance_adr; RBinFile *binfile = a ? a->cur : NULL; if (!obuf || !hdr || !regs) return NULL; adj_opcode = opcode - hdr->opcode_base; if (!hdr->line_range) { eprintf ("Error r_bin_dwarf_parse_spec_opcode: hdr->line_range is 0\n"); return NULL; } advance_adr = adj_opcode / hdr->line_range; regs->address += advance_adr; regs->line += hdr->line_base + (adj_opcode % hdr->line_range); if (f) { fprintf(f, "Special opcode %d: ", adj_opcode); fprintf(f, "advance Address by %lld to %llx and Line by %d to %lld\n", advance_adr, regs->address, hdr->line_base + (adj_opcode % hdr->line_range), regs->line); } if (binfile && binfile->sdb_addrinfo) { add_sdb_addrline (binfile->sdb_addrinfo, regs->address, hdr->file_names[regs->file - 1].name, regs->line); } regs->basic_block = DWARF_FALSE; regs->prologue_end = DWARF_FALSE; regs->epilogue_begin = DWARF_FALSE; regs->discriminator = 0; return buf; } static const ut8* r_bin_dwarf_parse_std_opcode( const RBin *a, const ut8 *obuf, size_t len, const RBinDwarfLNPHeader *hdr, RBinDwarfSMRegisters *regs, ut8 opcode, FILE *f) { const ut8* buf = obuf; ut64 addr = 0LL; st64 sbuf; ut8 adj_opcode; ut64 op_advance; ut16 operand; RBinFile *binfile = a ? a->cur : NULL; if (!binfile || !hdr || !regs || !obuf) return NULL; switch (opcode) { case DW_LNS_copy: if (f) { fprintf(f, "Copy\n"); } if (binfile && binfile->sdb_addrinfo) { add_sdb_addrline(binfile->sdb_addrinfo, regs->address, hdr->file_names[regs->file - 1].name, regs->line); } regs->basic_block = DWARF_FALSE; break; case DW_LNS_advance_pc: buf = r_uleb128 (buf, &addr); regs->address += addr * hdr->min_inst_len; if (f) { fprintf(f, "Advance PC by %lld to 0x%llx\n", addr * hdr->min_inst_len, regs->address); } break; case DW_LNS_advance_line: buf = r_leb128(buf, &sbuf); regs->line += sbuf; if (f) { fprintf(f, "Advance line by %lld, to %lld\n", sbuf, regs->line); } break; case DW_LNS_set_file: buf = r_uleb128 (buf, &addr); if (f) { fprintf(f, "Set file to %lld\n", addr); } regs->file = addr; break; case DW_LNS_set_column: buf = r_uleb128(buf, &addr); if (f) { fprintf(f, "Set column to %lld\n", addr); } regs->column = addr; break; case DW_LNS_negate_stmt: regs->is_stmt = regs->is_stmt ? DWARF_FALSE : DWARF_TRUE; if (f) { fprintf(f, "Set is_stmt to %d\n", regs->is_stmt); } break; case DW_LNS_set_basic_block: if (f) { fprintf(f, "set_basic_block\n"); } regs->basic_block = DWARF_TRUE; break; case DW_LNS_const_add_pc: adj_opcode = 255 - hdr->opcode_base; op_advance = adj_opcode / hdr->line_range; regs->address += op_advance; if (f) { fprintf(f, "Advance PC by constant %lld to 0x%llx\n", op_advance, regs->address); } break; case DW_LNS_fixed_advance_pc: operand = READ (buf, ut16); regs->address += operand; if (f) { fprintf(f,"Fixed advance pc to %lld\n", regs->address); } break; case DW_LNS_set_prologue_end: regs->prologue_end = ~0; if (f) { fprintf(f, "set_prologue_end\n"); } break; case DW_LNS_set_epilogue_begin: regs->epilogue_begin = ~0; if (f) { fprintf(f, "set_epilogue_begin\n"); } break; case DW_LNS_set_isa: buf = r_uleb128(buf, &addr); regs->isa = addr; if (f) { fprintf(f, "set_isa\n"); } break; default: if (f) { fprintf(f, "Unexpected opcode\n"); } break; } return buf; } static const ut8* r_bin_dwarf_parse_opcodes (const RBin *a, const ut8 *obuf, size_t len, const RBinDwarfLNPHeader *hdr, RBinDwarfSMRegisters *regs, FILE *f) { const ut8 *buf, *buf_end; ut8 opcode, ext_opcode; if (!a || !obuf) return NULL; buf = obuf; buf_end = obuf + len; while (buf && buf < buf_end) { opcode = *buf++; len--; if (opcode == 0) { ext_opcode = *buf; buf = r_bin_dwarf_parse_ext_opcode (a, buf, len, hdr, regs, f ); if (ext_opcode == DW_LNE_end_sequence) break; } else if (opcode >= hdr->opcode_base) { buf = r_bin_dwarf_parse_spec_opcode (a, buf, len, hdr, regs, opcode, f); } else { buf = r_bin_dwarf_parse_std_opcode (a, buf, len, hdr, regs, opcode, f); } len = (int)(buf_end - buf); } return buf; } static void r_bin_dwarf_set_regs_default (const RBinDwarfLNPHeader *hdr, RBinDwarfSMRegisters *regs) { regs->address = 0; regs->file = 1; regs->line = 1; regs->column = 0; regs->is_stmt = hdr->default_is_stmt; regs->basic_block = DWARF_FALSE; regs->end_sequence = DWARF_FALSE; } R_API int r_bin_dwarf_parse_line_raw2(const RBin *a, const ut8 *obuf, size_t len, int mode) { RBinDwarfLNPHeader hdr; const ut8 *buf = NULL, *buf_tmp = NULL, *buf_end = NULL; RBinDwarfSMRegisters regs; int tmplen; FILE *f = NULL; RBinFile *binfile = a ? a->cur : NULL; if (!binfile || !obuf) return R_FALSE; if (mode == R_CORE_BIN_PRINT) { f = stdout; } buf = obuf; buf_end = obuf + len; while (buf < buf_end) { buf_tmp = buf; buf = r_bin_dwarf_parse_lnp_header (a->cur, buf, &hdr, f); if (!buf) return R_FALSE; r_bin_dwarf_set_regs_default (&hdr, ®s); tmplen = R_MIN (len, 4+hdr.unit_length.part1); r_bin_dwarf_parse_opcodes (a, buf, tmplen, &hdr, ®s, f); buf = buf_tmp + tmplen; len = (int)(buf_end - buf); } return R_TRUE; } R_API int r_bin_dwarf_parse_aranges_raw(const ut8 *obuf, int len, FILE *f) { ut32 length; ut16 version; ut32 debug_info_offset; ut8 address_size, segment_size; const ut8 *buf = obuf; int idx = 0; if (!obuf) return R_FALSE; length = *(ut32*)obuf; if (f) { printf("parse_aranges\n"); printf("length 0x%x\n", length); } if (length >= 0xfffffff0) { if (idx+12>=len) return R_FALSE; idx += 12; buf += 4; buf += 8; } else { if (idx+4>=len) return R_FALSE; idx+=4; buf += 4; } if (idx+2>=len) return R_FALSE; version = *(ut16*)buf; buf += 2; idx += 2; if (f) printf("Version %d\n", version); if (idx+4>=len) return R_FALSE; debug_info_offset = *(ut32*)buf; if (f) fprintf(f, "Debug info offset %d\n", debug_info_offset); buf += 4; idx += 4; // ??? address_size = *(ut8*)buf; if (f) fprintf(f, "address size %d\n", (int)address_size); buf += 1; segment_size = *(ut8*)buf; if (f) fprintf(f, "segment size %d\n", (int)segment_size); buf += 1; size_t offset = segment_size + address_size * 2; if (offset) { ut64 n = (((ut64) (size_t)buf / offset) + 1) * offset - ((ut64)(size_t)buf); if (idx+n>=len) return R_FALSE; buf += n; idx += n; } else { // buf += 1; } while ((buf - obuf) < len) { ut64 adr, length; if ((idx+8)>=len) break; adr = *(ut64*)buf; buf += 8; idx += 8; length = *(ut64*)buf; buf += 8; idx += 8; if (f) printf("length 0x%llx address 0x%llx\n", length, adr); } return 0; } static int r_bin_dwarf_init_debug_info(RBinDwarfDebugInfo *inf) { if (!inf) return -1; inf->comp_units = calloc (sizeof(RBinDwarfCompUnit), DEBUG_INFO_CAPACITY); // XXX - should we be using error codes? if (!inf->comp_units) return -ENOMEM; inf->capacity = DEBUG_INFO_CAPACITY; inf->length = 0; return R_TRUE; } static int r_bin_dwarf_init_die(RBinDwarfDIE *die) { if (!die) return -EINVAL; die->attr_values = calloc(sizeof(RBinDwarfAttrValue), 8); if (!die->attr_values) return -ENOMEM; die->capacity = 8; die->length = 0; return 0; } static int r_bin_dwarf_expand_die(RBinDwarfDIE* die) { RBinDwarfAttrValue *tmp = NULL; if (!die || die->capacity == 0) return -EINVAL; if (die->capacity != die->length) return -EINVAL; tmp = (RBinDwarfAttrValue*)realloc(die->attr_values, die->capacity * 2 * sizeof(RBinDwarfAttrValue)); if (!tmp) return -ENOMEM; die->attr_values = tmp; die->capacity *= 2; return 0; } static int r_bin_dwarf_init_comp_unit(RBinDwarfCompUnit *cu) { if (!cu) return -EINVAL; cu->dies = calloc(sizeof(RBinDwarfDIE), COMP_UNIT_CAPACITY); if (!cu->dies) return -ENOMEM; cu->capacity = COMP_UNIT_CAPACITY; cu->length = 0; return 0; } static int r_bin_dwarf_expand_cu(RBinDwarfCompUnit *cu) { RBinDwarfDIE *tmp; if (!cu || cu->capacity == 0 || cu->capacity != cu->length) return -EINVAL; tmp = (RBinDwarfDIE*)realloc(cu->dies, cu->capacity * 2 * sizeof(RBinDwarfDIE)); if (!tmp) return -ENOMEM; cu->dies = tmp; cu->capacity *= 2; return 0; } static int r_bin_dwarf_init_abbrev_decl(RBinDwarfAbbrevDecl *ad) { if (!ad) return -EINVAL; ad->specs = calloc(sizeof(RBinDwarfAttrSpec), ABBREV_DECL_CAP); if (!ad->specs) return -ENOMEM; ad->capacity = ABBREV_DECL_CAP; ad->length = 0; return 0; } static int r_bin_dwarf_expand_abbrev_decl(RBinDwarfAbbrevDecl *ad) { RBinDwarfAttrSpec *tmp; if (!ad || ad->capacity==0 || ad->capacity != ad->length) return -EINVAL; tmp = (RBinDwarfAttrSpec*)realloc(ad->specs, ad->capacity * 2 * sizeof(RBinDwarfAttrSpec)); if (!tmp) return -ENOMEM; ad->specs = tmp; ad->capacity *= 2; return 0; } static int r_bin_dwarf_init_debug_abbrev(RBinDwarfDebugAbbrev *da) { if (!da) return -EINVAL; da->decls = calloc(sizeof(RBinDwarfAbbrevDecl), DEBUG_ABBREV_CAP); if (!da->decls) return -ENOMEM; da->capacity = DEBUG_ABBREV_CAP; da->length = 0; return 0; } static int r_bin_dwarf_expand_debug_abbrev(RBinDwarfDebugAbbrev *da) { RBinDwarfAbbrevDecl *tmp; if (!da || da->capacity == 0 || da->capacity != da->length) return -EINVAL; tmp = (RBinDwarfAbbrevDecl*)realloc(da->decls, da->capacity * 2 * sizeof(RBinDwarfAbbrevDecl)); if (!tmp) return -ENOMEM; da->decls = tmp; da->capacity *= 2; return 0; } static void dump_r_bin_dwarf_debug_abbrev(FILE *f, RBinDwarfDebugAbbrev *da) { size_t i, j; ut64 attr_name, attr_form; if (!f || !da) return; for (i = 0; i < da->length; i++) { fprintf(f, "Abbreviation Code %lld ", da->decls[i].code); fprintf(f, "Tag %s ", dwarf_tag_name_encodings[da->decls[i].tag]); fprintf(f, "[%s]\n", da->decls[i].has_children ? "has children" : "no children"); fprintf(f, "Offset 0x%llx\n", da->decls[i].offset); for (j = 0; j < da->decls[i].length; j++) { attr_name = da->decls[i].specs[j].attr_name; attr_form = da->decls[i].specs[j].attr_form; if (attr_name && attr_form && attr_name <= DW_AT_vtable_elem_location && attr_form <= DW_FORM_indirect) { fprintf(f, " %s %s\n", dwarf_attr_encodings[attr_name], dwarf_attr_form_encodings[attr_form]); } } } } R_API void r_bin_dwarf_free_debug_abbrev(RBinDwarfDebugAbbrev *da) { size_t i; if (!da) return; for (i = 0; i < da->length; i++) free(da->decls[i].specs); free (da->decls); } static void r_bin_dwarf_free_attr_value (RBinDwarfAttrValue *val) { if (!val) return; switch (val->form) { case DW_FORM_strp: case DW_FORM_string: if (val->encoding.str_struct.string) { free (val->encoding.str_struct.string); } break; case DW_FORM_block: case DW_FORM_block1: case DW_FORM_block2: case DW_FORM_block4: if (val->encoding.block.data) { free (val->encoding.block.data); } break; default: break; }; } static void r_bin_dwarf_free_die (RBinDwarfDIE *die) { size_t i; if (!die) return; for (i = 0; i < die->length; i++) { r_bin_dwarf_free_attr_value (&die->attr_values[i]); } free (die->attr_values); } static void r_bin_dwarf_free_comp_unit (RBinDwarfCompUnit *cu) { size_t i; if (!cu) return; for (i = 0; i < cu->length; i++) { r_bin_dwarf_free_die (&cu->dies[i]); } free (cu->dies); } static void r_bin_dwarf_free_debug_info (RBinDwarfDebugInfo *inf) { size_t i; if (!inf) return; for (i = 0; i < inf->length; i++) { r_bin_dwarf_free_comp_unit (&inf->comp_units[i]); } free (inf->comp_units); } static void r_bin_dwarf_dump_attr_value(const RBinDwarfAttrValue *val, FILE *f) { size_t i; if (!val || !f) return; switch (val->form) { case DW_FORM_addr: fprintf(f, "0x%llx", val->encoding.address); break; case DW_FORM_block: case DW_FORM_block1: case DW_FORM_block2: case DW_FORM_block4: fprintf (f, "%llu byte block:", val->encoding.block.length); for (i = 0; i < val->encoding.block.length; i++) { fprintf (f, "%02x", val->encoding.block.data[i]); } break; case DW_FORM_data1: case DW_FORM_data2: case DW_FORM_data4: case DW_FORM_data8: fprintf (f, "%llu", val->encoding.data); if (val->name == DW_AT_language) { fprintf (f, " (%s)", dwarf_langs[val->encoding.data]); } break; case DW_FORM_strp: fprintf (f, "(indirect string, offset: 0x%llx): ", val->encoding.str_struct.offset); case DW_FORM_string: if (val->encoding.str_struct.string) { fprintf (f, "%s", val->encoding.str_struct.string); } else { fprintf (f, "No string found"); } break; case DW_FORM_flag: fprintf (f, "%u", val->encoding.flag); break; case DW_FORM_sdata: fprintf (f, "%lld", val->encoding.sdata); break; case DW_FORM_udata: fprintf (f, "%llu", val->encoding.data); break; case DW_FORM_ref_addr: fprintf (f, "<0x%llx>", val->encoding.reference); break; case DW_FORM_ref1: case DW_FORM_ref2: case DW_FORM_ref4: case DW_FORM_ref8: fprintf (f, "<0x%llx>", val->encoding.reference); break; default: fprintf (f, "Unknown attr value form %lld\n", val->form); }; } static void r_bin_dwarf_dump_debug_info (FILE *f, const RBinDwarfDebugInfo *inf) { size_t i, j, k; RBinDwarfDIE *dies; RBinDwarfAttrValue *values; if (!inf || !f) return; for (i = 0; i < inf->length; i++) { fprintf(f, " Compilation Unit @ offset 0x%llx:\n", inf->comp_units [i].offset); fprintf(f, " Length: 0x%x\n", inf->comp_units [i].hdr.length); fprintf(f, " Version: %d\n", inf->comp_units [i].hdr.version); fprintf(f, " Abbrev Offset: 0x%x\n", inf->comp_units [i].hdr.abbrev_offset); fprintf(f, " Pointer Size: %d\n", inf->comp_units [i].hdr.pointer_size); dies = inf->comp_units[i].dies; for (j = 0; j < inf->comp_units[i].length; j++) { fprintf(f, " Abbrev Number: %llu ", dies[j].abbrev_code); if (dies[j].tag && dies[j].tag <= DW_TAG_volatile_type && dwarf_tag_name_encodings[dies[j].tag]) { fprintf(f, "(%s)\n", dwarf_tag_name_encodings[dies[j].tag]); } else { fprintf(f, "(Unknown abbrev tag)\n"); } if (!dies[j].abbrev_code) continue; values = dies[j].attr_values; for (k = 0; k < dies[j].length; k++) { if (!values[k].name) continue; if (values[k].name < DW_AT_vtable_elem_location && dwarf_attr_encodings[values[k].name]) { fprintf(f, " %-18s : ", dwarf_attr_encodings[values[k].name]); } else { fprintf(f, " TODO\t"); } r_bin_dwarf_dump_attr_value (&values[k], f); fprintf(f, "\n"); } } } } static const ut8 *r_bin_dwarf_parse_attr_value (const ut8 *obuf, RBinDwarfAttrSpec *spec, RBinDwarfAttrValue *value, const RBinDwarfCompUnitHdr *hdr, const ut8 *debug_str, size_t debug_str_len) { const ut8 *buf = obuf; size_t j; if (!spec || !value || !hdr || !obuf) return NULL; value->form = spec->attr_form; value->name = spec->attr_name; switch (spec->attr_form) { case DW_FORM_addr: switch (hdr->pointer_size) { case 1: value->encoding.address = READ (buf, ut8); break; case 2: value->encoding.address = READ (buf, ut16); break; case 4: value->encoding.address = READ (buf, ut32); break; case 8: value->encoding.address = READ (buf, ut64); break; default: eprintf("DWARF: Unexpected pointer size: %u\n", (unsigned)hdr->pointer_size); return NULL; } break; case DW_FORM_block2: value->encoding.block.length = READ (buf, ut16); value->encoding.block.data = calloc(sizeof(ut8), value->encoding.block.length); for (j = 0; j < value->encoding.block.length; j++) { value->encoding.block.data[j] = READ (buf, ut8); } break; case DW_FORM_block4: value->encoding.block.length = READ (buf, ut32); value->encoding.block.data = calloc(sizeof(ut8), value->encoding.block.length); for (j = 0; j < value->encoding.block.length; j++) { value->encoding.block.data[j] = READ (buf, ut8); } break; case DW_FORM_data2: value->encoding.data = READ (buf, ut16); break; case DW_FORM_data4: value->encoding.data = READ (buf, ut32); break; case DW_FORM_data8: value->encoding.data = READ (buf, ut64); break; case DW_FORM_string: value->encoding.str_struct.string = strdup((const char*)buf); buf += (strlen((const char*)buf) + 1); break; case DW_FORM_block: buf = r_uleb128 (buf, &value->encoding.block.length); value->encoding.block.data = calloc(sizeof(ut8), value->encoding.block.length); for (j = 0; j < value->encoding.block.length; j++) { value->encoding.block.data[j] = READ (buf, ut8); } break; case DW_FORM_block1: value->encoding.block.length = READ (buf, ut8); value->encoding.block.data = calloc(sizeof(ut8), value->encoding.block.length); for (j = 0; j < value->encoding.block.length; j++) { value->encoding.block.data[j] = READ (buf, ut8); } break; case DW_FORM_flag: value->encoding.flag = READ (buf, ut8); break; case DW_FORM_sdata: buf = r_leb128 (buf, &value->encoding.sdata); break; case DW_FORM_strp: value->encoding.str_struct.offset = READ (buf, ut32); if (debug_str && value->encoding.str_struct.offset < debug_str_len) { value->encoding.str_struct.string = strdup ( (const char *)(debug_str + value->encoding.str_struct.offset)); } else { value->encoding.str_struct.string = NULL; } break; case DW_FORM_udata: buf = r_uleb128 (buf, &value->encoding.data); break; case DW_FORM_ref_addr: value->encoding.reference = READ (buf, ut64); // addr size of machine break; case DW_FORM_ref1: value->encoding.reference = READ (buf, ut8); break; case DW_FORM_ref2: value->encoding.reference = READ (buf, ut16); break; case DW_FORM_ref4: value->encoding.reference = READ (buf, ut32); break; case DW_FORM_ref8: value->encoding.reference = READ (buf, ut64); break; case DW_FORM_data1: value->encoding.data = READ (buf, ut8); break; default: return buf; } return buf; } static const ut8 *r_bin_dwarf_parse_comp_unit(Sdb *s, const ut8 *obuf, RBinDwarfCompUnit *cu, const RBinDwarfDebugAbbrev *da, size_t offset, const ut8 *debug_str, size_t debug_str_len) { const ut8 *buf = obuf, *buf_end = obuf + (cu->hdr.length - 7); ut64 abbr_code; size_t i; while (buf < buf_end) { if (cu->length && cu->capacity == cu->length) r_bin_dwarf_expand_cu (cu); buf = r_uleb128 (buf, &abbr_code); if (abbr_code > da->length) { return NULL; } r_bin_dwarf_init_die (&cu->dies[cu->length]); if (!abbr_code) { cu->dies[cu->length].abbrev_code = 0; cu->length++; continue; } cu->dies[cu->length].abbrev_code = abbr_code; cu->dies[cu->length].tag = da->decls[abbr_code - 1].tag; abbr_code += offset; for (i = 0; i < da->decls[abbr_code - 1].length; i++) { if (cu->dies[cu->length].length == cu->dies[cu->length].capacity) r_bin_dwarf_expand_die (&cu->dies[cu->length]); buf = r_bin_dwarf_parse_attr_value (buf, &da->decls[abbr_code - 1].specs[i], &cu->dies[cu->length].attr_values[i], &cu->hdr, debug_str, debug_str_len); if (cu->dies[cu->length].attr_values[i].name == DW_AT_comp_dir) { char *comp_dir = cu->dies[cu->length].attr_values[i].encoding.str_struct.string; if (s) sdb_add (s, "DW_AT_comp_dir", comp_dir, 0); } cu->dies[cu->length].length++; } cu->length++; } return buf; } R_API int r_bin_dwarf_parse_info_raw(Sdb *s, RBinDwarfDebugAbbrev *da, const ut8 *obuf, size_t len, const ut8 *debug_str, size_t debug_str_len, int mode) { const ut8 *buf = obuf, *buf_end = obuf + len; size_t curr_unit = 0, k, offset = 0; RBinDwarfDebugInfo *inf = NULL, di; inf = &di; r_bin_dwarf_init_debug_info (inf); if (!da || !s || !obuf) return R_FALSE; while (buf < buf_end) { if (inf->length >= inf->capacity) break; r_bin_dwarf_init_comp_unit (&inf->comp_units[curr_unit]); inf->comp_units[curr_unit].offset = buf - obuf; inf->comp_units[curr_unit].hdr.length = READ (buf, ut32); inf->comp_units[curr_unit].hdr.version = READ (buf, ut16); if (inf->comp_units[curr_unit].hdr.version != 2) { eprintf("DWARF: version %d is yet not supported\n", inf->comp_units[curr_unit].hdr.version); return -1; } inf->comp_units[curr_unit].hdr.abbrev_offset = READ (buf, ut32); inf->comp_units[curr_unit].hdr.pointer_size = READ (buf, ut8); inf->length++; /* Linear search FIXME */ for (k = 0; k < da->decls->length; k++) { if (da->decls[k].offset == inf->comp_units[curr_unit].hdr.abbrev_offset) { offset = k; break; } } buf = r_bin_dwarf_parse_comp_unit(s, buf, &inf->comp_units[curr_unit], da, offset, debug_str, debug_str_len); if (!buf) { r_bin_dwarf_free_debug_info (inf); return R_FALSE; } curr_unit++; } if (mode == R_CORE_BIN_PRINT) { r_bin_dwarf_dump_debug_info (NULL, inf); } r_bin_dwarf_free_debug_info (inf); return R_TRUE; } static RBinDwarfDebugAbbrev *r_bin_dwarf_parse_abbrev_raw(const ut8 *obuf, size_t len, int mode) { const ut8 *buf = obuf, *buf_end = obuf + len; ut64 tmp, spec1, spec2, offset; ut8 has_children; RBinDwarfAbbrevDecl *tmpdecl; RBinDwarfDebugAbbrev *da = NULL; // XXX - Set a suitable value here. if (!obuf || len < 3) return da; da = R_NEW0(RBinDwarfDebugAbbrev); r_bin_dwarf_init_debug_abbrev (da); while (buf < buf_end) { offset = buf - obuf; buf = r_uleb128(buf, &tmp); if (!tmp) continue; if (da->length == da->capacity) r_bin_dwarf_expand_debug_abbrev(da); tmpdecl = &da->decls[da->length]; r_bin_dwarf_init_abbrev_decl(tmpdecl); tmpdecl->code = tmp; buf = r_uleb128(buf, &tmp); tmpdecl->tag = tmp; tmpdecl->offset = offset; has_children = READ (buf, ut8); tmpdecl->has_children = has_children; do { if (tmpdecl->length == tmpdecl->capacity) r_bin_dwarf_expand_abbrev_decl(tmpdecl); buf = r_uleb128(buf, &spec1); buf = r_uleb128(buf, &spec2); tmpdecl->specs[tmpdecl->length].attr_name = spec1; tmpdecl->specs[tmpdecl->length].attr_form = spec2; tmpdecl->length++; } while (spec1 && spec2); da->length++; } if (mode == R_CORE_BIN_PRINT) dump_r_bin_dwarf_debug_abbrev(stdout, da); return da; } RBinSection *getsection(RBin *a, const char *sn) { RListIter *iter; RBinSection *section = NULL; RBinFile *binfile = a ? a->cur: NULL; RBinObject *o = binfile ? binfile->o : NULL; if ( o && o->sections) { r_list_foreach (o->sections, iter, section) { if (strstr (section->name, sn)) return section; } } return NULL; } R_API int r_bin_dwarf_parse_info(RBinDwarfDebugAbbrev *da, RBin *a, int mode) { ut8 *buf, *debug_str_buf = 0; int len, debug_str_len = 0, ret; RBinSection *debug_str; RBinSection *section = getsection (a, "debug_info"); RBinFile *binfile = a ? a->cur: NULL; if (binfile && section) { debug_str = getsection (a, "debug_str"); if (debug_str) { debug_str_len = debug_str->size; debug_str_buf = malloc (debug_str_len); r_buf_read_at (binfile->buf, debug_str->paddr, debug_str_buf, debug_str_len); } len = section->size; buf = malloc (len); r_buf_read_at (binfile->buf, section->paddr, buf, len); ret = r_bin_dwarf_parse_info_raw (binfile->sdb_addrinfo, da, buf, len, debug_str_buf, debug_str_len, mode); if (debug_str_buf) { free (debug_str_buf); } free (buf); return ret; } return R_FALSE; } R_API RList *r_bin_dwarf_parse_line(RBin *a, int mode) { ut8 *buf; int len; RBinSection *section = getsection (a, "debug_line"); RBinFile *binfile = a ? a->cur: NULL; if (binfile && section) { RList *list = r_list_new (); len = section->size; buf = malloc (len); r_buf_read_at (binfile->buf, section->paddr, buf, len); r_bin_dwarf_parse_line_raw2 (a, buf, len, mode); free (buf); return list; } return NULL; } R_API RList *r_bin_dwarf_parse_aranges(RBin *a, int mode) { ut8 *buf; size_t len; RBinSection *section = getsection (a, "debug_aranges"); RBinFile *binfile = a ? a->cur: NULL; if (binfile && section) { len = section->size; if (len==0) return NULL; buf = malloc (len); r_buf_read_at (binfile->buf, section->paddr, buf, len); if (mode == R_CORE_BIN_PRINT) { r_bin_dwarf_parse_aranges_raw (buf, len, stdout); } else { r_bin_dwarf_parse_aranges_raw (buf, len, DBGFD); } free (buf); } return NULL; } R_API RBinDwarfDebugAbbrev *r_bin_dwarf_parse_abbrev(RBin *a, int mode) { ut8 *buf; size_t len; RBinSection *section = getsection (a, "debug_abbrev"); RBinDwarfDebugAbbrev *da = NULL; RBinFile *binfile = a ? a->cur: NULL; if (binfile && section) { len = section->size; buf = malloc (len); r_buf_read_at (binfile->buf, section->paddr, buf, len); da = r_bin_dwarf_parse_abbrev_raw (buf, len, mode); free (buf); } return da; }