mirror of
https://github.com/varun-r-mallya/sysprof.git
synced 2025-12-31 20:36:25 +00:00
2006-08-20 Soren Sandmann <sandmann@daimi.au.dk> * elfparser.c (elf_parser_get_debug_link): New function * elfparser.c: Delete SymbolTable typedef * binparser.[ch] (bin_parser_get_data): New function (bin_parser_get_length): New function * elfparser.[ch] (elf_parser_get_crc32): New function * TODO: Updates * elfparser.c (elf_parser_lookup_symbol): Offset passed in addresses by the load address. * elfparser.c (elf_parser_get_load_address): New function to compute the load address of the beginning of the file.
564 lines
11 KiB
C
564 lines
11 KiB
C
#include <string.h>
|
|
#include <stdlib.h>
|
|
#include <glib.h>
|
|
#include <stdarg.h>
|
|
#include "binparser.h"
|
|
|
|
typedef struct ParserFrame ParserFrame;
|
|
|
|
struct ParserFrame
|
|
{
|
|
BinFormat * format;
|
|
int index;
|
|
gsize offset;
|
|
|
|
ParserFrame * next;
|
|
};
|
|
|
|
struct BinField
|
|
{
|
|
guint64 offset;
|
|
int width;
|
|
int align;
|
|
char * name;
|
|
};
|
|
|
|
struct BinFormat
|
|
{
|
|
gboolean big_endian;
|
|
|
|
int n_fields;
|
|
BinField * fields;
|
|
};
|
|
|
|
struct BinParser
|
|
{
|
|
ParserFrame * frame;
|
|
const guchar * data;
|
|
gsize length;
|
|
};
|
|
|
|
BinParser *
|
|
bin_parser_new (const guchar *data,
|
|
gsize length)
|
|
{
|
|
BinParser *parser = g_new0 (BinParser, 1);
|
|
|
|
parser->frame = NULL;
|
|
parser->data = data;
|
|
parser->length = length;
|
|
|
|
return parser;
|
|
}
|
|
|
|
static GQueue *
|
|
read_varargs (va_list args,
|
|
const char * name,
|
|
BinField * field)
|
|
{
|
|
GQueue *queue = g_queue_new ();
|
|
gpointer p;
|
|
|
|
if (name)
|
|
{
|
|
g_queue_push_tail (queue, (gpointer)name);
|
|
g_queue_push_tail (queue, field);
|
|
|
|
p = va_arg (args, gpointer);
|
|
while (p)
|
|
{
|
|
g_queue_push_tail (queue, p);
|
|
p = va_arg (args, gpointer);
|
|
}
|
|
}
|
|
|
|
return queue;
|
|
}
|
|
|
|
static guint64
|
|
align (guint64 offset, int alignment)
|
|
{
|
|
/* Note that we can speed this up by assuming alignment'
|
|
* is a power of two, since
|
|
*
|
|
* offset % alignment == offset & (alignemnt - 1)
|
|
*
|
|
*/
|
|
|
|
if (offset % alignment != 0)
|
|
offset += (alignment - (offset % alignment));
|
|
|
|
return offset;
|
|
}
|
|
|
|
gsize
|
|
bin_format_get_size (BinFormat *format)
|
|
{
|
|
BinField *last_field = &(format->fields[format->n_fields - 1]);
|
|
BinField *first_field = &(format->fields[0]);
|
|
|
|
return align (last_field->offset + last_field->width, first_field->width);
|
|
}
|
|
|
|
BinFormat *
|
|
bin_format_new (gboolean big_endian,
|
|
const char *name, BinField *field,
|
|
...)
|
|
{
|
|
GQueue *queue = g_queue_new ();
|
|
BinFormat *format = g_new0 (BinFormat, 1);
|
|
GList *list;
|
|
int i;
|
|
guint64 offset;
|
|
va_list args;
|
|
|
|
format->big_endian = big_endian;
|
|
|
|
/* Build queue of child types */
|
|
va_start (args, field);
|
|
queue = read_varargs (args, name, field);
|
|
va_end (args);
|
|
|
|
g_assert (queue->length % 2 == 0);
|
|
|
|
format->n_fields = queue->length / 2;
|
|
format->fields = g_new (BinField, format->n_fields);
|
|
|
|
i = 0;
|
|
offset = 0;
|
|
for (list = queue->head; list != NULL; list = list->next->next)
|
|
{
|
|
const char *name = list->data;
|
|
BinField *field = list->next->data;
|
|
|
|
offset = align (offset, field->align);
|
|
|
|
format->fields[i].name = g_strdup (name);
|
|
format->fields[i].width = field->width;
|
|
format->fields[i].offset = offset;
|
|
|
|
offset += field->width;
|
|
++i;
|
|
|
|
g_free (field);
|
|
}
|
|
|
|
g_queue_free (queue);
|
|
|
|
return format;
|
|
}
|
|
|
|
static const BinField *
|
|
get_field (BinFormat *format,
|
|
const gchar *name)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < format->n_fields; ++i)
|
|
{
|
|
BinField *field = &(format->fields[i]);
|
|
|
|
if (strcmp (field->name, name) == 0)
|
|
return field;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
guint64
|
|
bin_parser_get_uint (BinParser *parser,
|
|
const gchar *name)
|
|
{
|
|
const BinField *field;
|
|
const guint8 *pos;
|
|
guint8 r8;
|
|
guint16 r16;
|
|
guint32 r32;
|
|
guint64 r64;
|
|
BinFormat *format;
|
|
const guchar *data;
|
|
|
|
g_return_val_if_fail (parser->frame != NULL, 0);
|
|
|
|
format = parser->frame->format;
|
|
data = parser->data + parser->frame->offset;
|
|
|
|
field = get_field (format, name);
|
|
|
|
g_return_val_if_fail (field != NULL, (guint64)-1);
|
|
|
|
pos = data + field->offset;
|
|
|
|
if (field->offset + field->width > parser->length)
|
|
{
|
|
/* FIXME: generate error */
|
|
return 0;
|
|
}
|
|
|
|
#if 0
|
|
g_print ("getting %s from offset: %llu\n", name, field->offset);
|
|
#endif
|
|
|
|
switch (field->width)
|
|
{
|
|
case 1:
|
|
r8 = *(guint8 *)pos;
|
|
return r8;
|
|
|
|
case 2:
|
|
r16 = *(guint16 *)pos;
|
|
|
|
if (format->big_endian)
|
|
r16 = GUINT16_FROM_BE (r16);
|
|
else
|
|
r16 = GUINT16_FROM_LE (r16);
|
|
|
|
return r16;
|
|
|
|
case 4:
|
|
r32 = *(guint32 *)pos;
|
|
|
|
if (format->big_endian)
|
|
r32 = GUINT32_FROM_BE (r32);
|
|
else
|
|
r32 = GUINT32_FROM_LE (r32);
|
|
|
|
return r32;
|
|
|
|
case 8:
|
|
r64 = *(guint64 *)pos;
|
|
|
|
if (format->big_endian)
|
|
r64 = GUINT64_FROM_BE (r64);
|
|
else
|
|
r64 = GUINT64_FROM_LE (r64);
|
|
|
|
return r64;
|
|
}
|
|
|
|
#if 0
|
|
g_print ("width: %d\n", field->width);
|
|
#endif
|
|
|
|
g_assert_not_reached();
|
|
return 0;
|
|
}
|
|
|
|
static BinField *
|
|
new_field_uint (int width)
|
|
{
|
|
BinField *field = g_new0 (BinField, 1);
|
|
|
|
field->width = width;
|
|
field->align = width;
|
|
|
|
return field;
|
|
}
|
|
|
|
BinField *
|
|
bin_field_new_uint8 (void)
|
|
{
|
|
return new_field_uint (1);
|
|
}
|
|
|
|
BinField *
|
|
bin_field_new_uint16 (void)
|
|
{
|
|
return new_field_uint (2);
|
|
}
|
|
|
|
BinField *
|
|
bin_field_new_uint32 (void)
|
|
{
|
|
return new_field_uint (4);
|
|
}
|
|
|
|
BinField *
|
|
bin_field_new_uint64 (void)
|
|
{
|
|
return new_field_uint (8);
|
|
}
|
|
|
|
const gchar *
|
|
bin_parser_get_string (BinParser *parser)
|
|
{
|
|
/* FIXME: check that the string is within the file */
|
|
return (gchar *)parser->data + parser->frame->offset;
|
|
}
|
|
|
|
void
|
|
bin_parser_begin (BinParser *parser,
|
|
BinFormat *format,
|
|
gsize offset)
|
|
{
|
|
ParserFrame *frame = g_new0 (ParserFrame, 1);
|
|
|
|
frame->format = format;
|
|
frame->offset = offset;
|
|
frame->index = 0;
|
|
|
|
frame->next = parser->frame;
|
|
parser->frame = frame;
|
|
}
|
|
|
|
void
|
|
bin_parser_end (BinParser *parser)
|
|
{
|
|
ParserFrame *frame;
|
|
|
|
frame = parser->frame;
|
|
parser->frame = frame->next;
|
|
|
|
g_free (frame);
|
|
}
|
|
|
|
void
|
|
bin_parser_index (BinParser *parser,
|
|
int index)
|
|
{
|
|
gsize format_size = bin_format_get_size (parser->frame->format);
|
|
|
|
parser->frame->offset -= parser->frame->index * format_size;
|
|
parser->frame->offset += index * format_size;
|
|
|
|
parser->frame->index = index;
|
|
}
|
|
|
|
gsize
|
|
bin_parser_get_offset (BinParser *parser)
|
|
{
|
|
g_return_val_if_fail (parser != NULL, 0);
|
|
g_return_val_if_fail (parser->frame != NULL, 0);
|
|
|
|
return parser->frame->offset;
|
|
}
|
|
|
|
const guchar *
|
|
bin_parser_get_data (BinParser *parser)
|
|
{
|
|
return parser->data;
|
|
}
|
|
|
|
gsize
|
|
bin_parser_get_length (BinParser *parser)
|
|
{
|
|
return parser->length;
|
|
}
|
|
|
|
BinField *
|
|
bin_field_new_fixed_array (int n_elements,
|
|
int element_size)
|
|
{
|
|
BinField *field = g_new0 (BinField, 1);
|
|
field->width = n_elements * element_size;
|
|
field->align = element_size;
|
|
return field;
|
|
}
|
|
|
|
#if 0
|
|
#include <elf.h>
|
|
|
|
static gboolean
|
|
find_elf_type (const guchar *data, gsize length,
|
|
gboolean *is_64, gboolean *is_be)
|
|
{
|
|
/* FIXME: this function should be able to return an error */
|
|
if (length < EI_NIDENT)
|
|
return FALSE;
|
|
|
|
/* 32 or 64? */
|
|
|
|
switch (data[EI_CLASS])
|
|
{
|
|
case ELFCLASS32:
|
|
*is_64 = FALSE;
|
|
break;
|
|
|
|
case ELFCLASS64:
|
|
*is_64 = TRUE;
|
|
break;
|
|
|
|
default:
|
|
/* return ERROR */
|
|
return FALSE;
|
|
break;
|
|
}
|
|
|
|
/* big or little endian? */
|
|
switch (data[EI_DATA])
|
|
{
|
|
case ELFDATA2LSB:
|
|
*is_be = FALSE;
|
|
break;
|
|
|
|
case ELFDATA2MSB:
|
|
*is_be = TRUE;
|
|
break;
|
|
|
|
default:
|
|
/* return Error */
|
|
return FALSE;
|
|
break;
|
|
}
|
|
|
|
g_print ("This elf file is %s %s\n",
|
|
*is_64? "64 bit" : "32 bit",
|
|
*is_be? "big endiann" : "little endian");
|
|
|
|
return TRUE;
|
|
}
|
|
|
|
void
|
|
parse_elf (const guchar *data,
|
|
gsize length)
|
|
{
|
|
gboolean is_64, is_big_endian;
|
|
BinFormat *elf_header;
|
|
BinFormat *shn_entry;
|
|
const guchar *section_header;
|
|
BinParser *parser;
|
|
BinParser *sh_parser;
|
|
BinFormat *sym;
|
|
int i;
|
|
|
|
find_elf_type (data, length, &is_64, &is_big_endian);
|
|
|
|
elf_header = bin_format_new (
|
|
is_big_endian,
|
|
"e_ident", bin_field_new_fixed_array (EI_NIDENT, 1),
|
|
|
|
"e_type", bin_field_new_uint16 (),
|
|
"e_machine", bin_field_new_uint16 (),
|
|
"e_version", bin_field_new_uint32 (),
|
|
|
|
"e_entry", make_word (is_64),
|
|
"e_phoff", make_word (is_64),
|
|
|
|
"e_shoff", make_word (is_64),
|
|
"e_flags", make_uint32 (),
|
|
"e_ehsize", make_uint16(),
|
|
"e_phentsize", make_uint16 (),
|
|
"e_phnum", make_uint16 (),
|
|
"e_shentsize", make_uint16 (),
|
|
"e_shnum", make_uint16 (),
|
|
"e_shstrndx", make_uint16 (),
|
|
NULL);
|
|
|
|
shn_entry = bin_format_new (
|
|
is_big_endian,
|
|
"sh_name", make_uint32(),
|
|
"sh_type", make_uint32(),
|
|
"sh_flags", make_word (is_64),
|
|
"sh_addr", make_word (is_64),
|
|
"sh_offset", make_word (is_64),
|
|
"sh_size", make_word (is_64),
|
|
"sh_link", make_uint32(),
|
|
"sh_info", make_uint32(),
|
|
"sh_addralign", make_word (is_64),
|
|
"sh_entsize", make_word (is_64),
|
|
NULL);
|
|
|
|
if (is_64)
|
|
{
|
|
sym = bin_format_new (
|
|
is_big_endian,
|
|
"st_name", make_uint32(),
|
|
"st_info", make_uint8 (),
|
|
"st_other", make_uint8 (),
|
|
"st_shndx", make_uint16 (),
|
|
"st_value", make_uint64 (),
|
|
"st_size", make_uint64 (),
|
|
NULL);
|
|
}
|
|
else
|
|
{
|
|
sym = bin_format_new (
|
|
is_big_endian,
|
|
"st_name", make_uint32 (),
|
|
"st_value", make_uint32 (),
|
|
"st_size", make_uint32 (),
|
|
"st_info", make_uint8 (),
|
|
"st_other", make_uint8 (),
|
|
"st_shndx", make_uint16 ());
|
|
}
|
|
|
|
parser = bin_parser_new (elf_header, data, length);
|
|
|
|
section_header = data + bin_parser_get_uint (parser, "e_shoff");
|
|
|
|
#if 0
|
|
g_print ("section header offset: %u\n",
|
|
section_header - data);
|
|
|
|
g_print ("There are %llu sections\n",
|
|
bin_parser_get_uint (parser, "e_shnum"));
|
|
#endif
|
|
|
|
/* should think through how to deal with offsets, and whether parsers
|
|
* are always considered parsers of an array. If yes, then it
|
|
* may be reasonable to just pass the length of the array.
|
|
*
|
|
* Hmm, although the parser still needs to know the end of the data.
|
|
* Maybe create yet another structure, a subparser, that also contains
|
|
* an offset in addition to the beginning and length.
|
|
*
|
|
* Ie., bin_sub_parser_new (parser, section_header, shn_entry, n_headers);
|
|
*
|
|
* In that case, it might be interesting to merge format and parser,
|
|
* and just call it 'file' or something, then call the subparser "parser"
|
|
*
|
|
* Also, how do we deal with strings?
|
|
*
|
|
* "asdf", make_string()?
|
|
*
|
|
*/
|
|
sh_parser = bin_parser_new (shn_entry, section_header, (guint)-1);
|
|
|
|
for (i = 0; i < bin_parser_get_uint (parser, "e_shnum"); ++i)
|
|
{
|
|
#if 0
|
|
bin_parser_set_index (sh_parser, i);
|
|
#endif
|
|
|
|
#if 0
|
|
bin_parser_get_uint
|
|
parser, data + i * bin_format_length (shn_entry));
|
|
section_header =
|
|
data + bin_parser_get_uint (parser, "e_shoff");
|
|
|
|
parser = bin_parser_new (
|
|
#endif
|
|
}
|
|
|
|
#if 0
|
|
bin_format_array_get_string (shn_table, data, "sh_name");
|
|
|
|
bin_format_array_get_uint (shn_table, data, "sh_addr");
|
|
#endif
|
|
}
|
|
|
|
static void
|
|
disaster (const char *str)
|
|
{
|
|
g_printerr ("%s\n", str);
|
|
|
|
exit (-1);
|
|
}
|
|
|
|
int
|
|
main ()
|
|
{
|
|
GMappedFile *libgtk;
|
|
|
|
libgtk = g_mapped_file_new ("/usr/lib/libgtk-x11-2.0.so", FALSE, NULL);
|
|
|
|
if (!libgtk)
|
|
disaster ("Could not map the file\n");
|
|
|
|
parse_elf ((const guchar *)g_mapped_file_get_contents (libgtk),
|
|
g_mapped_file_get_length (libgtk));
|
|
|
|
return 0 ;
|
|
}
|
|
#endif
|