Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 1 | #include "util.h" |
| 2 | #include "../perf.h" |
| 3 | #include "symbol.h" |
| 4 | |
| 5 | #include <libelf.h> |
| 6 | #include <gelf.h> |
| 7 | #include <elf.h> |
| 8 | |
| 9 | static struct symbol *symbol__new(uint64_t start, uint64_t len, |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 10 | const char *name, unsigned int priv_size) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 11 | { |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 12 | size_t namelen = strlen(name) + 1; |
| 13 | struct symbol *self = malloc(priv_size + sizeof(*self) + namelen); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 14 | |
| 15 | if (self != NULL) { |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 16 | if (priv_size) { |
| 17 | memset(self, 0, priv_size); |
| 18 | self = ((void *)self) + priv_size; |
| 19 | } |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 20 | self->start = start; |
| 21 | self->end = start + len; |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 22 | memcpy(self->name, name, namelen); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 23 | } |
| 24 | |
| 25 | return self; |
| 26 | } |
| 27 | |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 28 | static void symbol__delete(struct symbol *self, unsigned int priv_size) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 29 | { |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 30 | free(((void *)self) - priv_size); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 31 | } |
| 32 | |
| 33 | static size_t symbol__fprintf(struct symbol *self, FILE *fp) |
| 34 | { |
| 35 | return fprintf(fp, " %llx-%llx %s\n", |
| 36 | self->start, self->end, self->name); |
| 37 | } |
| 38 | |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 39 | struct dso *dso__new(const char *name, unsigned int sym_priv_size) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 40 | { |
| 41 | struct dso *self = malloc(sizeof(*self) + strlen(name) + 1); |
| 42 | |
| 43 | if (self != NULL) { |
| 44 | strcpy(self->name, name); |
| 45 | self->syms = RB_ROOT; |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 46 | self->sym_priv_size = sym_priv_size; |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 47 | } |
| 48 | |
| 49 | return self; |
| 50 | } |
| 51 | |
| 52 | static void dso__delete_symbols(struct dso *self) |
| 53 | { |
| 54 | struct symbol *pos; |
| 55 | struct rb_node *next = rb_first(&self->syms); |
| 56 | |
| 57 | while (next) { |
| 58 | pos = rb_entry(next, struct symbol, rb_node); |
| 59 | next = rb_next(&pos->rb_node); |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 60 | symbol__delete(pos, self->sym_priv_size); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 61 | } |
| 62 | } |
| 63 | |
| 64 | void dso__delete(struct dso *self) |
| 65 | { |
| 66 | dso__delete_symbols(self); |
| 67 | free(self); |
| 68 | } |
| 69 | |
| 70 | static void dso__insert_symbol(struct dso *self, struct symbol *sym) |
| 71 | { |
| 72 | struct rb_node **p = &self->syms.rb_node; |
| 73 | struct rb_node *parent = NULL; |
| 74 | const uint64_t ip = sym->start; |
| 75 | struct symbol *s; |
| 76 | |
| 77 | while (*p != NULL) { |
| 78 | parent = *p; |
| 79 | s = rb_entry(parent, struct symbol, rb_node); |
| 80 | if (ip < s->start) |
| 81 | p = &(*p)->rb_left; |
| 82 | else |
| 83 | p = &(*p)->rb_right; |
| 84 | } |
| 85 | rb_link_node(&sym->rb_node, parent, p); |
| 86 | rb_insert_color(&sym->rb_node, &self->syms); |
| 87 | } |
| 88 | |
| 89 | struct symbol *dso__find_symbol(struct dso *self, uint64_t ip) |
| 90 | { |
| 91 | struct rb_node *n; |
| 92 | |
| 93 | if (self == NULL) |
| 94 | return NULL; |
| 95 | |
| 96 | n = self->syms.rb_node; |
| 97 | |
| 98 | while (n) { |
| 99 | struct symbol *s = rb_entry(n, struct symbol, rb_node); |
| 100 | |
| 101 | if (ip < s->start) |
| 102 | n = n->rb_left; |
| 103 | else if (ip > s->end) |
| 104 | n = n->rb_right; |
| 105 | else |
| 106 | return s; |
| 107 | } |
| 108 | |
| 109 | return NULL; |
| 110 | } |
| 111 | |
| 112 | size_t dso__fprintf(struct dso *self, FILE *fp) |
| 113 | { |
| 114 | size_t ret = fprintf(fp, "dso: %s\n", self->name); |
| 115 | |
| 116 | struct rb_node *nd; |
| 117 | for (nd = rb_first(&self->syms); nd; nd = rb_next(nd)) { |
| 118 | struct symbol *pos = rb_entry(nd, struct symbol, rb_node); |
| 119 | ret += symbol__fprintf(pos, fp); |
| 120 | } |
| 121 | |
| 122 | return ret; |
| 123 | } |
| 124 | |
| 125 | static int hex(char ch) |
| 126 | { |
| 127 | if ((ch >= '0') && (ch <= '9')) |
| 128 | return ch - '0'; |
| 129 | if ((ch >= 'a') && (ch <= 'f')) |
| 130 | return ch - 'a' + 10; |
| 131 | if ((ch >= 'A') && (ch <= 'F')) |
| 132 | return ch - 'A' + 10; |
| 133 | return -1; |
| 134 | } |
| 135 | |
| 136 | /* |
| 137 | * While we find nice hex chars, build a long_val. |
| 138 | * Return number of chars processed. |
| 139 | */ |
| 140 | static int hex2long(char *ptr, unsigned long *long_val) |
| 141 | { |
| 142 | const char *p = ptr; |
| 143 | *long_val = 0; |
| 144 | |
| 145 | while (*p) { |
| 146 | const int hex_val = hex(*p); |
| 147 | |
| 148 | if (hex_val < 0) |
| 149 | break; |
| 150 | |
| 151 | *long_val = (*long_val << 4) | hex_val; |
| 152 | p++; |
| 153 | } |
| 154 | |
| 155 | return p - ptr; |
| 156 | } |
| 157 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 158 | static int dso__load_kallsyms(struct dso *self, symbol_filter_t filter) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 159 | { |
| 160 | struct rb_node *nd, *prevnd; |
| 161 | char *line = NULL; |
| 162 | size_t n; |
| 163 | FILE *file = fopen("/proc/kallsyms", "r"); |
| 164 | |
| 165 | if (file == NULL) |
| 166 | goto out_failure; |
| 167 | |
| 168 | while (!feof(file)) { |
| 169 | unsigned long start; |
| 170 | struct symbol *sym; |
| 171 | int line_len, len; |
| 172 | char symbol_type; |
| 173 | |
| 174 | line_len = getline(&line, &n, file); |
| 175 | if (line_len < 0) |
| 176 | break; |
| 177 | |
| 178 | if (!line) |
| 179 | goto out_failure; |
| 180 | |
| 181 | line[--line_len] = '\0'; /* \n */ |
| 182 | |
| 183 | len = hex2long(line, &start); |
| 184 | |
| 185 | len++; |
| 186 | if (len + 2 >= line_len) |
| 187 | continue; |
| 188 | |
| 189 | symbol_type = toupper(line[len]); |
| 190 | /* |
| 191 | * We're interested only in code ('T'ext) |
| 192 | */ |
| 193 | if (symbol_type != 'T' && symbol_type != 'W') |
| 194 | continue; |
| 195 | /* |
| 196 | * Well fix up the end later, when we have all sorted. |
| 197 | */ |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 198 | sym = symbol__new(start, 0xdead, line + len + 2, |
| 199 | self->sym_priv_size); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 200 | |
| 201 | if (sym == NULL) |
| 202 | goto out_delete_line; |
| 203 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 204 | if (filter && filter(self, sym)) |
| 205 | symbol__delete(sym, self->sym_priv_size); |
| 206 | else |
| 207 | dso__insert_symbol(self, sym); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 208 | } |
| 209 | |
| 210 | /* |
| 211 | * Now that we have all sorted out, just set the ->end of all |
| 212 | * symbols |
| 213 | */ |
| 214 | prevnd = rb_first(&self->syms); |
| 215 | |
| 216 | if (prevnd == NULL) |
| 217 | goto out_delete_line; |
| 218 | |
| 219 | for (nd = rb_next(prevnd); nd; nd = rb_next(nd)) { |
| 220 | struct symbol *prev = rb_entry(prevnd, struct symbol, rb_node), |
| 221 | *curr = rb_entry(nd, struct symbol, rb_node); |
| 222 | |
| 223 | prev->end = curr->start - 1; |
| 224 | prevnd = nd; |
| 225 | } |
| 226 | |
| 227 | free(line); |
| 228 | fclose(file); |
| 229 | |
| 230 | return 0; |
| 231 | |
| 232 | out_delete_line: |
| 233 | free(line); |
| 234 | out_failure: |
| 235 | return -1; |
| 236 | } |
| 237 | |
| 238 | /** |
| 239 | * elf_symtab__for_each_symbol - iterate thru all the symbols |
| 240 | * |
| 241 | * @self: struct elf_symtab instance to iterate |
| 242 | * @index: uint32_t index |
| 243 | * @sym: GElf_Sym iterator |
| 244 | */ |
| 245 | #define elf_symtab__for_each_symbol(syms, nr_syms, index, sym) \ |
| 246 | for (index = 0, gelf_getsym(syms, index, &sym);\ |
| 247 | index < nr_syms; \ |
| 248 | index++, gelf_getsym(syms, index, &sym)) |
| 249 | |
| 250 | static inline uint8_t elf_sym__type(const GElf_Sym *sym) |
| 251 | { |
| 252 | return GELF_ST_TYPE(sym->st_info); |
| 253 | } |
| 254 | |
| 255 | static inline int elf_sym__is_function(const GElf_Sym *sym) |
| 256 | { |
| 257 | return elf_sym__type(sym) == STT_FUNC && |
| 258 | sym->st_name != 0 && |
| 259 | sym->st_shndx != SHN_UNDEF && |
| 260 | sym->st_size != 0; |
| 261 | } |
| 262 | |
| 263 | static inline const char *elf_sym__name(const GElf_Sym *sym, |
| 264 | const Elf_Data *symstrs) |
| 265 | { |
| 266 | return symstrs->d_buf + sym->st_name; |
| 267 | } |
| 268 | |
| 269 | static Elf_Scn *elf_section_by_name(Elf *elf, GElf_Ehdr *ep, |
| 270 | GElf_Shdr *shp, const char *name, |
| 271 | size_t *index) |
| 272 | { |
| 273 | Elf_Scn *sec = NULL; |
| 274 | size_t cnt = 1; |
| 275 | |
| 276 | while ((sec = elf_nextscn(elf, sec)) != NULL) { |
| 277 | char *str; |
| 278 | |
| 279 | gelf_getshdr(sec, shp); |
| 280 | str = elf_strptr(elf, ep->e_shstrndx, shp->sh_name); |
| 281 | if (!strcmp(name, str)) { |
| 282 | if (index) |
| 283 | *index = cnt; |
| 284 | break; |
| 285 | } |
| 286 | ++cnt; |
| 287 | } |
| 288 | |
| 289 | return sec; |
| 290 | } |
| 291 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 292 | static int dso__load_sym(struct dso *self, int fd, const char *name, |
| 293 | symbol_filter_t filter) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 294 | { |
| 295 | Elf_Data *symstrs; |
| 296 | uint32_t nr_syms; |
| 297 | int err = -1; |
| 298 | uint32_t index; |
| 299 | GElf_Ehdr ehdr; |
| 300 | GElf_Shdr shdr; |
| 301 | Elf_Data *syms; |
| 302 | GElf_Sym sym; |
| 303 | Elf_Scn *sec; |
| 304 | Elf *elf; |
| 305 | int nr = 0; |
| 306 | |
| 307 | elf = elf_begin(fd, ELF_C_READ_MMAP, NULL); |
| 308 | if (elf == NULL) { |
| 309 | fprintf(stderr, "%s: cannot read %s ELF file.\n", |
| 310 | __func__, name); |
| 311 | goto out_close; |
| 312 | } |
| 313 | |
| 314 | if (gelf_getehdr(elf, &ehdr) == NULL) { |
| 315 | fprintf(stderr, "%s: cannot get elf header.\n", __func__); |
| 316 | goto out_elf_end; |
| 317 | } |
| 318 | |
| 319 | sec = elf_section_by_name(elf, &ehdr, &shdr, ".symtab", NULL); |
| 320 | if (sec == NULL) |
| 321 | sec = elf_section_by_name(elf, &ehdr, &shdr, ".dynsym", NULL); |
| 322 | |
| 323 | if (sec == NULL) |
| 324 | goto out_elf_end; |
| 325 | |
| 326 | syms = elf_getdata(sec, NULL); |
| 327 | if (syms == NULL) |
| 328 | goto out_elf_end; |
| 329 | |
| 330 | sec = elf_getscn(elf, shdr.sh_link); |
| 331 | if (sec == NULL) |
| 332 | goto out_elf_end; |
| 333 | |
| 334 | symstrs = elf_getdata(sec, NULL); |
| 335 | if (symstrs == NULL) |
| 336 | goto out_elf_end; |
| 337 | |
| 338 | nr_syms = shdr.sh_size / shdr.sh_entsize; |
| 339 | |
| 340 | elf_symtab__for_each_symbol(syms, nr_syms, index, sym) { |
| 341 | struct symbol *f; |
| 342 | |
| 343 | if (!elf_sym__is_function(&sym)) |
| 344 | continue; |
| 345 | |
| 346 | sec = elf_getscn(elf, sym.st_shndx); |
| 347 | if (!sec) |
| 348 | goto out_elf_end; |
| 349 | |
| 350 | gelf_getshdr(sec, &shdr); |
| 351 | sym.st_value -= shdr.sh_addr - shdr.sh_offset; |
| 352 | |
| 353 | f = symbol__new(sym.st_value, sym.st_size, |
Arnaldo Carvalho de Melo | 0085c954 | 2009-05-28 14:55:13 -0300 | [diff] [blame] | 354 | elf_sym__name(&sym, symstrs), |
| 355 | self->sym_priv_size); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 356 | if (!f) |
| 357 | goto out_elf_end; |
| 358 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 359 | if (filter && filter(self, f)) |
| 360 | symbol__delete(f, self->sym_priv_size); |
| 361 | else { |
| 362 | dso__insert_symbol(self, f); |
| 363 | nr++; |
| 364 | } |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 365 | } |
| 366 | |
| 367 | err = nr; |
| 368 | out_elf_end: |
| 369 | elf_end(elf); |
| 370 | out_close: |
| 371 | return err; |
| 372 | } |
| 373 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 374 | int dso__load(struct dso *self, symbol_filter_t filter) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 375 | { |
| 376 | int size = strlen(self->name) + sizeof("/usr/lib/debug%s.debug"); |
| 377 | char *name = malloc(size); |
| 378 | int variant = 0; |
| 379 | int ret = -1; |
| 380 | int fd; |
| 381 | |
| 382 | if (!name) |
| 383 | return -1; |
| 384 | |
| 385 | more: |
| 386 | do { |
| 387 | switch (variant) { |
| 388 | case 0: /* Fedora */ |
| 389 | snprintf(name, size, "/usr/lib/debug%s.debug", self->name); |
| 390 | break; |
| 391 | case 1: /* Ubuntu */ |
| 392 | snprintf(name, size, "/usr/lib/debug%s", self->name); |
| 393 | break; |
| 394 | case 2: /* Sane people */ |
| 395 | snprintf(name, size, "%s", self->name); |
| 396 | break; |
| 397 | |
| 398 | default: |
| 399 | goto out; |
| 400 | } |
| 401 | variant++; |
| 402 | |
| 403 | fd = open(name, O_RDONLY); |
| 404 | } while (fd < 0); |
| 405 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 406 | ret = dso__load_sym(self, fd, name, filter); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 407 | close(fd); |
| 408 | |
| 409 | /* |
| 410 | * Some people seem to have debuginfo files _WITHOUT_ debug info!?!? |
| 411 | */ |
| 412 | if (!ret) |
| 413 | goto more; |
| 414 | |
| 415 | out: |
| 416 | free(name); |
| 417 | return ret; |
| 418 | } |
| 419 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 420 | static int dso__load_vmlinux(struct dso *self, const char *vmlinux, |
| 421 | symbol_filter_t filter) |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 422 | { |
| 423 | int err, fd = open(vmlinux, O_RDONLY); |
| 424 | |
| 425 | if (fd < 0) |
| 426 | return -1; |
| 427 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 428 | err = dso__load_sym(self, fd, vmlinux, filter); |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 429 | close(fd); |
| 430 | |
| 431 | return err; |
| 432 | } |
| 433 | |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 434 | int dso__load_kernel(struct dso *self, const char *vmlinux, symbol_filter_t filter) |
Arnaldo Carvalho de Melo | a827c87 | 2009-05-28 14:55:19 -0300 | [diff] [blame] | 435 | { |
| 436 | int err = -1; |
| 437 | |
| 438 | if (vmlinux) |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 439 | err = dso__load_vmlinux(self, vmlinux, filter); |
Arnaldo Carvalho de Melo | a827c87 | 2009-05-28 14:55:19 -0300 | [diff] [blame] | 440 | |
| 441 | if (err) |
Arnaldo Carvalho de Melo | 69ee69f | 2009-05-28 14:55:26 -0300 | [diff] [blame^] | 442 | err = dso__load_kallsyms(self, filter); |
Arnaldo Carvalho de Melo | a827c87 | 2009-05-28 14:55:19 -0300 | [diff] [blame] | 443 | |
| 444 | return err; |
| 445 | } |
| 446 | |
Arnaldo Carvalho de Melo | a2928c4 | 2009-05-28 14:55:04 -0300 | [diff] [blame] | 447 | void symbol__init(void) |
| 448 | { |
| 449 | elf_version(EV_CURRENT); |
| 450 | } |