| 1 | // SPDX-License-Identifier: GPL-2.0 |
| 2 | /* |
| 3 | * Copyright (C) 2024 Google LLC |
| 4 | */ |
| 5 | |
| 6 | #define _GNU_SOURCE |
| 7 | #include <inttypes.h> |
| 8 | #include <stdio.h> |
| 9 | #include <zlib.h> |
| 10 | |
| 11 | #include "gendwarfksyms.h" |
| 12 | |
| 13 | static struct cache expansion_cache; |
| 14 | |
| 15 | /* |
| 16 | * A simple linked list of shared or owned strings to avoid copying strings |
| 17 | * around when not necessary. |
| 18 | */ |
| 19 | struct type_list_entry { |
| 20 | const char *str; |
| 21 | void *owned; |
| 22 | struct list_head list; |
| 23 | }; |
| 24 | |
| 25 | static void type_list_free(struct list_head *list) |
| 26 | { |
| 27 | struct type_list_entry *entry; |
| 28 | struct type_list_entry *tmp; |
| 29 | |
| 30 | list_for_each_entry_safe(entry, tmp, list, list) { |
| 31 | if (entry->owned) |
| 32 | free(ptr: entry->owned); |
| 33 | free(ptr: entry); |
| 34 | } |
| 35 | |
| 36 | INIT_LIST_HEAD(list); |
| 37 | } |
| 38 | |
| 39 | static int type_list_append(struct list_head *list, const char *s, void *owned) |
| 40 | { |
| 41 | struct type_list_entry *entry; |
| 42 | |
| 43 | if (!s) |
| 44 | return 0; |
| 45 | |
| 46 | entry = xmalloc(sizeof(struct type_list_entry)); |
| 47 | entry->str = s; |
| 48 | entry->owned = owned; |
| 49 | list_add_tail(&entry->list, list); |
| 50 | |
| 51 | return strlen(entry->str); |
| 52 | } |
| 53 | |
| 54 | static void type_list_write(struct list_head *list, FILE *file) |
| 55 | { |
| 56 | struct type_list_entry *entry; |
| 57 | |
| 58 | list_for_each_entry(entry, list, list) { |
| 59 | if (entry->str) |
| 60 | checkp(fputs(entry->str, file)); |
| 61 | } |
| 62 | } |
| 63 | |
| 64 | /* |
| 65 | * An expanded type string in symtypes format. |
| 66 | */ |
| 67 | struct type_expansion { |
| 68 | char *name; |
| 69 | size_t len; |
| 70 | struct list_head expanded; |
| 71 | struct hlist_node hash; |
| 72 | }; |
| 73 | |
| 74 | static void type_expansion_init(struct type_expansion *type) |
| 75 | { |
| 76 | type->name = NULL; |
| 77 | type->len = 0; |
| 78 | INIT_LIST_HEAD(&type->expanded); |
| 79 | } |
| 80 | |
| 81 | static inline void type_expansion_free(struct type_expansion *type) |
| 82 | { |
| 83 | free(ptr: type->name); |
| 84 | type->name = NULL; |
| 85 | type->len = 0; |
| 86 | type_list_free(list: &type->expanded); |
| 87 | } |
| 88 | |
| 89 | static void type_expansion_append(struct type_expansion *type, const char *s, |
| 90 | void *owned) |
| 91 | { |
| 92 | type->len += type_list_append(list: &type->expanded, s, owned); |
| 93 | } |
| 94 | |
| 95 | /* |
| 96 | * type_map -- the longest expansions for each type. |
| 97 | * |
| 98 | * const char *name -> struct type_expansion * |
| 99 | */ |
| 100 | #define TYPE_HASH_BITS 12 |
| 101 | static HASHTABLE_DEFINE(type_map, 1 << TYPE_HASH_BITS); |
| 102 | |
| 103 | static int __type_map_get(const char *name, struct type_expansion **res) |
| 104 | { |
| 105 | struct type_expansion *e; |
| 106 | |
| 107 | hash_for_each_possible(type_map, e, hash, hash_str(name)) { |
| 108 | if (!strcmp(name, e->name)) { |
| 109 | *res = e; |
| 110 | return 0; |
| 111 | } |
| 112 | } |
| 113 | |
| 114 | return -1; |
| 115 | } |
| 116 | |
| 117 | static struct type_expansion *type_map_add(const char *name, |
| 118 | struct type_expansion *type) |
| 119 | { |
| 120 | struct type_expansion *e; |
| 121 | |
| 122 | if (__type_map_get(name, res: &e)) { |
| 123 | e = xmalloc(sizeof(struct type_expansion)); |
| 124 | type_expansion_init(type: e); |
| 125 | e->name = xstrdup(name); |
| 126 | |
| 127 | hash_add(type_map, &e->hash, hash_str(e->name)); |
| 128 | |
| 129 | if (dump_types) |
| 130 | debug("adding %s" , e->name); |
| 131 | } else { |
| 132 | /* Use the longest available expansion */ |
| 133 | if (type->len <= e->len) |
| 134 | return e; |
| 135 | |
| 136 | type_list_free(list: &e->expanded); |
| 137 | |
| 138 | if (dump_types) |
| 139 | debug("replacing %s" , e->name); |
| 140 | } |
| 141 | |
| 142 | /* Take ownership of type->expanded */ |
| 143 | list_replace_init(&type->expanded, &e->expanded); |
| 144 | e->len = type->len; |
| 145 | |
| 146 | if (dump_types) { |
| 147 | checkp(fputs(e->name, stderr)); |
| 148 | checkp(fputs(" " , stderr)); |
| 149 | type_list_write(list: &e->expanded, stderr); |
| 150 | checkp(fputs("\n" , stderr)); |
| 151 | } |
| 152 | |
| 153 | return e; |
| 154 | } |
| 155 | |
| 156 | static void type_parse(const char *name, const char *str, |
| 157 | struct type_expansion *type); |
| 158 | |
| 159 | static int type_map_get(const char *name, struct type_expansion **res) |
| 160 | { |
| 161 | struct type_expansion type; |
| 162 | const char *override; |
| 163 | |
| 164 | if (!__type_map_get(name, res)) |
| 165 | return 0; |
| 166 | |
| 167 | /* |
| 168 | * If die_map didn't contain a type, we might still have |
| 169 | * a type_string kABI rule that defines it. |
| 170 | */ |
| 171 | if (stable && kabi_get_type_string(type: name, str: &override)) { |
| 172 | type_expansion_init(type: &type); |
| 173 | type_parse(name, str: override, type: &type); |
| 174 | *res = type_map_add(name, type: &type); |
| 175 | type_expansion_free(type: &type); |
| 176 | return 0; |
| 177 | } |
| 178 | |
| 179 | return -1; |
| 180 | } |
| 181 | |
| 182 | static void type_map_write(FILE *file) |
| 183 | { |
| 184 | struct type_expansion *e; |
| 185 | struct hlist_node *tmp; |
| 186 | |
| 187 | if (!file) |
| 188 | return; |
| 189 | |
| 190 | hash_for_each_safe(type_map, e, tmp, hash) { |
| 191 | checkp(fputs(e->name, file)); |
| 192 | checkp(fputs(" " , file)); |
| 193 | type_list_write(list: &e->expanded, file); |
| 194 | checkp(fputs("\n" , file)); |
| 195 | } |
| 196 | } |
| 197 | |
| 198 | static void type_map_free(void) |
| 199 | { |
| 200 | struct type_expansion *e; |
| 201 | struct hlist_node *tmp; |
| 202 | |
| 203 | hash_for_each_safe(type_map, e, tmp, hash) { |
| 204 | type_expansion_free(type: e); |
| 205 | free(ptr: e); |
| 206 | } |
| 207 | |
| 208 | hash_init(type_map); |
| 209 | } |
| 210 | |
| 211 | /* |
| 212 | * CRC for a type, with an optional fully expanded type string for |
| 213 | * debugging. |
| 214 | */ |
| 215 | struct version { |
| 216 | struct type_expansion type; |
| 217 | unsigned long crc; |
| 218 | }; |
| 219 | |
| 220 | static void version_init(struct version *version) |
| 221 | { |
| 222 | version->crc = crc32(crc: 0, NULL, len: 0); |
| 223 | type_expansion_init(type: &version->type); |
| 224 | } |
| 225 | |
| 226 | static void version_free(struct version *version) |
| 227 | { |
| 228 | type_expansion_free(type: &version->type); |
| 229 | } |
| 230 | |
| 231 | static void version_add(struct version *version, const char *s) |
| 232 | { |
| 233 | version->crc = crc32(crc: version->crc, buf: (void *)s, len: strlen(s)); |
| 234 | if (dump_versions) |
| 235 | type_expansion_append(type: &version->type, s, NULL); |
| 236 | } |
| 237 | |
| 238 | /* |
| 239 | * Type reference format: <prefix>#<name>, where prefix: |
| 240 | * s -> structure |
| 241 | * u -> union |
| 242 | * e -> enum |
| 243 | * t -> typedef |
| 244 | * |
| 245 | * Names with spaces are additionally wrapped in single quotes. |
| 246 | */ |
| 247 | static inline bool is_type_prefix(const char *s) |
| 248 | { |
| 249 | return (s[0] == 's' || s[0] == 'u' || s[0] == 'e' || s[0] == 't') && |
| 250 | s[1] == '#'; |
| 251 | } |
| 252 | |
| 253 | static char get_type_prefix(int tag) |
| 254 | { |
| 255 | switch (tag) { |
| 256 | case DW_TAG_class_type: |
| 257 | case DW_TAG_structure_type: |
| 258 | return 's'; |
| 259 | case DW_TAG_union_type: |
| 260 | return 'u'; |
| 261 | case DW_TAG_enumeration_type: |
| 262 | return 'e'; |
| 263 | case DW_TAG_typedef_type: |
| 264 | return 't'; |
| 265 | default: |
| 266 | return 0; |
| 267 | } |
| 268 | } |
| 269 | |
| 270 | static char *get_type_name(struct die *cache) |
| 271 | { |
| 272 | const char *quote; |
| 273 | char prefix; |
| 274 | char *name; |
| 275 | |
| 276 | if (cache->state == DIE_INCOMPLETE) { |
| 277 | warn("found incomplete cache entry: %p" , cache); |
| 278 | return NULL; |
| 279 | } |
| 280 | if (cache->state == DIE_SYMBOL || cache->state == DIE_FQN) |
| 281 | return NULL; |
| 282 | if (!cache->fqn || !*cache->fqn) |
| 283 | return NULL; |
| 284 | |
| 285 | prefix = get_type_prefix(tag: cache->tag); |
| 286 | if (!prefix) |
| 287 | return NULL; |
| 288 | |
| 289 | /* Wrap names with spaces in single quotes */ |
| 290 | quote = strstr(cache->fqn, " " ) ? "'" : "" ; |
| 291 | |
| 292 | /* <prefix>#<type_name>\0 */ |
| 293 | if (asprintf(ptr: &name, fmt: "%c#%s%s%s" , prefix, quote, cache->fqn, quote) < 0) |
| 294 | error("asprintf failed for '%s'" , cache->fqn); |
| 295 | |
| 296 | return name; |
| 297 | } |
| 298 | |
| 299 | static void __calculate_version(struct version *version, |
| 300 | struct type_expansion *type) |
| 301 | { |
| 302 | struct type_list_entry *entry; |
| 303 | struct type_expansion *e; |
| 304 | |
| 305 | /* Calculate a CRC over an expanded type string */ |
| 306 | list_for_each_entry(entry, &type->expanded, list) { |
| 307 | if (is_type_prefix(s: entry->str)) { |
| 308 | if (type_map_get(name: entry->str, res: &e)) |
| 309 | error("unknown type reference to '%s' when expanding '%s'" , |
| 310 | entry->str, type->name); |
| 311 | |
| 312 | /* |
| 313 | * It's sufficient to expand each type reference just |
| 314 | * once to detect changes. |
| 315 | */ |
| 316 | if (cache_was_expanded(cache: &expansion_cache, addr: e)) { |
| 317 | version_add(version, s: entry->str); |
| 318 | } else { |
| 319 | cache_mark_expanded(cache: &expansion_cache, addr: e); |
| 320 | __calculate_version(version, type: e); |
| 321 | } |
| 322 | } else { |
| 323 | version_add(version, s: entry->str); |
| 324 | } |
| 325 | } |
| 326 | } |
| 327 | |
| 328 | static void calculate_version(struct version *version, |
| 329 | struct type_expansion *type) |
| 330 | { |
| 331 | version_init(version); |
| 332 | __calculate_version(version, type); |
| 333 | cache_free(cache: &expansion_cache); |
| 334 | } |
| 335 | |
| 336 | static void __type_expand(struct die *cache, struct type_expansion *type, |
| 337 | bool recursive); |
| 338 | |
| 339 | static void type_expand_child(struct die *cache, struct type_expansion *type, |
| 340 | bool recursive) |
| 341 | { |
| 342 | struct type_expansion child; |
| 343 | char *name; |
| 344 | |
| 345 | name = get_type_name(cache); |
| 346 | if (!name) { |
| 347 | __type_expand(cache, type, recursive); |
| 348 | return; |
| 349 | } |
| 350 | |
| 351 | if (recursive && !__cache_was_expanded(cache: &expansion_cache, addr: cache->addr)) { |
| 352 | __cache_mark_expanded(cache: &expansion_cache, addr: cache->addr); |
| 353 | type_expansion_init(type: &child); |
| 354 | __type_expand(cache, type: &child, true); |
| 355 | type_map_add(name, type: &child); |
| 356 | type_expansion_free(type: &child); |
| 357 | } |
| 358 | |
| 359 | type_expansion_append(type, s: name, owned: name); |
| 360 | } |
| 361 | |
| 362 | static void __type_expand(struct die *cache, struct type_expansion *type, |
| 363 | bool recursive) |
| 364 | { |
| 365 | struct die_fragment *df; |
| 366 | struct die *child; |
| 367 | |
| 368 | list_for_each_entry(df, &cache->fragments, list) { |
| 369 | switch (df->type) { |
| 370 | case FRAGMENT_STRING: |
| 371 | type_expansion_append(type, s: df->data.str, NULL); |
| 372 | break; |
| 373 | case FRAGMENT_DIE: |
| 374 | /* Use a complete die_map expansion if available */ |
| 375 | if (__die_map_get(addr: df->data.addr, state: DIE_COMPLETE, |
| 376 | res: &child) && |
| 377 | __die_map_get(addr: df->data.addr, state: DIE_UNEXPANDED, |
| 378 | res: &child)) |
| 379 | error("unknown child: %" PRIxPTR, |
| 380 | df->data.addr); |
| 381 | |
| 382 | type_expand_child(cache: child, type, recursive); |
| 383 | break; |
| 384 | case FRAGMENT_LINEBREAK: |
| 385 | /* |
| 386 | * Keep whitespace in the symtypes format, but avoid |
| 387 | * repeated spaces. |
| 388 | */ |
| 389 | if (list_is_last(&df->list, &cache->fragments) || |
| 390 | list_next_entry(df, list)->type != |
| 391 | FRAGMENT_LINEBREAK) |
| 392 | type_expansion_append(type, s: " " , NULL); |
| 393 | break; |
| 394 | default: |
| 395 | error("empty die_fragment in %p" , cache); |
| 396 | } |
| 397 | } |
| 398 | } |
| 399 | |
| 400 | static void type_expand(struct die *cache, struct type_expansion *type, |
| 401 | bool recursive) |
| 402 | { |
| 403 | type_expansion_init(type); |
| 404 | __type_expand(cache, type, recursive); |
| 405 | cache_free(cache: &expansion_cache); |
| 406 | } |
| 407 | |
| 408 | static void type_parse(const char *name, const char *str, |
| 409 | struct type_expansion *type) |
| 410 | { |
| 411 | char *fragment; |
| 412 | size_t start = 0; |
| 413 | size_t end; |
| 414 | size_t pos; |
| 415 | |
| 416 | if (!*str) |
| 417 | error("empty type string override for '%s'" , name); |
| 418 | |
| 419 | type_expansion_init(type); |
| 420 | |
| 421 | for (pos = 0; str[pos]; ++pos) { |
| 422 | bool empty; |
| 423 | char marker = ' '; |
| 424 | |
| 425 | if (!is_type_prefix(s: &str[pos])) |
| 426 | continue; |
| 427 | |
| 428 | end = pos + 2; |
| 429 | |
| 430 | /* |
| 431 | * Find the end of the type reference. If the type name contains |
| 432 | * spaces, it must be in single quotes. |
| 433 | */ |
| 434 | if (str[end] == '\'') { |
| 435 | marker = '\''; |
| 436 | ++end; |
| 437 | } |
| 438 | while (str[end] && str[end] != marker) |
| 439 | ++end; |
| 440 | |
| 441 | /* Check that we have a non-empty type name */ |
| 442 | if (marker == '\'') { |
| 443 | if (str[end] != marker) |
| 444 | error("incomplete %c# type reference for '%s' (string : '%s')" , |
| 445 | str[pos], name, str); |
| 446 | empty = end == pos + 3; |
| 447 | ++end; |
| 448 | } else { |
| 449 | empty = end == pos + 2; |
| 450 | } |
| 451 | if (empty) |
| 452 | error("empty %c# type name for '%s' (string: '%s')" , |
| 453 | str[pos], name, str); |
| 454 | |
| 455 | /* Append the part of the string before the type reference */ |
| 456 | if (pos > start) { |
| 457 | fragment = xstrndup(&str[start], pos - start); |
| 458 | type_expansion_append(type, s: fragment, owned: fragment); |
| 459 | } |
| 460 | |
| 461 | /* |
| 462 | * Append the type reference -- note that if the reference |
| 463 | * is invalid, i.e. points to a non-existent type, we will |
| 464 | * print out an error when calculating versions. |
| 465 | */ |
| 466 | fragment = xstrndup(&str[pos], end - pos); |
| 467 | type_expansion_append(type, s: fragment, owned: fragment); |
| 468 | |
| 469 | start = end; |
| 470 | pos = end - 1; |
| 471 | } |
| 472 | |
| 473 | /* Append the rest of the type string, if there's any left */ |
| 474 | if (str[start]) |
| 475 | type_expansion_append(type, s: &str[start], NULL); |
| 476 | } |
| 477 | |
| 478 | static void expand_type(struct die *cache, void *arg) |
| 479 | { |
| 480 | struct type_expansion type; |
| 481 | const char *override; |
| 482 | char *name; |
| 483 | |
| 484 | if (cache->mapped) |
| 485 | return; |
| 486 | |
| 487 | cache->mapped = true; |
| 488 | |
| 489 | /* |
| 490 | * Skip unexpanded die_map entries if there's a complete |
| 491 | * expansion available for this DIE. |
| 492 | */ |
| 493 | if (cache->state == DIE_UNEXPANDED && |
| 494 | !__die_map_get(addr: cache->addr, state: DIE_COMPLETE, res: &cache)) { |
| 495 | if (cache->mapped) |
| 496 | return; |
| 497 | |
| 498 | cache->mapped = true; |
| 499 | } |
| 500 | |
| 501 | name = get_type_name(cache); |
| 502 | if (!name) |
| 503 | return; |
| 504 | |
| 505 | debug("%s" , name); |
| 506 | |
| 507 | if (stable && kabi_get_type_string(type: name, str: &override)) |
| 508 | type_parse(name, str: override, type: &type); |
| 509 | else |
| 510 | type_expand(cache, type: &type, true); |
| 511 | |
| 512 | type_map_add(name, type: &type); |
| 513 | type_expansion_free(type: &type); |
| 514 | free(ptr: name); |
| 515 | } |
| 516 | |
| 517 | static void expand_symbol(struct symbol *sym, void *arg) |
| 518 | { |
| 519 | struct type_expansion type; |
| 520 | struct version version; |
| 521 | const char *override; |
| 522 | struct die *cache; |
| 523 | |
| 524 | /* |
| 525 | * No need to expand again unless we want a symtypes file entry |
| 526 | * for the symbol. Note that this means `sym` has the same address |
| 527 | * as another symbol that was already processed. |
| 528 | */ |
| 529 | if (!symtypes && sym->state == SYMBOL_PROCESSED) |
| 530 | return; |
| 531 | |
| 532 | if (__die_map_get(addr: sym->die_addr, state: DIE_SYMBOL, res: &cache)) |
| 533 | return; /* We'll warn about missing CRCs later. */ |
| 534 | |
| 535 | if (stable && kabi_get_type_string(type: sym->name, str: &override)) |
| 536 | type_parse(name: sym->name, str: override, type: &type); |
| 537 | else |
| 538 | type_expand(cache, type: &type, false); |
| 539 | |
| 540 | /* If the symbol already has a version, don't calculate it again. */ |
| 541 | if (sym->state != SYMBOL_PROCESSED) { |
| 542 | calculate_version(version: &version, type: &type); |
| 543 | symbol_set_crc(sym, crc: version.crc); |
| 544 | debug("%s = %lx" , sym->name, version.crc); |
| 545 | |
| 546 | if (dump_versions) { |
| 547 | checkp(fputs(sym->name, stderr)); |
| 548 | checkp(fputs(" " , stderr)); |
| 549 | type_list_write(list: &version.type.expanded, stderr); |
| 550 | checkp(fputs("\n" , stderr)); |
| 551 | } |
| 552 | |
| 553 | version_free(version: &version); |
| 554 | } |
| 555 | |
| 556 | /* These aren't needed in type_map unless we want a symtypes file. */ |
| 557 | if (symtypes) |
| 558 | type_map_add(name: sym->name, type: &type); |
| 559 | |
| 560 | type_expansion_free(type: &type); |
| 561 | } |
| 562 | |
| 563 | void generate_symtypes_and_versions(FILE *file) |
| 564 | { |
| 565 | cache_init(cache: &expansion_cache); |
| 566 | |
| 567 | /* |
| 568 | * die_map processing: |
| 569 | * |
| 570 | * 1. die_map contains all types referenced in exported symbol |
| 571 | * signatures, but can contain duplicates just like the original |
| 572 | * DWARF, and some references may not be fully expanded depending |
| 573 | * on how far we processed the DIE tree for that specific symbol. |
| 574 | * |
| 575 | * For each die_map entry, find the longest available expansion, |
| 576 | * and add it to type_map. |
| 577 | */ |
| 578 | die_map_for_each(func: expand_type, NULL); |
| 579 | |
| 580 | /* |
| 581 | * 2. For each exported symbol, expand the die_map type, and use |
| 582 | * type_map expansions to calculate a symbol version from the |
| 583 | * fully expanded type string. |
| 584 | */ |
| 585 | symbol_for_each(func: expand_symbol, NULL); |
| 586 | |
| 587 | /* |
| 588 | * 3. If a symtypes file is requested, write type_map contents to |
| 589 | * the file. |
| 590 | */ |
| 591 | type_map_write(file); |
| 592 | type_map_free(); |
| 593 | } |
| 594 | |