xref: /linux-6.15/scripts/mod/symsearch.c (revision 4c2598e3)
140745327SJack Brennen // SPDX-License-Identifier: GPL-2.0
240745327SJack Brennen 
340745327SJack Brennen /*
440745327SJack Brennen  * Helper functions for finding the symbol in an ELF which is "nearest"
540745327SJack Brennen  * to a given address.
640745327SJack Brennen  */
7*4c2598e3SMasahiro Yamada #include <xalloc.h>
840745327SJack Brennen #include "modpost.h"
940745327SJack Brennen 
1040745327SJack Brennen struct syminfo {
1140745327SJack Brennen 	unsigned int symbol_index;
1240745327SJack Brennen 	unsigned int section_index;
1340745327SJack Brennen 	Elf_Addr addr;
1440745327SJack Brennen };
1540745327SJack Brennen 
1640745327SJack Brennen /*
1740745327SJack Brennen  * Container used to hold an entire binary search table.
1840745327SJack Brennen  * Entries in table are ascending, sorted first by section_index,
1940745327SJack Brennen  * then by addr, and last by symbol_index.  The sorting by
2040745327SJack Brennen  * symbol_index is used to ensure predictable behavior when
2140745327SJack Brennen  * multiple symbols are present with the same address; all
2240745327SJack Brennen  * symbols past the first are effectively ignored, by eliding
2340745327SJack Brennen  * them in symsearch_fixup().
2440745327SJack Brennen  */
2540745327SJack Brennen struct symsearch {
2640745327SJack Brennen 	unsigned int table_size;
2740745327SJack Brennen 	struct syminfo table[];
2840745327SJack Brennen };
2940745327SJack Brennen 
syminfo_compare(const void * s1,const void * s2)3040745327SJack Brennen static int syminfo_compare(const void *s1, const void *s2)
3140745327SJack Brennen {
3240745327SJack Brennen 	const struct syminfo *sym1 = s1;
3340745327SJack Brennen 	const struct syminfo *sym2 = s2;
3440745327SJack Brennen 
3540745327SJack Brennen 	if (sym1->section_index > sym2->section_index)
3640745327SJack Brennen 		return 1;
3740745327SJack Brennen 	if (sym1->section_index < sym2->section_index)
3840745327SJack Brennen 		return -1;
3940745327SJack Brennen 	if (sym1->addr > sym2->addr)
4040745327SJack Brennen 		return 1;
4140745327SJack Brennen 	if (sym1->addr < sym2->addr)
4240745327SJack Brennen 		return -1;
4340745327SJack Brennen 	if (sym1->symbol_index > sym2->symbol_index)
4440745327SJack Brennen 		return 1;
4540745327SJack Brennen 	if (sym1->symbol_index < sym2->symbol_index)
4640745327SJack Brennen 		return -1;
4740745327SJack Brennen 	return 0;
4840745327SJack Brennen }
4940745327SJack Brennen 
symbol_count(struct elf_info * elf)5040745327SJack Brennen static unsigned int symbol_count(struct elf_info *elf)
5140745327SJack Brennen {
5240745327SJack Brennen 	unsigned int result = 0;
5340745327SJack Brennen 
5440745327SJack Brennen 	for (Elf_Sym *sym = elf->symtab_start; sym < elf->symtab_stop; sym++) {
5540745327SJack Brennen 		if (is_valid_name(elf, sym))
5640745327SJack Brennen 			result++;
5740745327SJack Brennen 	}
5840745327SJack Brennen 	return result;
5940745327SJack Brennen }
6040745327SJack Brennen 
6140745327SJack Brennen /*
6240745327SJack Brennen  * Populate the search array that we just allocated.
6340745327SJack Brennen  * Be slightly paranoid here.  The ELF file is mmap'd and could
6440745327SJack Brennen  * conceivably change between symbol_count() and symsearch_populate().
6540745327SJack Brennen  * If we notice any difference, bail out rather than potentially
6640745327SJack Brennen  * propagating errors or crashing.
6740745327SJack Brennen  */
symsearch_populate(struct elf_info * elf,struct syminfo * table,unsigned int table_size)6840745327SJack Brennen static void symsearch_populate(struct elf_info *elf,
6940745327SJack Brennen 			       struct syminfo *table,
7040745327SJack Brennen 			       unsigned int table_size)
7140745327SJack Brennen {
7240745327SJack Brennen 	bool is_arm = (elf->hdr->e_machine == EM_ARM);
7340745327SJack Brennen 
7440745327SJack Brennen 	for (Elf_Sym *sym = elf->symtab_start; sym < elf->symtab_stop; sym++) {
7540745327SJack Brennen 		if (is_valid_name(elf, sym)) {
7640745327SJack Brennen 			if (table_size-- == 0)
7740745327SJack Brennen 				fatal("%s: size mismatch\n", __func__);
7840745327SJack Brennen 			table->symbol_index = sym - elf->symtab_start;
7940745327SJack Brennen 			table->section_index = get_secindex(elf, sym);
8040745327SJack Brennen 			table->addr = sym->st_value;
8140745327SJack Brennen 
8240745327SJack Brennen 			/*
8340745327SJack Brennen 			 * For ARM Thumb instruction, the bit 0 of st_value is
8440745327SJack Brennen 			 * set if the symbol is STT_FUNC type. Mask it to get
8540745327SJack Brennen 			 * the address.
8640745327SJack Brennen 			 */
8740745327SJack Brennen 			if (is_arm && ELF_ST_TYPE(sym->st_info) == STT_FUNC)
8840745327SJack Brennen 				table->addr &= ~1;
8940745327SJack Brennen 
9040745327SJack Brennen 			table++;
9140745327SJack Brennen 		}
9240745327SJack Brennen 	}
9340745327SJack Brennen 
9440745327SJack Brennen 	if (table_size != 0)
9540745327SJack Brennen 		fatal("%s: size mismatch\n", __func__);
9640745327SJack Brennen }
9740745327SJack Brennen 
9840745327SJack Brennen /*
9940745327SJack Brennen  * Do any fixups on the table after sorting.
10040745327SJack Brennen  * For now, this just finds adjacent entries which have
10140745327SJack Brennen  * the same section_index and addr, and it propagates
10240745327SJack Brennen  * the first symbol_index over the subsequent entries,
10340745327SJack Brennen  * so that only one symbol_index is seen for any given
10440745327SJack Brennen  * section_index and addr.  This ensures that whether
10540745327SJack Brennen  * we're looking at an address from "above" or "below"
10640745327SJack Brennen  * that we see the same symbol_index.
10740745327SJack Brennen  * This does leave some duplicate entries in the table;
10840745327SJack Brennen  * in practice, these are a small fraction of the
10940745327SJack Brennen  * total number of entries, and they are harmless to
11040745327SJack Brennen  * the binary search algorithm other than a few occasional
11140745327SJack Brennen  * unnecessary comparisons.
11240745327SJack Brennen  */
symsearch_fixup(struct syminfo * table,unsigned int table_size)11340745327SJack Brennen static void symsearch_fixup(struct syminfo *table, unsigned int table_size)
11440745327SJack Brennen {
11540745327SJack Brennen 	/* Don't look at index 0, it will never change. */
11640745327SJack Brennen 	for (unsigned int i = 1; i < table_size; i++) {
11740745327SJack Brennen 		if (table[i].addr == table[i - 1].addr &&
11840745327SJack Brennen 		    table[i].section_index == table[i - 1].section_index) {
11940745327SJack Brennen 			table[i].symbol_index = table[i - 1].symbol_index;
12040745327SJack Brennen 		}
12140745327SJack Brennen 	}
12240745327SJack Brennen }
12340745327SJack Brennen 
symsearch_init(struct elf_info * elf)12440745327SJack Brennen void symsearch_init(struct elf_info *elf)
12540745327SJack Brennen {
12640745327SJack Brennen 	unsigned int table_size = symbol_count(elf);
12740745327SJack Brennen 
128*4c2598e3SMasahiro Yamada 	elf->symsearch = xmalloc(sizeof(struct symsearch) +
129*4c2598e3SMasahiro Yamada 				       sizeof(struct syminfo) * table_size);
13040745327SJack Brennen 	elf->symsearch->table_size = table_size;
13140745327SJack Brennen 
13240745327SJack Brennen 	symsearch_populate(elf, elf->symsearch->table, table_size);
13340745327SJack Brennen 	qsort(elf->symsearch->table, table_size,
13440745327SJack Brennen 	      sizeof(struct syminfo), syminfo_compare);
13540745327SJack Brennen 
13640745327SJack Brennen 	symsearch_fixup(elf->symsearch->table, table_size);
13740745327SJack Brennen }
13840745327SJack Brennen 
symsearch_finish(struct elf_info * elf)13940745327SJack Brennen void symsearch_finish(struct elf_info *elf)
14040745327SJack Brennen {
14140745327SJack Brennen 	free(elf->symsearch);
14240745327SJack Brennen 	elf->symsearch = NULL;
14340745327SJack Brennen }
14440745327SJack Brennen 
14540745327SJack Brennen /*
14640745327SJack Brennen  * Find the syminfo which is in secndx and "nearest" to addr.
14740745327SJack Brennen  * allow_negative: allow returning a symbol whose address is > addr.
14840745327SJack Brennen  * min_distance: ignore symbols which are further away than this.
14940745327SJack Brennen  *
15040745327SJack Brennen  * Returns a pointer into the symbol table for success.
15140745327SJack Brennen  * Returns NULL if no legal symbol is found within the requested range.
15240745327SJack Brennen  */
symsearch_find_nearest(struct elf_info * elf,Elf_Addr addr,unsigned int secndx,bool allow_negative,Elf_Addr min_distance)15340745327SJack Brennen Elf_Sym *symsearch_find_nearest(struct elf_info *elf, Elf_Addr addr,
15440745327SJack Brennen 				unsigned int secndx, bool allow_negative,
15540745327SJack Brennen 				Elf_Addr min_distance)
15640745327SJack Brennen {
15740745327SJack Brennen 	unsigned int hi = elf->symsearch->table_size;
15840745327SJack Brennen 	unsigned int lo = 0;
15940745327SJack Brennen 	struct syminfo *table = elf->symsearch->table;
16040745327SJack Brennen 	struct syminfo target;
16140745327SJack Brennen 
16240745327SJack Brennen 	target.addr = addr;
16340745327SJack Brennen 	target.section_index = secndx;
16440745327SJack Brennen 	target.symbol_index = ~0;  /* compares greater than any actual index */
16540745327SJack Brennen 	while (hi > lo) {
16640745327SJack Brennen 		unsigned int mid = lo + (hi - lo) / 2;  /* Avoids overflow */
16740745327SJack Brennen 
16840745327SJack Brennen 		if (syminfo_compare(&table[mid], &target) > 0)
16940745327SJack Brennen 			hi = mid;
17040745327SJack Brennen 		else
17140745327SJack Brennen 			lo = mid + 1;
17240745327SJack Brennen 	}
17340745327SJack Brennen 
17440745327SJack Brennen 	/*
17540745327SJack Brennen 	 * table[hi], if it exists, is the first entry in the array which
17640745327SJack Brennen 	 * lies beyond target.  table[hi - 1], if it exists, is the last
17740745327SJack Brennen 	 * entry in the array which comes before target, including the
17840745327SJack Brennen 	 * case where it perfectly matches the section and the address.
17940745327SJack Brennen 	 *
18040745327SJack Brennen 	 * Note -- if the address we're looking up falls perfectly
18140745327SJack Brennen 	 * in the middle of two symbols, this is written to always
18240745327SJack Brennen 	 * prefer the symbol with the lower address.
18340745327SJack Brennen 	 */
18440745327SJack Brennen 	Elf_Sym *result = NULL;
18540745327SJack Brennen 
18640745327SJack Brennen 	if (allow_negative &&
18740745327SJack Brennen 	    hi < elf->symsearch->table_size &&
18840745327SJack Brennen 	    table[hi].section_index == secndx &&
18940745327SJack Brennen 	    table[hi].addr - addr <= min_distance) {
19040745327SJack Brennen 		min_distance = table[hi].addr - addr;
19140745327SJack Brennen 		result = &elf->symtab_start[table[hi].symbol_index];
19240745327SJack Brennen 	}
19340745327SJack Brennen 	if (hi > 0 &&
19440745327SJack Brennen 	    table[hi - 1].section_index == secndx &&
19540745327SJack Brennen 	    addr - table[hi - 1].addr <= min_distance) {
19640745327SJack Brennen 		result = &elf->symtab_start[table[hi - 1].symbol_index];
19740745327SJack Brennen 	}
19840745327SJack Brennen 	return result;
19940745327SJack Brennen }
200