1 // SPDX-License-Identifier: GPL-2.0-only
3 * kallsyms.c: in-kernel printing of symbolic oopses and stack traces.
5 * Rewritten and vastly simplified by Rusty Russell for in-kernel
12 * Changed the compression method from stem compression to "table lookup"
13 * compression (see scripts/kallsyms.c for a more complete description)
15 #include <linux/kallsyms.h>
16 #include <linux/init.h>
17 #include <linux/seq_file.h>
19 #include <linux/kdb.h>
20 #include <linux/err.h>
21 #include <linux/proc_fs.h>
22 #include <linux/sched.h> /* for cond_resched */
23 #include <linux/ctype.h>
24 #include <linux/slab.h>
25 #include <linux/filter.h>
26 #include <linux/ftrace.h>
27 #include <linux/kprobes.h>
28 #include <linux/build_bug.h>
29 #include <linux/compiler.h>
30 #include <linux/module.h>
31 #include <linux/kernel.h>
32 #include <linux/bsearch.h>
33 #include <linux/btf_ids.h>
35 #include "kallsyms_internal.h"
38 * Expand a compressed symbol data into the resulting uncompressed string,
39 * if uncompressed string is too long (>= maxlen), it will be truncated,
40 * given the offset to where the symbol is in the compressed stream.
42 static unsigned int kallsyms_expand_symbol(unsigned int off,
43 char *result, size_t maxlen)
45 int len, skipped_first = 0;
49 /* Get the compressed symbol length from the first symbol byte. */
50 data = &kallsyms_names[off];
55 /* If MSB is 1, it is a "big" symbol, so needs an additional byte. */
56 if ((len & 0x80) != 0) {
57 len = (len & 0x7F) | (*data << 7);
63 * Update the offset to return the offset for the next symbol on
64 * the compressed stream.
69 * For every byte on the compressed symbol data, copy the table
70 * entry for that byte.
73 tptr = &kallsyms_token_table[kallsyms_token_index[*data]];
94 /* Return to offset to the next symbol. */
99 * Get symbol type information. This is encoded as a single char at the
100 * beginning of the symbol name.
102 static char kallsyms_get_symbol_type(unsigned int off)
105 * Get just the first code, look it up in the token table,
106 * and return the first char from this token.
108 return kallsyms_token_table[kallsyms_token_index[kallsyms_names[off + 1]]];
113 * Find the offset on the compressed stream given and index in the
116 static unsigned int get_symbol_offset(unsigned long pos)
122 * Use the closest marker we have. We have markers every 256 positions,
123 * so that should be close enough.
125 name = &kallsyms_names[kallsyms_markers[pos >> 8]];
128 * Sequentially scan all the symbols up to the point we're searching
129 * for. Every symbol is stored in a [<len>][<len> bytes of data] format,
130 * so we just need to add the len to the current pointer for every
131 * symbol we wish to skip.
133 for (i = 0; i < (pos & 0xFF); i++) {
137 * If MSB is 1, it is a "big" symbol, so we need to look into
138 * the next byte (and skip it, too).
140 if ((len & 0x80) != 0)
141 len = ((len & 0x7F) | (name[1] << 7)) + 1;
143 name = name + len + 1;
146 return name - kallsyms_names;
149 unsigned long kallsyms_sym_address(int idx)
151 if (!IS_ENABLED(CONFIG_KALLSYMS_BASE_RELATIVE))
152 return kallsyms_addresses[idx];
154 /* values are unsigned offsets if --absolute-percpu is not in effect */
155 if (!IS_ENABLED(CONFIG_KALLSYMS_ABSOLUTE_PERCPU))
156 return kallsyms_relative_base + (u32)kallsyms_offsets[idx];
158 /* ...otherwise, positive offsets are absolute values */
159 if (kallsyms_offsets[idx] >= 0)
160 return kallsyms_offsets[idx];
162 /* ...and negative offsets are relative to kallsyms_relative_base - 1 */
163 return kallsyms_relative_base - 1 - kallsyms_offsets[idx];
166 static void cleanup_symbol_name(char *s)
170 if (!IS_ENABLED(CONFIG_LTO_CLANG))
174 * LLVM appends various suffixes for local functions and variables that
175 * must be promoted to global scope as part of LTO. This can break
176 * hooking of static functions with kprobes. '.' is not a valid
177 * character in an identifier in C. Suffixes only in LLVM LTO observed:
178 * - foo.llvm.[0-9a-f]+
180 res = strstr(s, ".llvm.");
187 static int compare_symbol_name(const char *name, char *namebuf)
189 /* The kallsyms_seqs_of_names is sorted based on names after
190 * cleanup_symbol_name() (see scripts/kallsyms.c) if clang lto is enabled.
191 * To ensure correct bisection in kallsyms_lookup_names(), do
192 * cleanup_symbol_name(namebuf) before comparing name and namebuf.
194 cleanup_symbol_name(namebuf);
195 return strcmp(name, namebuf);
198 static unsigned int get_symbol_seq(int index)
200 unsigned int i, seq = 0;
202 for (i = 0; i < 3; i++)
203 seq = (seq << 8) | kallsyms_seqs_of_names[3 * index + i];
208 static int kallsyms_lookup_names(const char *name,
214 unsigned int seq, off;
215 char namebuf[KSYM_NAME_LEN];
218 high = kallsyms_num_syms - 1;
220 while (low <= high) {
221 mid = low + (high - low) / 2;
222 seq = get_symbol_seq(mid);
223 off = get_symbol_offset(seq);
224 kallsyms_expand_symbol(off, namebuf, ARRAY_SIZE(namebuf));
225 ret = compare_symbol_name(name, namebuf);
239 seq = get_symbol_seq(low - 1);
240 off = get_symbol_offset(seq);
241 kallsyms_expand_symbol(off, namebuf, ARRAY_SIZE(namebuf));
242 if (compare_symbol_name(name, namebuf))
250 while (high < kallsyms_num_syms - 1) {
251 seq = get_symbol_seq(high + 1);
252 off = get_symbol_offset(seq);
253 kallsyms_expand_symbol(off, namebuf, ARRAY_SIZE(namebuf));
254 if (compare_symbol_name(name, namebuf))
264 /* Lookup the address for this symbol. Returns 0 if not found. */
265 unsigned long kallsyms_lookup_name(const char *name)
270 /* Skip the search for empty string. */
274 ret = kallsyms_lookup_names(name, &i, NULL);
276 return kallsyms_sym_address(get_symbol_seq(i));
278 return module_kallsyms_lookup_name(name);
282 * Iterate over all symbols in vmlinux. For symbols from modules use
283 * module_kallsyms_on_each_symbol instead.
285 int kallsyms_on_each_symbol(int (*fn)(void *, const char *, unsigned long),
288 char namebuf[KSYM_NAME_LEN];
293 for (i = 0, off = 0; i < kallsyms_num_syms; i++) {
294 off = kallsyms_expand_symbol(off, namebuf, ARRAY_SIZE(namebuf));
295 ret = fn(data, namebuf, kallsyms_sym_address(i));
303 int kallsyms_on_each_match_symbol(int (*fn)(void *, unsigned long),
304 const char *name, void *data)
307 unsigned int i, start, end;
309 ret = kallsyms_lookup_names(name, &start, &end);
313 for (i = start; !ret && i <= end; i++) {
314 ret = fn(data, kallsyms_sym_address(get_symbol_seq(i)));
321 static unsigned long get_symbol_pos(unsigned long addr,
322 unsigned long *symbolsize,
323 unsigned long *offset)
325 unsigned long symbol_start = 0, symbol_end = 0;
326 unsigned long i, low, high, mid;
328 /* Do a binary search on the sorted kallsyms_addresses array. */
330 high = kallsyms_num_syms;
332 while (high - low > 1) {
333 mid = low + (high - low) / 2;
334 if (kallsyms_sym_address(mid) <= addr)
341 * Search for the first aliased symbol. Aliased
342 * symbols are symbols with the same address.
344 while (low && kallsyms_sym_address(low-1) == kallsyms_sym_address(low))
347 symbol_start = kallsyms_sym_address(low);
349 /* Search for next non-aliased symbol. */
350 for (i = low + 1; i < kallsyms_num_syms; i++) {
351 if (kallsyms_sym_address(i) > symbol_start) {
352 symbol_end = kallsyms_sym_address(i);
357 /* If we found no next symbol, we use the end of the section. */
359 if (is_kernel_inittext(addr))
360 symbol_end = (unsigned long)_einittext;
361 else if (IS_ENABLED(CONFIG_KALLSYMS_ALL))
362 symbol_end = (unsigned long)_end;
364 symbol_end = (unsigned long)_etext;
368 *symbolsize = symbol_end - symbol_start;
370 *offset = addr - symbol_start;
376 * Lookup an address but don't bother to find any names.
378 int kallsyms_lookup_size_offset(unsigned long addr, unsigned long *symbolsize,
379 unsigned long *offset)
381 char namebuf[KSYM_NAME_LEN];
383 if (is_ksym_addr(addr)) {
384 get_symbol_pos(addr, symbolsize, offset);
387 return !!module_address_lookup(addr, symbolsize, offset, NULL, NULL, namebuf) ||
388 !!__bpf_address_lookup(addr, symbolsize, offset, namebuf);
391 static int kallsyms_lookup_buildid(unsigned long addr,
392 unsigned long *symbolsize,
393 unsigned long *offset, char **modname,
394 const unsigned char **modbuildid, char *namebuf)
398 namebuf[KSYM_NAME_LEN - 1] = 0;
401 if (is_ksym_addr(addr)) {
404 pos = get_symbol_pos(addr, symbolsize, offset);
406 kallsyms_expand_symbol(get_symbol_offset(pos),
407 namebuf, KSYM_NAME_LEN);
413 ret = strlen(namebuf);
417 /* See if it's in a module or a BPF JITed image. */
418 ret = module_address_lookup(addr, symbolsize, offset,
419 modname, modbuildid, namebuf);
421 ret = bpf_address_lookup(addr, symbolsize,
422 offset, modname, namebuf);
425 ret = ftrace_mod_address_lookup(addr, symbolsize,
426 offset, modname, namebuf);
429 cleanup_symbol_name(namebuf);
435 * - modname is set to NULL if it's in the kernel.
436 * - We guarantee that the returned name is valid until we reschedule even if.
437 * It resides in a module.
438 * - We also guarantee that modname will be valid until rescheduled.
440 const char *kallsyms_lookup(unsigned long addr,
441 unsigned long *symbolsize,
442 unsigned long *offset,
443 char **modname, char *namebuf)
445 int ret = kallsyms_lookup_buildid(addr, symbolsize, offset, modname,
454 int lookup_symbol_name(unsigned long addr, char *symname)
459 symname[KSYM_NAME_LEN - 1] = '\0';
461 if (is_ksym_addr(addr)) {
464 pos = get_symbol_pos(addr, NULL, NULL);
466 kallsyms_expand_symbol(get_symbol_offset(pos),
467 symname, KSYM_NAME_LEN);
470 /* See if it's in a module. */
471 res = lookup_module_symbol_name(addr, symname);
476 cleanup_symbol_name(symname);
480 /* Look up a kernel symbol and return it in a text buffer. */
481 static int __sprint_symbol(char *buffer, unsigned long address,
482 int symbol_offset, int add_offset, int add_buildid)
485 const unsigned char *buildid;
486 unsigned long offset, size;
489 address += symbol_offset;
490 len = kallsyms_lookup_buildid(address, &size, &offset, &modname, &buildid,
493 return sprintf(buffer, "0x%lx", address - symbol_offset);
495 offset -= symbol_offset;
498 len += sprintf(buffer + len, "+%#lx/%#lx", offset, size);
501 len += sprintf(buffer + len, " [%s", modname);
502 #if IS_ENABLED(CONFIG_STACKTRACE_BUILD_ID)
503 if (add_buildid && buildid) {
504 /* build ID should match length of sprintf */
505 #if IS_ENABLED(CONFIG_MODULES)
506 static_assert(sizeof(typeof_member(struct module, build_id)) == 20);
508 len += sprintf(buffer + len, " %20phN", buildid);
511 len += sprintf(buffer + len, "]");
518 * sprint_symbol - Look up a kernel symbol and return it in a text buffer
519 * @buffer: buffer to be stored
520 * @address: address to lookup
522 * This function looks up a kernel symbol with @address and stores its name,
523 * offset, size and module name to @buffer if possible. If no symbol was found,
524 * just saves its @address as is.
526 * This function returns the number of bytes stored in @buffer.
528 int sprint_symbol(char *buffer, unsigned long address)
530 return __sprint_symbol(buffer, address, 0, 1, 0);
532 EXPORT_SYMBOL_GPL(sprint_symbol);
535 * sprint_symbol_build_id - Look up a kernel symbol and return it in a text buffer
536 * @buffer: buffer to be stored
537 * @address: address to lookup
539 * This function looks up a kernel symbol with @address and stores its name,
540 * offset, size, module name and module build ID to @buffer if possible. If no
541 * symbol was found, just saves its @address as is.
543 * This function returns the number of bytes stored in @buffer.
545 int sprint_symbol_build_id(char *buffer, unsigned long address)
547 return __sprint_symbol(buffer, address, 0, 1, 1);
549 EXPORT_SYMBOL_GPL(sprint_symbol_build_id);
552 * sprint_symbol_no_offset - Look up a kernel symbol and return it in a text buffer
553 * @buffer: buffer to be stored
554 * @address: address to lookup
556 * This function looks up a kernel symbol with @address and stores its name
557 * and module name to @buffer if possible. If no symbol was found, just saves
558 * its @address as is.
560 * This function returns the number of bytes stored in @buffer.
562 int sprint_symbol_no_offset(char *buffer, unsigned long address)
564 return __sprint_symbol(buffer, address, 0, 0, 0);
566 EXPORT_SYMBOL_GPL(sprint_symbol_no_offset);
569 * sprint_backtrace - Look up a backtrace symbol and return it in a text buffer
570 * @buffer: buffer to be stored
571 * @address: address to lookup
573 * This function is for stack backtrace and does the same thing as
574 * sprint_symbol() but with modified/decreased @address. If there is a
575 * tail-call to the function marked "noreturn", gcc optimized out code after
576 * the call so that the stack-saved return address could point outside of the
577 * caller. This function ensures that kallsyms will find the original caller
578 * by decreasing @address.
580 * This function returns the number of bytes stored in @buffer.
582 int sprint_backtrace(char *buffer, unsigned long address)
584 return __sprint_symbol(buffer, address, -1, 1, 0);
588 * sprint_backtrace_build_id - Look up a backtrace symbol and return it in a text buffer
589 * @buffer: buffer to be stored
590 * @address: address to lookup
592 * This function is for stack backtrace and does the same thing as
593 * sprint_symbol() but with modified/decreased @address. If there is a
594 * tail-call to the function marked "noreturn", gcc optimized out code after
595 * the call so that the stack-saved return address could point outside of the
596 * caller. This function ensures that kallsyms will find the original caller
597 * by decreasing @address. This function also appends the module build ID to
598 * the @buffer if @address is within a kernel module.
600 * This function returns the number of bytes stored in @buffer.
602 int sprint_backtrace_build_id(char *buffer, unsigned long address)
604 return __sprint_symbol(buffer, address, -1, 1, 1);
607 /* To avoid using get_symbol_offset for every symbol, we carry prefix along. */
608 struct kallsym_iter {
611 loff_t pos_ftrace_mod_end;
614 unsigned int nameoff; /* If iterating in core kernel symbols. */
616 char name[KSYM_NAME_LEN];
617 char module_name[MODULE_NAME_LEN];
622 static int get_ksymbol_mod(struct kallsym_iter *iter)
624 int ret = module_get_kallsym(iter->pos - kallsyms_num_syms,
625 &iter->value, &iter->type,
626 iter->name, iter->module_name,
629 iter->pos_mod_end = iter->pos;
637 * ftrace_mod_get_kallsym() may also get symbols for pages allocated for ftrace
638 * purposes. In that case "__builtin__ftrace" is used as a module name, even
639 * though "__builtin__ftrace" is not a module.
641 static int get_ksymbol_ftrace_mod(struct kallsym_iter *iter)
643 int ret = ftrace_mod_get_kallsym(iter->pos - iter->pos_mod_end,
644 &iter->value, &iter->type,
645 iter->name, iter->module_name,
648 iter->pos_ftrace_mod_end = iter->pos;
655 static int get_ksymbol_bpf(struct kallsym_iter *iter)
659 strscpy(iter->module_name, "bpf", MODULE_NAME_LEN);
661 ret = bpf_get_kallsym(iter->pos - iter->pos_ftrace_mod_end,
662 &iter->value, &iter->type,
665 iter->pos_bpf_end = iter->pos;
673 * This uses "__builtin__kprobes" as a module name for symbols for pages
674 * allocated for kprobes' purposes, even though "__builtin__kprobes" is not a
677 static int get_ksymbol_kprobe(struct kallsym_iter *iter)
679 strscpy(iter->module_name, "__builtin__kprobes", MODULE_NAME_LEN);
681 return kprobe_get_kallsym(iter->pos - iter->pos_bpf_end,
682 &iter->value, &iter->type,
683 iter->name) < 0 ? 0 : 1;
686 /* Returns space to next name. */
687 static unsigned long get_ksymbol_core(struct kallsym_iter *iter)
689 unsigned off = iter->nameoff;
691 iter->module_name[0] = '\0';
692 iter->value = kallsyms_sym_address(iter->pos);
694 iter->type = kallsyms_get_symbol_type(off);
696 off = kallsyms_expand_symbol(off, iter->name, ARRAY_SIZE(iter->name));
698 return off - iter->nameoff;
701 static void reset_iter(struct kallsym_iter *iter, loff_t new_pos)
703 iter->name[0] = '\0';
704 iter->nameoff = get_symbol_offset(new_pos);
707 iter->pos_mod_end = 0;
708 iter->pos_ftrace_mod_end = 0;
709 iter->pos_bpf_end = 0;
714 * The end position (last + 1) of each additional kallsyms section is recorded
715 * in iter->pos_..._end as each section is added, and so can be used to
716 * determine which get_ksymbol_...() function to call next.
718 static int update_iter_mod(struct kallsym_iter *iter, loff_t pos)
722 if ((!iter->pos_mod_end || iter->pos_mod_end > pos) &&
723 get_ksymbol_mod(iter))
726 if ((!iter->pos_ftrace_mod_end || iter->pos_ftrace_mod_end > pos) &&
727 get_ksymbol_ftrace_mod(iter))
730 if ((!iter->pos_bpf_end || iter->pos_bpf_end > pos) &&
731 get_ksymbol_bpf(iter))
734 return get_ksymbol_kprobe(iter);
737 /* Returns false if pos at or past end of file. */
738 static int update_iter(struct kallsym_iter *iter, loff_t pos)
740 /* Module symbols can be accessed randomly. */
741 if (pos >= kallsyms_num_syms)
742 return update_iter_mod(iter, pos);
744 /* If we're not on the desired position, reset to new position. */
745 if (pos != iter->pos)
746 reset_iter(iter, pos);
748 iter->nameoff += get_ksymbol_core(iter);
754 static void *s_next(struct seq_file *m, void *p, loff_t *pos)
758 if (!update_iter(m->private, *pos))
763 static void *s_start(struct seq_file *m, loff_t *pos)
765 if (!update_iter(m->private, *pos))
770 static void s_stop(struct seq_file *m, void *p)
774 static int s_show(struct seq_file *m, void *p)
777 struct kallsym_iter *iter = m->private;
779 /* Some debugging symbols have no name. Ignore them. */
783 value = iter->show_value ? (void *)iter->value : NULL;
785 if (iter->module_name[0]) {
789 * Label it "global" if it is exported,
790 * "local" if not exported.
792 type = iter->exported ? toupper(iter->type) :
794 seq_printf(m, "%px %c %s\t[%s]\n", value,
795 type, iter->name, iter->module_name);
797 seq_printf(m, "%px %c %s\n", value,
798 iter->type, iter->name);
802 static const struct seq_operations kallsyms_op = {
809 #ifdef CONFIG_BPF_SYSCALL
811 struct bpf_iter__ksym {
812 __bpf_md_ptr(struct bpf_iter_meta *, meta);
813 __bpf_md_ptr(struct kallsym_iter *, ksym);
816 static int ksym_prog_seq_show(struct seq_file *m, bool in_stop)
818 struct bpf_iter__ksym ctx;
819 struct bpf_iter_meta meta;
820 struct bpf_prog *prog;
823 prog = bpf_iter_get_info(&meta, in_stop);
828 ctx.ksym = m ? m->private : NULL;
829 return bpf_iter_run_prog(prog, &ctx);
832 static int bpf_iter_ksym_seq_show(struct seq_file *m, void *p)
834 return ksym_prog_seq_show(m, false);
837 static void bpf_iter_ksym_seq_stop(struct seq_file *m, void *p)
840 (void) ksym_prog_seq_show(m, true);
845 static const struct seq_operations bpf_iter_ksym_ops = {
848 .stop = bpf_iter_ksym_seq_stop,
849 .show = bpf_iter_ksym_seq_show,
852 static int bpf_iter_ksym_init(void *priv_data, struct bpf_iter_aux_info *aux)
854 struct kallsym_iter *iter = priv_data;
858 /* cache here as in kallsyms_open() case; use current process
859 * credentials to tell BPF iterators if values should be shown.
861 iter->show_value = kallsyms_show_value(current_cred());
866 DEFINE_BPF_ITER_FUNC(ksym, struct bpf_iter_meta *meta, struct kallsym_iter *ksym)
868 static const struct bpf_iter_seq_info ksym_iter_seq_info = {
869 .seq_ops = &bpf_iter_ksym_ops,
870 .init_seq_private = bpf_iter_ksym_init,
871 .fini_seq_private = NULL,
872 .seq_priv_size = sizeof(struct kallsym_iter),
875 static struct bpf_iter_reg ksym_iter_reg_info = {
877 .feature = BPF_ITER_RESCHED,
878 .ctx_arg_info_size = 1,
880 { offsetof(struct bpf_iter__ksym, ksym),
881 PTR_TO_BTF_ID_OR_NULL },
883 .seq_info = &ksym_iter_seq_info,
886 BTF_ID_LIST(btf_ksym_iter_id)
887 BTF_ID(struct, kallsym_iter)
889 static int __init bpf_ksym_iter_register(void)
891 ksym_iter_reg_info.ctx_arg_info[0].btf_id = *btf_ksym_iter_id;
892 return bpf_iter_reg_target(&ksym_iter_reg_info);
895 late_initcall(bpf_ksym_iter_register);
897 #endif /* CONFIG_BPF_SYSCALL */
899 static int kallsyms_open(struct inode *inode, struct file *file)
902 * We keep iterator in m->private, since normal case is to
903 * s_start from where we left off, so we avoid doing
904 * using get_symbol_offset for every symbol.
906 struct kallsym_iter *iter;
907 iter = __seq_open_private(file, &kallsyms_op, sizeof(*iter));
913 * Instead of checking this on every s_show() call, cache
914 * the result here at open time.
916 iter->show_value = kallsyms_show_value(file->f_cred);
920 #ifdef CONFIG_KGDB_KDB
921 const char *kdb_walk_kallsyms(loff_t *pos)
923 static struct kallsym_iter kdb_walk_kallsyms_iter;
925 memset(&kdb_walk_kallsyms_iter, 0,
926 sizeof(kdb_walk_kallsyms_iter));
927 reset_iter(&kdb_walk_kallsyms_iter, 0);
930 if (!update_iter(&kdb_walk_kallsyms_iter, *pos))
933 /* Some debugging symbols have no name. Ignore them. */
934 if (kdb_walk_kallsyms_iter.name[0])
935 return kdb_walk_kallsyms_iter.name;
938 #endif /* CONFIG_KGDB_KDB */
940 static const struct proc_ops kallsyms_proc_ops = {
941 .proc_open = kallsyms_open,
942 .proc_read = seq_read,
943 .proc_lseek = seq_lseek,
944 .proc_release = seq_release_private,
947 static int __init kallsyms_init(void)
949 proc_create("kallsyms", 0444, NULL, &kallsyms_proc_ops);
952 device_initcall(kallsyms_init);