0488568178
Support using LLVM as a disassembler method, allowing helperless annotation in non-distro builds. (It is also much faster than using libbfd or bfd objdump on binaries with a lot of debug information.) This is nearly identical to the output of llvm-objdump; there are some very rare whitespace differences, some minor changes to demangling (since we use perf's regular demangling and not LLVM's own) and the occasional case where llvm-objdump makes a different choice when multiple symbols share the same address. It should work across all of LLVM's supported architectures, although I've only tested 64-bit x86, and finding the right triple from perf's idea of machine architecture can sometimes be a bit tricky. Ideally, we should have some way of finding the triplet just from the file itself. Committer notes: Address this on 32-bit systems by using PRIu64 from inttypes.h 3 17.58 almalinux:9-i386 : FAIL gcc version 11.4.1 20231218 (Red Hat 11.4.1-3) (GCC) util/llvm-c-helpers.cpp: In function ‘char* make_symbol_relative_string(dso*, const char*, u64, u64)’: util/llvm-c-helpers.cpp:150:52: error: format ‘%lx’ expects argument of type ‘long unsigned int’, but argument 5 has type ‘u64’ {aka +‘long long unsigned int’} [-Werror=format=] 150 | snprintf(buf, sizeof(buf), "%s+0x%lx", | ~~^ | | | long unsigned int | %llx 151 | demangled ? demangled : sym_name, addr - base_addr); | ~~~~~~~~~~~~~~~~ | | | u64 {aka long long unsigned int} cc1plus: all warnings being treated as errors Signed-off-by: Steinar H. Gunderson <sesse@google.com> Cc: Ian Rogers <irogers@google.com> Link: https://lore.kernel.org/r/20240803152008.2818485-3-sesse@google.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
198 lines
5.1 KiB
C++
198 lines
5.1 KiB
C++
// SPDX-License-Identifier: GPL-2.0
|
|
|
|
/*
|
|
* Must come before the linux/compiler.h include, which defines several
|
|
* macros (e.g. noinline) that conflict with compiler builtins used
|
|
* by LLVM.
|
|
*/
|
|
#pragma GCC diagnostic push
|
|
#pragma GCC diagnostic ignored "-Wunused-parameter" /* Needed for LLVM <= 15 */
|
|
#include <llvm/DebugInfo/Symbolize/Symbolize.h>
|
|
#include <llvm/Support/TargetSelect.h>
|
|
#pragma GCC diagnostic pop
|
|
|
|
#include <inttypes.h>
|
|
#include <stdio.h>
|
|
#include <sys/types.h>
|
|
#include <linux/compiler.h>
|
|
extern "C" {
|
|
#include <linux/zalloc.h>
|
|
}
|
|
#include "symbol_conf.h"
|
|
#include "llvm-c-helpers.h"
|
|
|
|
extern "C"
|
|
char *dso__demangle_sym(struct dso *dso, int kmodule, const char *elf_name);
|
|
|
|
using namespace llvm;
|
|
using llvm::symbolize::LLVMSymbolizer;
|
|
|
|
/*
|
|
* Allocate a static LLVMSymbolizer, which will live to the end of the program.
|
|
* Unlike the bfd paths, LLVMSymbolizer has its own cache, so we do not need
|
|
* to store anything in the dso struct.
|
|
*/
|
|
static LLVMSymbolizer *get_symbolizer()
|
|
{
|
|
static LLVMSymbolizer *instance = nullptr;
|
|
if (instance == nullptr) {
|
|
LLVMSymbolizer::Options opts;
|
|
/*
|
|
* LLVM sometimes demangles slightly different from the rest
|
|
* of the code, and this mismatch can cause new_inline_sym()
|
|
* to get confused and mark non-inline symbol as inlined
|
|
* (since the name does not properly match up with base_sym).
|
|
* Thus, disable the demangling and let the rest of the code
|
|
* handle it.
|
|
*/
|
|
opts.Demangle = false;
|
|
instance = new LLVMSymbolizer(opts);
|
|
}
|
|
return instance;
|
|
}
|
|
|
|
/* Returns 0 on error, 1 on success. */
|
|
static int extract_file_and_line(const DILineInfo &line_info, char **file,
|
|
unsigned int *line)
|
|
{
|
|
if (file) {
|
|
if (line_info.FileName == "<invalid>") {
|
|
/* Match the convention of libbfd. */
|
|
*file = nullptr;
|
|
} else {
|
|
/* The caller expects to get something it can free(). */
|
|
*file = strdup(line_info.FileName.c_str());
|
|
if (*file == nullptr)
|
|
return 0;
|
|
}
|
|
}
|
|
if (line)
|
|
*line = line_info.Line;
|
|
return 1;
|
|
}
|
|
|
|
extern "C"
|
|
int llvm_addr2line(const char *dso_name, u64 addr,
|
|
char **file, unsigned int *line,
|
|
bool unwind_inlines,
|
|
llvm_a2l_frame **inline_frames)
|
|
{
|
|
LLVMSymbolizer *symbolizer = get_symbolizer();
|
|
object::SectionedAddress sectioned_addr = {
|
|
addr,
|
|
object::SectionedAddress::UndefSection
|
|
};
|
|
|
|
if (unwind_inlines) {
|
|
Expected<DIInliningInfo> res_or_err =
|
|
symbolizer->symbolizeInlinedCode(dso_name,
|
|
sectioned_addr);
|
|
if (!res_or_err)
|
|
return 0;
|
|
unsigned num_frames = res_or_err->getNumberOfFrames();
|
|
if (num_frames == 0)
|
|
return 0;
|
|
|
|
if (extract_file_and_line(res_or_err->getFrame(0),
|
|
file, line) == 0)
|
|
return 0;
|
|
|
|
*inline_frames = (llvm_a2l_frame *)calloc(
|
|
num_frames, sizeof(**inline_frames));
|
|
if (*inline_frames == nullptr)
|
|
return 0;
|
|
|
|
for (unsigned i = 0; i < num_frames; ++i) {
|
|
const DILineInfo &src = res_or_err->getFrame(i);
|
|
|
|
llvm_a2l_frame &dst = (*inline_frames)[i];
|
|
if (src.FileName == "<invalid>")
|
|
/* Match the convention of libbfd. */
|
|
dst.filename = nullptr;
|
|
else
|
|
dst.filename = strdup(src.FileName.c_str());
|
|
dst.funcname = strdup(src.FunctionName.c_str());
|
|
dst.line = src.Line;
|
|
|
|
if (dst.filename == nullptr ||
|
|
dst.funcname == nullptr) {
|
|
for (unsigned j = 0; j <= i; ++j) {
|
|
zfree(&(*inline_frames)[j].filename);
|
|
zfree(&(*inline_frames)[j].funcname);
|
|
}
|
|
zfree(inline_frames);
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
return num_frames;
|
|
} else {
|
|
if (inline_frames)
|
|
*inline_frames = nullptr;
|
|
|
|
Expected<DILineInfo> res_or_err =
|
|
symbolizer->symbolizeCode(dso_name, sectioned_addr);
|
|
if (!res_or_err)
|
|
return 0;
|
|
return extract_file_and_line(*res_or_err, file, line);
|
|
}
|
|
}
|
|
|
|
static char *
|
|
make_symbol_relative_string(struct dso *dso, const char *sym_name,
|
|
u64 addr, u64 base_addr)
|
|
{
|
|
if (!strcmp(sym_name, "<invalid>"))
|
|
return NULL;
|
|
|
|
char *demangled = dso__demangle_sym(dso, 0, sym_name);
|
|
if (base_addr && base_addr != addr) {
|
|
char buf[256];
|
|
snprintf(buf, sizeof(buf), "%s+0x%" PRIx64,
|
|
demangled ? demangled : sym_name, addr - base_addr);
|
|
free(demangled);
|
|
return strdup(buf);
|
|
} else {
|
|
if (demangled)
|
|
return demangled;
|
|
else
|
|
return strdup(sym_name);
|
|
}
|
|
}
|
|
|
|
extern "C"
|
|
char *llvm_name_for_code(struct dso *dso, const char *dso_name, u64 addr)
|
|
{
|
|
LLVMSymbolizer *symbolizer = get_symbolizer();
|
|
object::SectionedAddress sectioned_addr = {
|
|
addr,
|
|
object::SectionedAddress::UndefSection
|
|
};
|
|
Expected<DILineInfo> res_or_err =
|
|
symbolizer->symbolizeCode(dso_name, sectioned_addr);
|
|
if (!res_or_err) {
|
|
return NULL;
|
|
}
|
|
return make_symbol_relative_string(
|
|
dso, res_or_err->FunctionName.c_str(),
|
|
addr, res_or_err->StartAddress ? *res_or_err->StartAddress : 0);
|
|
}
|
|
|
|
extern "C"
|
|
char *llvm_name_for_data(struct dso *dso, const char *dso_name, u64 addr)
|
|
{
|
|
LLVMSymbolizer *symbolizer = get_symbolizer();
|
|
object::SectionedAddress sectioned_addr = {
|
|
addr,
|
|
object::SectionedAddress::UndefSection
|
|
};
|
|
Expected<DIGlobal> res_or_err =
|
|
symbolizer->symbolizeData(dso_name, sectioned_addr);
|
|
if (!res_or_err) {
|
|
return NULL;
|
|
}
|
|
return make_symbol_relative_string(
|
|
dso, res_or_err->Name.c_str(),
|
|
addr, res_or_err->Start);
|
|
}
|