mirror of
https://github.com/JakeHillion/drgn.git
synced 2024-12-22 01:03:07 +00:00
a47fa1f3e2
We got a couple of reports about drgn failing to get a stack trace (#391) or getting the wrong stack trace (#404) from a kernel core dump. Both were caused because drgn assumes that there is an NT_PRSTATUS note for each CPU in order by CPU number, and in these core dumps some NT_PRSTATUS notes were missing. There are a least a couple of things that can cause this: offline CPUs or CPUs that were in a bad state and didn't respond to the kdump NMI. The former is expected and could be special-cased, but the latter basically means that we can't trust the order of the notes. Instead, look up the notes from the crash_notes per-CPU variable that the kernel uses to populate the ELF notes. We still need to use the actual NT_PRSTATUS notes for QEMU dump-guest-memory dumps, but for those we need to use the PID field to handle CPU hotplugging. Closes #404. Signed-off-by: Omar Sandoval <osandov@osandov.com>
440 lines
12 KiB
C
440 lines
12 KiB
C
// Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
// SPDX-License-Identifier: LGPL-2.1-or-later
|
|
|
|
/**
|
|
* @file
|
|
*
|
|
* Program internals.
|
|
*
|
|
* See @ref ProgramInternals.
|
|
*/
|
|
|
|
#ifndef DRGN_PROGRAM_H
|
|
#define DRGN_PROGRAM_H
|
|
|
|
#include <elfutils/libdwfl.h>
|
|
#include <libelf.h>
|
|
#include <sys/types.h>
|
|
#ifdef WITH_LIBKDUMPFILE
|
|
#include <libkdumpfile/kdumpfile.h>
|
|
#endif
|
|
|
|
#include "debug_info.h"
|
|
#include "drgn.h"
|
|
#include "handler.h"
|
|
#include "hash_table.h"
|
|
#include "language.h"
|
|
#include "memory_reader.h"
|
|
#include "platform.h"
|
|
#include "pp.h"
|
|
#include "symbol.h"
|
|
#include "type.h"
|
|
#include "vector.h"
|
|
|
|
struct drgn_type_finder;
|
|
struct drgn_object_finder;
|
|
struct drgn_symbol_finder;
|
|
|
|
/**
|
|
* @defgroup Internals Internals
|
|
*
|
|
* Internal implementation
|
|
*
|
|
* @{
|
|
*
|
|
* @defgroup ProgramInternals Programs
|
|
*
|
|
* Program internals.
|
|
*
|
|
* @{
|
|
*/
|
|
|
|
struct drgn_thread {
|
|
struct drgn_program *prog;
|
|
uint32_t tid;
|
|
struct nstring prstatus;
|
|
struct drgn_object object;
|
|
};
|
|
|
|
DEFINE_VECTOR_TYPE(drgn_typep_vector, struct drgn_type *);
|
|
DEFINE_HASH_TABLE_TYPE(drgn_thread_set, struct drgn_thread);
|
|
|
|
struct drgn_program {
|
|
/** @privatesection */
|
|
|
|
/*
|
|
* Memory/core dump.
|
|
*/
|
|
struct drgn_memory_reader reader;
|
|
/* Elf core dump or /proc/pid/mem file segments. */
|
|
struct drgn_memory_file_segment *file_segments;
|
|
/* Elf core dump. Not valid for live programs or kdump files. */
|
|
Elf *core;
|
|
/* File descriptor for ELF core dump, kdump file, or /proc/pid/mem. */
|
|
int core_fd;
|
|
/* PID of live userspace program. */
|
|
pid_t pid;
|
|
#ifdef WITH_LIBKDUMPFILE
|
|
kdump_ctx_t *kdump_ctx;
|
|
#endif
|
|
|
|
/*
|
|
* Types.
|
|
*/
|
|
/** Callbacks for finding types. */
|
|
struct drgn_handler_list type_finders;
|
|
/** Void type for each language. */
|
|
struct drgn_type void_types[DRGN_NUM_LANGUAGES];
|
|
/** Cache of primitive types. */
|
|
struct drgn_type *primitive_types[DRGN_PRIMITIVE_TYPE_NUM];
|
|
/** Cache of deduplicated types. */
|
|
struct drgn_dedupe_type_set dedupe_types;
|
|
/**
|
|
* List of created types that are not deduplicated: types with non-empty
|
|
* lists of members, parameters, template parameters, or enumerators.
|
|
*
|
|
* Members, parameters, and template parameters contain lazily-evaluated
|
|
* objects, so they cannot be easily deduplicated.
|
|
*
|
|
* Enumerators could be deduplicated, but it's probably not worth the
|
|
* effort to hash and compare them.
|
|
*/
|
|
struct drgn_typep_vector created_types;
|
|
/** Cache for @ref drgn_program_find_member(). */
|
|
struct drgn_member_map members;
|
|
/**
|
|
* Set of types which have been already cached in @ref
|
|
* drgn_program::members.
|
|
*/
|
|
struct drgn_type_set members_cached;
|
|
|
|
/*
|
|
* Debugging information.
|
|
*/
|
|
struct drgn_handler_list object_finders;
|
|
struct drgn_debug_info dbinfo;
|
|
struct drgn_handler_list symbol_finders;
|
|
|
|
/*
|
|
* Program information.
|
|
*/
|
|
/* Default language of the program. */
|
|
const struct drgn_language *lang;
|
|
struct drgn_platform platform;
|
|
bool has_platform;
|
|
enum drgn_program_flags flags;
|
|
|
|
/*
|
|
* Threads/stack traces.
|
|
*/
|
|
/*
|
|
* Threads indexed by TID.
|
|
*
|
|
* For the Linux kernel, this is only used to index @c PRSTATUS notes.
|
|
* See @ref drgn_program_find_prstatus().
|
|
*/
|
|
struct drgn_thread_set thread_set;
|
|
struct drgn_thread *main_thread;
|
|
struct drgn_thread *crashed_thread;
|
|
/*
|
|
* AArch64 instruction pointer authentication code mask, parsed either
|
|
* from NT_ARM_PAC_MASK or VMCOREINFO.
|
|
*/
|
|
uint64_t aarch64_insn_pac_mask;
|
|
bool core_dump_notes_cached;
|
|
bool prefer_orc_unwinder;
|
|
|
|
/*
|
|
* Linux kernel-specific.
|
|
*/
|
|
/* The important parts of the VMCOREINFO note of a Linux kernel core. */
|
|
struct {
|
|
/** <tt>uname -r</tt> */
|
|
char osrelease[128];
|
|
/** PAGE_SIZE of the kernel. */
|
|
uint64_t page_size;
|
|
/**
|
|
* The offset from the compiled address of the kernel image to its
|
|
* actual address in memory.
|
|
*
|
|
* This is non-zero if kernel address space layout randomization (KASLR)
|
|
* is enabled.
|
|
*/
|
|
uint64_t kaslr_offset;
|
|
/** Kernel page table. */
|
|
uint64_t swapper_pg_dir;
|
|
/** Length of mem_section array (i.e., NR_SECTION_ROOTS). */
|
|
uint64_t mem_section_length;
|
|
/** VA_BITS on AArch64. */
|
|
uint64_t va_bits;
|
|
/** phys_base on x86_64 */
|
|
uint64_t phys_base;
|
|
/** Whether 5-level paging was enabled on x86-64. */
|
|
bool pgtable_l5_enabled;
|
|
/** Whether CRASHTIME was in the VMCOREINFO. */
|
|
bool have_crashtime;
|
|
/** PAGE_SHIFT of the kernel (derived from PAGE_SIZE). */
|
|
int page_shift;
|
|
|
|
/** The original vmcoreinfo data, to expose as an object */
|
|
char *raw;
|
|
size_t raw_size;
|
|
} vmcoreinfo;
|
|
/*
|
|
* Difference between a virtual address in the direct mapping and the
|
|
* physical address it maps to.
|
|
*/
|
|
uint64_t direct_mapping_offset;
|
|
/* Cached vmemmap. */
|
|
struct drgn_object vmemmap;
|
|
/* Page table iterator. */
|
|
struct pgtable_iterator *pgtable_it;
|
|
/*
|
|
* Whether we are currently in address translation. Used to prevent
|
|
* address translation from recursing.
|
|
*/
|
|
bool in_address_translation;
|
|
/* Whether @ref drgn_program::direct_mapping_offset has been cached. */
|
|
bool direct_mapping_offset_cached;
|
|
|
|
/*
|
|
* Logging.
|
|
*/
|
|
drgn_log_fn *log_fn;
|
|
void *log_arg;
|
|
enum drgn_log_level log_level;
|
|
|
|
/*
|
|
* Blocking callbacks.
|
|
*/
|
|
drgn_program_begin_blocking_fn *begin_blocking_fn;
|
|
drgn_program_end_blocking_fn *end_blocking_fn;
|
|
void *blocking_arg;
|
|
};
|
|
|
|
/** Initialize a @ref drgn_program. */
|
|
void drgn_program_init(struct drgn_program *prog,
|
|
const struct drgn_platform *platform);
|
|
|
|
/** Deinitialize a @ref drgn_program. */
|
|
void drgn_program_deinit(struct drgn_program *prog);
|
|
|
|
/**
|
|
* Set the @ref drgn_platform of a @ref drgn_program if it hasn't been set
|
|
* yet.
|
|
*/
|
|
void drgn_program_set_platform(struct drgn_program *prog,
|
|
const struct drgn_platform *platform);
|
|
|
|
/**
|
|
* Implement @ref drgn_program_from_core_dump() on an initialized @ref
|
|
* drgn_program.
|
|
*/
|
|
struct drgn_error *drgn_program_init_core_dump(struct drgn_program *prog,
|
|
const char *path);
|
|
|
|
/**
|
|
* Implement @ref drgn_program_from_core_dump_fd() on an initialized @ref
|
|
* drgn_program.
|
|
*/
|
|
struct drgn_error *drgn_program_init_core_dump_fd(struct drgn_program *prog,
|
|
int fd);
|
|
|
|
/**
|
|
* Implement @ref drgn_program_from_kernel() on an initialized @ref
|
|
* drgn_program.
|
|
*/
|
|
struct drgn_error *drgn_program_init_kernel(struct drgn_program *prog);
|
|
|
|
/**
|
|
* Implement @ref drgn_program_from_pid() on an initialized @ref drgn_program.
|
|
*/
|
|
struct drgn_error *drgn_program_init_pid(struct drgn_program *prog, pid_t pid);
|
|
|
|
static inline struct drgn_error *
|
|
drgn_program_is_little_endian(struct drgn_program *prog, bool *ret)
|
|
{
|
|
if (!prog->has_platform) {
|
|
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
|
|
"program byte order is not known");
|
|
}
|
|
*ret = drgn_platform_is_little_endian(&prog->platform);
|
|
return NULL;
|
|
}
|
|
|
|
/**
|
|
* Return whether a @ref drgn_program has a different endianness than the host
|
|
* system.
|
|
*/
|
|
static inline struct drgn_error *
|
|
drgn_program_bswap(struct drgn_program *prog, bool *ret)
|
|
{
|
|
if (!prog->has_platform) {
|
|
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
|
|
"program byte order is not known");
|
|
}
|
|
*ret = drgn_platform_bswap(&prog->platform);
|
|
return NULL;
|
|
}
|
|
|
|
static inline struct drgn_error *
|
|
drgn_program_is_64_bit(struct drgn_program *prog, bool *ret)
|
|
{
|
|
if (!prog->has_platform) {
|
|
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
|
|
"program word size is not known");
|
|
}
|
|
*ret = drgn_platform_is_64_bit(&prog->platform);
|
|
return NULL;
|
|
}
|
|
|
|
static inline struct drgn_error *
|
|
drgn_program_address_size(struct drgn_program *prog, uint8_t *ret)
|
|
{
|
|
if (!prog->has_platform) {
|
|
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
|
|
"program address size is not known");
|
|
}
|
|
*ret = drgn_platform_address_size(&prog->platform);
|
|
return NULL;
|
|
}
|
|
|
|
static inline struct drgn_error *
|
|
drgn_program_address_mask(const struct drgn_program *prog, uint64_t *ret)
|
|
{
|
|
if (!prog->has_platform) {
|
|
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
|
|
"program address size is not known");
|
|
}
|
|
*ret = drgn_platform_address_mask(&prog->platform);
|
|
return NULL;
|
|
}
|
|
|
|
static inline struct drgn_error *
|
|
drgn_program_untagged_addr(const struct drgn_program *prog, uint64_t *address)
|
|
{
|
|
if (!prog->has_platform) {
|
|
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
|
|
"program address size is not known");
|
|
}
|
|
*address &= drgn_platform_address_mask(&prog->platform);
|
|
if (prog->platform.arch->untagged_addr)
|
|
*address = prog->platform.arch->untagged_addr(*address);
|
|
return NULL;
|
|
}
|
|
|
|
struct drgn_error *drgn_thread_dup_internal(const struct drgn_thread *thread,
|
|
struct drgn_thread *ret);
|
|
|
|
void drgn_thread_deinit(struct drgn_thread *thread);
|
|
|
|
/**
|
|
* Find the @c NT_PRSTATUS note with the given "PID".
|
|
*
|
|
* For userspace, the PID is the thread ID. For the kernel, it's complicated;
|
|
* see drgn_get_initial_registers_from_kernel_core_dump().
|
|
*
|
|
* @param[out] ret Returned note data. If not found, <tt>ret->str</tt> is set to
|
|
* @c NULL and <tt>ret->len</tt> is set to zero.
|
|
*/
|
|
struct drgn_error *drgn_program_find_prstatus(struct drgn_program *prog,
|
|
uint32_t tid,
|
|
struct nstring *ret);
|
|
|
|
/**
|
|
* Cache the @c NT_PRSTATUS note provided by @p data in @p prog.
|
|
*
|
|
* @param[in] data The pointer to the note data.
|
|
* @param[in] size Size of data in note.
|
|
* @param[out] ret Thread ID from note.
|
|
*/
|
|
struct drgn_error *drgn_program_cache_prstatus_entry(struct drgn_program *prog,
|
|
const char *data,
|
|
size_t size,
|
|
uint32_t *ret);
|
|
|
|
/*
|
|
* Like @ref drgn_program_find_symbol_by_address(), but returns @c NULL rather
|
|
* than a lookup error if the symbol was not found.
|
|
*
|
|
* @param[in] address Address to search for.
|
|
* @param [out] ret The symbol found by the lookup (if found)
|
|
* @return @c NULL unless an error (unrelated to a lookup error) was encountered
|
|
*/
|
|
struct drgn_error *
|
|
drgn_program_find_symbol_by_address_internal(struct drgn_program *prog,
|
|
uint64_t address,
|
|
struct drgn_symbol **ret);
|
|
|
|
struct drgn_error *
|
|
drgn_program_register_type_finder_impl(struct drgn_program *prog,
|
|
struct drgn_type_finder *finder,
|
|
const char *name,
|
|
const struct drgn_type_finder_ops *ops,
|
|
void *arg, size_t enable_index);
|
|
|
|
struct drgn_error *
|
|
drgn_program_register_object_finder_impl(struct drgn_program *prog,
|
|
struct drgn_object_finder *finder,
|
|
const char *name,
|
|
const struct drgn_object_finder_ops *ops,
|
|
void *arg, size_t enable_index);
|
|
|
|
struct drgn_error *
|
|
drgn_program_register_symbol_finder_impl(struct drgn_program *prog,
|
|
struct drgn_symbol_finder *finder,
|
|
const char *name,
|
|
const struct drgn_symbol_finder_ops *ops,
|
|
void *arg, size_t enable_index);
|
|
|
|
/**
|
|
* Call before a blocking (I/O or long-running) operation.
|
|
*
|
|
* Must be paired with @ref drgn_program_end_blocking().
|
|
*
|
|
* @return Opaque pointer to pass to @ref drgn_program_end_blocking().
|
|
*/
|
|
void *drgn_program_begin_blocking(struct drgn_program *prog);
|
|
|
|
/**
|
|
* Call after a blocking (I/O or long-running) operation.
|
|
*
|
|
* @param[in] state Return value of @ref drgn_program_begin_blocking().
|
|
*/
|
|
void drgn_program_end_blocking(struct drgn_program *prog, void *state);
|
|
|
|
struct drgn_blocking_guard_struct {
|
|
struct drgn_program *prog;
|
|
void *state;
|
|
};
|
|
|
|
static inline struct drgn_blocking_guard_struct
|
|
drgn_blocking_guard_init(struct drgn_program *prog)
|
|
{
|
|
return (struct drgn_blocking_guard_struct){
|
|
prog, drgn_program_begin_blocking(prog),
|
|
};
|
|
}
|
|
|
|
static inline void
|
|
drgn_blocking_guard_cleanup(struct drgn_blocking_guard_struct *guard)
|
|
{
|
|
drgn_program_end_blocking(guard->prog, guard->state);
|
|
}
|
|
|
|
/**
|
|
* Scope guard that wraps @ref drgn_program_begin_blocking() and @ref
|
|
* drgn_program_end_blocking().
|
|
*/
|
|
#define drgn_blocking_guard(prog) \
|
|
struct drgn_blocking_guard_struct PP_UNIQUE(guard) \
|
|
__attribute__((__cleanup__(drgn_blocking_guard_cleanup), __unused__)) = \
|
|
drgn_blocking_guard_init(prog)
|
|
|
|
/**
|
|
* @}
|
|
* @}
|
|
*/
|
|
|
|
#endif /* DRGN_PROGRAM_H */
|