drgn/libdrgn/program.h
Omar Sandoval a47fa1f3e2 libdrgn: get initial registers for kdump from crash_notes variable
We got a couple of reports about drgn failing to get a stack trace
(#391) or getting the wrong stack trace (#404) from a kernel core dump.
Both were caused because drgn assumes that there is an NT_PRSTATUS note
for each CPU in order by CPU number, and in these core dumps some
NT_PRSTATUS notes were missing. There are a least a couple of things
that can cause this: offline CPUs or CPUs that were in a bad state and
didn't respond to the kdump NMI. The former is expected and could be
special-cased, but the latter basically means that we can't trust the
order of the notes. Instead, look up the notes from the crash_notes
per-CPU variable that the kernel uses to populate the ELF notes. We
still need to use the actual NT_PRSTATUS notes for QEMU
dump-guest-memory dumps, but for those we need to use the PID field to
handle CPU hotplugging.

Closes #404.

Signed-off-by: Omar Sandoval <osandov@osandov.com>
2024-06-20 14:34:20 -07:00

440 lines
12 KiB
C

// Copyright (c) Meta Platforms, Inc. and affiliates.
// SPDX-License-Identifier: LGPL-2.1-or-later
/**
* @file
*
* Program internals.
*
* See @ref ProgramInternals.
*/
#ifndef DRGN_PROGRAM_H
#define DRGN_PROGRAM_H
#include <elfutils/libdwfl.h>
#include <libelf.h>
#include <sys/types.h>
#ifdef WITH_LIBKDUMPFILE
#include <libkdumpfile/kdumpfile.h>
#endif
#include "debug_info.h"
#include "drgn.h"
#include "handler.h"
#include "hash_table.h"
#include "language.h"
#include "memory_reader.h"
#include "platform.h"
#include "pp.h"
#include "symbol.h"
#include "type.h"
#include "vector.h"
struct drgn_type_finder;
struct drgn_object_finder;
struct drgn_symbol_finder;
/**
* @defgroup Internals Internals
*
* Internal implementation
*
* @{
*
* @defgroup ProgramInternals Programs
*
* Program internals.
*
* @{
*/
struct drgn_thread {
struct drgn_program *prog;
uint32_t tid;
struct nstring prstatus;
struct drgn_object object;
};
DEFINE_VECTOR_TYPE(drgn_typep_vector, struct drgn_type *);
DEFINE_HASH_TABLE_TYPE(drgn_thread_set, struct drgn_thread);
struct drgn_program {
/** @privatesection */
/*
* Memory/core dump.
*/
struct drgn_memory_reader reader;
/* Elf core dump or /proc/pid/mem file segments. */
struct drgn_memory_file_segment *file_segments;
/* Elf core dump. Not valid for live programs or kdump files. */
Elf *core;
/* File descriptor for ELF core dump, kdump file, or /proc/pid/mem. */
int core_fd;
/* PID of live userspace program. */
pid_t pid;
#ifdef WITH_LIBKDUMPFILE
kdump_ctx_t *kdump_ctx;
#endif
/*
* Types.
*/
/** Callbacks for finding types. */
struct drgn_handler_list type_finders;
/** Void type for each language. */
struct drgn_type void_types[DRGN_NUM_LANGUAGES];
/** Cache of primitive types. */
struct drgn_type *primitive_types[DRGN_PRIMITIVE_TYPE_NUM];
/** Cache of deduplicated types. */
struct drgn_dedupe_type_set dedupe_types;
/**
* List of created types that are not deduplicated: types with non-empty
* lists of members, parameters, template parameters, or enumerators.
*
* Members, parameters, and template parameters contain lazily-evaluated
* objects, so they cannot be easily deduplicated.
*
* Enumerators could be deduplicated, but it's probably not worth the
* effort to hash and compare them.
*/
struct drgn_typep_vector created_types;
/** Cache for @ref drgn_program_find_member(). */
struct drgn_member_map members;
/**
* Set of types which have been already cached in @ref
* drgn_program::members.
*/
struct drgn_type_set members_cached;
/*
* Debugging information.
*/
struct drgn_handler_list object_finders;
struct drgn_debug_info dbinfo;
struct drgn_handler_list symbol_finders;
/*
* Program information.
*/
/* Default language of the program. */
const struct drgn_language *lang;
struct drgn_platform platform;
bool has_platform;
enum drgn_program_flags flags;
/*
* Threads/stack traces.
*/
/*
* Threads indexed by TID.
*
* For the Linux kernel, this is only used to index @c PRSTATUS notes.
* See @ref drgn_program_find_prstatus().
*/
struct drgn_thread_set thread_set;
struct drgn_thread *main_thread;
struct drgn_thread *crashed_thread;
/*
* AArch64 instruction pointer authentication code mask, parsed either
* from NT_ARM_PAC_MASK or VMCOREINFO.
*/
uint64_t aarch64_insn_pac_mask;
bool core_dump_notes_cached;
bool prefer_orc_unwinder;
/*
* Linux kernel-specific.
*/
/* The important parts of the VMCOREINFO note of a Linux kernel core. */
struct {
/** <tt>uname -r</tt> */
char osrelease[128];
/** PAGE_SIZE of the kernel. */
uint64_t page_size;
/**
* The offset from the compiled address of the kernel image to its
* actual address in memory.
*
* This is non-zero if kernel address space layout randomization (KASLR)
* is enabled.
*/
uint64_t kaslr_offset;
/** Kernel page table. */
uint64_t swapper_pg_dir;
/** Length of mem_section array (i.e., NR_SECTION_ROOTS). */
uint64_t mem_section_length;
/** VA_BITS on AArch64. */
uint64_t va_bits;
/** phys_base on x86_64 */
uint64_t phys_base;
/** Whether 5-level paging was enabled on x86-64. */
bool pgtable_l5_enabled;
/** Whether CRASHTIME was in the VMCOREINFO. */
bool have_crashtime;
/** PAGE_SHIFT of the kernel (derived from PAGE_SIZE). */
int page_shift;
/** The original vmcoreinfo data, to expose as an object */
char *raw;
size_t raw_size;
} vmcoreinfo;
/*
* Difference between a virtual address in the direct mapping and the
* physical address it maps to.
*/
uint64_t direct_mapping_offset;
/* Cached vmemmap. */
struct drgn_object vmemmap;
/* Page table iterator. */
struct pgtable_iterator *pgtable_it;
/*
* Whether we are currently in address translation. Used to prevent
* address translation from recursing.
*/
bool in_address_translation;
/* Whether @ref drgn_program::direct_mapping_offset has been cached. */
bool direct_mapping_offset_cached;
/*
* Logging.
*/
drgn_log_fn *log_fn;
void *log_arg;
enum drgn_log_level log_level;
/*
* Blocking callbacks.
*/
drgn_program_begin_blocking_fn *begin_blocking_fn;
drgn_program_end_blocking_fn *end_blocking_fn;
void *blocking_arg;
};
/** Initialize a @ref drgn_program. */
void drgn_program_init(struct drgn_program *prog,
const struct drgn_platform *platform);
/** Deinitialize a @ref drgn_program. */
void drgn_program_deinit(struct drgn_program *prog);
/**
* Set the @ref drgn_platform of a @ref drgn_program if it hasn't been set
* yet.
*/
void drgn_program_set_platform(struct drgn_program *prog,
const struct drgn_platform *platform);
/**
* Implement @ref drgn_program_from_core_dump() on an initialized @ref
* drgn_program.
*/
struct drgn_error *drgn_program_init_core_dump(struct drgn_program *prog,
const char *path);
/**
* Implement @ref drgn_program_from_core_dump_fd() on an initialized @ref
* drgn_program.
*/
struct drgn_error *drgn_program_init_core_dump_fd(struct drgn_program *prog,
int fd);
/**
* Implement @ref drgn_program_from_kernel() on an initialized @ref
* drgn_program.
*/
struct drgn_error *drgn_program_init_kernel(struct drgn_program *prog);
/**
* Implement @ref drgn_program_from_pid() on an initialized @ref drgn_program.
*/
struct drgn_error *drgn_program_init_pid(struct drgn_program *prog, pid_t pid);
static inline struct drgn_error *
drgn_program_is_little_endian(struct drgn_program *prog, bool *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program byte order is not known");
}
*ret = drgn_platform_is_little_endian(&prog->platform);
return NULL;
}
/**
* Return whether a @ref drgn_program has a different endianness than the host
* system.
*/
static inline struct drgn_error *
drgn_program_bswap(struct drgn_program *prog, bool *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program byte order is not known");
}
*ret = drgn_platform_bswap(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_is_64_bit(struct drgn_program *prog, bool *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program word size is not known");
}
*ret = drgn_platform_is_64_bit(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_address_size(struct drgn_program *prog, uint8_t *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program address size is not known");
}
*ret = drgn_platform_address_size(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_address_mask(const struct drgn_program *prog, uint64_t *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program address size is not known");
}
*ret = drgn_platform_address_mask(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_untagged_addr(const struct drgn_program *prog, uint64_t *address)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program address size is not known");
}
*address &= drgn_platform_address_mask(&prog->platform);
if (prog->platform.arch->untagged_addr)
*address = prog->platform.arch->untagged_addr(*address);
return NULL;
}
struct drgn_error *drgn_thread_dup_internal(const struct drgn_thread *thread,
struct drgn_thread *ret);
void drgn_thread_deinit(struct drgn_thread *thread);
/**
* Find the @c NT_PRSTATUS note with the given "PID".
*
* For userspace, the PID is the thread ID. For the kernel, it's complicated;
* see drgn_get_initial_registers_from_kernel_core_dump().
*
* @param[out] ret Returned note data. If not found, <tt>ret->str</tt> is set to
* @c NULL and <tt>ret->len</tt> is set to zero.
*/
struct drgn_error *drgn_program_find_prstatus(struct drgn_program *prog,
uint32_t tid,
struct nstring *ret);
/**
* Cache the @c NT_PRSTATUS note provided by @p data in @p prog.
*
* @param[in] data The pointer to the note data.
* @param[in] size Size of data in note.
* @param[out] ret Thread ID from note.
*/
struct drgn_error *drgn_program_cache_prstatus_entry(struct drgn_program *prog,
const char *data,
size_t size,
uint32_t *ret);
/*
* Like @ref drgn_program_find_symbol_by_address(), but returns @c NULL rather
* than a lookup error if the symbol was not found.
*
* @param[in] address Address to search for.
* @param [out] ret The symbol found by the lookup (if found)
* @return @c NULL unless an error (unrelated to a lookup error) was encountered
*/
struct drgn_error *
drgn_program_find_symbol_by_address_internal(struct drgn_program *prog,
uint64_t address,
struct drgn_symbol **ret);
struct drgn_error *
drgn_program_register_type_finder_impl(struct drgn_program *prog,
struct drgn_type_finder *finder,
const char *name,
const struct drgn_type_finder_ops *ops,
void *arg, size_t enable_index);
struct drgn_error *
drgn_program_register_object_finder_impl(struct drgn_program *prog,
struct drgn_object_finder *finder,
const char *name,
const struct drgn_object_finder_ops *ops,
void *arg, size_t enable_index);
struct drgn_error *
drgn_program_register_symbol_finder_impl(struct drgn_program *prog,
struct drgn_symbol_finder *finder,
const char *name,
const struct drgn_symbol_finder_ops *ops,
void *arg, size_t enable_index);
/**
* Call before a blocking (I/O or long-running) operation.
*
* Must be paired with @ref drgn_program_end_blocking().
*
* @return Opaque pointer to pass to @ref drgn_program_end_blocking().
*/
void *drgn_program_begin_blocking(struct drgn_program *prog);
/**
* Call after a blocking (I/O or long-running) operation.
*
* @param[in] state Return value of @ref drgn_program_begin_blocking().
*/
void drgn_program_end_blocking(struct drgn_program *prog, void *state);
struct drgn_blocking_guard_struct {
struct drgn_program *prog;
void *state;
};
static inline struct drgn_blocking_guard_struct
drgn_blocking_guard_init(struct drgn_program *prog)
{
return (struct drgn_blocking_guard_struct){
prog, drgn_program_begin_blocking(prog),
};
}
static inline void
drgn_blocking_guard_cleanup(struct drgn_blocking_guard_struct *guard)
{
drgn_program_end_blocking(guard->prog, guard->state);
}
/**
* Scope guard that wraps @ref drgn_program_begin_blocking() and @ref
* drgn_program_end_blocking().
*/
#define drgn_blocking_guard(prog) \
struct drgn_blocking_guard_struct PP_UNIQUE(guard) \
__attribute__((__cleanup__(drgn_blocking_guard_cleanup), __unused__)) = \
drgn_blocking_guard_init(prog)
/**
* @}
* @}
*/
#endif /* DRGN_PROGRAM_H */