drgn/libdrgn/program.h
Omar Sandoval 1487db5389 libdrgn: stack_trace: get rid of PRSTATUS PID match heuristic
Commit 1b47b866b4 ("libdrgn: go back to trusting PRSTATUS PID")
introduced a check so that we only use the PRSTATUS note for stack
unwinding if its PID field matches the PID of the task we're trying to
unwind. This was intended to detect when a CPU was in the middle of a
context switch during a crash. However, it has caused more trouble than
it's worth. For example:

1. It's broken on s390x, which puts the CPU number + 1 in the PID field.
   See also commit 7cb3e99b23 ("libdrgn: program: find crashed task
   with cpu_curr() instead of find_task()").
2. It's broken on dumps from QEMU's dump-guest-memory command, which
   also puts the CPU number + 1 in the PID field. See issue #356.
3. It breaks the reasonable assumption that
   prog.stack_trace(cpu_curr(prog, cpu)) always gets the stack trace for
   a given CPU. This slowed down an internal scheduler investigation.

It doesn't even really accomplish what it's trying to do, since the
check itself is racy. Let's remove it (which is not as simple as it
sounds, since we were also using it in lieu of a proper on_cpu fallback
for !SMP kernels).

Signed-off-by: Omar Sandoval <osandov@osandov.com>
2023-10-30 23:22:17 -07:00

417 lines
11 KiB
C

// Copyright (c) Meta Platforms, Inc. and affiliates.
// SPDX-License-Identifier: LGPL-2.1-or-later
/**
* @file
*
* Program internals.
*
* See @ref ProgramInternals.
*/
#ifndef DRGN_PROGRAM_H
#define DRGN_PROGRAM_H
#include <elfutils/libdwfl.h>
#include <libelf.h>
#include <sys/types.h>
#ifdef WITH_LIBKDUMPFILE
#include <libkdumpfile/kdumpfile.h>
#endif
#include "debug_info.h"
#include "drgn.h"
#include "hash_table.h"
#include "language.h"
#include "memory_reader.h"
#include "object_index.h"
#include "platform.h"
#include "pp.h"
#include "type.h"
#include "vector.h"
/**
* @defgroup Internals Internals
*
* Internal implementation
*
* @{
*
* @defgroup ProgramInternals Programs
*
* Program internals.
*
* @{
*/
struct drgn_thread {
struct drgn_program *prog;
uint32_t tid;
struct nstring prstatus;
struct drgn_object object;
};
DEFINE_VECTOR_TYPE(drgn_typep_vector, struct drgn_type *);
DEFINE_VECTOR_TYPE(drgn_prstatus_vector, struct nstring);
DEFINE_HASH_TABLE_TYPE(drgn_thread_set, struct drgn_thread);
struct drgn_program {
/** @privatesection */
/*
* Memory/core dump.
*/
struct drgn_memory_reader reader;
/* Elf core dump or /proc/pid/mem file segments. */
struct drgn_memory_file_segment *file_segments;
/* Elf core dump. Not valid for live programs or kdump files. */
Elf *core;
/* File descriptor for ELF core dump, kdump file, or /proc/pid/mem. */
int core_fd;
/* PID of live userspace program. */
pid_t pid;
#ifdef WITH_LIBKDUMPFILE
kdump_ctx_t *kdump_ctx;
#endif
/*
* Types.
*/
/** Callbacks for finding types. */
struct drgn_type_finder *type_finders;
/** Void type for each language. */
struct drgn_type void_types[DRGN_NUM_LANGUAGES];
/** Cache of primitive types. */
struct drgn_type *primitive_types[DRGN_PRIMITIVE_TYPE_NUM];
/** Cache of deduplicated types. */
struct drgn_dedupe_type_set dedupe_types;
/**
* List of created types that are not deduplicated: types with non-empty
* lists of members, parameters, template parameters, or enumerators.
*
* Members, parameters, and template parameters contain lazily-evaluated
* objects, so they cannot be easily deduplicated.
*
* Enumerators could be deduplicated, but it's probably not worth the
* effort to hash and compare them.
*/
struct drgn_typep_vector created_types;
/** Cache for @ref drgn_program_find_member(). */
struct drgn_member_map members;
/**
* Set of types which have been already cached in @ref
* drgn_program::members.
*/
struct drgn_type_set members_cached;
/*
* Debugging information.
*/
struct drgn_object_index oindex;
struct drgn_debug_info dbinfo;
/*
* Program information.
*/
/* Default language of the program. */
const struct drgn_language *lang;
struct drgn_platform platform;
bool has_platform;
enum drgn_program_flags flags;
/*
* Threads/stack traces.
*/
union {
/*
* For the Linux kernel, PRSTATUS notes indexed by CPU. See
* drgn_get_initial_registers() for why we don't use the PID
* map.
*/
struct drgn_prstatus_vector prstatus_vector;
/* For userspace programs, threads indexed by PID. */
struct drgn_thread_set thread_set;
};
struct drgn_thread *main_thread;
struct drgn_thread *crashed_thread;
/*
* AArch64 instruction pointer authentication code mask, parsed either
* from NT_ARM_PAC_MASK or VMCOREINFO.
*/
uint64_t aarch64_insn_pac_mask;
bool core_dump_notes_cached;
bool prefer_orc_unwinder;
/*
* Linux kernel-specific.
*/
/* The important parts of the VMCOREINFO note of a Linux kernel core. */
struct {
/** <tt>uname -r</tt> */
char osrelease[128];
/** PAGE_SIZE of the kernel. */
uint64_t page_size;
/**
* The offset from the compiled address of the kernel image to its
* actual address in memory.
*
* This is non-zero if kernel address space layout randomization (KASLR)
* is enabled.
*/
uint64_t kaslr_offset;
/** Kernel page table. */
uint64_t swapper_pg_dir;
/** Length of mem_section array (i.e., NR_SECTION_ROOTS). */
uint64_t mem_section_length;
/** VA_BITS on AArch64. */
uint64_t va_bits;
/** Whether 5-level paging was enabled on x86-64. */
bool pgtable_l5_enabled;
/** PAGE_SHIFT of the kernel (derived from PAGE_SIZE). */
int page_shift;
/** The original vmcoreinfo data, to expose as an object */
char *raw;
size_t raw_size;
} vmcoreinfo;
/*
* Difference between a virtual address in the direct mapping and the
* physical address it maps to.
*/
uint64_t direct_mapping_offset;
/* Cached vmemmap. */
struct drgn_object vmemmap;
/* Page table iterator. */
struct pgtable_iterator *pgtable_it;
/*
* Whether we are currently in address translation. Used to prevent
* address translation from recursing.
*/
bool in_address_translation;
/* Whether @ref drgn_program::direct_mapping_offset has been cached. */
bool direct_mapping_offset_cached;
/*
* Logging.
*/
drgn_log_fn *log_fn;
void *log_arg;
enum drgn_log_level log_level;
/*
* Blocking callbacks.
*/
drgn_program_begin_blocking_fn *begin_blocking_fn;
drgn_program_end_blocking_fn *end_blocking_fn;
void *blocking_arg;
};
/** Initialize a @ref drgn_program. */
void drgn_program_init(struct drgn_program *prog,
const struct drgn_platform *platform);
/** Deinitialize a @ref drgn_program. */
void drgn_program_deinit(struct drgn_program *prog);
/**
* Set the @ref drgn_platform of a @ref drgn_program if it hasn't been set
* yet.
*/
void drgn_program_set_platform(struct drgn_program *prog,
const struct drgn_platform *platform);
/**
* Implement @ref drgn_program_from_core_dump() on an initialized @ref
* drgn_program.
*/
struct drgn_error *drgn_program_init_core_dump(struct drgn_program *prog,
const char *path);
/**
* Implement @ref drgn_program_from_core_dump_fd() on an initialized @ref
* drgn_program.
*/
struct drgn_error *drgn_program_init_core_dump_fd(struct drgn_program *prog,
int fd);
/**
* Implement @ref drgn_program_from_kernel() on an initialized @ref
* drgn_program.
*/
struct drgn_error *drgn_program_init_kernel(struct drgn_program *prog);
/**
* Implement @ref drgn_program_from_pid() on an initialized @ref drgn_program.
*/
struct drgn_error *drgn_program_init_pid(struct drgn_program *prog, pid_t pid);
struct drgn_error *
drgn_program_add_object_finder_impl(struct drgn_program *prog,
struct drgn_object_finder *finder,
drgn_object_find_fn fn, void *arg);
static inline struct drgn_error *
drgn_program_is_little_endian(struct drgn_program *prog, bool *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program byte order is not known");
}
*ret = drgn_platform_is_little_endian(&prog->platform);
return NULL;
}
/**
* Return whether a @ref drgn_program has a different endianness than the host
* system.
*/
static inline struct drgn_error *
drgn_program_bswap(struct drgn_program *prog, bool *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program byte order is not known");
}
*ret = drgn_platform_bswap(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_is_64_bit(struct drgn_program *prog, bool *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program word size is not known");
}
*ret = drgn_platform_is_64_bit(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_address_size(struct drgn_program *prog, uint8_t *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program address size is not known");
}
*ret = drgn_platform_address_size(&prog->platform);
return NULL;
}
static inline struct drgn_error *
drgn_program_address_mask(const struct drgn_program *prog, uint64_t *ret)
{
if (!prog->has_platform) {
return drgn_error_create(DRGN_ERROR_INVALID_ARGUMENT,
"program address size is not known");
}
*ret = drgn_platform_address_mask(&prog->platform);
return NULL;
}
struct drgn_error *drgn_thread_dup_internal(const struct drgn_thread *thread,
struct drgn_thread *ret);
void drgn_thread_deinit(struct drgn_thread *thread);
/**
* Find the @c NT_PRSTATUS note for the given CPU.
*
* This is only valid for the Linux kernel.
*
* @param[out] ret Returned note data. If not found, <tt>ret->str</tt> is set to
* @c NULL and <tt>ret->len</tt> is set to zero.
*/
struct drgn_error *drgn_program_find_prstatus_by_cpu(struct drgn_program *prog,
uint32_t cpu,
struct nstring *ret);
/**
* Find the @c NT_PRSTATUS note for the given thread ID.
*
* This is only valid for userspace programs.
*
* @param[out] ret Returned note data. If not found, <tt>ret->str</tt> is set to
* @c NULL and <tt>ret->len</tt> is set to zero.
*/
struct drgn_error *drgn_program_find_prstatus_by_tid(struct drgn_program *prog,
uint32_t tid,
struct nstring *ret);
/**
* Cache the @c NT_PRSTATUS note provided by @p data in @p prog.
*
* @param[in] data The pointer to the note data.
* @param[in] size Size of data in note.
* @param[out] ret Thread ID from note.
*/
struct drgn_error *drgn_program_cache_prstatus_entry(struct drgn_program *prog,
const char *data,
size_t size,
uint32_t *ret);
/*
* Like @ref drgn_program_find_symbol_by_address(), but @p ret is already
* allocated, we may already know the module, and doesn't return a @ref
* drgn_error.
*
* @param[in] module Module containing the address. May be @c NULL, in which
* case this will look it up.
* @return Whether the symbol was found.
*/
bool drgn_program_find_symbol_by_address_internal(struct drgn_program *prog,
uint64_t address,
Dwfl_Module *module,
struct drgn_symbol *ret);
/**
* Call before a blocking (I/O or long-running) operation.
*
* Must be paired with @ref drgn_program_end_blocking().
*
* @return Opaque pointer to pass to @ref drgn_program_end_blocking().
*/
void *drgn_program_begin_blocking(struct drgn_program *prog);
/**
* Call after a blocking (I/O or long-running) operation.
*
* @param[in] state Return value of @ref drgn_program_begin_blocking().
*/
void drgn_program_end_blocking(struct drgn_program *prog, void *state);
struct drgn_blocking_guard_struct {
struct drgn_program *prog;
void *state;
};
static inline struct drgn_blocking_guard_struct
drgn_blocking_guard_init(struct drgn_program *prog)
{
return (struct drgn_blocking_guard_struct){
prog, drgn_program_begin_blocking(prog),
};
}
static inline void
drgn_blocking_guard_cleanup(struct drgn_blocking_guard_struct *guard)
{
drgn_program_end_blocking(guard->prog, guard->state);
}
/**
* Scope guard that wraps @ref drgn_program_begin_blocking() and @ref
* drgn_program_end_blocking().
*/
#define drgn_blocking_guard(prog) \
struct drgn_blocking_guard_struct PP_UNIQUE(guard) \
__attribute__((__cleanup__(drgn_blocking_guard_cleanup), __unused__)) = \
drgn_blocking_guard_init(prog)
/**
* @}
* @}
*/
#endif /* DRGN_PROGRAM_H */