2023-12-07 19:21:39 +00:00
/* SPDX-License-Identifier: GPL-2.0 */
/*
* Copyright ( c ) 2023 Meta Platforms , Inc . and affiliates .
* Copyright ( c ) 2023 David Vernet < dvernet @ meta . com >
* Copyright ( c ) 2023 Tejun Heo < tj @ kernel . org >
*/
# include <stdio.h>
# include <unistd.h>
2023-12-09 12:50:12 +00:00
# include <inttypes.h>
2023-12-07 19:21:39 +00:00
# include <signal.h>
# include <libgen.h>
# include <bpf/bpf.h>
# include <scx/common.h>
# include "scx_nest.bpf.skel.h"
# include "scx_nest.h"
# define SAMPLING_CADENCE_S 2
const char help_fmt [ ] =
" A Nest sched_ext scheduler. \n "
" \n "
" See the top-level comment in .bpf.c for more details. \n "
" \n "
" Usage: %s [-p] [-d DELAY] [-m <max>] [-i ITERS] \n "
" \n "
" -d DELAY_US Delay (us), before removing an idle core from the primary nest (default 2000us / 2ms) \n "
" -m R_MAX Maximum number of cores in the reserve nest (default 5) \n "
" -i ITERS Number of successive placement failures tolerated before trying to aggressively expand primary nest (default 2), or 0 to disable \n "
" -s SLICE_US Override slice duration in us (default 20000us / 20ms) \n "
" -I First try to find a fully idle core, and then any idle core, when searching nests. Default behavior is to ignore hypertwins and check for any idle core. \n "
2024-04-29 21:13:46 +01:00
" -v Print libbpf debug messages \n "
2023-12-07 19:21:39 +00:00
" -h Display this help and exit \n " ;
2024-04-29 21:13:46 +01:00
static bool verbose ;
2023-12-07 19:21:39 +00:00
static volatile int exit_req ;
2024-04-29 21:13:46 +01:00
static int libbpf_print_fn ( enum libbpf_print_level level , const char * format , va_list args )
{
if ( level = = LIBBPF_DEBUG & & ! verbose )
return 0 ;
return vfprintf ( stderr , format , args ) ;
}
2023-12-07 19:21:39 +00:00
static void sigint_handler ( int nest )
{
exit_req = 1 ;
}
struct nest_stat {
const char * label ;
enum nest_stat_group group ;
enum nest_stat_idx idx ;
} ;
# define NEST_ST(__stat, __grp, __desc) { \
. label = # __stat , \
. group = __grp , \
. idx = NEST_STAT ( __stat ) \
} ,
static struct nest_stat nest_stats [ NEST_STAT ( NR ) ] = {
# include "scx_nest_stats_table.h"
} ;
# undef NEST_ST
static void read_stats ( struct scx_nest * skel , u64 * stats )
{
int nr_cpus = libbpf_num_possible_cpus ( ) ;
u64 cnts [ NEST_STAT ( NR ) ] [ nr_cpus ] ;
u32 idx ;
memset ( stats , 0 , sizeof ( stats [ 0 ] ) * NEST_STAT ( NR ) ) ;
for ( idx = 0 ; idx < NEST_STAT ( NR ) ; idx + + ) {
int ret , cpu ;
ret = bpf_map_lookup_elem ( bpf_map__fd ( skel - > maps . stats ) ,
& idx , cnts [ idx ] ) ;
if ( ret < 0 )
continue ;
for ( cpu = 0 ; cpu < nr_cpus ; cpu + + )
stats [ idx ] + = cnts [ idx ] [ cpu ] ;
}
}
static void print_underline ( const char * str )
{
char buf [ 64 ] ;
size_t len ;
len = strlen ( str ) ;
memset ( buf , ' - ' , len ) ;
buf [ len ] = ' \0 ' ;
printf ( " \n \n %s \n %s \n " , str , buf ) ;
}
static void print_stat_grp ( enum nest_stat_group grp )
{
const char * group ;
switch ( grp ) {
case STAT_GRP_WAKEUP :
group = " Wakeup stats " ;
break ;
case STAT_GRP_NEST :
group = " Nest stats " ;
break ;
case STAT_GRP_CONSUME :
group = " Consume stats " ;
break ;
default :
group = " Unknown stats " ;
break ;
}
print_underline ( group ) ;
}
static void print_active_nests ( const struct scx_nest * skel )
{
u64 primary = skel - > bss - > stats_primary_mask ;
u64 reserved = skel - > bss - > stats_reserved_mask ;
u64 other = skel - > bss - > stats_other_mask ;
u64 idle = skel - > bss - > stats_idle_mask ;
u32 nr_cpus = skel - > rodata - > nr_cpus , cpu ;
int idx ;
char cpus [ nr_cpus + 1 ] ;
memset ( cpus , 0 , nr_cpus + 1 ) ;
print_underline ( " Masks " ) ;
for ( idx = 0 ; idx < 4 ; idx + + ) {
const char * mask_str ;
u64 mask , total = 0 ;
memset ( cpus , ' - ' , nr_cpus ) ;
if ( idx = = 0 ) {
mask_str = " PRIMARY " ;
mask = primary ;
} else if ( idx = = 1 ) {
mask_str = " RESERVED " ;
mask = reserved ;
} else if ( idx = = 2 ) {
mask_str = " OTHER " ;
mask = other ;
} else {
mask_str = " IDLE " ;
mask = idle ;
}
for ( cpu = 0 ; cpu < nr_cpus ; cpu + + ) {
if ( mask & ( 1ULL < < cpu ) ) {
cpus [ cpu ] = ' * ' ;
total + + ;
}
}
2023-12-09 12:50:12 +00:00
printf ( " %-9s(%2 " PRIu64 " ): | %s | \n " , mask_str , total , cpus ) ;
2023-12-07 19:21:39 +00:00
}
}
int main ( int argc , char * * argv )
{
struct scx_nest * skel ;
struct bpf_link * link ;
__u32 opt ;
2024-04-29 21:13:46 +01:00
__u64 ecode ;
2023-12-07 19:21:39 +00:00
2024-04-29 21:13:46 +01:00
libbpf_set_print ( libbpf_print_fn ) ;
2023-12-07 19:21:39 +00:00
signal ( SIGINT , sigint_handler ) ;
signal ( SIGTERM , sigint_handler ) ;
2024-04-29 21:13:46 +01:00
restart :
skel = SCX_OPS_OPEN ( nest_ops , scx_nest ) ;
2023-12-07 19:21:39 +00:00
skel - > rodata - > nr_cpus = libbpf_num_possible_cpus ( ) ;
skel - > rodata - > sampling_cadence_ns = SAMPLING_CADENCE_S * 1000 * 1000 * 1000 ;
2024-04-29 21:13:46 +01:00
while ( ( opt = getopt ( argc , argv , " d:m:i:Is:vh " ) ) ! = - 1 ) {
2023-12-07 19:21:39 +00:00
switch ( opt ) {
case ' d ' :
skel - > rodata - > p_remove_ns = strtoull ( optarg , NULL , 0 ) * 1000 ;
break ;
case ' m ' :
skel - > rodata - > r_max = strtoull ( optarg , NULL , 0 ) ;
break ;
case ' i ' :
skel - > rodata - > r_impatient = strtoull ( optarg , NULL , 0 ) ;
break ;
case ' I ' :
skel - > rodata - > find_fully_idle = true ;
break ;
case ' s ' :
skel - > rodata - > slice_ns = strtoull ( optarg , NULL , 0 ) * 1000 ;
break ;
2024-04-29 21:13:46 +01:00
case ' v ' :
verbose = true ;
break ;
2023-12-07 19:21:39 +00:00
default :
fprintf ( stderr , help_fmt , basename ( argv [ 0 ] ) ) ;
return opt ! = ' h ' ;
}
}
2024-03-07 20:44:09 +00:00
SCX_OPS_LOAD ( skel , nest_ops , scx_nest , uei ) ;
2024-05-18 01:16:56 +01:00
link = SCX_OPS_ATTACH ( skel , nest_ops , scx_nest ) ;
2023-12-07 19:21:39 +00:00
2024-03-07 20:44:09 +00:00
while ( ! exit_req & & ! UEI_EXITED ( skel , uei ) ) {
2023-12-07 19:21:39 +00:00
u64 stats [ NEST_STAT ( NR ) ] ;
enum nest_stat_idx i ;
enum nest_stat_group last_grp = - 1 ;
read_stats ( skel , stats ) ;
for ( i = 0 ; i < NEST_STAT ( NR ) ; i + + ) {
struct nest_stat * nest_stat ;
nest_stat = & nest_stats [ i ] ;
if ( nest_stat - > group ! = last_grp ) {
print_stat_grp ( nest_stat - > group ) ;
last_grp = nest_stat - > group ;
}
2023-12-09 12:50:12 +00:00
printf ( " %s=% " PRIu64 " \n " , nest_stat - > label , stats [ nest_stat - > idx ] ) ;
2023-12-07 19:21:39 +00:00
}
printf ( " \n " ) ;
print_active_nests ( skel ) ;
printf ( " \n " ) ;
printf ( " \n " ) ;
printf ( " \n " ) ;
fflush ( stdout ) ;
sleep ( SAMPLING_CADENCE_S ) ;
}
bpf_link__destroy ( link ) ;
2024-04-29 21:13:46 +01:00
ecode = UEI_REPORT ( skel , uei ) ;
2023-12-07 19:21:39 +00:00
scx_nest__destroy ( skel ) ;
2024-04-29 21:13:46 +01:00
if ( UEI_ECODE_RESTART ( ecode ) )
goto restart ;
2023-12-07 19:21:39 +00:00
return 0 ;
}