diff --git a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/bpf/mutrace.bpf.c b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/bpf/mutrace.bpf.c index e2e24aa65..c1552cb23 100644 --- a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/bpf/mutrace.bpf.c +++ b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/bpf/mutrace.bpf.c @@ -22,13 +22,22 @@ char LICENSE[] SEC("license") = "Dual BSD/GPL"; -BPF_HASH(mutex_info_map,u64,struct mutex_info, 1024); - +const int ctrl_key = 0; +BPF_HASH(mutex_info_map, u64, struct mutex_info_kernel, 1024); +BPF_ARRAY(mu_ctrl_map, int, struct mu_ctrl, 1); struct { __uint(type, BPF_MAP_TYPE_RINGBUF); __uint(max_entries, 256 * 1024); } rb SEC(".maps"); +static inline struct mu_ctrl *get_mu_ctrl(void) { + struct mu_ctrl *mu_ctrl; + mu_ctrl = bpf_map_lookup_elem(&mu_ctrl_map, &ctrl_key); + if (!mu_ctrl || !mu_ctrl->mu_func) { + return NULL; + } + return mu_ctrl; +} /*----------------------------------------------*/ /* 内核态互斥锁 */ @@ -36,21 +45,23 @@ struct { SEC("kprobe/mutex_lock") int BPF_KPROBE(trace_mutex_lock, struct mutex *lock) { - u64 lock_addr = (u64)lock; // 获取锁地址 - u64 ts = bpf_ktime_get_ns(); - struct mutex_info *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); + u64 lock_addr = (u64)lock; // 获取锁地址 + u64 ts = bpf_ktime_get_ns(); + struct mutex_info_kernel *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); if (info) { - info->acquire_time = ts; // 保存锁获取时间 + info->acquire_time = ts; // 保存锁获取时间 } else { - struct mutex_info new_info = { + struct mutex_info_kernel new_info = { .locked_total = 0, .locked_max = 0, .contended_total = 0, + .count = 0, .last_owner = 0, .acquire_time = ts, .ptr = lock_addr }; - bpf_map_update_elem(&mutex_info_map, &lock_addr, &new_info, BPF_ANY); + __builtin_memset(new_info.last_name, 0, sizeof(new_info.last_name)); + bpf_map_update_elem(&mutex_info_map, &lock_addr, &new_info, BPF_ANY); } return 0; } @@ -58,21 +69,23 @@ int BPF_KPROBE(trace_mutex_lock, struct mutex *lock) { SEC("kprobe/mutex_trylock") int BPF_KPROBE(trace_mutex_trylock, struct mutex *lock) { int ret = PT_REGS_RC(ctx); - if (ret == 0) { // 成功获取锁 - u64 lock_addr = (u64)lock; // 获取锁地址 - u64 ts = bpf_ktime_get_ns(); - struct mutex_info *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); + if (ret != 0) { // 成功获取锁 + u64 lock_addr = (u64)lock; // 获取锁地址 + u64 ts = bpf_ktime_get_ns(); + struct mutex_info_kernel *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); if (info) { - info->acquire_time = ts; + info->acquire_time = ts; } else { - struct mutex_info new_info = { + struct mutex_info_kernel new_info = { .locked_total = 0, .locked_max = 0, .contended_total = 0, + .count = 0, .last_owner = 0, .acquire_time = ts, .ptr = lock_addr }; + __builtin_memset(new_info.last_name, 0, sizeof(new_info.last_name)); bpf_map_update_elem(&mutex_info_map, &lock_addr, &new_info, BPF_ANY); } } @@ -81,6 +94,7 @@ int BPF_KPROBE(trace_mutex_trylock, struct mutex *lock) { SEC("kprobe/__mutex_lock_slowpath") int BPF_KPROBE(trace_mutex_lock_slowpath, struct mutex *lock) { + struct mu_ctrl *mu_ctrl = get_mu_ctrl(); struct mutex_contention_event *e; struct task_struct *owner_task; struct task_struct *contender_task; @@ -98,7 +112,7 @@ int BPF_KPROBE(trace_mutex_lock_slowpath, struct mutex *lock) { bpf_probe_read_kernel(&owner, sizeof(owner), &lock->owner); owner_task = (struct task_struct *)(owner & ~0x1L); contender_task = (struct task_struct *)bpf_get_current_task(); - bpf_probe_read_kernel(&e->contender_prio, sizeof(e->contender_prio), &contender_task->prio); + bpf_probe_read_kernel(&e->contender_prio, sizeof(e->contender_prio), &contender_task->prio); if (owner_task) { bpf_probe_read_kernel(&e->owner_pid, sizeof(e->owner_pid), &owner_task->pid); bpf_probe_read_kernel_str(&e->owner_name, sizeof(e->owner_name), owner_task->comm); @@ -107,18 +121,22 @@ int BPF_KPROBE(trace_mutex_lock_slowpath, struct mutex *lock) { e->owner_pid = 0; __builtin_memset(e->owner_name, 0, sizeof(e->owner_name)); } - struct mutex_info *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); + struct mutex_info_kernel *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); if (info) { - info->contended_total += ts - info->acquire_time; + u64 contention_start = ts; + info->contended_total += (contention_start - info->acquire_time); // 更新争用时间 + info->count++; // 更新争用次数 } else { - struct mutex_info new_info = { + struct mutex_info_kernel new_info = { .locked_total = 0, .locked_max = 0, - .contended_total = ts, + .contended_total = 0, + .count = 1, // 初始化争用次数 .last_owner = 0, - .acquire_time = 0, + .acquire_time = ts, // 初始化获取时间 .ptr = lock_addr }; + __builtin_memset(new_info.last_name, 0, sizeof(new_info.last_name)); bpf_map_update_elem(&mutex_info_map, &lock_addr, &new_info, BPF_ANY); } bpf_ringbuf_submit(e, 0); @@ -130,7 +148,7 @@ int BPF_KPROBE(trace_mutex_unlock, struct mutex *lock) { u64 lock_addr = (u64)lock; u64 ts = bpf_ktime_get_ns(); pid_t pid = bpf_get_current_pid_tgid(); - struct mutex_info *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); + struct mutex_info_kernel *info = bpf_map_lookup_elem(&mutex_info_map, &lock_addr); if (info) { u64 held_time = ts - info->acquire_time; // 计算锁被持有的时间 info->locked_total += held_time; // 更新锁被持有的总时间 @@ -138,35 +156,38 @@ int BPF_KPROBE(trace_mutex_unlock, struct mutex *lock) { info->locked_max = held_time; // 更新锁被持有的最长时间 } info->last_owner = pid; // 更新最后一次持有该锁的线程ID + bpf_get_current_comm(&info->last_name, sizeof(info->last_name)); // 更新最后一次持有该锁的线程名称 } return 0; } + + /*----------------------------------------------*/ /* 用户态互斥锁 */ /*----------------------------------------------*/ // SEC("uprobe") -// int BPF_KPROBE(pthread_mutex_lock_init, pthread_mutex_t *mutex){ +// int BPF_KPROBE(pthread_mutex_lock_init, void *__mutex){ // } // SEC("uprobe") -// int BPF_KPROBE(pthread_mutex_lock,pthread_mutex_t *mutex){ +// int BPF_KPROBE(pthread_mutex_lock,void *__mutex){ // } // SEC("uprobe") -// int BPF_KPROBE(pthread_mutex_try, pthread_mutex_t *mutex){ +// int BPF_KPROBE(pthread_mutex_trylock, void *__mutex){ // } // SEC("uprobe") -// int BPF_KPROBE(pthread_mutex_unlock, pthread_mutex_t *mutex){ +// int BPF_KPROBE(pthread_mutex_unlock, void *__mutex){ // } // SEC("uprobe") -// int BPF_KPROBE(pthread_mutex_destroy, pthread_mutex_t *mutex){ +// int BPF_KPROBE(pthread_mutex_destroy,void *__mutex){ -// } \ No newline at end of file +// } diff --git a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/controller.c b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/controller.c index 7c8cde155..b507e48ff 100644 --- a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/controller.c +++ b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/controller.c @@ -39,6 +39,8 @@ static struct env { bool SCHEDULE_DELAY; bool MQ_DELAY; int freq; + bool mutrace; + bool mutex_detail; } env = { .usemode = 0, .SAR = false, @@ -51,6 +53,8 @@ static struct env { .SCHEDULE_DELAY = false, .MQ_DELAY = false, .freq = 99, + .mutrace = false, + .mutex_detail = false, }; const char argp_program_doc[] ="Trace process to get cpu watcher.\n"; @@ -66,7 +70,9 @@ static const struct argp_option opts[] = { {"preempt_time", 'p', 0, 0, "Print preempt_time (the data of preempt_schedule)" }, {"schedule_delay", 'd', 0, 0, "Print schedule_delay (the data of cpu)" }, {"schedule_delay_min_us_set", 'e', "THRESHOLD", 0, "Print scheduling delays that exceed the threshold (the data of cpu)" }, - {"mq_delay", 'm', 0, 0, "Print mq_delay(the data of proc)" }, + {"mq_delay", 'm', 0, 0, "Print mq_delay(the data of proc)" }, + {"mutrace", 'x', 0, 0, "Print kernel mutex contend" }, + {"mutex_detail", 'i', 0, 0, "Print kernel mutex details" }, { NULL, 'h', NULL, OPTION_HIDDEN, "show the full help" }, {}, }; @@ -114,7 +120,13 @@ static error_t parse_arg(int key, char *arg, struct argp_state *state) break; case 'm': env.MQ_DELAY = true; - break; + break; + case 'x': + env.mutrace = true; + break; + case 'i': + env.mutex_detail = true; + break; case 'h': argp_state_help(state, stderr, ARGP_HELP_STD_HELP); break; @@ -157,6 +169,11 @@ int deactivate_mode(){ struct mq_ctrl mq_ctrl = {false,0}; err = update_mq_ctrl_map(mq_ctrl); if(err < 0) return err; + } + if(env.mutrace){ + struct mu_ctrl mu_ctrl = {false,false,0}; + err = update_mu_ctrl_map(mu_ctrl); + if(err < 0) return err; } return 0; } @@ -223,6 +240,12 @@ int main(int argc, char **argv) err = update_mq_ctrl_map(mq_ctrl); if(err < 0) return err; } + + if(env.mutrace){ + struct mu_ctrl mu_ctrl = {true,env.mutex_detail,MUTEX_WATCHER+env.mutex_detail}; + err = update_mu_ctrl_map(mu_ctrl); + if(err < 0) return err; + } }else if(env.usemode == 2){ // deactivate mode err = deactivate_mode(); if(err<0){ diff --git a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/cpu_watcher.c b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/cpu_watcher.c index 36a533d09..3ecc8ca4f 100644 --- a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/cpu_watcher.c +++ b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/cpu_watcher.c @@ -25,6 +25,7 @@ #include #include #include +#include #include #include #include @@ -102,6 +103,8 @@ static int preemptmap_fd; static int schedulemap_fd; struct schedule_ctrl sd_ctrl = {}; static int mqmap_fd; +static int mumap_fd; +struct mu_ctrl mu_ctrl = {}; //static int prev_watcher = 0;//上一个使用的工具,用于在切换使用功能时,打印不用功能的表头; @@ -560,18 +563,55 @@ static int preempt_print(void *ctx, void *data, unsigned long data_sz) //mutrace输出 static int mutrace_print(void *ctx, void *data, unsigned long data_sz) { - const struct mutex_contention_event *e = data; - if (e->owner_pid == 0 || e->contender_pid == 0||e->owner_pid == 1) { - return 0; - } - // 增加锁争用次数 - increment_lock_count(e->ptr); - uint64_t contention_count = get_lock_count(e->ptr); - printf("%15llu %15d %15s %15d %15d %15s %15d %15ld\n", e->ptr, e->owner_pid, e->owner_name, e->owner_prio,e->contender_pid, e->contender_name, e->contender_prio,contention_count); + int err,key = 0; + err = bpf_map_lookup_elem(mumap_fd,&key,&mu_ctrl); + if (err < 0) { + fprintf(stderr, "failed to lookup infos: %d\n", err); + return -1; + } + if(!mu_ctrl.mu_func) return 0; + if(mu_ctrl.prev_watcher == MUTEX_WATCHER ){ + printf("%s\n"," lock_ptr owner_pid owner_comm owner_prio contender_pid contender_comm contender_prio contender_count"); + mu_ctrl.prev_watcher = MUTEX_WATCHER + 9;//打印表头功能关 + err = bpf_map_update_elem(mumap_fd, &key, &mu_ctrl, 0); + if(err < 0){ + fprintf(stderr, "Failed to update elem\n"); + } + }else if (mu_ctrl.prev_watcher == MUTEX_WATCHER +1) { + printf("%s\n"," lock_ptr locked_total locked_max contended_total count last_owner last_owmer_name"); + mu_ctrl.prev_watcher = MUTEX_WATCHER + 9;//打印表头功能关 + err = bpf_map_update_elem(mumap_fd, &key, &mu_ctrl, 0); + if(err < 0){ + fprintf(stderr, "Failed to update elem\n"); + } + } + if(!mu_ctrl.mutex_detail){ + const struct mutex_contention_event *e = data; + if (e->owner_pid == 0 || e->contender_pid == 0||e->owner_pid == 1) { + return 0; + } + // 增加锁争用次数 + increment_lock_count(e->ptr); + uint64_t contention_count = get_lock_count(e->ptr); + printf("%15llu %15d %15s %15d %15d %15s %15d %15ld\n", e->ptr, e->owner_pid, e->owner_name, e->owner_prio,e->contender_pid, e->contender_name, e->contender_prio,contention_count); + } return 0; } - +static int mutex_detail() { + int fd = bpf_map__fd(mu_skel->maps.mutex_info_map); + u64 key, next_key; + struct mutex_info_kernel info; + while (bpf_map_get_next_key(fd, &key, &next_key) == 0) { + int err = bpf_map_lookup_elem(fd, &next_key, &info); + if (err == 0 && info.contended_total != 0) { // 添加过滤条件 + printf(" %15llu %15lluns %15lluns %15lluns %15d %15d %20s\n", + next_key, info.locked_total, info.locked_max, info.contended_total, info.count, info.last_owner, info.last_name); + } + key = next_key; + } + return 0; +} static int schedule_print() { @@ -697,6 +737,7 @@ int main(int argc, char **argv) struct bpf_map *preempt_ctrl_map = NULL; struct bpf_map *schedule_ctrl_map = NULL; struct bpf_map *mq_ctrl_map = NULL; + struct bpf_map *mu_ctrl_map = NULL; int key = 0; int err; err = argp_parse(&argp, argc, argv, 0, NULL, NULL); @@ -967,6 +1008,18 @@ int main(int argc, char **argv) fprintf(stderr, "Failed to load and verify BPF skeleton\n"); goto mutrace_cleanup; } + err = common_pin_map(&mu_ctrl_map,mu_skel->obj,"mu_ctrl_map",mu_ctrl_path); + if(err < 0){ + goto mutrace_cleanup; + } + mumap_fd = bpf_map__fd(mu_ctrl_map); + struct mu_ctrl init_value = {false,false,MUTEX_WATCHER}; + + err = bpf_map_update_elem(mumap_fd, &key, &init_value, 0); + if(err < 0){ + fprintf(stderr, "Failed to update elem\n"); + goto mutrace_cleanup; + } //ctrl if(err < 0){ goto mutrace_cleanup; @@ -983,7 +1036,6 @@ int main(int argc, char **argv) } rb = ring_buffer__new(bpf_map__fd(mu_skel->maps.rb), mutrace_print, NULL, NULL); - printf("%s\n"," lock_ptr owner_pid owner_comm owner_prio contender_pid contender_comm contender_prio contender_count"); if (!rb) { err = -1; fprintf(stderr, "Failed to create ring buffer\n"); @@ -1091,6 +1143,11 @@ int main(int argc, char **argv) printf("Error polling perf buffer: %d\n", err); break; } + if(env.MUTRACE&&mu_ctrl.mutex_detail){ + err = mutex_detail(); + sleep(1); + printf("-------------------------------------------------------------\n"); + } } else { printf("正在开发中......\n-c 打印cs_delay:\t对内核函数schedule()的执行时长进行测试;\n-s sar工具;\n-y 打印sc_delay:\t系统调用运行延迟进行检测; \n-p 打印preempt_time:\t对抢占调度时间输出;\n"); @@ -1136,4 +1193,4 @@ int main(int argc, char **argv) ring_buffer__free(rb); mutrace_bpf__destroy(mu_skel); return err < 0 ? -err : 0; -} \ No newline at end of file +} diff --git a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher.h b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher.h index 3425e8975..54a328542 100644 --- a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher.h +++ b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher.h @@ -158,11 +158,13 @@ struct proc_history { /*----------------------------------------------*/ /* mutrace相关结构体 */ /*----------------------------------------------*/ -struct mutex_info { +struct mutex_info_kernel { u64 locked_total;//锁被持有的总时间 u64 locked_max;//锁被持有的最长时间 u64 contended_total;//锁发生竞争的总时间 + int count;//记录锁被争用的总次数 pid_t last_owner;//最后一次持有该锁的线程 ID + char last_name[TASK_COMM_LEN]; u64 acquire_time; // 锁每次被获取的时间戳,方便后续计算 u64 ptr;//地址 }; @@ -288,4 +290,10 @@ struct mq_ctrl{ int prev_watcher; }; +struct mu_ctrl{ + bool mu_func; + bool mutex_detail; + int prev_watcher; +}; + #endif // CPU_WATCHER_H \ No newline at end of file diff --git a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher_helper.h b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher_helper.h index dc78f2622..3db69defd 100644 --- a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher_helper.h +++ b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/include/cpu_watcher_helper.h @@ -25,6 +25,7 @@ #define PREEMPT_WACTHER 40 #define SCHEDULE_WACTHER 50 #define MQ_WACTHER 60 +#define MUTEX_WATCHER 70 #define HASH_SIZE 1024 /*----------------------------------------------*/ @@ -74,6 +75,7 @@ const char *sc_ctrl_path = "/sys/fs/bpf/cpu_watcher_map/sc_ctrl_map"; const char *preempt_ctrl_path = "/sys/fs/bpf/cpu_watcher_map/preempt_ctrl_map"; const char *schedule_ctrl_path = "/sys/fs/bpf/cpu_watcher_map/schedule_ctrl_map"; const char *mq_ctrl_path = "/sys/fs/bpf/cpu_watcher_map/mq_ctrl_map"; +const char *mu_ctrl_path = "/sys/fs/bpf/cpu_watcher_map/mu_ctrl_map"; int common_pin_map(struct bpf_map **bpf_map, const struct bpf_object *obj, const char *map_name, const char *ctrl_path) { @@ -203,6 +205,23 @@ int update_mq_ctrl_map(struct mq_ctrl mq_ctrl){ return 0; } +int update_mu_ctrl_map(struct mu_ctrl mu_ctrl){ + int err,key = 0; + int srcmap_fd; + + srcmap_fd = bpf_obj_get(mu_ctrl_path); + if (srcmap_fd < 0) { + fprintf(stderr,"Failed to open mq_ctrl_map file\n"); + return srcmap_fd; + } + err = bpf_map_update_elem(srcmap_fd,&key,&mu_ctrl, 0); + if(err < 0){ + fprintf(stderr, "Failed to update mq_ctrl_map elem\n"); + return err; + } + + return 0; +} /*----------------------------------------------*/ /* mutex_count */ /*----------------------------------------------*/ diff --git a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/test/test_cpuwatcher.c b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/test/test_cpuwatcher.c index ada9abd83..59bb2dcb6 100644 --- a/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/test/test_cpuwatcher.c +++ b/eBPF_Supermarket/CPU_Subsystem/cpu_watcher/test/test_cpuwatcher.c @@ -19,6 +19,7 @@ static struct env { bool mq_delay_test; bool preempt_test; bool schedule_test; + bool mutrace_test; } env = { .sar_test = false, .cs_delay_test = false, @@ -26,6 +27,7 @@ static struct env { .mq_delay_test = false, .preempt_test = false, .schedule_test = false, + .mutrace_test = false, }; const char argp_program_doc[] ="To test cpu_watcher.\n"; @@ -37,6 +39,7 @@ static const struct argp_option opts[] = { { "mq_delay", 'm', NULL, 0, "To test mq_delay", 0 }, { "preempt_delay", 'p', NULL, 0, "To test preempt_delay", 0 }, { "schedule_delay", 'd', NULL, 0, "To test schedule_delay", 0 }, + { "mu_trace", 'x', NULL, 0, "To test mutrace", 0 }, { "all", 'a', NULL, 0, "To test all", 0 }, { NULL, 'h', NULL, OPTION_HIDDEN, "show the full help", 0 }, {}, @@ -71,6 +74,9 @@ static error_t parse_arg(int key, char *arg, struct argp_state *state) break; case 'd': env.schedule_test = true; + break; + case 'x': + env.mutrace_test = true; break; case 'h': argp_state_help(state, stderr, ARGP_HELP_STD_HELP); @@ -191,5 +197,17 @@ int main(int argc, char **argv){ printf("\n"); } + if(env.mutrace_test){ + printf("MUTRACE_TEST----------------------------------------------\n"); + //MUTRACE功能测试逻辑:系统上执行混合压力测试,包括4个顺序读写硬盘线程、4个IO操作线程,持续15秒,观察加压前后的变化。 + char *argvv[] = { "/usr/bin/stress-ng", "--hdd", "4", "--hdd-opts", "wr-seq,rd-seq", "--io", "4", "--timeout", "15s", "--metrics-brief", NULL }; + char *envp[] = { "PATH=/bin", NULL }; + printf("MUTRACE功能测试逻辑:系统上执行混合压力测试,包括4个顺序读写硬盘线程、4个IO操作线程和4个UDP网络操作线程,持续15秒,观察加压前后的变化\n"); + printf("执行指令 stress-ng --hdd 4 --hdd-opts wr-seq,rd-seq --io 4 --udp 4 --timeout 15s --metrics-brief\n"); + execve("/usr/bin/stress-ng", argvv, envp); + perror("execve"); + printf("\n"); + } + return 0; }