Skip to content

Commit

Permalink
cpu_watcher:schedule_delay增加阈值选项&&增加controller功能 (#813)
Browse files Browse the repository at this point in the history
* cpu_watcher:schedule_delay增加阈值选项&&workflow增加测试流程

* .

* cpu_watcher:增加controller功能
  • Loading branch information
vvzxy authored Jun 11, 2024
1 parent 1749ab2 commit 2df6e9d
Show file tree
Hide file tree
Showing 10 changed files with 641 additions and 45 deletions.
3 changes: 2 additions & 1 deletion .github/workflows/ebpf_cpu_watcher.yml
Original file line number Diff line number Diff line change
Expand Up @@ -31,8 +31,9 @@ jobs:
cd eBPF_Supermarket/CPU_Subsystem/cpu_watcher/
make
sudo ./cpu_watcher
- name: Run test_cpuwatcher

- name: Run test_cpuwatcher
run: |
cd eBPF_Supermarket/CPU_Subsystem/cpu_watcher/test
make
Expand Down
13 changes: 11 additions & 2 deletions eBPF_Supermarket/CPU_Subsystem/cpu_watcher/Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,7 @@ ALL_LDFLAGS := $(LDFLAGS) $(EXTRA_LDFLAGS)

APPS =cs_delay sar sc_delay preempt schedule_delay mq_delay
TARGETS=cpu_watcher
CONTROLLER := controller

SRC_DIR = ./include

Expand Down Expand Up @@ -81,12 +82,12 @@ $(call allow-override,CC,$(CROSS_COMPILE)cc)
$(call allow-override,LD,$(CROSS_COMPILE)ld)

.PHONY: all
all: $(TARGETS)
all: $(CONTROLLER) $(TARGETS)

.PHONY: clean
clean:
$(call msg,CLEAN)
$(Q)rm -rf $(OUTPUT) $(TARGETS)
$(Q)rm -rf $(OUTPUT) $(TARGETS) $(CONTROLLER)

$(OUTPUT) $(OUTPUT)/libbpf $(BPFTOOL_OUTPUT):
$(call msg,MKDIR,$@)
Expand Down Expand Up @@ -132,11 +133,19 @@ $(OUTPUT)/%.o: $(SRC_DIR)/%.c | $(OUTPUT)
$(call msg,CC,$@)
$(Q)$(CC) $(CFLAGS) $(INCLUDES) -c $< -o $@

$(OUTPUT)/%.o: $(CONTROLLER).c | $(OUTPUT)
$(call msg,CC,$@)
$(Q)$(CC) $(CFLAGS) $(INCLUDES) -c $< -o $@

$(OUTPUT)/$(TARGETS).o: $(TARGETS).c $(APPS) | $(OUTPUT)
$(call msg,CC,$@)
$(Q)$(CC) $(CFLAGS) $(INCLUDES) -c $(filter %.c,$^) -o $@

# Build application binary
$(CONTROLLER): %: $(OUTPUT)/%.o $(COMMON_OBJ) $(LIBBPF_OBJ) | $(OUTPUT)
$(call msg,BINARY,$@)
$(Q)$(CC) $^ $(ALL_LDFLAGS) -lstdc++ -lelf -lz -o $@

$(TARGETS): %: $(OUTPUT)/%.o $(COMMON_OBJ) $(LIBBPF_OBJ) | $(OUTPUT)
$(call msg,BINARY,$@)
$(Q)$(CC) $(CFLAGS) $^ $(ALL_LDFLAGS) -lstdc++ -lelf -lz -o $@
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -21,9 +21,10 @@
#include "cpu_watcher.h"

char LICENSE[] SEC("license") = "Dual BSD/GPL";

const int ctrl_key = 0;
//记录时间戳;
BPF_ARRAY(start,int,u64,1);
BPF_ARRAY(cs_ctrl_map,int,struct cs_ctrl,1);
struct {
__uint(type, BPF_MAP_TYPE_RINGBUF);
__uint(max_entries, 256 * 1024);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -23,10 +23,11 @@


char LICENSE[] SEC("license") = "Dual BSD/GPL";

const int ctrl_key = 0;
BPF_HASH(send_msg1,pid_t,struct send_events,1024);//记录pid->u_msg_ptr的关系;do_mq_timedsend入参
BPF_HASH(send_msg2,u64,struct send_events,1024);//记录msg->time的关系;
BPF_HASH(rcv_msg1,pid_t,struct rcv_events,1024);//记录pid->u_msg_ptr的关系;do_mq_timedsend入参
BPF_ARRAY(mq_ctrl_map,int,struct mq_ctrl,1);
struct {
__uint(type, BPF_MAP_TYPE_RINGBUF);
__uint(max_entries, 256 * 1024);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -23,13 +23,19 @@
char LICENSE[] SEC("license") = "Dual BSD/GPL";
#define TASK_RUNNING 0x0000

const int ctrl_key = 0;
BPF_HASH(has_scheduled,struct proc_id, bool, 10240);//记录该进程是否调度过
BPF_HASH(enter_schedule,struct proc_id, struct schedule_event, 10240);//记录该进程上运行队列的时间
BPF_ARRAY(sys_schedule,int,struct sum_schedule,1);//记录整个系统的调度延迟
BPF_ARRAY(threshold_schedule,int,struct proc_schedule,10240);//记录每个进程的调度延迟
BPF_ARRAY(schedule_ctrl_map,int,struct schedule_ctrl,1);

SEC("tp_btf/sched_wakeup")
int BPF_PROG(sched_wakeup, struct task_struct *p) {
struct schedule_ctrl *sched_ctrl;
sched_ctrl = bpf_map_lookup_elem(&schedule_ctrl_map,&ctrl_key);
if(!sched_ctrl || !sched_ctrl->schedule_func)
return 0;
pid_t pid = p->pid;
int cpu = bpf_get_smp_processor_id();
struct schedule_event *schedule_event;
Expand All @@ -56,6 +62,10 @@ int BPF_PROG(sched_wakeup, struct task_struct *p) {

SEC("tp_btf/sched_wakeup_new")
int BPF_PROG(sched_wakeup_new, struct task_struct *p) {
struct schedule_ctrl *sched_ctrl;
sched_ctrl = bpf_map_lookup_elem(&schedule_ctrl_map,&ctrl_key);
if(!sched_ctrl || !sched_ctrl->schedule_func)
return 0;
pid_t pid = p->pid;
int cpu = bpf_get_smp_processor_id();
struct proc_id id= {};
Expand All @@ -76,6 +86,11 @@ int BPF_PROG(sched_wakeup_new, struct task_struct *p) {

SEC("tp_btf/sched_switch")
int BPF_PROG(sched_switch, bool preempt, struct task_struct *prev, struct task_struct *next) {
struct schedule_ctrl *sched_ctrl;
sched_ctrl = bpf_map_lookup_elem(&schedule_ctrl_map,&ctrl_key);
if(!sched_ctrl || !sched_ctrl->schedule_func)
return 0;

u64 current_time = bpf_ktime_get_ns();
pid_t prev_pid = prev->pid;
unsigned int prev_state = prev->__state;
Expand Down Expand Up @@ -162,6 +177,11 @@ int BPF_PROG(sched_switch, bool preempt, struct task_struct *prev, struct task_s

SEC("tracepoint/sched/sched_process_exit")
int sched_process_exit(void *ctx) {
struct schedule_ctrl *sched_ctrl;
sched_ctrl = bpf_map_lookup_elem(&schedule_ctrl_map,&ctrl_key);
if(!sched_ctrl || !sched_ctrl->schedule_func)
return 0;

struct task_struct *p = (struct task_struct *)bpf_get_current_task();
pid_t pid = BPF_CORE_READ(p, pid);
int cpu = bpf_get_smp_processor_id();
Expand Down
250 changes: 250 additions & 0 deletions eBPF_Supermarket/CPU_Subsystem/cpu_watcher/controller.c
Original file line number Diff line number Diff line change
@@ -0,0 +1,250 @@
// Copyright 2023 The LMP Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// https://github.com/linuxkerneltravel/lmp/blob/develop/LICENSE
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// author: [email protected] [email protected] [email protected]
//
// used to control the execution of proc_image tool
#include <stdio.h>
#include <stdbool.h>
#include <argp.h>
#include <stdlib.h>
#include <unistd.h>
#include <time.h>
#include <signal.h>
#include <bpf/libbpf.h>
#include <bpf/bpf.h>
#include "cpu_watcher_helper.h"

static struct env {
// 1代表activate;2代表unactivate;3代表finish
int usemode;
bool SAR;
bool CS_DELAY;
bool SYSCALL_DELAY;
bool MIN_US_SET;
int MIN_US;
bool PREEMPT;
bool SCHEDULE_DELAY;
bool MQ_DELAY;
int freq;
} env = {
.usemode = 0,
.SAR = false,
.CS_DELAY = false,
.SYSCALL_DELAY = false,
.MIN_US_SET = false,
.MIN_US = 10000,
.PREEMPT = false,
.SCHEDULE_DELAY = false,
.MQ_DELAY = false,
.freq = 99,
};

const char argp_program_doc[] ="Trace process to get cpu watcher.\n";

static const struct argp_option opts[] = {
{ "activate", 'a', NULL, 0, "Set startup policy of proc_image tool" },
{ "unactivate", 'u', NULL, 0, "Initialize to the original unactivated state" },
{ "finish", 'f', NULL, 0, "Finish to run eBPF tool" },
{"libbpf_sar", 's', 0, 0, "Print sar_info (the data of cpu)" },
{"cs_delay", 'c', 0, 0, "Print cs_delay (the data of cpu)" },
{"syscall_delay", 'S', 0, 0, "Print syscall_delay (the data of syscall)" },
{"preempt_time", 'p', 0, 0, "Print preempt_time (the data of preempt_schedule)" },
{"schedule_delay", 'd', 0, 0, "Print schedule_delay (the data of cpu)" },
{"schedule_delay_min_us_set", 'e', "THRESHOLD", 0, "Print scheduling delays that exceed the threshold (the data of cpu)" },
{"mq_delay", 'm', 0, 0, "Print mq_delay(the data of proc)" },
// { "pid", 'p', "PID", 0, "Process ID to trace" },
// { "tgid", 'P', "TGID", 0, "Thread group to trace" },
// { "cpuid", 'c', "CPUID", 0, "Set For Tracing per-CPU Process(other processes don't need to set this parameter)" },
// { "time", 't', "TIME-SEC", 0, "Max Running Time(0 for infinite)" },
// { "myproc", 'm', NULL, 0, "Trace the process of the tool itself (not tracked by default)" },
// { "resource", 'r', NULL, 0, "Collects resource usage information about processes" },
// { "keytime", 'k', "KEYTIME", 0, "Collects keytime information about processes(0:except CPU kt_info,1:all kt_info,any 0 or 1 when deactivated)" },
// { "lock", 'l', NULL, 0, "Collects lock information about processes" },
// { "syscall", 's', "SYSCALLS", 0, "Collects syscall sequence (1~50) information about processes(any 1~50 when deactivated)" },
// { "schedule", 'S', NULL, 0, "Collects schedule information about processes (trace tool process)" },
{ NULL, 'h', NULL, OPTION_HIDDEN, "show the full help" },
{},
};

static error_t parse_arg(int key, char *arg, struct argp_state *state)
{
switch (key) {
case 'a':
env.usemode = 1;
break;
case 'u':
env.usemode = 2;
break;
case 'f':
env.usemode = 3;
break;
case 's':
env.SAR = true;
break;
case 'c':
env.CS_DELAY = true;
break;
case 'S':
env.SYSCALL_DELAY = true;
break;
case 'p':
env.PREEMPT = true;
break;
case 'd':
env.SCHEDULE_DELAY = true;
break;
case 'e':
env.MIN_US_SET = true;
if (arg) {
env.MIN_US = strtol(arg, NULL, 10);
if (env.MIN_US <= 0) {
fprintf(stderr, "Invalid value for min_us: %d\n", env.MIN_US);
argp_usage(state);
}
} else {
env.MIN_US = 10000;
}
break;
case 'm':
env.MQ_DELAY = true;
break;
case 'h':
argp_state_help(state, stderr, ARGP_HELP_STD_HELP);
break;
default:
return ARGP_ERR_UNKNOWN;
}

return 0;
}

int deactivate_mode(){
int err;

if(env.SAR){
struct sar_ctrl sar_ctrl = {false,0};
err = update_sar_ctrl_map(sar_ctrl);
if(err < 0) return err;
}
if(env.CS_DELAY){
struct cs_ctrl cs_ctrl = {false,0};
err = update_cs_ctrl_map(cs_ctrl);
if(err < 0) return err;
}
if(env.SYSCALL_DELAY){
struct sc_ctrl sc_ctrl = {false,0};
err = update_sc_ctrl_map(sc_ctrl);
if(err < 0) return err;
}
if(env.PREEMPT){
struct preempt_ctrl preempt_ctrl = {false,0};
err = update_preempt_ctrl_map(preempt_ctrl);
if(err < 0) return err;
}
if(env.SCHEDULE_DELAY){
struct schedule_ctrl schedule_ctrl = {false,false,10000,0};
err = update_schedule_ctrl_map(schedule_ctrl);
if(err < 0) return err;
}
if(env.MQ_DELAY){
struct mq_ctrl mq_ctrl = {false,0};
err = update_mq_ctrl_map(mq_ctrl);
if(err < 0) return err;
}
return 0;
}

static void sig_handler(int signo)
{
deactivate_mode();
}

int main(int argc, char **argv)
{
int err;
static const struct argp argp = {
.options = opts,
.parser = parse_arg,
.doc = argp_program_doc,
};

err = argp_parse(&argp, argc, argv, 0, NULL, NULL);
if (err)
return err;

signal(SIGALRM,sig_handler);
signal(SIGINT,sig_handler);
signal(SIGTERM,sig_handler);

if(env.usemode == 1){ // activate mode
if(env.SAR){
struct sar_ctrl sar_ctrl = {true,SAR_WACTHER};
err = update_sar_ctrl_map(sar_ctrl);
if(err < 0) return err;
}

if(env.CS_DELAY){
struct cs_ctrl cs_ctrl = {true,CS_WACTHER};
err = update_cs_ctrl_map(cs_ctrl);
if(err < 0) return err;
}

if(env.SYSCALL_DELAY){
struct sc_ctrl sc_ctrl = {true,SC_WACTHER};
err = update_sc_ctrl_map(sc_ctrl);
if(err < 0) return err;
}

if(env.PREEMPT){
struct preempt_ctrl preempt_ctrl = {true,PREEMPT_WACTHER};
err = update_preempt_ctrl_map(preempt_ctrl);
if(err < 0) return err;
}

if(env.SCHEDULE_DELAY){
/*
*1.未设置env.MIN_US_SET时, prev_watcher = SCHEDULE_WACTHER + 0;输出方式为schedule输出
*2.已设置env.MIN_US_SET时, prev_watcher = SCHEDULE_WACTHER + 1;输出方式为-e输出
*/
struct schedule_ctrl schedule_ctrl = {true,env.MIN_US_SET,env.MIN_US,SCHEDULE_WACTHER+env.MIN_US_SET};
err = update_schedule_ctrl_map(schedule_ctrl);
if(err < 0) return err;
}

if(env.MQ_DELAY){
struct mq_ctrl mq_ctrl = {true,MQ_WACTHER};
err = update_mq_ctrl_map(mq_ctrl);
if(err < 0) return err;
}
}else if(env.usemode == 2){ // deactivate mode
err = deactivate_mode();
if(err<0){
fprintf(stderr, "Failed to deactivate\n");
return err;
}
}else if(env.usemode == 3){ // finish mode
const char *command = "pkill cpu_watcher";
int status = system(command);
if (status == -1) {
perror("system");
}
}else{
// 输出help信息
printf("Please enter the usage mode(activate/deactivate/finish) before selecting the function\n");
argp_help(&argp, stderr, ARGP_HELP_LONG, argv[0]);
}

return 0;
}
Loading

0 comments on commit 2df6e9d

Please sign in to comment.