[PATCH v2] io_uring: Statistics of the true utilization of sq threads.

From: Xiaobing Li
Date: Wed Nov 08 2023 - 03:15:39 EST


Since the sq thread has a while(1) structure, during this process, there
may be a lot of time that is not processing IO but does not exceed the
timeout period, therefore, the sqpoll thread will keep running and will
keep occupying the CPU. Obviously, the CPU is wasted at this time;Our
goal is to count the part of the time that the sqpoll thread actually
processes IO, so as to reflect the part of the CPU it uses to process
IO, which can be used to help improve the actual utilization of the CPU
in the future.

Signed-off-by: Xiaobing Li <xiaobing.li@xxxxxxxxxxx>

v1 -> v2: Added method to query data.

The test results are as follows:
cat /proc/11440/fdinfo/6
pos: 0
flags: 02000002
mnt_id: 16
ino: 94449
SqMask: 0xf
SqHead: 1845170
SqTail: 1845170
CachedSqHead: 1845170
CqMask: 0xf
CqHead: 1845154
CqTail: 1845154
CachedCqTail: 1845154
SQEs: 0
CQEs: 0
SqThread: -1
SqThreadCpu: -1
UserFiles: 1
UserBufs: 0
PollList:
CqOverflowList:
PID: 11440
work: 18794
total: 19123

---
io_uring/fdinfo.c | 6 ++++++
io_uring/sqpoll.c | 8 ++++++++
io_uring/sqpoll.h | 2 ++
3 files changed, 16 insertions(+)

diff --git a/io_uring/fdinfo.c b/io_uring/fdinfo.c
index f04a43044d91..f0b79c533062 100644
--- a/io_uring/fdinfo.c
+++ b/io_uring/fdinfo.c
@@ -213,6 +213,12 @@ __cold void io_uring_show_fdinfo(struct seq_file *m, struct file *f)

}

+ if (ctx->sq_data) {
+ seq_printf(m, "PID:\t%d\n", task_pid_nr(ctx->sq_data->thread));
+ seq_printf(m, "work:\t%lu\n", ctx->sq_data->work);
+ seq_printf(m, "total:\t%lu\n", ctx->sq_data->total);
+ }
+
spin_unlock(&ctx->completion_lock);
}
#endif
diff --git a/io_uring/sqpoll.c b/io_uring/sqpoll.c
index bd6c2c7959a5..c821273406bd 100644
--- a/io_uring/sqpoll.c
+++ b/io_uring/sqpoll.c
@@ -224,6 +224,7 @@ static int io_sq_thread(void *data)
struct io_ring_ctx *ctx;
unsigned long timeout = 0;
char buf[TASK_COMM_LEN];
+ unsigned long start, begin, end;
DEFINE_WAIT(wait);

snprintf(buf, sizeof(buf), "iou-sqp-%d", sqd->task_pid);
@@ -235,6 +236,7 @@ static int io_sq_thread(void *data)
set_cpus_allowed_ptr(current, cpu_online_mask);

mutex_lock(&sqd->lock);
+ start = jiffies;
while (1) {
bool cap_entries, sqt_spin = false;

@@ -245,12 +247,18 @@ static int io_sq_thread(void *data)
}

cap_entries = !list_is_singular(&sqd->ctx_list);
+ begin = jiffies;
list_for_each_entry(ctx, &sqd->ctx_list, sqd_list) {
int ret = __io_sq_thread(ctx, cap_entries);

if (!sqt_spin && (ret > 0 || !wq_list_empty(&ctx->iopoll_list)))
sqt_spin = true;
}
+ end = jiffies;
+ sqd->total = end - start;
+ if (sqt_spin == true)
+ sqd->work += end - begin;
+
if (io_run_task_work())
sqt_spin = true;

diff --git a/io_uring/sqpoll.h b/io_uring/sqpoll.h
index 8df37e8c9149..0aa4e2efa4db 100644
--- a/io_uring/sqpoll.h
+++ b/io_uring/sqpoll.h
@@ -16,6 +16,8 @@ struct io_sq_data {
pid_t task_pid;
pid_t task_tgid;

+ unsigned long work;
+ unsigned long total;
unsigned long state;
struct completion exited;
};
--
2.34.1