|
Hannes Reinecke |
382417 |
From: Keith Busch <kbusch@kernel.org>
|
|
Hannes Reinecke |
382417 |
Date: Thu, 9 Sep 2021 08:54:52 -0700
|
|
Hannes Reinecke |
382417 |
Subject: [PATCH] nvme-tcp: fix io_work priority inversion
|
|
Hannes Reinecke |
382417 |
Git-commit: 70f437fb4395ad4d1d16fab9a1ad9fbc9fc0579b
|
|
Hannes Reinecke |
382417 |
Patch-mainline: v5.15-rc1
|
|
Hannes Reinecke |
382417 |
References: git-fixes
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
Dispatching requests inline with the .queue_rq() call may block while
|
|
Hannes Reinecke |
382417 |
holding the send_mutex. If the tcp io_work also happens to schedule, it
|
|
Hannes Reinecke |
382417 |
may see the req_list is non-empty, leaving "pending" true and remaining
|
|
Hannes Reinecke |
382417 |
in TASK_RUNNING. Since io_work is of higher scheduling priority, the
|
|
Hannes Reinecke |
382417 |
.queue_rq task may not get a chance to run, blocking forward progress
|
|
Hannes Reinecke |
382417 |
and leading to io timeouts.
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
Instead of checking for pending requests within io_work, let the queueing
|
|
Hannes Reinecke |
382417 |
restart io_work outside the send_mutex lock if there is more work to be
|
|
Hannes Reinecke |
382417 |
done.
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
Fixes: a0fdd1418007f ("nvme-tcp: rerun io_work if req_list is not empty")
|
|
Hannes Reinecke |
382417 |
Reported-by: Samuel Jones <sjones@kalrayinc.com>
|
|
Hannes Reinecke |
382417 |
Signed-off-by: Keith Busch <kbusch@kernel.org>
|
|
Hannes Reinecke |
382417 |
Reviewed-by: Sagi Grimberg <sagi@grimberg.me>
|
|
Hannes Reinecke |
382417 |
Signed-off-by: Christoph Hellwig <hch@lst.de>
|
|
Hannes Reinecke |
382417 |
Acked-by: Hannes Reinecke <hare@suse.com>
|
|
Hannes Reinecke |
382417 |
---
|
|
Hannes Reinecke |
382417 |
drivers/nvme/host/tcp.c | 20 ++++++++++----------
|
|
Hannes Reinecke |
382417 |
1 file changed, 10 insertions(+), 10 deletions(-)
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
diff --git a/drivers/nvme/host/tcp.c b/drivers/nvme/host/tcp.c
|
|
Hannes Reinecke |
382417 |
index e2ab12f3f51c..e4249b7dc056 100644
|
|
Hannes Reinecke |
382417 |
--- a/drivers/nvme/host/tcp.c
|
|
Hannes Reinecke |
382417 |
+++ b/drivers/nvme/host/tcp.c
|
|
Hannes Reinecke |
382417 |
@@ -274,6 +274,12 @@ static inline void nvme_tcp_send_all(struct nvme_tcp_queue *queue)
|
|
Hannes Reinecke |
382417 |
} while (ret > 0);
|
|
Hannes Reinecke |
382417 |
}
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
+static inline bool nvme_tcp_queue_more(struct nvme_tcp_queue *queue)
|
|
Hannes Reinecke |
382417 |
+{
|
|
Hannes Reinecke |
382417 |
+ return !list_empty(&queue->send_list) ||
|
|
Hannes Reinecke |
382417 |
+ !llist_empty(&queue->req_list) || queue->more_requests;
|
|
Hannes Reinecke |
382417 |
+}
|
|
Hannes Reinecke |
382417 |
+
|
|
Hannes Reinecke |
382417 |
static inline void nvme_tcp_queue_request(struct nvme_tcp_request *req,
|
|
Hannes Reinecke |
382417 |
bool sync, bool last)
|
|
Hannes Reinecke |
382417 |
{
|
|
Hannes Reinecke |
382417 |
@@ -294,9 +300,10 @@ static inline void nvme_tcp_queue_request(struct nvme_tcp_request *req,
|
|
Hannes Reinecke |
382417 |
nvme_tcp_send_all(queue);
|
|
Hannes Reinecke |
382417 |
queue->more_requests = false;
|
|
Hannes Reinecke |
382417 |
mutex_unlock(&queue->send_mutex);
|
|
Hannes Reinecke |
382417 |
- } else if (last) {
|
|
Hannes Reinecke |
382417 |
- queue_work_on(queue->io_cpu, nvme_tcp_wq, &queue->io_work);
|
|
Hannes Reinecke |
382417 |
}
|
|
Hannes Reinecke |
382417 |
+
|
|
Hannes Reinecke |
382417 |
+ if (last && nvme_tcp_queue_more(queue))
|
|
Hannes Reinecke |
382417 |
+ queue_work_on(queue->io_cpu, nvme_tcp_wq, &queue->io_work);
|
|
Hannes Reinecke |
382417 |
}
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
static void nvme_tcp_process_req_list(struct nvme_tcp_queue *queue)
|
|
Hannes Reinecke |
382417 |
@@ -906,12 +913,6 @@ static void nvme_tcp_state_change(struct sock *sk)
|
|
Hannes Reinecke |
382417 |
read_unlock_bh(&sk->sk_callback_lock);
|
|
Hannes Reinecke |
382417 |
}
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
-static inline bool nvme_tcp_queue_more(struct nvme_tcp_queue *queue)
|
|
Hannes Reinecke |
382417 |
-{
|
|
Hannes Reinecke |
382417 |
- return !list_empty(&queue->send_list) ||
|
|
Hannes Reinecke |
382417 |
- !llist_empty(&queue->req_list) || queue->more_requests;
|
|
Hannes Reinecke |
382417 |
-}
|
|
Hannes Reinecke |
382417 |
-
|
|
Hannes Reinecke |
382417 |
static inline void nvme_tcp_done_send_req(struct nvme_tcp_queue *queue)
|
|
Hannes Reinecke |
382417 |
{
|
|
Hannes Reinecke |
382417 |
queue->request = NULL;
|
|
Hannes Reinecke |
382417 |
@@ -1145,8 +1146,7 @@ static void nvme_tcp_io_work(struct work_struct *w)
|
|
Hannes Reinecke |
382417 |
pending = true;
|
|
Hannes Reinecke |
382417 |
else if (unlikely(result < 0))
|
|
Hannes Reinecke |
382417 |
break;
|
|
Hannes Reinecke |
382417 |
- } else
|
|
Hannes Reinecke |
382417 |
- pending = !llist_empty(&queue->req_list);
|
|
Hannes Reinecke |
382417 |
+ }
|
|
Hannes Reinecke |
382417 |
|
|
Hannes Reinecke |
382417 |
result = nvme_tcp_try_recv(queue);
|
|
Hannes Reinecke |
382417 |
if (result > 0)
|
|
Hannes Reinecke |
382417 |
--
|
|
Hannes Reinecke |
382417 |
2.29.2
|
|
Hannes Reinecke |
382417 |
|