nvme: fine-tune sending of first keep-alive
authorMark O'Donovan <shiftee@posteo.net>
Fri, 24 Nov 2023 20:56:59 +0000 (20:56 +0000)
committerKeith Busch <kbusch@kernel.org>
Mon, 27 Nov 2023 18:23:13 +0000 (10:23 -0800)
Keep-alive commands are sent half-way through the kato period.
This normally works well but fails when the keep-alive system is
started when we are more than half way through the kato.
This can happen on larger setups or due to host delays.
With this change we now time the initial keep-alive command from
the controller initialisation time, rather than the keep-alive
mechanism activation time.

Signed-off-by: Mark O'Donovan <shiftee@posteo.net>
Reviewed-by: Sagi Grimberg <sagi@grimberg.me>
Signed-off-by: Keith Busch <kbusch@kernel.org>
drivers/nvme/host/core.c

index 46a4c9c5ea9625c7feb11d970ebb95cd4ce8be2b..8bf24c1cd8bba39591de66a30a7a6ad876b58161 100644 (file)
@@ -1192,8 +1192,16 @@ static unsigned long nvme_keep_alive_work_period(struct nvme_ctrl *ctrl)
 
 static void nvme_queue_keep_alive_work(struct nvme_ctrl *ctrl)
 {
-       queue_delayed_work(nvme_wq, &ctrl->ka_work,
-                          nvme_keep_alive_work_period(ctrl));
+       unsigned long now = jiffies;
+       unsigned long delay = nvme_keep_alive_work_period(ctrl);
+       unsigned long ka_next_check_tm = ctrl->ka_last_check_time + delay;
+
+       if (time_after(now, ka_next_check_tm))
+               delay = 0;
+       else
+               delay = ka_next_check_tm - now;
+
+       queue_delayed_work(nvme_wq, &ctrl->ka_work, delay);
 }
 
 static enum rq_end_io_ret nvme_keep_alive_end_io(struct request *rq,
@@ -4471,6 +4479,7 @@ int nvme_init_ctrl(struct nvme_ctrl *ctrl, struct device *dev,
        INIT_DELAYED_WORK(&ctrl->failfast_work, nvme_failfast_work);
        memset(&ctrl->ka_cmd, 0, sizeof(ctrl->ka_cmd));
        ctrl->ka_cmd.common.opcode = nvme_admin_keep_alive;
+       ctrl->ka_last_check_time = jiffies;
 
        BUILD_BUG_ON(NVME_DSM_MAX_RANGES * sizeof(struct nvme_dsm_range) >
                        PAGE_SIZE);