drm/amd/pm: Modify mode2 msg sequence on aldebaran
authorLijo Lazar <lijo.lazar@amd.com>
Tue, 16 Mar 2021 11:19:09 +0000 (19:19 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Fri, 9 Apr 2021 20:45:57 +0000 (16:45 -0400)
v1: During mode2 reset, PCI space is lost after message is sent.
Restore PCI space before waiting for response from firmware.

v2: Move mode2 sequence to aldebaran and update PMFW version.
Handle generic sequence in smu13 without PMFW version check.

Signed-off-by: Lijo Lazar <lijo.lazar@amd.com>
Reviewed-by: Feifei Xu <Feifei.Xu@amd.com>
Reviewed-by: Hawking Zhang <Hawking.Zhang@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/pm/swsmu/smu13/aldebaran_ppt.c
drivers/gpu/drm/amd/pm/swsmu/smu13/smu_v13_0.c
drivers/gpu/drm/amd/pm/swsmu/smu_cmn.c
drivers/gpu/drm/amd/pm/swsmu/smu_cmn.h

index 7d38b92a78dc90ad8567c385c858fcf078af7726..ec485308b921199b18b32f5a72304eeb67188dab 100644 (file)
@@ -1432,6 +1432,57 @@ static ssize_t aldebaran_get_gpu_metrics(struct smu_context *smu,
        return sizeof(struct gpu_metrics_v1_1);
 }
 
+int aldebaran_mode2_reset(struct smu_context *smu)
+{
+       u32 smu_version;
+       int ret = 0, index;
+       struct amdgpu_device *adev = smu->adev;
+       int timeout = 10;
+
+       smu_cmn_get_smc_version(smu, NULL, &smu_version);
+
+       index = smu_cmn_to_asic_specific_index(smu, CMN2ASIC_MAPPING_MSG,
+                                               SMU_MSG_GfxDeviceDriverReset);
+
+       mutex_lock(&smu->message_lock);
+       if (smu_version >= 0x00441400) {
+               ret = smu_cmn_send_msg_without_waiting(smu, (uint16_t)index, SMU_RESET_MODE_2);
+               /* This is similar to FLR, wait till max FLR timeout */
+               msleep(100);
+               dev_dbg(smu->adev->dev, "restore config space...\n");
+               /* Restore the config space saved during init */
+               amdgpu_device_load_pci_state(adev->pdev);
+
+               dev_dbg(smu->adev->dev, "wait for reset ack\n");
+               while (ret == -ETIME && timeout)  {
+                       ret = smu_cmn_wait_for_response(smu);
+                       /* Wait a bit more time for getting ACK */
+                       if (ret == -ETIME) {
+                               --timeout;
+                               usleep_range(500, 1000);
+                               continue;
+                       }
+
+                       if (ret != 1) {
+                               dev_err(adev->dev, "failed to send mode2 message \tparam: 0x%08x response %#x\n",
+                                               SMU_RESET_MODE_2, ret);
+                               goto out;
+                       }
+               }
+
+       } else {
+               dev_err(adev->dev, "smu fw 0x%x does not support MSG_GfxDeviceDriverReset MSG\n",
+                               smu_version);
+       }
+
+       if (ret == 1)
+               ret = 0;
+out:
+       mutex_unlock(&smu->message_lock);
+
+       return ret;
+}
+
 static bool aldebaran_is_mode1_reset_supported(struct smu_context *smu)
 {
 #if 0
@@ -1530,8 +1581,8 @@ static const struct pptable_funcs aldebaran_ppt_funcs = {
        .mode1_reset_is_support = aldebaran_is_mode1_reset_supported,
        .mode2_reset_is_support = aldebaran_is_mode2_reset_supported,
        .mode1_reset = smu_v13_0_mode1_reset,
-       .mode2_reset = smu_v13_0_mode2_reset,
        .set_mp1_state = aldebaran_set_mp1_state,
+       .mode2_reset = aldebaran_mode2_reset,
 };
 
 void aldebaran_set_ppt_funcs(struct smu_context *smu)
index 2e296cb3bb04dd3e372630cfcf51b17e1beefe2a..8974cd55994b162b8cc04db6568557951f623831 100644 (file)
@@ -1376,17 +1376,14 @@ int smu_v13_0_mode1_reset(struct smu_context *smu)
 
 int smu_v13_0_mode2_reset(struct smu_context *smu)
 {
-       u32 smu_version;
-       int ret = 0;
-       struct amdgpu_device *adev = smu->adev;
-       smu_cmn_get_smc_version(smu, NULL, &smu_version);
-       if (smu_version >= 0x00440700)
-               ret = smu_cmn_send_smc_msg_with_param(smu, SMU_MSG_GfxDeviceDriverReset, SMU_RESET_MODE_2, NULL);
-       else
-               dev_err(adev->dev, "smu fw 0x%x does not support MSG_GfxDeviceDriverReset MSG\n", smu_version);
-       /*TODO: mode2 reset wait time should be shorter, will modify it later*/
+       int ret;
+
+       ret = smu_cmn_send_smc_msg_with_param(smu, SMU_MSG_GfxDeviceDriverReset,
+                       SMU_RESET_MODE_2, NULL);
+       /*TODO: mode2 reset wait time should be shorter, add ASIC specific func if required */
        if (!ret)
                msleep(SMU13_MODE1_RESET_WAIT_TIME_IN_MS);
+
        return ret;
 }
 
index 2d216f5b167d6f050eda12cf40329e10e50003dc..b725f263092bacf5927c0776449e47f73a668bc8 100644 (file)
@@ -76,7 +76,7 @@ static void smu_cmn_read_arg(struct smu_context *smu,
        *arg = RREG32_SOC15(MP1, 0, mmMP1_SMN_C2PMSG_82);
 }
 
-static int smu_cmn_wait_for_response(struct smu_context *smu)
+int smu_cmn_wait_for_response(struct smu_context *smu)
 {
        struct amdgpu_device *adev = smu->adev;
        uint32_t cur_value, i, timeout = adev->usec_timeout * 10;
index 155e2a68fa1c7c0b03a7d793a315fb0a76362f5d..da6ff6f024f91bf53c6a1a5d292793ed46cf1fb5 100644 (file)
@@ -37,6 +37,8 @@ int smu_cmn_send_smc_msg(struct smu_context *smu,
                         enum smu_message_type msg,
                         uint32_t *read_arg);
 
+int smu_cmn_wait_for_response(struct smu_context *smu);
+
 int smu_cmn_to_asic_specific_index(struct smu_context *smu,
                                   enum smu_cmn2asic_mapping_type type,
                                   uint32_t index);