drm/amdgpu: Add reset control handling to reset workflow

This prefers reset control based handling if it's implemented for a particular ASIC. If not, it takes the legacy path. It uses the legacy method of preparing environment (job, scheduler tasks) and restoring environment. v2: remove unused variable (Alex) Signed-off-by: Lijo Lazar <lijo.lazar@amd.com> Reviewed-by: Feifei Xu <Feifei.Xu@amd.com> Reviewed-by: Hawking Zhang <Hawking.Zhang@amd.com> Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
author: Lijo Lazar <lijo.lazar@amd.com> 2021-03-16 20:31:51 +0800
committer: Alex Deucher <alexander.deucher@amd.com> 2021-04-09 16:46:14 -0400
commit: 04442bf70debb197d4ed4e850aa77213e685b352 (patch)
tree: 17774997a6f4edbe8aa5675d98f07432578ea57a /drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
parent: e071dce38f0a3acb2f6d019c6bb7933fd20d3357 (diff)
download: linux-stable-04442bf70debb197d4ed4e850aa77213e685b352.tar.gz
linux-stable-04442bf70debb197d4ed4e850aa77213e685b352.tar.bz2
linux-stable-04442bf70debb197d4ed4e850aa77213e685b352.zip
1 files changed, 14 insertions, 3 deletions
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
index 0e10c3958f94..d8f131ed10cb 100644
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
@@ -47,6 +47,7 @@
 
 #include "amdgpu_ras.h"
 #include "amdgpu_xgmi.h"
+#include "amdgpu_reset.h"
 
 /*
  * KMS wrapper.
@@ -1349,7 +1350,9 @@ static void amdgpu_drv_delayed_reset_work_handler(struct work_struct *work)
 	struct list_head device_list;
 	struct amdgpu_device *adev;
 	int i, r;
-	bool need_full_reset = true;
+	struct amdgpu_reset_context reset_context;
+
+	memset(&reset_context, 0, sizeof(reset_context));
 
 	mutex_lock(&mgpu_info.mutex);
 	if (mgpu_info.pending_reset == true) {
@@ -1359,9 +1362,14 @@ static void amdgpu_drv_delayed_reset_work_handler(struct work_struct *work)
 	mgpu_info.pending_reset = true;
 	mutex_unlock(&mgpu_info.mutex);
 
+	/* Use a common context, just need to make sure full reset is done */
+	reset_context.method = AMD_RESET_METHOD_NONE;
+	set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
+
 	for (i = 0; i < mgpu_info.num_dgpu; i++) {
 		adev = mgpu_info.gpu_ins[i].adev;
-		r = amdgpu_device_pre_asic_reset(adev, NULL, &need_full_reset);
+		reset_context.reset_req_dev = adev;
+		r = amdgpu_device_pre_asic_reset(adev, &reset_context);
 		if (r) {
 			dev_err(adev->dev, "GPU pre asic reset failed with err, %d for drm dev, %s ",
 				r, adev_to_drm(adev)->unique);
@@ -1388,7 +1396,10 @@ static void amdgpu_drv_delayed_reset_work_handler(struct work_struct *work)
 	list_for_each_entry(adev, &device_list, reset_list)
 		amdgpu_unregister_gpu_instance(adev);
 
-	r = amdgpu_do_asic_reset(NULL, &device_list, &need_full_reset, true);
+	/* Use a common context, just need to make sure full reset is done */
+	set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
+	r = amdgpu_do_asic_reset(&device_list, &reset_context);
+
 	if (r) {
 		DRM_ERROR("reinit gpus failure");
 		return;
author	Lijo Lazar <lijo.lazar@amd.com>	2021-03-16 20:31:51 +0800
committer	Alex Deucher <alexander.deucher@amd.com>	2021-04-09 16:46:14 -0400
commit	04442bf70debb197d4ed4e850aa77213e685b352 (patch)
tree	17774997a6f4edbe8aa5675d98f07432578ea57a /drivers/gpu/drm/amd/amdgpu/amdgpu_drv.c
parent	e071dce38f0a3acb2f6d019c6bb7933fd20d3357 (diff)
download	linux-stable-04442bf70debb197d4ed4e850aa77213e685b352.tar.gz linux-stable-04442bf70debb197d4ed4e850aa77213e685b352.tar.bz2 linux-stable-04442bf70debb197d4ed4e850aa77213e685b352.zip