]> www.infradead.org Git - users/hch/misc.git/commitdiff
drm/amdkfd: debugfs hang_hws skip GPU with MES
authorPhilip Yang <Philip.Yang@amd.com>
Mon, 10 Feb 2025 14:42:31 +0000 (09:42 -0500)
committerAlex Deucher <alexander.deucher@amd.com>
Thu, 27 Feb 2025 21:50:05 +0000 (16:50 -0500)
debugfs hang_hws is used by GPU reset test with HWS, for MES this crash
the kernel with NULL pointer access because dqm->packet_mgr is not setup
for MES path.

Skip GPU with MES for now, MES hang_hws debugfs interface will be
supported later.

Signed-off-by: Philip Yang <Philip.Yang@amd.com>
Reviewed-by: Kent Russell <kent.russell@amd.com>
Reviewed-by: Felix Kuehling <felix.kuehling@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdkfd/kfd_device.c

index 095e73790dc483e83bc93fc3a0eabc81ba202356..b9c82be6ce134f37ff427264a0d97ee0e6045ea5 100644 (file)
@@ -1604,6 +1604,11 @@ int kfd_debugfs_hang_hws(struct kfd_node *dev)
                return -EINVAL;
        }
 
+       if (dev->kfd->shared_resources.enable_mes) {
+               dev_err(dev->adev->dev, "Inducing MES hang is not supported\n");
+               return -EINVAL;
+       }
+
        return dqm_debugfs_hang_hws(dev->dqm);
 }