]> www.infradead.org Git - users/hch/misc.git/commitdiff
drm/amdgpu: fix nullptr err of vm_handle_moved
authorHeng Zhou <Heng.Zhou@amd.com>
Wed, 13 Aug 2025 03:18:04 +0000 (11:18 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Fri, 15 Aug 2025 17:04:07 +0000 (13:04 -0400)
If a amdgpu_bo_va is fpriv->prt_va, the bo of this one is always NULL.
So, such kind of amdgpu_bo_va should be updated separately before
amdgpu_vm_handle_moved.

Signed-off-by: Heng Zhou <Heng.Zhou@amd.com>
Reviewed-by: Kasiviswanathan, Harish <Harish.Kasiviswanathan@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_gpuvm.c

index 37d8a7034a7ee561f1b32a83f5f2b81c3ccb9050..d478acb4568a5d4b5556c109e28272064a8c6879 100644 (file)
@@ -2970,9 +2970,22 @@ int amdgpu_amdkfd_gpuvm_restore_process_bos(void *info, struct dma_fence __rcu *
                struct amdgpu_device *adev = amdgpu_ttm_adev(
                        peer_vm->root.bo->tbo.bdev);
 
+               struct amdgpu_fpriv *fpriv =
+                       container_of(peer_vm, struct amdgpu_fpriv, vm);
+
+               ret = amdgpu_vm_bo_update(adev, fpriv->prt_va, false);
+               if (ret) {
+                       dev_dbg(adev->dev,
+                               "Memory eviction: handle PRT moved failed, pid %8d. Try again.\n",
+                               pid_nr(process_info->pid));
+                       goto validate_map_fail;
+               }
+
                ret = amdgpu_vm_handle_moved(adev, peer_vm, &exec.ticket);
                if (ret) {
-                       pr_debug("Memory eviction: handle moved failed. Try again\n");
+                       dev_dbg(adev->dev,
+                               "Memory eviction: handle moved failed, pid %8d. Try again.\n",
+                               pid_nr(process_info->pid));
                        goto validate_map_fail;
                }
        }