]> www.infradead.org Git - users/dwmw2/linux.git/commitdiff
drm/xe/ct: prevent UAF in send_recv()
authorMatthew Auld <matthew.auld@intel.com>
Tue, 1 Oct 2024 08:43:47 +0000 (09:43 +0100)
committerLucas De Marchi <lucas.demarchi@intel.com>
Tue, 8 Oct 2024 23:06:05 +0000 (18:06 -0500)
Ensure we serialize with completion side to prevent UAF with fence going
out of scope on the stack, since we have no clue if it will fire after
the timeout before we can erase from the xa. Also we have some dependent
loads and stores for which we need the correct ordering, and we lack the
needed barriers. Fix this by grabbing the ct->lock after the wait, which
is also held by the completion side.

v2 (Badal):
 - Also print done after acquiring the lock and seeing timeout.

Fixes: dd08ebf6c352 ("drm/xe: Introduce a new DRM driver for Intel GPUs")
Signed-off-by: Matthew Auld <matthew.auld@intel.com>
Cc: Matthew Brost <matthew.brost@intel.com>
Cc: Badal Nilawar <badal.nilawar@intel.com>
Cc: <stable@vger.kernel.org> # v6.8+
Reviewed-by: Badal Nilawar <badal.nilawar@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20241001084346.98516-5-matthew.auld@intel.com
(cherry picked from commit 52789ce35c55ccd30c4b67b9cc5b2af55e0122ea)
Signed-off-by: Lucas De Marchi <lucas.demarchi@intel.com>
drivers/gpu/drm/xe/xe_guc_ct.c

index f24dd52239268c169443cedaf0b04d88b14775c1..79eb8e60137ba76c606f7a38c3e870ba66e3a6f8 100644 (file)
@@ -903,16 +903,26 @@ retry_same_fence:
        }
 
        ret = wait_event_timeout(ct->g2h_fence_wq, g2h_fence.done, HZ);
+
+       /*
+        * Ensure we serialize with completion side to prevent UAF with fence going out of scope on
+        * the stack, since we have no clue if it will fire after the timeout before we can erase
+        * from the xa. Also we have some dependent loads and stores below for which we need the
+        * correct ordering, and we lack the needed barriers.
+        */
+       mutex_lock(&ct->lock);
        if (!ret) {
-               xe_gt_err(gt, "Timed out wait for G2H, fence %u, action %04x",
-                         g2h_fence.seqno, action[0]);
+               xe_gt_err(gt, "Timed out wait for G2H, fence %u, action %04x, done %s",
+                         g2h_fence.seqno, action[0], str_yes_no(g2h_fence.done));
                xa_erase_irq(&ct->fence_lookup, g2h_fence.seqno);
+               mutex_unlock(&ct->lock);
                return -ETIME;
        }
 
        if (g2h_fence.retry) {
                xe_gt_dbg(gt, "H2G action %#x retrying: reason %#x\n",
                          action[0], g2h_fence.reason);
+               mutex_unlock(&ct->lock);
                goto retry;
        }
        if (g2h_fence.fail) {
@@ -921,7 +931,12 @@ retry_same_fence:
                ret = -EIO;
        }
 
-       return ret > 0 ? response_buffer ? g2h_fence.response_len : g2h_fence.response_data : ret;
+       if (ret > 0)
+               ret = response_buffer ? g2h_fence.response_len : g2h_fence.response_data;
+
+       mutex_unlock(&ct->lock);
+
+       return ret;
 }
 
 /**