The new VM_BIND UAPI implementation introduced in subsequent commits
will allow asynchronous jobs processing push buffers and emitting
fences.
If a fence context is killed, e.g. due to a channel fault, jobs which
are already queued for execution might still emit new fences. In such a
case a job would hang forever.
To fix that, fail to emit a new fence on a killed fence context with
-ENODEV to unblock the job.
Reviewed-by: Dave Airlie <airlied@redhat.com>
Signed-off-by: Danilo Krummrich <dakr@redhat.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20230804182406.5222-9-dakr@redhat.com
                if (nouveau_fence_signal(fence))
                        nvif_event_block(&fctx->event);
        }
+       fctx->killed = 1;
        spin_unlock_irqrestore(&fctx->lock, flags);
 }
 
                dma_fence_get(&fence->base);
                spin_lock_irq(&fctx->lock);
 
+               if (unlikely(fctx->killed)) {
+                       spin_unlock_irq(&fctx->lock);
+                       dma_fence_put(&fence->base);
+                       return -ENODEV;
+               }
+
                if (nouveau_fence_update(chan, fctx))
                        nvif_event_block(&fctx->event);
 
 
        char name[32];
 
        struct nvif_event event;
-       int notify_ref, dead;
+       int notify_ref, dead, killed;
 };
 
 struct nouveau_fence_priv {