The synchronize_rcu may take several ms, which noticeably slows down
applications close SMI event handle. Use call_rcu to free client->fifo
and client asynchronously and eliminate the synchronize_rcu call in the
user thread.
Signed-off-by: Philip Yang <Philip.Yang@amd.com>
Reviewed-by: Felix Kuehling <Felix.Kuehling@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
        uint64_t events;
        struct kfd_dev *dev;
        spinlock_t lock;
+       struct rcu_head rcu;
        pid_t pid;
        bool suser;
 };
        return sizeof(events);
 }
 
+static void kfd_smi_ev_client_free(struct rcu_head *p)
+{
+       struct kfd_smi_client *ev = container_of(p, struct kfd_smi_client, rcu);
+
+       kfifo_free(&ev->fifo);
+       kfree(ev);
+}
+
 static int kfd_smi_ev_release(struct inode *inode, struct file *filep)
 {
        struct kfd_smi_client *client = filep->private_data;
        list_del_rcu(&client->list);
        spin_unlock(&dev->smi_lock);
 
-       synchronize_rcu();
-       kfifo_free(&client->fifo);
-       kfree(client);
-
+       call_rcu(&client->rcu, kfd_smi_ev_client_free);
        return 0;
 }