]> www.infradead.org Git - users/jedix/linux-maple.git/commitdiff
aio: add aio support for iov_iter arguments
authorZach Brown <zach.brown@oracle.com>
Fri, 22 Oct 2010 19:24:24 +0000 (12:24 -0700)
committerDave Kleikamp <dave.kleikamp@oracle.com>
Fri, 13 Jan 2012 00:16:00 +0000 (18:16 -0600)
This adds iocb cmds which specify that memory is held in iov_iter
structures.  This lets kernel callers specify memory that can be
expressed in an iov_iter, which includes pages in bio_vec arrays.

Only kernel callers can provide an iov_iter so it doesn't make a lot of
sense to expose the IOCB_CMD values for this as part of the user space
ABI.

But kernel callers should also be able to perform the usual aio
operations which suggests using the the existing operation namespace and
support code.

Hrmph.

Signed-off-by: Zach Brown <zach.brown@oracle.com>
fs/aio.c
include/linux/aio.h
include/linux/aio_abi.h

index 376cca91ce5ac7b942ad844a5d3e5170611488b8..a2a6a070d3d934d9f20c2d33d928c9f6f39428b5 100644 (file)
--- a/fs/aio.c
+++ b/fs/aio.c
@@ -1422,6 +1422,26 @@ static ssize_t aio_setup_single_vector(struct kiocb *kiocb)
        return 0;
 }
 
+static ssize_t aio_read_iter(struct kiocb *iocb)
+{
+       struct file *file = iocb->ki_filp;
+       ssize_t ret = -EINVAL;
+
+       if (file->f_op->read_iter)
+               ret = file->f_op->read_iter(iocb, iocb->ki_iter, iocb->ki_pos);
+       return ret;
+}
+
+static ssize_t aio_write_iter(struct kiocb *iocb)
+{
+       struct file *file = iocb->ki_filp;
+       ssize_t ret = -EINVAL;
+
+       if (file->f_op->write_iter)
+               ret = file->f_op->write_iter(iocb, iocb->ki_iter, iocb->ki_pos);
+       return ret;
+}
+
 /*
  * aio_setup_iocb:
  *     Performs the initial checks and aio retry method
@@ -1497,6 +1517,34 @@ static ssize_t aio_setup_iocb(struct kiocb *kiocb, bool compat)
                if (file->f_op->aio_write)
                        kiocb->ki_retry = aio_rw_vect_retry;
                break;
+       case IOCB_CMD_READ_ITER:
+               ret = -EINVAL;
+               if (unlikely(!is_kernel_kiocb(kiocb)))
+                       break;
+               ret = -EBADF;
+               if (unlikely(!(file->f_mode & FMODE_READ)))
+                       break;
+               ret = security_file_permission(file, MAY_READ);
+               if (unlikely(ret))
+                       break;
+               ret = -EINVAL;
+               if (file->f_op->read_iter)
+                       kiocb->ki_retry = aio_read_iter;
+               break;
+       case IOCB_CMD_WRITE_ITER:
+               ret = -EINVAL;
+               if (unlikely(!is_kernel_kiocb(kiocb)))
+                       break;
+               ret = -EBADF;
+               if (unlikely(!(file->f_mode & FMODE_WRITE)))
+                       break;
+               ret = security_file_permission(file, MAY_WRITE);
+               if (unlikely(ret))
+                       break;
+               ret = -EINVAL;
+               if (file->f_op->write_iter)
+                       kiocb->ki_retry = aio_write_iter;
+               break;
        case IOCB_CMD_FDSYNC:
                ret = -EINVAL;
                if (file->f_op->aio_fsync)
@@ -1563,6 +1611,22 @@ void aio_kernel_init_rw(struct kiocb *iocb, struct file *filp,
 }
 EXPORT_SYMBOL_GPL(aio_kernel_init_rw);
 
+/*
+ * The iter count must be set before calling here.  Some filesystems uses
+ * iocb->ki_left as an indicator of the size of an IO.
+ */
+void aio_kernel_init_iter(struct kiocb *iocb, struct file *filp,
+                         unsigned short op, struct iov_iter *iter, loff_t off)
+{
+       iocb->ki_filp = filp;
+       iocb->ki_iter = iter;
+       iocb->ki_opcode = op;
+       iocb->ki_pos = off;
+       iocb->ki_nbytes = iov_iter_count(iter);
+       iocb->ki_left = iocb->ki_nbytes;
+}
+EXPORT_SYMBOL_GPL(aio_kernel_init_iter);
+
 void aio_kernel_init_callback(struct kiocb *iocb,
                              void (*complete)(u64 user_data, long res),
                              u64 user_data)
index 6a7be9e9d0e9c9d3b7ee2d369e8fd31a4ae4ccd5..002a90adb751e0b8e224c4d90da2ea8755c8d24e 100644 (file)
@@ -125,6 +125,7 @@ struct kiocb {
         * this is the underlying eventfd context to deliver events to.
         */
        struct eventfd_ctx      *ki_eventfd;
+       struct iov_iter         *ki_iter;
 };
 
 #define is_sync_kiocb(iocb)    ((iocb)->ki_key == KIOCB_SYNC_KEY)
@@ -221,6 +222,8 @@ struct kiocb *aio_kernel_alloc(gfp_t gfp);
 void aio_kernel_free(struct kiocb *iocb);
 void aio_kernel_init_rw(struct kiocb *iocb, struct file *filp,
                        unsigned short op, void *ptr, size_t nr, loff_t off);
+void aio_kernel_init_iter(struct kiocb *iocb, struct file *filp,
+                         unsigned short op, struct iov_iter *iter, loff_t off);
 void aio_kernel_init_callback(struct kiocb *iocb,
                              void (*complete)(u64 user_data, long res),
                              u64 user_data);
index 2c8731664180242ad95fa91cfb2b8e6d11f90b78..2c97a2ded6f7f2bd40b3238b26e46eaa4fbd7d25 100644 (file)
@@ -44,6 +44,8 @@ enum {
        IOCB_CMD_NOOP = 6,
        IOCB_CMD_PREADV = 7,
        IOCB_CMD_PWRITEV = 8,
+       IOCB_CMD_READ_ITER = 9,
+       IOCB_CMD_WRITE_ITER = 10,
 };
 
 /*