#define QPIC_PER_CW_CMD_SGL            32
 #define QPIC_PER_CW_DATA_SGL           8
 
+/*
+ * Flags used in DMA descriptor preparation helper functions
+ * (i.e. read_reg_dma/write_reg_dma/read_data_dma/write_data_dma)
+ */
+/* Don't set the EOT in current tx BAM sgl */
+#define NAND_BAM_NO_EOT                        BIT(0)
+/* Set the NWD flag in current BAM sgl */
+#define NAND_BAM_NWD                   BIT(1)
+/* Finish writing in the current BAM sgl and start writing in another BAM sgl */
+#define NAND_BAM_NEXT_SGL              BIT(2)
+
 /*
  * This data type corresponds to the BAM transaction which will be used for all
  * NAND transfers.
  *
  * @first:             offset of the first register in the contiguous block
  * @num_regs:          number of registers to read
+ * @flags:             flags to control DMA descriptor preparation
  */
 static int read_reg_dma(struct qcom_nand_controller *nandc, int first,
-                       int num_regs)
+                       int num_regs, unsigned int flags)
 {
        bool flow_control = false;
        void *vaddr;
  *
  * @first:             offset of the first register in the contiguous block
  * @num_regs:          number of registers to write
+ * @flags:             flags to control DMA descriptor preparation
  */
 static int write_reg_dma(struct qcom_nand_controller *nandc, int first,
-                        int num_regs)
+                        int num_regs, unsigned int flags)
 {
        bool flow_control = false;
        struct nandc_regs *regs = nandc->regs;
        if (first == NAND_FLASH_CMD)
                flow_control = true;
 
+       if (first == NAND_EXEC_CMD)
+               flags |= NAND_BAM_NWD;
+
        if (first == NAND_DEV_CMD1_RESTORE)
                first = NAND_DEV_CMD1;
 
  * @reg_off:           offset within the controller's data buffer
  * @vaddr:             virtual address of the buffer we want to write to
  * @size:              DMA transaction size in bytes
+ * @flags:             flags to control DMA descriptor preparation
  */
 static int read_data_dma(struct qcom_nand_controller *nandc, int reg_off,
-                        const u8 *vaddr, int size)
+                        const u8 *vaddr, int size, unsigned int flags)
 {
        return prep_adm_dma_desc(nandc, true, reg_off, vaddr, size, false);
 }
  * @reg_off:           offset within the controller's data buffer
  * @vaddr:             virtual address of the buffer we want to read from
  * @size:              DMA transaction size in bytes
+ * @flags:             flags to control DMA descriptor preparation
  */
 static int write_data_dma(struct qcom_nand_controller *nandc, int reg_off,
-                         const u8 *vaddr, int size)
+                         const u8 *vaddr, int size, unsigned int flags)
 {
        return prep_adm_dma_desc(nandc, false, reg_off, vaddr, size, false);
 }
  */
 static void config_nand_page_read(struct qcom_nand_controller *nandc)
 {
-       write_reg_dma(nandc, NAND_ADDR0, 2);
-       write_reg_dma(nandc, NAND_DEV0_CFG0, 3);
-       write_reg_dma(nandc, NAND_EBI2_ECC_BUF_CFG, 1);
+       write_reg_dma(nandc, NAND_ADDR0, 2, 0);
+       write_reg_dma(nandc, NAND_DEV0_CFG0, 3, 0);
+       write_reg_dma(nandc, NAND_EBI2_ECC_BUF_CFG, 1, 0);
 }
 
 /*
  */
 static void config_nand_cw_read(struct qcom_nand_controller *nandc)
 {
-       write_reg_dma(nandc, NAND_FLASH_CMD, 1);
-       write_reg_dma(nandc, NAND_EXEC_CMD, 1);
+       write_reg_dma(nandc, NAND_FLASH_CMD, 1, NAND_BAM_NEXT_SGL);
+       write_reg_dma(nandc, NAND_EXEC_CMD, 1, NAND_BAM_NEXT_SGL);
 
-       read_reg_dma(nandc, NAND_FLASH_STATUS, 2);
-       read_reg_dma(nandc, NAND_ERASED_CW_DETECT_STATUS, 1);
+       read_reg_dma(nandc, NAND_FLASH_STATUS, 2, 0);
+       read_reg_dma(nandc, NAND_ERASED_CW_DETECT_STATUS, 1,
+                    NAND_BAM_NEXT_SGL);
 }
 
 /*
  */
 static void config_nand_page_write(struct qcom_nand_controller *nandc)
 {
-       write_reg_dma(nandc, NAND_ADDR0, 2);
-       write_reg_dma(nandc, NAND_DEV0_CFG0, 3);
-       write_reg_dma(nandc, NAND_EBI2_ECC_BUF_CFG, 1);
+       write_reg_dma(nandc, NAND_ADDR0, 2, 0);
+       write_reg_dma(nandc, NAND_DEV0_CFG0, 3, 0);
+       write_reg_dma(nandc, NAND_EBI2_ECC_BUF_CFG, 1,
+                     NAND_BAM_NEXT_SGL);
 }
 
 /*
  */
 static void config_nand_cw_write(struct qcom_nand_controller *nandc)
 {
-       write_reg_dma(nandc, NAND_FLASH_CMD, 1);
-       write_reg_dma(nandc, NAND_EXEC_CMD, 1);
+       write_reg_dma(nandc, NAND_FLASH_CMD, 1, NAND_BAM_NEXT_SGL);
+       write_reg_dma(nandc, NAND_EXEC_CMD, 1, NAND_BAM_NEXT_SGL);
 
-       read_reg_dma(nandc, NAND_FLASH_STATUS, 1);
+       read_reg_dma(nandc, NAND_FLASH_STATUS, 1, NAND_BAM_NEXT_SGL);
 
-       write_reg_dma(nandc, NAND_FLASH_STATUS, 1);
-       write_reg_dma(nandc, NAND_READ_STATUS, 1);
+       write_reg_dma(nandc, NAND_FLASH_STATUS, 1, 0);
+       write_reg_dma(nandc, NAND_READ_STATUS, 1, NAND_BAM_NEXT_SGL);
 }
 
 /*
        nandc_set_reg(nandc, NAND_DEV_CMD1_RESTORE, nandc->cmd1);
        nandc_set_reg(nandc, NAND_DEV_CMD_VLD_RESTORE, nandc->vld);
 
-       write_reg_dma(nandc, NAND_DEV_CMD_VLD, 1);
-       write_reg_dma(nandc, NAND_DEV_CMD1, 1);
+       write_reg_dma(nandc, NAND_DEV_CMD_VLD, 1, 0);
+       write_reg_dma(nandc, NAND_DEV_CMD1, 1, NAND_BAM_NEXT_SGL);
 
        nandc->buf_count = 512;
        memset(nandc->data_buffer, 0xff, nandc->buf_count);
        config_nand_single_cw_page_read(nandc);
 
        read_data_dma(nandc, FLASH_BUF_ACC, nandc->data_buffer,
-                     nandc->buf_count);
+                     nandc->buf_count, 0);
 
        /* restore CMD1 and VLD regs */
-       write_reg_dma(nandc, NAND_DEV_CMD1_RESTORE, 1);
-       write_reg_dma(nandc, NAND_DEV_CMD_VLD_RESTORE, 1);
+       write_reg_dma(nandc, NAND_DEV_CMD1_RESTORE, 1, 0);
+       write_reg_dma(nandc, NAND_DEV_CMD_VLD_RESTORE, 1, NAND_BAM_NEXT_SGL);
 
        return 0;
 }
        nandc_set_reg(nandc, NAND_FLASH_STATUS, host->clrflashstatus);
        nandc_set_reg(nandc, NAND_READ_STATUS, host->clrreadstatus);
 
-       write_reg_dma(nandc, NAND_FLASH_CMD, 3);
-       write_reg_dma(nandc, NAND_DEV0_CFG0, 2);
-       write_reg_dma(nandc, NAND_EXEC_CMD, 1);
+       write_reg_dma(nandc, NAND_FLASH_CMD, 3, NAND_BAM_NEXT_SGL);
+       write_reg_dma(nandc, NAND_DEV0_CFG0, 2, NAND_BAM_NEXT_SGL);
+       write_reg_dma(nandc, NAND_EXEC_CMD, 1, NAND_BAM_NEXT_SGL);
 
-       read_reg_dma(nandc, NAND_FLASH_STATUS, 1);
+       read_reg_dma(nandc, NAND_FLASH_STATUS, 1, NAND_BAM_NEXT_SGL);
 
-       write_reg_dma(nandc, NAND_FLASH_STATUS, 1);
-       write_reg_dma(nandc, NAND_READ_STATUS, 1);
+       write_reg_dma(nandc, NAND_FLASH_STATUS, 1, 0);
+       write_reg_dma(nandc, NAND_READ_STATUS, 1, NAND_BAM_NEXT_SGL);
 
        return 0;
 }
        nandc_set_reg(nandc, NAND_FLASH_CHIP_SELECT, DM_EN);
        nandc_set_reg(nandc, NAND_EXEC_CMD, 1);
 
-       write_reg_dma(nandc, NAND_FLASH_CMD, 4);
-       write_reg_dma(nandc, NAND_EXEC_CMD, 1);
+       write_reg_dma(nandc, NAND_FLASH_CMD, 4, NAND_BAM_NEXT_SGL);
+       write_reg_dma(nandc, NAND_EXEC_CMD, 1, NAND_BAM_NEXT_SGL);
 
-       read_reg_dma(nandc, NAND_READ_ID, 1);
+       read_reg_dma(nandc, NAND_READ_ID, 1, NAND_BAM_NEXT_SGL);
 
        return 0;
 }
        nandc_set_reg(nandc, NAND_FLASH_CMD, RESET_DEVICE);
        nandc_set_reg(nandc, NAND_EXEC_CMD, 1);
 
-       write_reg_dma(nandc, NAND_FLASH_CMD, 1);
-       write_reg_dma(nandc, NAND_EXEC_CMD, 1);
+       write_reg_dma(nandc, NAND_FLASH_CMD, 1, NAND_BAM_NEXT_SGL);
+       write_reg_dma(nandc, NAND_EXEC_CMD, 1, NAND_BAM_NEXT_SGL);
 
-       read_reg_dma(nandc, NAND_FLASH_STATUS, 1);
+       read_reg_dma(nandc, NAND_FLASH_STATUS, 1, NAND_BAM_NEXT_SGL);
 
        return 0;
 }
 
                if (data_buf)
                        read_data_dma(nandc, FLASH_BUF_ACC, data_buf,
-                                     data_size);
+                                     data_size, 0);
 
                /*
                 * when ecc is enabled, the controller doesn't read the real
                                *oob_buf++ = 0xff;
 
                        read_data_dma(nandc, FLASH_BUF_ACC + data_size,
-                                     oob_buf, oob_size);
+                                     oob_buf, oob_size, 0);
                }
 
                if (data_buf)
 
        config_nand_single_cw_page_read(nandc);
 
-       read_data_dma(nandc, FLASH_BUF_ACC, nandc->data_buffer, size);
+       read_data_dma(nandc, FLASH_BUF_ACC, nandc->data_buffer, size, 0);
 
        ret = submit_descs(nandc);
        if (ret)
 
                config_nand_cw_read(nandc);
 
-               read_data_dma(nandc, reg_off, data_buf, data_size1);
+               read_data_dma(nandc, reg_off, data_buf, data_size1, 0);
                reg_off += data_size1;
                data_buf += data_size1;
 
-               read_data_dma(nandc, reg_off, oob_buf, oob_size1);
+               read_data_dma(nandc, reg_off, oob_buf, oob_size1, 0);
                reg_off += oob_size1;
                oob_buf += oob_size1;
 
-               read_data_dma(nandc, reg_off, data_buf, data_size2);
+               read_data_dma(nandc, reg_off, data_buf, data_size2, 0);
                reg_off += data_size2;
                data_buf += data_size2;
 
-               read_data_dma(nandc, reg_off, oob_buf, oob_size2);
+               read_data_dma(nandc, reg_off, oob_buf, oob_size2, 0);
                oob_buf += oob_size2;
        }
 
                }
 
 
-               write_data_dma(nandc, FLASH_BUF_ACC, data_buf, data_size);
+               write_data_dma(nandc, FLASH_BUF_ACC, data_buf, data_size,
+                              i == (ecc->steps - 1) ? NAND_BAM_NO_EOT : 0);
 
                /*
                 * when ECC is enabled, we don't really need to write anything
                        oob_buf += host->bbm_size;
 
                        write_data_dma(nandc, FLASH_BUF_ACC + data_size,
-                                      oob_buf, oob_size);
+                                      oob_buf, oob_size, 0);
                }
 
                config_nand_cw_write(nandc);
                        oob_size2 = host->ecc_bytes_hw + host->spare_bytes;
                }
 
-               write_data_dma(nandc, reg_off, data_buf, data_size1);
+               write_data_dma(nandc, reg_off, data_buf, data_size1,
+                              NAND_BAM_NO_EOT);
                reg_off += data_size1;
                data_buf += data_size1;
 
-               write_data_dma(nandc, reg_off, oob_buf, oob_size1);
+               write_data_dma(nandc, reg_off, oob_buf, oob_size1,
+                              NAND_BAM_NO_EOT);
                reg_off += oob_size1;
                oob_buf += oob_size1;
 
-               write_data_dma(nandc, reg_off, data_buf, data_size2);
+               write_data_dma(nandc, reg_off, data_buf, data_size2,
+                              NAND_BAM_NO_EOT);
                reg_off += data_size2;
                data_buf += data_size2;
 
-               write_data_dma(nandc, reg_off, oob_buf, oob_size2);
+               write_data_dma(nandc, reg_off, oob_buf, oob_size2, 0);
                oob_buf += oob_size2;
 
                config_nand_cw_write(nandc);
        update_rw_regs(host, 1, false);
 
        config_nand_page_write(nandc);
-       write_data_dma(nandc, FLASH_BUF_ACC, nandc->data_buffer,
-                      data_size + oob_size);
+       write_data_dma(nandc, FLASH_BUF_ACC,
+                      nandc->data_buffer, data_size + oob_size, 0);
        config_nand_cw_write(nandc);
 
        ret = submit_descs(nandc);
        update_rw_regs(host, 1, false);
 
        config_nand_page_write(nandc);
-       write_data_dma(nandc, FLASH_BUF_ACC, nandc->data_buffer, host->cw_size);
+       write_data_dma(nandc, FLASH_BUF_ACC,
+                      nandc->data_buffer, host->cw_size, 0);
        config_nand_cw_write(nandc);
 
        ret = submit_descs(nandc);