ctx = (iopte_val(*base) & IOPTE_CONTEXT) >> 47UL;
 
        /* Step 1: Kick data out of streaming buffers if necessary. */
-       if (strbuf->strbuf_enabled)
+       if (strbuf->strbuf_enabled && !(attrs & DMA_ATTR_SKIP_CPU_SYNC))
                strbuf_flush(strbuf, iommu, bus_addr, ctx,
                             npages, direction);
 
                base = iommu->page_table + entry;
 
                dma_handle &= IO_PAGE_MASK;
-               if (strbuf->strbuf_enabled)
+               if (strbuf->strbuf_enabled && !(attrs & DMA_ATTR_SKIP_CPU_SYNC))
                        strbuf_flush(strbuf, iommu, dma_handle, ctx,
                                     npages, direction);
 
 
 static void pci32_unmap_page(struct device *dev, dma_addr_t ba, size_t size,
                             enum dma_data_direction dir, unsigned long attrs)
 {
-       if (dir != PCI_DMA_TODEVICE)
+       if (dir != PCI_DMA_TODEVICE && !(attrs & DMA_ATTR_SKIP_CPU_SYNC))
                dma_make_coherent(ba, PAGE_ALIGN(size));
 }
 
        struct scatterlist *sg;
        int n;
 
-       if (dir != PCI_DMA_TODEVICE) {
+       if (dir != PCI_DMA_TODEVICE && !(attrs & DMA_ATTR_SKIP_CPU_SYNC)) {
                for_each_sg(sgl, sg, nents, n) {
                        dma_make_coherent(sg_phys(sg), PAGE_ALIGN(sg->length));
                }