break;
                trace_btrfs_ordered_sched(work);
                spin_unlock_irqrestore(lock, flags);
-               work->ordered_func(work);
+               work->ordered_func(work, false);
 
                /* now take the lock again and drop our item from the list */
                spin_lock_irqsave(lock, flags);
                         * We don't want to call the ordered free functions with
                         * the lock held.
                         */
-                       work->ordered_free(work);
+                       work->ordered_func(work, true);
                        /* NB: work must not be dereferenced past this point. */
                        trace_btrfs_all_work_done(wq->fs_info, work);
                }
        spin_unlock_irqrestore(lock, flags);
 
        if (free_self) {
-               self->ordered_free(self);
+               self->ordered_func(self, true);
                /* NB: self must not be dereferenced past this point. */
                trace_btrfs_all_work_done(wq->fs_info, self);
        }
 
        /*
         * We should not touch things inside work in the following cases:
-        * 1) after work->func() if it has no ordered_free
+        * 1) after work->func() if it has no ordered_func(..., true) to free
         *    Since the struct is freed in work->func().
         * 2) after setting WORK_DONE_BIT
         *    The work may be freed in other threads almost instantly.
 }
 
 void btrfs_init_work(struct btrfs_work *work, btrfs_func_t func,
-                    btrfs_func_t ordered_func, btrfs_func_t ordered_free)
+                    btrfs_ordered_func_t ordered_func)
 {
        work->func = func;
        work->ordered_func = ordered_func;
-       work->ordered_free = ordered_free;
        INIT_WORK(&work->normal_work, btrfs_work_helper);
        INIT_LIST_HEAD(&work->ordered_list);
        work->flags = 0;
 
 struct btrfs_workqueue;
 struct btrfs_work;
 typedef void (*btrfs_func_t)(struct btrfs_work *arg);
+typedef void (*btrfs_ordered_func_t)(struct btrfs_work *arg, bool);
 
 struct btrfs_work {
        btrfs_func_t func;
-       btrfs_func_t ordered_func;
-       btrfs_func_t ordered_free;
+       btrfs_ordered_func_t ordered_func;
 
        /* Don't touch things below */
        struct work_struct normal_work;
                                struct btrfs_fs_info *fs_info, const char *name,
                                unsigned int flags);
 void btrfs_init_work(struct btrfs_work *work, btrfs_func_t func,
-                    btrfs_func_t ordered_func, btrfs_func_t ordered_free);
+                    btrfs_ordered_func_t ordered_func);
 void btrfs_queue_work(struct btrfs_workqueue *wq,
                      struct btrfs_work *work);
 void btrfs_destroy_workqueue(struct btrfs_workqueue *wq);
 
  *
  * At IO completion time the csums attached on the ordered extent record are
  * inserted into the tree.
+ *
+ * If called with @do_free == true, then it will free the work struct.
  */
-static void run_one_async_done(struct btrfs_work *work)
+static void run_one_async_done(struct btrfs_work *work, bool do_free)
 {
        struct async_submit_bio *async =
                container_of(work, struct async_submit_bio, work);
        struct bio *bio = &async->bbio->bio;
 
+       if (do_free) {
+               kfree(container_of(work, struct async_submit_bio, work));
+               return;
+       }
+
        /* If an error occurred we just want to clean up the bio and move on. */
        if (bio->bi_status) {
                btrfs_orig_bbio_end_io(async->bbio);
        __btrfs_submit_bio(bio, async->bioc, &async->smap, async->mirror_num);
 }
 
-static void run_one_async_free(struct btrfs_work *work)
-{
-       kfree(container_of(work, struct async_submit_bio, work));
-}
-
 static bool should_async_write(struct btrfs_bio *bbio)
 {
        /* Submit synchronously if the checksum implementation is fast. */
        async->smap = *smap;
        async->mirror_num = mirror_num;
 
-       btrfs_init_work(&async->work, run_one_async_start, run_one_async_done,
-                       run_one_async_free);
+       btrfs_init_work(&async->work, run_one_async_start, run_one_async_done);
        btrfs_queue_work(fs_info->workers, &async->work);
        return true;
 }
 
        caching_ctl->block_group = cache;
        refcount_set(&caching_ctl->count, 2);
        atomic_set(&caching_ctl->progress, 0);
-       btrfs_init_work(&caching_ctl->work, caching_thread, NULL, NULL);
+       btrfs_init_work(&caching_ctl->work, caching_thread, NULL);
 
        spin_lock(&cache->lock);
        if (cache->cached != BTRFS_CACHE_NO) {
 
                return -ENOMEM;
 
        async_work->delayed_root = delayed_root;
-       btrfs_init_work(&async_work->work, btrfs_async_run_delayed_root, NULL,
-                       NULL);
+       btrfs_init_work(&async_work->work, btrfs_async_run_delayed_root, NULL);
        async_work->nr = nr;
 
        btrfs_queue_work(fs_info->delayed_workers, &async_work->work);
 
  * Phase two of compressed writeback.  This is the ordered portion of the code,
  * which only gets called in the order the work was queued.  We walk all the
  * async extents created by compress_file_range and send them down to the disk.
+ *
+ * If called with @do_free == true then it'll try to finish the work and free
+ * the work struct eventually.
  */
-static noinline void submit_compressed_extents(struct btrfs_work *work)
+static noinline void submit_compressed_extents(struct btrfs_work *work, bool do_free)
 {
        struct async_chunk *async_chunk = container_of(work, struct async_chunk,
                                                     work);
        unsigned long nr_pages;
        u64 alloc_hint = 0;
 
+       if (do_free) {
+               struct async_chunk *async_chunk;
+               struct async_cow *async_cow;
+
+               async_chunk = container_of(work, struct async_chunk, work);
+               btrfs_add_delayed_iput(async_chunk->inode);
+               if (async_chunk->blkcg_css)
+                       css_put(async_chunk->blkcg_css);
+
+               async_cow = async_chunk->async_cow;
+               if (atomic_dec_and_test(&async_cow->num_chunks))
+                       kvfree(async_cow);
+               return;
+       }
+
        nr_pages = (async_chunk->end - async_chunk->start + PAGE_SIZE) >>
                PAGE_SHIFT;
 
                cond_wake_up_nomb(&fs_info->async_submit_wait);
 }
 
-static noinline void async_cow_free(struct btrfs_work *work)
-{
-       struct async_chunk *async_chunk;
-       struct async_cow *async_cow;
-
-       async_chunk = container_of(work, struct async_chunk, work);
-       btrfs_add_delayed_iput(async_chunk->inode);
-       if (async_chunk->blkcg_css)
-               css_put(async_chunk->blkcg_css);
-
-       async_cow = async_chunk->async_cow;
-       if (atomic_dec_and_test(&async_cow->num_chunks))
-               kvfree(async_cow);
-}
-
 static bool run_delalloc_compressed(struct btrfs_inode *inode,
                                    struct page *locked_page, u64 start,
                                    u64 end, struct writeback_control *wbc)
                }
 
                btrfs_init_work(&async_chunk[i].work, compress_file_range,
-                               submit_compressed_extents, async_cow_free);
+                               submit_compressed_extents);
 
                nr_pages = DIV_ROUND_UP(cur_end - start, PAGE_SIZE);
                atomic_add(nr_pages, &fs_info->async_delalloc_pages);
        ihold(inode);
        btrfs_page_set_checked(fs_info, page, page_offset(page), PAGE_SIZE);
        get_page(page);
-       btrfs_init_work(&fixup->work, btrfs_writepage_fixup_worker, NULL, NULL);
+       btrfs_init_work(&fixup->work, btrfs_writepage_fixup_worker, NULL);
        fixup->page = page;
        fixup->inode = BTRFS_I(inode);
        btrfs_queue_work(fs_info->fixup_workers, &fixup->work);
        init_completion(&work->completion);
        INIT_LIST_HEAD(&work->list);
        work->inode = inode;
-       btrfs_init_work(&work->work, btrfs_run_delalloc_work, NULL, NULL);
+       btrfs_init_work(&work->work, btrfs_run_delalloc_work, NULL);
 
        return work;
 }
 
        struct btrfs_workqueue *wq = btrfs_is_free_space_inode(inode) ?
                fs_info->endio_freespace_worker : fs_info->endio_write_workers;
 
-       btrfs_init_work(&ordered->work, finish_ordered_fn, NULL, NULL);
+       btrfs_init_work(&ordered->work, finish_ordered_fn, NULL);
        btrfs_queue_work(wq, &ordered->work);
 }
 
                spin_unlock(&root->ordered_extent_lock);
 
                btrfs_init_work(&ordered->flush_work,
-                               btrfs_run_ordered_extent_work, NULL, NULL);
+                               btrfs_run_ordered_extent_work, NULL);
                list_add_tail(&ordered->work_list, &works);
                btrfs_queue_work(fs_info->flush_workers, &ordered->flush_work);
 
 
        mutex_unlock(&fs_info->qgroup_rescan_lock);
 
        btrfs_init_work(&fs_info->qgroup_rescan_work,
-                       btrfs_qgroup_rescan_worker, NULL, NULL);
+                       btrfs_qgroup_rescan_worker, NULL);
        return 0;
 }
 
 
                __field(        const void *,   wq                      )
                __field(        const void *,   func                    )
                __field(        const void *,   ordered_func            )
-               __field(        const void *,   ordered_free            )
                __field(        const void *,   normal_work             )
        ),
 
                __entry->wq             = work->wq;
                __entry->func           = work->func;
                __entry->ordered_func   = work->ordered_func;
-               __entry->ordered_free   = work->ordered_free;
                __entry->normal_work    = &work->normal_work;
        ),
 
-       TP_printk_btrfs("work=%p (normal_work=%p) wq=%p func=%ps ordered_func=%p "
-                 "ordered_free=%p",
+       TP_printk_btrfs("work=%p (normal_work=%p) wq=%p func=%ps ordered_func=%p",
                  __entry->work, __entry->normal_work, __entry->wq,
-                  __entry->func, __entry->ordered_func, __entry->ordered_free)
+                  __entry->func, __entry->ordered_func)
 );
 
 /*