struct buffer_head *di_bh, u64 byte_start,
                                    u64 byte_len)
 {
-       int ret = 0;
+       int ret = 0, flags = 0;
        u32 trunc_start, trunc_len, cpos, phys_cpos, alloc_size;
        struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
        struct ocfs2_cached_dealloc_ctxt dealloc;
        struct address_space *mapping = inode->i_mapping;
        struct ocfs2_extent_tree et;
+       struct ocfs2_dinode *di = (struct ocfs2_dinode *)di_bh->b_data;
+       u64 refcount_loc = le64_to_cpu(di->i_refcount_loc);
 
        ocfs2_init_dinode_extent_tree(&et, INODE_CACHE(inode), di_bh);
        ocfs2_init_dealloc_ctxt(&dealloc);
                goto out;
        }
 
+       /*
+        * For reflinks, we may need to CoW 2 clusters which might be
+        * partially zero'd later, if hole's start and end offset were
+        * within one cluster(means is not exactly aligned to clustersize).
+        */
+
+       if (OCFS2_I(inode)->ip_dyn_features & OCFS2_HAS_REFCOUNT_FL) {
+
+               ret = ocfs2_cow_file_pos(inode, di_bh, byte_start);
+               if (ret) {
+                       mlog_errno(ret);
+                       goto out;
+               }
+
+               ret = ocfs2_cow_file_pos(inode, di_bh, byte_start + byte_len);
+               if (ret) {
+                       mlog_errno(ret);
+                       goto out;
+               }
+       }
+
        trunc_start = ocfs2_clusters_for_bytes(osb->sb, byte_start);
        trunc_len = (byte_start + byte_len) >> osb->s_clustersize_bits;
        if (trunc_len >= trunc_start)
        cpos = trunc_start;
        while (trunc_len) {
                ret = ocfs2_get_clusters(inode, cpos, &phys_cpos,
-                                        &alloc_size, NULL);
+                                        &alloc_size, &flags);
                if (ret) {
                        mlog_errno(ret);
                        goto out;
                if (phys_cpos != 0) {
                        ret = ocfs2_remove_btree_range(inode, &et, cpos,
                                                       phys_cpos, alloc_size,
-                                                      0, &dealloc, 0);
+                                                      flags, &dealloc,
+                                                      refcount_loc);
                        if (ret) {
                                mlog_errno(ret);
                                goto out;