static inline void bch2_dev_get(struct bch_dev *ca)
 {
+#ifdef CONFIG_BCACHEFS_DEBUG
+       BUG_ON(atomic_long_inc_return(&ca->ref) <= 1L);
+#else
        percpu_ref_get(&ca->ref);
+#endif
 }
 
 static inline void __bch2_dev_put(struct bch_dev *ca)
 {
+#ifdef CONFIG_BCACHEFS_DEBUG
+       long r = atomic_long_dec_return(&ca->ref);
+       if (r < (long) !ca->dying)
+               panic("bch_dev->ref underflow, last put: %pS\n", (void *) ca->last_put);
+       ca->last_put = _THIS_IP_;
+       if (!r)
+               complete(&ca->ref_completion);
+#else
        percpu_ref_put(&ca->ref);
+#endif
 }
 
 static inline void bch2_dev_put(struct bch_dev *ca)
 
                struct bch_dev *ca = rcu_dereference_protected(c->devs[i], true);
 
                if (ca) {
+                       EBUG_ON(atomic_long_read(&ca->ref) != 1);
                        bch2_free_super(&ca->disk_sb);
                        bch2_dev_free(ca);
                }
        bch2_time_stats_quantiles_exit(&ca->io_latency[READ]);
 
        percpu_ref_exit(&ca->io_ref);
+#ifndef CONFIG_BCACHEFS_DEBUG
        percpu_ref_exit(&ca->ref);
+#endif
        kobject_put(&ca->kobj);
 }
 
        bch2_dev_journal_exit(ca);
 }
 
+#ifndef CONFIG_BCACHEFS_DEBUG
 static void bch2_dev_ref_complete(struct percpu_ref *ref)
 {
        struct bch_dev *ca = container_of(ref, struct bch_dev, ref);
 
        complete(&ca->ref_completion);
 }
+#endif
 
 static void bch2_dev_io_ref_complete(struct percpu_ref *ref)
 {
        ca->nr_btree_reserve = DIV_ROUND_UP(BTREE_NODE_RESERVE,
                             ca->mi.bucket_size / btree_sectors(c));
 
-       if (percpu_ref_init(&ca->ref, bch2_dev_ref_complete,
-                           0, GFP_KERNEL) ||
-           percpu_ref_init(&ca->io_ref, bch2_dev_io_ref_complete,
+#ifndef CONFIG_BCACHEFS_DEBUG
+       if (percpu_ref_init(&ca->ref, bch2_dev_ref_complete, 0, GFP_KERNEL))
+               goto err;
+#else
+       atomic_long_set(&ca->ref, 1);
+#endif
+
+       if (percpu_ref_init(&ca->io_ref, bch2_dev_io_ref_complete,
                            PERCPU_REF_INIT_DEAD, GFP_KERNEL) ||
            !(ca->sb_read_scratch = (void *) __get_free_page(GFP_KERNEL)) ||
            bch2_dev_buckets_alloc(c, ca) ||
        rcu_assign_pointer(c->devs[ca->dev_idx], NULL);
        mutex_unlock(&c->sb_lock);
 
+#ifndef CONFIG_BCACHEFS_DEBUG
        percpu_ref_kill(&ca->ref);
+#else
+       ca->dying = true;
+       bch2_dev_put(ca);
+#endif
        wait_for_completion(&ca->ref_completion);
 
        bch2_dev_free(ca);