/*
  * The save/restore register list must be pre-calculated to a temporary
- * buffer of driver defined size before it can be generated in place
- * inside the ADS.
+ * buffer before it can be copied inside the ADS.
  */
-#define MAX_MMIO_REGS  128     /* Arbitrary size, increase as needed */
 struct temp_regset {
+       /*
+        * ptr to the section of the storage for the engine currently being
+        * worked on
+        */
        struct guc_mmio_reg *registers;
-       u32 used;
-       u32 size;
+       /* ptr to the base of the allocated storage for all engines */
+       struct guc_mmio_reg *storage;
+       u32 storage_used;
+       u32 storage_max;
 };
 
 static int guc_mmio_reg_cmp(const void *a, const void *b)
        return (int)ra->offset - (int)rb->offset;
 }
 
+static struct guc_mmio_reg * __must_check
+__mmio_reg_add(struct temp_regset *regset, struct guc_mmio_reg *reg)
+{
+       u32 pos = regset->storage_used;
+       struct guc_mmio_reg *slot;
+
+       if (pos >= regset->storage_max) {
+               size_t size = ALIGN((pos + 1) * sizeof(*slot), PAGE_SIZE);
+               struct guc_mmio_reg *r = krealloc(regset->storage,
+                                                 size, GFP_KERNEL);
+               if (!r) {
+                       WARN_ONCE(1, "Incomplete regset list: can't add register (%d)\n",
+                                 -ENOMEM);
+                       return ERR_PTR(-ENOMEM);
+               }
+
+               regset->registers = r + (regset->registers - regset->storage);
+               regset->storage = r;
+               regset->storage_max = size / sizeof(*slot);
+       }
+
+       slot = ®set->storage[pos];
+       regset->storage_used++;
+       *slot = *reg;
+
+       return slot;
+}
+
 static long __must_check guc_mmio_reg_add(struct temp_regset *regset,
                                          u32 offset, u32 flags)
 {
-       u32 count = regset->used;
+       u32 count = regset->storage_used - (regset->registers - regset->storage);
        struct guc_mmio_reg reg = {
                .offset = offset,
                .flags = flags,
        };
        struct guc_mmio_reg *slot;
 
-       GEM_BUG_ON(count >= regset->size);
-
        /*
         * The mmio list is built using separate lists within the driver.
         * It's possible that at some point we may attempt to add the same
                    sizeof(reg), guc_mmio_reg_cmp))
                return 0;
 
-       slot = ®set->registers[count];
-       regset->used++;
-       *slot = reg;
+       slot = __mmio_reg_add(regset, ®);
+       if (IS_ERR(slot))
+               return PTR_ERR(slot);
 
        while (slot-- > regset->registers) {
                GEM_BUG_ON(slot[0].offset == slot[1].offset);
        unsigned int i;
        int ret = 0;
 
-       regset->used = 0;
+       /*
+        * Each engine's registers point to a new start relative to
+        * storage
+        */
+       regset->registers = regset->storage + regset->storage_used;
 
        ret |= GUC_MMIO_REG_ADD(regset, RING_MODE_GEN7(base), true);
        ret |= GUC_MMIO_REG_ADD(regset, RING_HWS_PGA(base), false);
        return ret ? -1 : 0;
 }
 
-static int guc_mmio_reg_state_query(struct intel_guc *guc)
+static long guc_mmio_reg_state_create(struct intel_guc *guc)
 {
        struct intel_gt *gt = guc_to_gt(guc);
        struct intel_engine_cs *engine;
        enum intel_engine_id id;
-       struct temp_regset temp_set;
-       u32 total;
+       struct temp_regset temp_set = {};
+       long total = 0;
+       long ret;
 
-       /*
-        * Need to actually build the list in order to filter out
-        * duplicates and other such data dependent constructions.
-        */
-       temp_set.size = MAX_MMIO_REGS;
-       temp_set.registers = kmalloc_array(temp_set.size,
-                                          sizeof(*temp_set.registers),
-                                          GFP_KERNEL);
-       if (!temp_set.registers)
-               return -ENOMEM;
-
-       total = 0;
        for_each_engine(engine, gt, id) {
-               guc_mmio_regset_init(&temp_set, engine);
-               total += temp_set.used;
+               u32 used = temp_set.storage_used;
+
+               ret = guc_mmio_regset_init(&temp_set, engine);
+               if (ret < 0)
+                       goto fail_regset_init;
+
+               guc->ads_regset_count[id] = temp_set.storage_used - used;
+               total += guc->ads_regset_count[id];
        }
 
-       kfree(temp_set.registers);
+       guc->ads_regset = temp_set.storage;
+
+       drm_dbg(&guc_to_gt(guc)->i915->drm, "Used %zu KB for temporary ADS regset\n",
+               (temp_set.storage_max * sizeof(struct guc_mmio_reg)) >> 10);
 
        return total * sizeof(struct guc_mmio_reg);
+
+fail_regset_init:
+       kfree(temp_set.storage);
+       return ret;
 }
 
 static void guc_mmio_reg_state_init(struct intel_guc *guc,
 {
        struct intel_gt *gt = guc_to_gt(guc);
        struct intel_engine_cs *engine;
+       struct guc_mmio_reg *ads_registers;
        enum intel_engine_id id;
-       struct temp_regset temp_set;
-       struct guc_mmio_reg_set *ads_reg_set;
        u32 addr_ggtt, offset;
-       u8 guc_class;
 
        offset = guc_ads_regset_offset(guc);
        addr_ggtt = intel_guc_ggtt_offset(guc, guc->ads_vma) + offset;
-       temp_set.registers = (struct guc_mmio_reg *)(((u8 *)blob) + offset);
-       temp_set.size = guc->ads_regset_size / sizeof(temp_set.registers[0]);
+       ads_registers = (struct guc_mmio_reg *)(((u8 *)blob) + offset);
+
+       memcpy(ads_registers, guc->ads_regset, guc->ads_regset_size);
 
        for_each_engine(engine, gt, id) {
+               u32 count = guc->ads_regset_count[id];
+               struct guc_mmio_reg_set *ads_reg_set;
+               u8 guc_class;
+
                /* Class index is checked in class converter */
                GEM_BUG_ON(engine->instance >= GUC_MAX_INSTANCES_PER_CLASS);
 
                guc_class = engine_class_to_guc_class(engine->class);
                ads_reg_set = &blob->ads.reg_state_list[guc_class][engine->instance];
 
-               guc_mmio_regset_init(&temp_set, engine);
-               if (!temp_set.used) {
+               if (!count) {
                        ads_reg_set->address = 0;
                        ads_reg_set->count = 0;
                        continue;
                }
 
                ads_reg_set->address = addr_ggtt;
-               ads_reg_set->count = temp_set.used;
+               ads_reg_set->count = count;
 
-               temp_set.size -= temp_set.used;
-               temp_set.registers += temp_set.used;
-               addr_ggtt += temp_set.used * sizeof(struct guc_mmio_reg);
+               addr_ggtt += count * sizeof(struct guc_mmio_reg);
        }
-
-       GEM_BUG_ON(temp_set.size);
 }
 
 static void fill_engine_enable_masks(struct intel_gt *gt,
 
        GEM_BUG_ON(guc->ads_vma);
 
-       /* Need to calculate the reg state size dynamically: */
-       ret = guc_mmio_reg_state_query(guc);
+       /*
+        * Create reg state size dynamically on system memory to be copied to
+        * the final ads blob on gt init/reset
+        */
+       ret = guc_mmio_reg_state_create(guc);
        if (ret < 0)
                return ret;
        guc->ads_regset_size = ret;
 {
        i915_vma_unpin_and_release(&guc->ads_vma, I915_VMA_RELEASE_MAP);
        guc->ads_blob = NULL;
+       kfree(guc->ads_regset);
 }
 
 static void guc_ads_private_data_reset(struct intel_guc *guc)