#define DML2_MAX_FMT_420_BUFFER_WIDTH 4096
 #define DML_MAX_NUM_OF_SLICES_PER_DSC 4
+#define ALLOW_SDPIF_RATE_LIMIT_PRE_CSTATE
 
 const char *dml2_core_internal_bw_type_str(enum dml2_core_internal_bw_type bw_type)
 {
 #endif
 
        *p->hw_debug5 = false;
+#ifdef ALLOW_SDPIF_RATE_LIMIT_PRE_CSTATE
+       if (p->NumberOfActiveSurfaces > 1)
+               *p->hw_debug5 = true;
+#else
        for (unsigned int k = 0; k < p->NumberOfActiveSurfaces; ++k) {
                if (!(p->mrq_present) && (!(*p->UnboundedRequestEnabled)) && (TotalActiveDPP == 1)
                        && p->display_cfg->plane_descriptors[k].surface.dcc.enable
                dml2_printf("DML::%s: k=%u hw_debug5 = %u\n", __func__, k, *p->hw_debug5);
 #endif
        }
+#endif
 }
 
 static enum dml2_odm_mode DecideODMMode(unsigned int HActive,
 
        uint32_t DCHUBBUB_ARB_FRAC_URG_BW_MALL_B;
        uint32_t DCHUBBUB_TIMEOUT_DETECTION_CTRL1;
        uint32_t DCHUBBUB_TIMEOUT_DETECTION_CTRL2;
+       uint32_t DCHUBBUB_CTRL_STATUS;
 };
 
 #define HUBBUB_REG_FIELD_LIST_DCN32(type) \
                type DCHUBBUB_TIMEOUT_REQ_STALL_THRESHOLD;\
                type DCHUBBUB_TIMEOUT_PSTATE_STALL_THRESHOLD;\
                type DCHUBBUB_TIMEOUT_DETECTION_EN;\
-               type DCHUBBUB_TIMEOUT_TIMER_RESET
+               type DCHUBBUB_TIMEOUT_TIMER_RESET;\
+               type ROB_UNDERFLOW_STATUS;\
+               type ROB_OVERFLOW_STATUS;\
+               type ROB_OVERFLOW_CLEAR;\
+               type DCHUBBUB_HW_DEBUG;\
+               type CSTATE_SWATH_CHK_GOOD_MODE
 
 #define HUBBUB_STUTTER_REG_FIELD_LIST(type) \
                type DCHUBBUB_ARB_ALLOW_SR_ENTER_WATERMARK_A;\
 
        unsigned int det1_size;
        unsigned int det2_size;
        unsigned int det3_size;
+       bool allow_sdpif_rate_limit_when_cstate_req;
 };
 
 void hubbub2_construct(struct dcn20_hubbub *hubbub,
 
        }
 }
 
-static void dcn401_program_timeout_thresholds(struct hubbub *hubbub, struct dml2_display_arb_regs *arb_regs)
+static bool dcn401_program_arbiter(struct hubbub *hubbub, struct dml2_display_arb_regs *arb_regs, bool safe_to_lower)
 {
        struct dcn20_hubbub *hubbub2 = TO_DCN20_HUBBUB(hubbub);
 
+       bool wm_pending = false;
+       uint32_t temp;
+
        /* request backpressure and outstanding return threshold (unused)*/
        //REG_UPDATE(DCHUBBUB_TIMEOUT_DETECTION_CTRL1, DCHUBBUB_TIMEOUT_REQ_STALL_THRESHOLD, arb_regs->req_stall_threshold);
 
        /* P-State stall threshold */
        REG_UPDATE(DCHUBBUB_TIMEOUT_DETECTION_CTRL2, DCHUBBUB_TIMEOUT_PSTATE_STALL_THRESHOLD, arb_regs->pstate_stall_threshold);
+
+       if (safe_to_lower || arb_regs->allow_sdpif_rate_limit_when_cstate_req > hubbub2->allow_sdpif_rate_limit_when_cstate_req) {
+               hubbub2->allow_sdpif_rate_limit_when_cstate_req = arb_regs->allow_sdpif_rate_limit_when_cstate_req;
+
+               /* only update the required bits */
+               REG_GET(DCHUBBUB_CTRL_STATUS, DCHUBBUB_HW_DEBUG, &temp);
+               if (hubbub2->allow_sdpif_rate_limit_when_cstate_req) {
+                       temp |= (1 << 5);
+               } else {
+                       temp &= ~(1 << 5);
+               }
+               REG_UPDATE(DCHUBBUB_CTRL_STATUS, DCHUBBUB_HW_DEBUG, temp);
+       } else {
+               wm_pending = true;
+       }
+
+       return wm_pending;
 }
 
 static const struct hubbub_funcs hubbub4_01_funcs = {
        .program_det_segments = dcn401_program_det_segments,
        .program_compbuf_segments = dcn401_program_compbuf_segments,
        .wait_for_det_update = dcn401_wait_for_det_update,
-       .program_timeout_thresholds = dcn401_program_timeout_thresholds,
+       .program_arbiter = dcn401_program_arbiter,
 };
 
 void hubbub401_construct(struct dcn20_hubbub *hubbub2,
 
        HUBBUB_SF(DCHUBBUB_TIMEOUT_DETECTION_CTRL1, DCHUBBUB_TIMEOUT_REQ_STALL_THRESHOLD, mask_sh),\
        HUBBUB_SF(DCHUBBUB_TIMEOUT_DETECTION_CTRL2, DCHUBBUB_TIMEOUT_PSTATE_STALL_THRESHOLD, mask_sh),\
        HUBBUB_SF(DCHUBBUB_TIMEOUT_DETECTION_CTRL2, DCHUBBUB_TIMEOUT_DETECTION_EN, mask_sh),\
-       HUBBUB_SF(DCHUBBUB_TIMEOUT_DETECTION_CTRL2, DCHUBBUB_TIMEOUT_TIMER_RESET, mask_sh)
+       HUBBUB_SF(DCHUBBUB_TIMEOUT_DETECTION_CTRL2, DCHUBBUB_TIMEOUT_TIMER_RESET, mask_sh),\
+       HUBBUB_SF(DCHUBBUB_CTRL_STATUS, ROB_UNDERFLOW_STATUS, mask_sh),\
+       HUBBUB_SF(DCHUBBUB_CTRL_STATUS, ROB_OVERFLOW_STATUS, mask_sh),\
+       HUBBUB_SF(DCHUBBUB_CTRL_STATUS, ROB_OVERFLOW_CLEAR, mask_sh),\
+       HUBBUB_SF(DCHUBBUB_CTRL_STATUS, DCHUBBUB_HW_DEBUG, mask_sh),\
+       HUBBUB_SF(DCHUBBUB_CTRL_STATUS, CSTATE_SWATH_CHK_GOOD_MODE, mask_sh)
 
 bool hubbub401_program_urgent_watermarks(
                struct hubbub *hubbub,
 
                                        &context->bw_ctx.bw.dcn.watermarks,
                                        dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000,
                                        false);
+       /* update timeout thresholds */
+       if (hubbub->funcs->program_arbiter) {
+               dc->wm_optimized_required |= hubbub->funcs->program_arbiter(hubbub, &context->bw_ctx.bw.dcn.arb_regs, false);
+       }
 
        /* decrease compbuf size */
        if (hubbub->funcs->program_compbuf_segments) {
                                        &context->bw_ctx.bw.dcn.watermarks,
                                        dc->res_pool->ref_clocks.dchub_ref_clock_inKhz / 1000,
                                        true);
+       /* update timeout thresholds */
+       if (hubbub->funcs->program_arbiter) {
+               hubbub->funcs->program_arbiter(hubbub, &context->bw_ctx.bw.dcn.arb_regs, true);
+       }
 
        if (dc->clk_mgr->dc_mode_softmax_enabled)
                if (dc->clk_mgr->clks.dramclk_khz > dc->clk_mgr->bw_params->dc_mode_softmax_memclk * 1000 &&
                                                pipe_ctx->dlg_regs.min_dst_y_next_start);
                }
        }
-
-       /* update timeout thresholds */
-       if (hubbub->funcs->program_timeout_thresholds) {
-               hubbub->funcs->program_timeout_thresholds(hubbub, &context->bw_ctx.bw.dcn.arb_regs);
-       }
 }
 
 void dcn401_fams2_global_control_lock(struct dc *dc,
 
        void (*program_det_segments)(struct hubbub *hubbub, int hubp_inst, unsigned det_buffer_size_seg);
        void (*program_compbuf_segments)(struct hubbub *hubbub, unsigned compbuf_size_seg, bool safe_to_increase);
        void (*wait_for_det_update)(struct hubbub *hubbub, int hubp_inst);
-       void (*program_timeout_thresholds)(struct hubbub *hubbub, struct dml2_display_arb_regs *arb_regs);
+       bool (*program_arbiter)(struct hubbub *hubbub, struct dml2_display_arb_regs *arb_regs, bool safe_to_lower);
 };
 
 struct hubbub {
 
        SR(DCHUBBUB_SDPIF_CFG1),                                                 \
        SR(DCHUBBUB_MEM_PWR_MODE_CTRL),                                          \
        SR(DCHUBBUB_TIMEOUT_DETECTION_CTRL1),                                    \
-       SR(DCHUBBUB_TIMEOUT_DETECTION_CTRL2)
+       SR(DCHUBBUB_TIMEOUT_DETECTION_CTRL2),                                                                    \
+       SR(DCHUBBUB_CTRL_STATUS)
 
 /* DCCG */