static inline void gic_pmr_mask_irqs(void)
 {
-       BUILD_BUG_ON(GICD_INT_DEF_PRI <= GIC_PRIO_IRQOFF);
+       BUILD_BUG_ON(GICD_INT_DEF_PRI < (GIC_PRIO_IRQOFF |
+                                        GIC_PRIO_PSR_I_SET));
+       BUILD_BUG_ON(GICD_INT_DEF_PRI >= GIC_PRIO_IRQON);
        gic_write_pmr(GIC_PRIO_IRQOFF);
 }
 
 
 
 #include <linux/irqflags.h>
 
+#include <asm/arch_gicv3.h>
 #include <asm/cpufeature.h>
 
 #define DAIF_PROCCTX           0
                :
                :
                : "memory");
+
+       /* Don't really care for a dsb here, we don't intend to enable IRQs */
+       if (system_uses_irq_prio_masking())
+               gic_write_pmr(GIC_PRIO_IRQON | GIC_PRIO_PSR_I_SET);
+
        trace_hardirqs_off();
 }
 
 
        if (system_uses_irq_prio_masking()) {
                /* If IRQs are masked with PMR, reflect it in the flags */
-               if (read_sysreg_s(SYS_ICC_PMR_EL1) <= GIC_PRIO_IRQOFF)
+               if (read_sysreg_s(SYS_ICC_PMR_EL1) != GIC_PRIO_IRQON)
                        flags |= PSR_I_BIT;
        }
 
        if (!irq_disabled) {
                trace_hardirqs_on();
 
-               if (system_uses_irq_prio_masking())
-                       arch_local_irq_enable();
-       } else if (!(flags & PSR_A_BIT)) {
-               /*
-                * If interrupts are disabled but we can take
-                * asynchronous errors, we can take NMIs
-                */
                if (system_uses_irq_prio_masking()) {
-                       flags &= ~PSR_I_BIT;
+                       gic_write_pmr(GIC_PRIO_IRQON);
+                       dsb(sy);
+               }
+       } else if (system_uses_irq_prio_masking()) {
+               u64 pmr;
+
+               if (!(flags & PSR_A_BIT)) {
                        /*
-                        * There has been concern that the write to daif
-                        * might be reordered before this write to PMR.
-                        * From the ARM ARM DDI 0487D.a, section D1.7.1
-                        * "Accessing PSTATE fields":
-                        *   Writes to the PSTATE fields have side-effects on
-                        *   various aspects of the PE operation. All of these
-                        *   side-effects are guaranteed:
-                        *     - Not to be visible to earlier instructions in
-                        *       the execution stream.
-                        *     - To be visible to later instructions in the
-                        *       execution stream
-                        *
-                        * Also, writes to PMR are self-synchronizing, so no
-                        * interrupts with a lower priority than PMR is signaled
-                        * to the PE after the write.
-                        *
-                        * So we don't need additional synchronization here.
+                        * If interrupts are disabled but we can take
+                        * asynchronous errors, we can take NMIs
                         */
-                       arch_local_irq_disable();
+                       flags &= ~PSR_I_BIT;
+                       pmr = GIC_PRIO_IRQOFF;
+               } else {
+                       pmr = GIC_PRIO_IRQON | GIC_PRIO_PSR_I_SET;
                }
+
+               /*
+                * There has been concern that the write to daif
+                * might be reordered before this write to PMR.
+                * From the ARM ARM DDI 0487D.a, section D1.7.1
+                * "Accessing PSTATE fields":
+                *   Writes to the PSTATE fields have side-effects on
+                *   various aspects of the PE operation. All of these
+                *   side-effects are guaranteed:
+                *     - Not to be visible to earlier instructions in
+                *       the execution stream.
+                *     - To be visible to later instructions in the
+                *       execution stream
+                *
+                * Also, writes to PMR are self-synchronizing, so no
+                * interrupts with a lower priority than PMR is signaled
+                * to the PE after the write.
+                *
+                * So we don't need additional synchronization here.
+                */
+               gic_write_pmr(pmr);
        }
 
        write_sysreg(flags, daif);
 
  */
 static inline unsigned long arch_local_save_flags(void)
 {
-       unsigned long daif_bits;
        unsigned long flags;
 
-       daif_bits = read_sysreg(daif);
-
-       /*
-        * The asm is logically equivalent to:
-        *
-        * if (system_uses_irq_prio_masking())
-        *      flags = (daif_bits & PSR_I_BIT) ?
-        *                      GIC_PRIO_IRQOFF :
-        *                      read_sysreg_s(SYS_ICC_PMR_EL1);
-        * else
-        *      flags = daif_bits;
-        */
        asm volatile(ALTERNATIVE(
-                       "mov    %0, %1\n"
-                       "nop\n"
-                       "nop",
-                       __mrs_s("%0", SYS_ICC_PMR_EL1)
-                       "ands   %1, %1, " __stringify(PSR_I_BIT) "\n"
-                       "csel   %0, %0, %2, eq",
-                       ARM64_HAS_IRQ_PRIO_MASKING)
-               : "=&r" (flags), "+r" (daif_bits)
-               : "r" ((unsigned long) GIC_PRIO_IRQOFF)
-               : "cc", "memory");
+               "mrs    %0, daif",
+               __mrs_s("%0", SYS_ICC_PMR_EL1),
+               ARM64_HAS_IRQ_PRIO_MASKING)
+               : "=&r" (flags)
+               :
+               : "memory");
 
        return flags;
 }
 
+static inline int arch_irqs_disabled_flags(unsigned long flags)
+{
+       int res;
+
+       asm volatile(ALTERNATIVE(
+               "and    %w0, %w1, #" __stringify(PSR_I_BIT),
+               "eor    %w0, %w1, #" __stringify(GIC_PRIO_IRQON),
+               ARM64_HAS_IRQ_PRIO_MASKING)
+               : "=&r" (res)
+               : "r" ((int) flags)
+               : "memory");
+
+       return res;
+}
+
 static inline unsigned long arch_local_irq_save(void)
 {
        unsigned long flags;
 
        flags = arch_local_save_flags();
 
-       arch_local_irq_disable();
+       /*
+        * There are too many states with IRQs disabled, just keep the current
+        * state if interrupts are already disabled/masked.
+        */
+       if (!arch_irqs_disabled_flags(flags))
+               arch_local_irq_disable();
 
        return flags;
 }
                : "memory");
 }
 
-static inline int arch_irqs_disabled_flags(unsigned long flags)
-{
-       int res;
-
-       asm volatile(ALTERNATIVE(
-                       "and    %w0, %w1, #" __stringify(PSR_I_BIT) "\n"
-                       "nop",
-                       "cmp    %w1, #" __stringify(GIC_PRIO_IRQOFF) "\n"
-                       "cset   %w0, ls",
-                       ARM64_HAS_IRQ_PRIO_MASKING)
-               : "=&r" (res)
-               : "r" ((int) flags)
-               : "cc", "memory");
-
-       return res;
-}
 #endif
 #endif
 
         * will not signal the CPU of interrupts of lower priority, and the
         * only way to get out will be via guest exceptions.
         * Naturally, we want to avoid this.
+        *
+        * local_daif_mask() already sets GIC_PRIO_PSR_I_SET, we just need a
+        * dsb to ensure the redistributor is forwards EL2 IRQs to the CPU.
         */
-       if (system_uses_irq_prio_masking()) {
-               gic_write_pmr(GIC_PRIO_IRQON);
+       if (system_uses_irq_prio_masking())
                dsb(sy);
-       }
 }
 
 static inline void kvm_arm_vhe_guest_exit(void)
 
  * means masking more IRQs (or at least that the same IRQs remain masked).
  *
  * To mask interrupts, we clear the most significant bit of PMR.
+ *
+ * Some code sections either automatically switch back to PSR.I or explicitly
+ * require to not use priority masking. If bit GIC_PRIO_PSR_I_SET is included
+ * in the  the priority mask, it indicates that PSR.I should be set and
+ * interrupt disabling temporarily does not rely on IRQ priorities.
  */
-#define GIC_PRIO_IRQON         0xf0
-#define GIC_PRIO_IRQOFF                (GIC_PRIO_IRQON & ~0x80)
+#define GIC_PRIO_IRQON                 0xc0
+#define GIC_PRIO_IRQOFF                        (GIC_PRIO_IRQON & ~0x80)
+#define GIC_PRIO_PSR_I_SET             (1 << 4)
 
 /* Additional SPSR bits not exposed in the UABI */
 #define PSR_IL_BIT             (1 << 20)
 
        /*
         * Registers that may be useful after this macro is invoked:
         *
+        * x20 - ICC_PMR_EL1
         * x21 - aborted SP
         * x22 - aborted PC
         * x23 - aborted PSTATE
        .endm
 #endif
 
+       .macro  gic_prio_kentry_setup, tmp:req
+#ifdef CONFIG_ARM64_PSEUDO_NMI
+       alternative_if ARM64_HAS_IRQ_PRIO_MASKING
+       mov     \tmp, #(GIC_PRIO_PSR_I_SET | GIC_PRIO_IRQON)
+       msr_s   SYS_ICC_PMR_EL1, \tmp
+       alternative_else_nop_endif
+#endif
+       .endm
+
+       .macro  gic_prio_irq_setup, pmr:req, tmp:req
+#ifdef CONFIG_ARM64_PSEUDO_NMI
+       alternative_if ARM64_HAS_IRQ_PRIO_MASKING
+       orr     \tmp, \pmr, #GIC_PRIO_PSR_I_SET
+       msr_s   SYS_ICC_PMR_EL1, \tmp
+       alternative_else_nop_endif
+#endif
+       .endm
+
        .text
 
 /*
        cmp     x24, #ESR_ELx_EC_BRK64          // if BRK64
        cinc    x24, x24, eq                    // set bit '0'
        tbz     x24, #0, el1_inv                // EL1 only
+       gic_prio_kentry_setup tmp=x3
        mrs     x0, far_el1
        mov     x2, sp                          // struct pt_regs
        bl      do_debug_exception
        .align  6
 el1_irq:
        kernel_entry 1
+       gic_prio_irq_setup pmr=x20, tmp=x1
        enable_da_f
 
 #ifdef CONFIG_ARM64_PSEUDO_NMI
-alternative_if ARM64_HAS_IRQ_PRIO_MASKING
-       ldr     x20, [sp, #S_PMR_SAVE]
-alternative_else_nop_endif
        test_irqs_unmasked      res=x0, pmr=x20
        cbz     x0, 1f
        bl      asm_nmi_enter
 
 #ifdef CONFIG_ARM64_PSEUDO_NMI
        /*
-        * if IRQs were disabled when we received the interrupt, we have an NMI
-        * and we are not re-enabling interrupt upon eret. Skip tracing.
+        * When using IRQ priority masking, we can get spurious interrupts while
+        * PMR is set to GIC_PRIO_IRQOFF. An NMI might also have occurred in a
+        * section with interrupts disabled. Skip tracing in those cases.
         */
        test_irqs_unmasked      res=x0, pmr=x20
        cbz     x0, 1f
         * Instruction abort handling
         */
        mrs     x26, far_el1
+       gic_prio_kentry_setup tmp=x0
        enable_da_f
 #ifdef CONFIG_TRACE_IRQFLAGS
        bl      trace_hardirqs_off
         * Stack or PC alignment exception handling
         */
        mrs     x26, far_el1
+       gic_prio_kentry_setup tmp=x0
        enable_da_f
 #ifdef CONFIG_TRACE_IRQFLAGS
        bl      trace_hardirqs_off
         * Debug exception handling
         */
        tbnz    x24, #0, el0_inv                // EL0 only
+       gic_prio_kentry_setup tmp=x3
        mrs     x0, far_el1
        mov     x1, x25
        mov     x2, sp
 el0_irq:
        kernel_entry 0
 el0_irq_naked:
+       gic_prio_irq_setup pmr=x20, tmp=x0
        enable_da_f
+
 #ifdef CONFIG_TRACE_IRQFLAGS
        bl      trace_hardirqs_off
 #endif
 el1_error:
        kernel_entry 1
        mrs     x1, esr_el1
+       gic_prio_kentry_setup tmp=x2
        enable_dbg
        mov     x0, sp
        bl      do_serror
        kernel_entry 0
 el0_error_naked:
        mrs     x1, esr_el1
+       gic_prio_kentry_setup tmp=x2
        enable_dbg
        mov     x0, sp
        bl      do_serror
  */
 ret_to_user:
        disable_daif
+       gic_prio_kentry_setup tmp=x3
        ldr     x1, [tsk, #TSK_TI_FLAGS]
        and     x2, x1, #_TIF_WORK_MASK
        cbnz    x2, work_pending
  */
        .align  6
 el0_svc:
+       gic_prio_kentry_setup tmp=x1
        mov     x0, sp
        bl      el0_svc_handler
        b       ret_to_user
 
         * be raised.
         */
        pmr = gic_read_pmr();
-       gic_write_pmr(GIC_PRIO_IRQON);
+       gic_write_pmr(GIC_PRIO_IRQON | GIC_PRIO_PSR_I_SET);
 
        __cpu_do_idle();
 
 
 
        WARN_ON(!(cpuflags & PSR_I_BIT));
 
-       gic_write_pmr(GIC_PRIO_IRQOFF);
-
        /* We can only unmask PSR.I if we can take aborts */
-       if (!(cpuflags & PSR_A_BIT))
+       if (!(cpuflags & PSR_A_BIT)) {
+               gic_write_pmr(GIC_PRIO_IRQOFF);
                write_sysreg(cpuflags & ~PSR_I_BIT, daif);
+       } else {
+               gic_write_pmr(GIC_PRIO_IRQON | GIC_PRIO_PSR_I_SET);
+       }
 }
 
 /*
 
         * Naturally, we want to avoid this.
         */
        if (system_uses_irq_prio_masking()) {
-               gic_write_pmr(GIC_PRIO_IRQON);
+               gic_write_pmr(GIC_PRIO_IRQON | GIC_PRIO_PSR_I_SET);
                dsb(sy);
        }