]> www.infradead.org Git - users/hch/misc.git/commitdiff
drm/amdgpu/gfx11: Implement cleaner shader support for GFX11 hardware
authorSrinivasan Shanmugam <srinivasan.shanmugam@amd.com>
Thu, 3 Oct 2024 10:13:14 +0000 (15:43 +0530)
committerAlex Deucher <alexander.deucher@amd.com>
Mon, 7 Oct 2024 18:08:56 +0000 (14:08 -0400)
The patch modifies the gfx_v11_0_kiq_set_resources function to write
the cleaner shader's memory controller address to the ring buffer. It
also adds a new function, gfx_v11_0_ring_emit_cleaner_shader, which
emits the PACKET3_RUN_CLEANER_SHADER packet to the ring buffer.

This patch adds support for the PACKET3_RUN_CLEANER_SHADER packet in the
gfx_v11_0 module. This packet is used to emit the cleaner shader, which
is used to clear GPU memory before it's reused, helping to prevent data
leakage between different processes.

Finally, the patch updates the ring function structures to include the
new gfx_v11_0_ring_emit_cleaner_shader function. This allows the
cleaner shader to be emitted as part of the ring's operations.

Cc: Christian König <christian.koenig@amd.com>
Cc: Alex Deucher <alexander.deucher@amd.com>
Signed-off-by: Srinivasan Shanmugam <srinivasan.shanmugam@amd.com>
Reviewed-by: Alex Deucher <alexander.deucher@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c

index 6b22128ab004b9f7056344f47464bc12385b7cc3..c78a63da8d2ee01be3271ad95b8db61625bd62e4 100644 (file)
@@ -293,14 +293,20 @@ static void gfx_v11_0_update_perf_clk(struct amdgpu_device *adev,
 
 static void gfx11_kiq_set_resources(struct amdgpu_ring *kiq_ring, uint64_t queue_mask)
 {
+       struct amdgpu_device *adev = kiq_ring->adev;
+       u64 shader_mc_addr;
+
+       /* Cleaner shader MC address */
+       shader_mc_addr = adev->gfx.cleaner_shader_gpu_addr >> 8;
+
        amdgpu_ring_write(kiq_ring, PACKET3(PACKET3_SET_RESOURCES, 6));
        amdgpu_ring_write(kiq_ring, PACKET3_SET_RESOURCES_VMID_MASK(0) |
                          PACKET3_SET_RESOURCES_UNMAP_LATENTY(0xa) | /* unmap_latency: 0xa (~ 1s) */
                          PACKET3_SET_RESOURCES_QUEUE_TYPE(0)); /* vmid_mask:0 queue_type:0 (KIQ) */
        amdgpu_ring_write(kiq_ring, lower_32_bits(queue_mask)); /* queue mask lo */
        amdgpu_ring_write(kiq_ring, upper_32_bits(queue_mask)); /* queue mask hi */
-       amdgpu_ring_write(kiq_ring, 0); /* gws mask lo */
-       amdgpu_ring_write(kiq_ring, 0); /* gws mask hi */
+       amdgpu_ring_write(kiq_ring, lower_32_bits(shader_mc_addr)); /* cleaner shader addr lo */
+       amdgpu_ring_write(kiq_ring, upper_32_bits(shader_mc_addr)); /* cleaner shader addr hi */
        amdgpu_ring_write(kiq_ring, 0); /* oac mask */
        amdgpu_ring_write(kiq_ring, 0); /* gds heap base:0, gds heap size:0 */
 }
@@ -1575,6 +1581,11 @@ static int gfx_v11_0_sw_init(struct amdgpu_ip_block *ip_block)
                break;
        }
 
+       switch (amdgpu_ip_version(adev, GC_HWIP, 0)) {
+       default:
+               adev->gfx.enable_cleaner_shader = false;
+       }
+
        /* Enable CG flag in one VF mode for enabling RLC safe mode enter/exit */
        if (amdgpu_ip_version(adev, GC_HWIP, 0) == IP_VERSION(11, 0, 3) &&
            amdgpu_sriov_is_pp_one_vf(adev))
@@ -1700,6 +1711,10 @@ static int gfx_v11_0_sw_init(struct amdgpu_ip_block *ip_block)
 
        gfx_v11_0_alloc_ip_dump(adev);
 
+       r = amdgpu_gfx_sysfs_isolation_shader_init(adev);
+       if (r)
+               return r;
+
        return 0;
 }
 
@@ -1749,6 +1764,8 @@ static int gfx_v11_0_sw_fini(struct amdgpu_ip_block *ip_block)
                amdgpu_gfx_kiq_fini(adev, 0);
        }
 
+       amdgpu_gfx_cleaner_shader_sw_fini(adev);
+
        gfx_v11_0_pfp_fini(adev);
        gfx_v11_0_me_fini(adev);
        gfx_v11_0_rlc_fini(adev);
@@ -1759,6 +1776,8 @@ static int gfx_v11_0_sw_fini(struct amdgpu_ip_block *ip_block)
 
        gfx_v11_0_free_microcode(adev);
 
+       amdgpu_gfx_sysfs_isolation_shader_fini(adev);
+
        kfree(adev->gfx.ip_dump_core);
        kfree(adev->gfx.ip_dump_compute_queues);
        kfree(adev->gfx.ip_dump_gfx_queues);
@@ -4575,6 +4594,9 @@ static int gfx_v11_0_hw_init(struct amdgpu_ip_block *ip_block)
        int r;
        struct amdgpu_device *adev = ip_block->adev;
 
+       amdgpu_gfx_cleaner_shader_init(adev, adev->gfx.cleaner_shader_size,
+                                      adev->gfx.cleaner_shader_ptr);
+
        if (adev->firmware.load_type == AMDGPU_FW_LOAD_RLC_BACKDOOR_AUTO) {
                if (adev->gfx.imu.funcs) {
                        /* RLC autoload sequence 1: Program rlc ram */
@@ -6772,6 +6794,13 @@ static void gfx_v11_ip_dump(struct amdgpu_ip_block *ip_block)
        amdgpu_gfx_off_ctrl(adev, true);
 }
 
+static void gfx_v11_0_ring_emit_cleaner_shader(struct amdgpu_ring *ring)
+{
+       /* Emit the cleaner shader */
+       amdgpu_ring_write(ring, PACKET3(PACKET3_RUN_CLEANER_SHADER, 0));
+       amdgpu_ring_write(ring, 0);  /* RESERVED field, programmed to zero */
+}
+
 static const struct amd_ip_funcs gfx_v11_0_ip_funcs = {
        .name = "gfx_v11_0",
        .early_init = gfx_v11_0_early_init,
@@ -6821,7 +6850,8 @@ static const struct amdgpu_ring_funcs gfx_v11_0_ring_funcs_gfx = {
                5 + /* HDP_INVL */
                22 + /* SET_Q_PREEMPTION_MODE */
                8 + 8 + /* FENCE x2 */
-               8, /* gfx_v11_0_emit_mem_sync */
+               8 + /* gfx_v11_0_emit_mem_sync */
+               2, /* gfx_v11_0_ring_emit_cleaner_shader */
        .emit_ib_size = 4, /* gfx_v11_0_ring_emit_ib_gfx */
        .emit_ib = gfx_v11_0_ring_emit_ib_gfx,
        .emit_fence = gfx_v11_0_ring_emit_fence,
@@ -6844,6 +6874,7 @@ static const struct amdgpu_ring_funcs gfx_v11_0_ring_funcs_gfx = {
        .soft_recovery = gfx_v11_0_ring_soft_recovery,
        .emit_mem_sync = gfx_v11_0_emit_mem_sync,
        .reset = gfx_v11_0_reset_kgq,
+       .emit_cleaner_shader = gfx_v11_0_ring_emit_cleaner_shader,
 };
 
 static const struct amdgpu_ring_funcs gfx_v11_0_ring_funcs_compute = {
@@ -6864,7 +6895,8 @@ static const struct amdgpu_ring_funcs gfx_v11_0_ring_funcs_compute = {
                SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 7 +
                2 + /* gfx_v11_0_ring_emit_vm_flush */
                8 + 8 + 8 + /* gfx_v11_0_ring_emit_fence x3 for user fence, vm fence */
-               8, /* gfx_v11_0_emit_mem_sync */
+               8 + /* gfx_v11_0_emit_mem_sync */
+               2, /* gfx_v11_0_ring_emit_cleaner_shader */
        .emit_ib_size = 7, /* gfx_v11_0_ring_emit_ib_compute */
        .emit_ib = gfx_v11_0_ring_emit_ib_compute,
        .emit_fence = gfx_v11_0_ring_emit_fence,
@@ -6882,6 +6914,7 @@ static const struct amdgpu_ring_funcs gfx_v11_0_ring_funcs_compute = {
        .soft_recovery = gfx_v11_0_ring_soft_recovery,
        .emit_mem_sync = gfx_v11_0_emit_mem_sync,
        .reset = gfx_v11_0_reset_kcq,
+       .emit_cleaner_shader = gfx_v11_0_ring_emit_cleaner_shader,
 };
 
 static const struct amdgpu_ring_funcs gfx_v11_0_ring_funcs_kiq = {