drm/amdgpu: Enable DISABLE_BARRIER_WAITCNT for Arcturus
authorJoseph Greathouse <Joseph.Greathouse@amd.com>
Mon, 27 Jan 2020 22:08:11 +0000 (16:08 -0600)
committerAlex Deucher <alexander.deucher@amd.com>
Thu, 30 Jan 2020 22:15:27 +0000 (17:15 -0500)
In previous gfx9 parts, S_BARRIER shader instructions are implicitly
S_WAITCNT 0 instructions as well. This setting turns off that
mechanism in Arcturus and beyond. With this, shaders must follow the
ISA guide insofar as putting in explicit S_WAITCNT operations even
after an S_BARRIER.

v2: Fix patch title to list component

Signed-off-by: Joseph Greathouse <Joseph.Greathouse@amd.com>
Reviewed-by: Felix Kuehling <Felix.Kuehling@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/gfx_v9_0.c
drivers/gpu/drm/amd/include/asic_reg/gc/gc_9_0_sh_mask.h

index 51ec8a7..90f64b8 100644 (file)
@@ -2441,6 +2441,22 @@ static void gfx_v9_0_init_gds_vmid(struct amdgpu_device *adev)
        }
 }
 
+static void gfx_v9_0_init_sq_config(struct amdgpu_device *adev)
+{
+       uint32_t tmp;
+
+       switch (adev->asic_type) {
+       case CHIP_ARCTURUS:
+               tmp = RREG32_SOC15(GC, 0, mmSQ_CONFIG);
+               tmp = REG_SET_FIELD(tmp, SQ_CONFIG,
+                                       DISABLE_BARRIER_WAITCNT, 1);
+               WREG32_SOC15(GC, 0, mmSQ_CONFIG, tmp);
+               break;
+       default:
+               break;
+       };
+}
+
 static void gfx_v9_0_constants_init(struct amdgpu_device *adev)
 {
        u32 tmp;
@@ -2486,6 +2502,7 @@ static void gfx_v9_0_constants_init(struct amdgpu_device *adev)
 
        gfx_v9_0_init_compute_vmid(adev);
        gfx_v9_0_init_gds_vmid(adev);
+       gfx_v9_0_init_sq_config(adev);
 }
 
 static void gfx_v9_0_wait_for_rlc_serdes(struct amdgpu_device *adev)
index c9e3f6d..ea316d8 100644 (file)
 
 // addressBlock: gc_sqdec
 //SQ_CONFIG
-#define SQ_CONFIG__UNUSED__SHIFT                                                                              0x0
+#define SQ_CONFIG__DISABLE_BARRIER_WAITCNT__SHIFT                                                             0x0
+#define SQ_CONFIG__UNUSED__SHIFT                                                                              0x1
 #define SQ_CONFIG__OVERRIDE_ALU_BUSY__SHIFT                                                                   0x7
 #define SQ_CONFIG__DEBUG_EN__SHIFT                                                                            0x8
 #define SQ_CONFIG__DEBUG_SINGLE_MEMOP__SHIFT                                                                  0x9
 #define SQ_CONFIG__DISABLE_SP_REDUNDANT_THREAD_GATING__SHIFT                                                  0x1d
 #define SQ_CONFIG__DISABLE_FLAT_SOFT_CLAUSE__SHIFT                                                            0x1e
 #define SQ_CONFIG__DISABLE_MIMG_SOFT_CLAUSE__SHIFT                                                            0x1f
-#define SQ_CONFIG__UNUSED_MASK                                                                                0x0000007FL
+#define SQ_CONFIG__DISABLE_BARRIER_WAITCNT_MASK                                                               0x00000001L
+#define SQ_CONFIG__UNUSED_MASK                                                                                0x0000007EL
 #define SQ_CONFIG__OVERRIDE_ALU_BUSY_MASK                                                                     0x00000080L
 #define SQ_CONFIG__DEBUG_EN_MASK                                                                              0x00000100L
 #define SQ_CONFIG__DEBUG_SINGLE_MEMOP_MASK                                                                    0x00000200L