From: Daniele Ceraolo Spurio <daniele.ceraolospu...@intel.com>

CCS re-uses the RCS functions for breadcrumb and flush emission.
However, CCS pipe_control has additional programming restrictions:

- Command Streamer Stall Enable must be always set
- Post Sync Operations must not be set to Write PS Depth Count
- 3D-related bits must not be set

Bspec: 47112
Cc: Vinay Belgaumkar <vinay.belgaum...@intel.com>
Signed-off-by: Daniele Ceraolo Spurio <daniele.ceraolospu...@intel.com>
Signed-off-by: Aravind Iddamsetty <aravind.iddamse...@intel.com>
Signed-off-by: Matt Roper <matthew.d.ro...@intel.com>
---
 drivers/gpu/drm/i915/gt/gen8_engine_cs.c     | 31 ++++++++++++++------
 drivers/gpu/drm/i915/gt/intel_gpu_commands.h | 15 ++++++++++
 2 files changed, 37 insertions(+), 9 deletions(-)

diff --git a/drivers/gpu/drm/i915/gt/gen8_engine_cs.c 
b/drivers/gpu/drm/i915/gt/gen8_engine_cs.c
index 461844dffd7e..bf79e5ee3e45 100644
--- a/drivers/gpu/drm/i915/gt/gen8_engine_cs.c
+++ b/drivers/gpu/drm/i915/gt/gen8_engine_cs.c
@@ -200,6 +200,8 @@ static u32 *gen12_emit_aux_table_inv(const i915_reg_t 
inv_reg, u32 *cs)
 
 int gen12_emit_flush_rcs(struct i915_request *rq, u32 mode)
 {
+       struct intel_engine_cs *engine = rq->engine;
+
        if (mode & EMIT_FLUSH) {
                u32 flags = 0;
                u32 *cs;
@@ -218,6 +220,9 @@ int gen12_emit_flush_rcs(struct i915_request *rq, u32 mode)
 
                flags |= PIPE_CONTROL_CS_STALL;
 
+               if (engine->class == COMPUTE_CLASS)
+                       flags &= ~PIPE_CONTROL_RENDER_ONLY_FLAGS;
+
                cs = intel_ring_begin(rq, 6);
                if (IS_ERR(cs))
                        return PTR_ERR(cs);
@@ -245,6 +250,9 @@ int gen12_emit_flush_rcs(struct i915_request *rq, u32 mode)
 
                flags |= PIPE_CONTROL_CS_STALL;
 
+               if (engine->class == COMPUTE_CLASS)
+                       flags &= ~PIPE_CONTROL_RENDER_ONLY_FLAGS;
+
                cs = intel_ring_begin(rq, 8 + 4);
                if (IS_ERR(cs))
                        return PTR_ERR(cs);
@@ -617,19 +625,24 @@ u32 *gen12_emit_fini_breadcrumb_xcs(struct i915_request 
*rq, u32 *cs)
 
 u32 *gen12_emit_fini_breadcrumb_rcs(struct i915_request *rq, u32 *cs)
 {
+       u32 flags = (PIPE_CONTROL_CS_STALL |
+                    PIPE_CONTROL_TILE_CACHE_FLUSH |
+                    PIPE_CONTROL_FLUSH_L3 |
+                    PIPE_CONTROL_RENDER_TARGET_CACHE_FLUSH |
+                    PIPE_CONTROL_DEPTH_CACHE_FLUSH |
+                    /* Wa_1409600907:tgl,rkl,dg1,adl-p */
+                    PIPE_CONTROL_DEPTH_STALL |
+                    PIPE_CONTROL_DC_FLUSH_ENABLE |
+                    PIPE_CONTROL_FLUSH_ENABLE);
+
+       if (rq->engine->class == COMPUTE_CLASS)
+               flags &= ~PIPE_CONTROL_RENDER_ONLY_FLAGS;
+
        cs = gen12_emit_ggtt_write_rcs(cs,
                                       rq->fence.seqno,
                                       hwsp_offset(rq),
                                       PIPE_CONTROL0_HDC_PIPELINE_FLUSH,
-                                      PIPE_CONTROL_CS_STALL |
-                                      PIPE_CONTROL_TILE_CACHE_FLUSH |
-                                      PIPE_CONTROL_FLUSH_L3 |
-                                      PIPE_CONTROL_RENDER_TARGET_CACHE_FLUSH |
-                                      PIPE_CONTROL_DEPTH_CACHE_FLUSH |
-                                      /* Wa_1409600907:tgl */
-                                      PIPE_CONTROL_DEPTH_STALL |
-                                      PIPE_CONTROL_DC_FLUSH_ENABLE |
-                                      PIPE_CONTROL_FLUSH_ENABLE);
+                                      flags);
 
        return gen12_emit_fini_breadcrumb_tail(rq, cs);
 }
diff --git a/drivers/gpu/drm/i915/gt/intel_gpu_commands.h 
b/drivers/gpu/drm/i915/gt/intel_gpu_commands.h
index 1c3af0fc0456..a3c1047a2c71 100644
--- a/drivers/gpu/drm/i915/gt/intel_gpu_commands.h
+++ b/drivers/gpu/drm/i915/gt/intel_gpu_commands.h
@@ -223,11 +223,14 @@
 #define   PIPE_CONTROL_COMMAND_CACHE_INVALIDATE                (1<<29) /* 
gen11+ */
 #define   PIPE_CONTROL_TILE_CACHE_FLUSH                        (1<<28) /* 
gen11+ */
 #define   PIPE_CONTROL_FLUSH_L3                                (1<<27)
+#define   PIPE_CONTROL_AMFS_FLUSH                      (1<<25) /* gen12+ */
 #define   PIPE_CONTROL_GLOBAL_GTT_IVB                  (1<<24) /* gen7+ */
 #define   PIPE_CONTROL_MMIO_WRITE                      (1<<23)
 #define   PIPE_CONTROL_STORE_DATA_INDEX                        (1<<21)
 #define   PIPE_CONTROL_CS_STALL                                (1<<20)
+#define   PIPE_CONTROL_GLOBAL_SNAPSHOT_RESET           (1<<19)
 #define   PIPE_CONTROL_TLB_INVALIDATE                  (1<<18)
+#define   PIPE_CONTROL_PSD_SYNC                                (1<<17) /* 
gen11+ */
 #define   PIPE_CONTROL_MEDIA_STATE_CLEAR               (1<<16)
 #define   PIPE_CONTROL_WRITE_TIMESTAMP                 (3<<14)
 #define   PIPE_CONTROL_QW_WRITE                                (1<<14)
@@ -249,6 +252,18 @@
 #define   PIPE_CONTROL_DEPTH_CACHE_FLUSH               (1<<0)
 #define   PIPE_CONTROL_GLOBAL_GTT (1<<2) /* in addr dword */
 
+/* 3D-related flags can't be set on compute engine */
+#define PIPE_CONTROL_RENDER_ONLY_FLAGS (\
+               PIPE_CONTROL_RENDER_TARGET_CACHE_FLUSH | \
+               PIPE_CONTROL_DEPTH_CACHE_FLUSH | \
+               PIPE_CONTROL_TILE_CACHE_FLUSH | \
+               PIPE_CONTROL_DEPTH_STALL | \
+               PIPE_CONTROL_STALL_AT_SCOREBOARD | \
+               PIPE_CONTROL_PSD_SYNC | \
+               PIPE_CONTROL_AMFS_FLUSH | \
+               PIPE_CONTROL_VF_CACHE_INVALIDATE | \
+               PIPE_CONTROL_GLOBAL_SNAPSHOT_RESET)
+
 #define MI_MATH(x)                     MI_INSTR(0x1a, (x) - 1)
 #define MI_MATH_INSTR(opcode, op1, op2) ((opcode) << 20 | (op1) << 10 | (op2))
 /* Opcodes for MI_MATH_INSTR */
-- 
2.25.4

Reply via email to