The gfxv7 contains a slightly different version of cik_mqd called
bonaire_mqd. This can introduce subtle bugs if fixes are not applied in
both places.

Reviewed-by: Edward O'Callaghan <funfunc...@folklore1984.net>
Acked-by: Christian König <christian.koe...@amd.com>
Acked-by: Felix Kuehling <felix.kuehl...@amd.com>
Signed-off-by: Andres Rodriguez <andre...@gmail.com>
---
 drivers/gpu/drm/amd/amdgpu/gfx_v7_0.c | 135 ++++++++++++++--------------------
 1 file changed, 54 insertions(+), 81 deletions(-)

diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v7_0.c 
b/drivers/gpu/drm/amd/amdgpu/gfx_v7_0.c
index 4e6a60c..c408af5 100644
--- a/drivers/gpu/drm/amd/amdgpu/gfx_v7_0.c
+++ b/drivers/gpu/drm/amd/amdgpu/gfx_v7_0.c
@@ -10,40 +10,41 @@
  *
  * The above copyright notice and this permission notice shall be included in
  * all copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  * OTHER DEALINGS IN THE SOFTWARE.
  *
  */
 #include <linux/firmware.h>
 #include "drmP.h"
 #include "amdgpu.h"
 #include "amdgpu_ih.h"
 #include "amdgpu_gfx.h"
 #include "cikd.h"
 #include "cik.h"
+#include "cik_structs.h"
 #include "atom.h"
 #include "amdgpu_ucode.h"
 #include "clearstate_ci.h"
 
 #include "dce/dce_8_0_d.h"
 #include "dce/dce_8_0_sh_mask.h"
 
 #include "bif/bif_4_1_d.h"
 #include "bif/bif_4_1_sh_mask.h"
 
 #include "gca/gfx_7_0_d.h"
 #include "gca/gfx_7_2_enum.h"
 #include "gca/gfx_7_2_sh_mask.h"
 
 #include "gmc/gmc_7_0_d.h"
 #include "gmc/gmc_7_0_sh_mask.h"
 
 #include "oss/oss_2_0_d.h"
 #include "oss/oss_2_0_sh_mask.h"
 
@@ -2899,68 +2900,40 @@ struct hqd_registers
        u32 cp_hqd_pq_control;
        u32 cp_hqd_ib_base_addr;
        u32 cp_hqd_ib_base_addr_hi;
        u32 cp_hqd_ib_rptr;
        u32 cp_hqd_ib_control;
        u32 cp_hqd_iq_timer;
        u32 cp_hqd_iq_rptr;
        u32 cp_hqd_dequeue_request;
        u32 cp_hqd_dma_offload;
        u32 cp_hqd_sema_cmd;
        u32 cp_hqd_msg_type;
        u32 cp_hqd_atomic0_preop_lo;
        u32 cp_hqd_atomic0_preop_hi;
        u32 cp_hqd_atomic1_preop_lo;
        u32 cp_hqd_atomic1_preop_hi;
        u32 cp_hqd_hq_scheduler0;
        u32 cp_hqd_hq_scheduler1;
        u32 cp_mqd_control;
 };
 
-struct bonaire_mqd
-{
-       u32 header;
-       u32 dispatch_initiator;
-       u32 dimensions[3];
-       u32 start_idx[3];
-       u32 num_threads[3];
-       u32 pipeline_stat_enable;
-       u32 perf_counter_enable;
-       u32 pgm[2];
-       u32 tba[2];
-       u32 tma[2];
-       u32 pgm_rsrc[2];
-       u32 vmid;
-       u32 resource_limits;
-       u32 static_thread_mgmt01[2];
-       u32 tmp_ring_size;
-       u32 static_thread_mgmt23[2];
-       u32 restart[3];
-       u32 thread_trace_enable;
-       u32 reserved1;
-       u32 user_data[16];
-       u32 vgtcs_invoke_count[2];
-       struct hqd_registers queue_state;
-       u32 dequeue_cntr;
-       u32 interrupt_queue[64];
-};
-
 static void gfx_v7_0_compute_pipe_init(struct amdgpu_device *adev, int me, int 
pipe)
 {
        u64 eop_gpu_addr;
        u32 tmp;
        size_t eop_offset = me * pipe * GFX7_MEC_HPD_SIZE * 2;
 
        mutex_lock(&adev->srbm_mutex);
        eop_gpu_addr = adev->gfx.mec.hpd_eop_gpu_addr + eop_offset;
 
        cik_srbm_select(adev, me, pipe, 0, 0);
 
        /* write the EOP addr */
        WREG32(mmCP_HPD_EOP_BASE_ADDR, eop_gpu_addr >> 8);
        WREG32(mmCP_HPD_EOP_BASE_ADDR_HI, upper_32_bits(eop_gpu_addr) >> 8);
 
        /* set the VMID assigned */
        WREG32(mmCP_HPD_EOP_VMID, 0);
 
        /* set the EOP size, register value is 2^(EOP_SIZE+1) dwords */
        tmp = RREG32(mmCP_HPD_EOP_CONTROL);
@@ -2980,182 +2953,182 @@ static int gfx_v7_0_mqd_deactivate(struct 
amdgpu_device *adev)
        if (RREG32(mmCP_HQD_ACTIVE) & 1) {
                WREG32(mmCP_HQD_DEQUEUE_REQUEST, 1);
                for (i = 0; i < adev->usec_timeout; i++) {
                        if (!(RREG32(mmCP_HQD_ACTIVE) & 1))
                                break;
                        udelay(1);
                }
 
                if (i == adev->usec_timeout)
                        return -ETIMEDOUT;
 
                WREG32(mmCP_HQD_DEQUEUE_REQUEST, 0);
                WREG32(mmCP_HQD_PQ_RPTR, 0);
                WREG32(mmCP_HQD_PQ_WPTR, 0);
        }
 
        return 0;
 }
 
 static void gfx_v7_0_mqd_init(struct amdgpu_device *adev,
-                            struct bonaire_mqd *mqd,
+                            struct cik_mqd *mqd,
                             uint64_t mqd_gpu_addr,
                             struct amdgpu_ring *ring)
 {
        u64 hqd_gpu_addr;
        u64 wb_gpu_addr;
 
        /* init the mqd struct */
-       memset(mqd, 0, sizeof(struct bonaire_mqd));
+       memset(mqd, 0, sizeof(struct cik_mqd));
 
        mqd->header = 0xC0310800;
-       mqd->static_thread_mgmt01[0] = 0xffffffff;
-       mqd->static_thread_mgmt01[1] = 0xffffffff;
-       mqd->static_thread_mgmt23[0] = 0xffffffff;
-       mqd->static_thread_mgmt23[1] = 0xffffffff;
+       mqd->compute_static_thread_mgmt_se0 = 0xffffffff;
+       mqd->compute_static_thread_mgmt_se1 = 0xffffffff;
+       mqd->compute_static_thread_mgmt_se2 = 0xffffffff;
+       mqd->compute_static_thread_mgmt_se3 = 0xffffffff;
 
        /* enable doorbell? */
-       mqd->queue_state.cp_hqd_pq_doorbell_control =
+       mqd->cp_hqd_pq_doorbell_control =
                RREG32(mmCP_HQD_PQ_DOORBELL_CONTROL);
        if (ring->use_doorbell)
-               mqd->queue_state.cp_hqd_pq_doorbell_control |= 
CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_EN_MASK;
+               mqd->cp_hqd_pq_doorbell_control |= 
CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_EN_MASK;
        else
-               mqd->queue_state.cp_hqd_pq_doorbell_control &= 
~CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_EN_MASK;
+               mqd->cp_hqd_pq_doorbell_control &= 
~CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_EN_MASK;
 
        /* set the pointer to the MQD */
-       mqd->queue_state.cp_mqd_base_addr = mqd_gpu_addr & 0xfffffffc;
-       mqd->queue_state.cp_mqd_base_addr_hi = upper_32_bits(mqd_gpu_addr);
+       mqd->cp_mqd_base_addr_lo = mqd_gpu_addr & 0xfffffffc;
+       mqd->cp_mqd_base_addr_hi = upper_32_bits(mqd_gpu_addr);
 
        /* set MQD vmid to 0 */
-       mqd->queue_state.cp_mqd_control = RREG32(mmCP_MQD_CONTROL);
-       mqd->queue_state.cp_mqd_control &= ~CP_MQD_CONTROL__VMID_MASK;
+       mqd->cp_mqd_control = RREG32(mmCP_MQD_CONTROL);
+       mqd->cp_mqd_control &= ~CP_MQD_CONTROL__VMID_MASK;
 
        /* set the pointer to the HQD, this is similar CP_RB0_BASE/_HI */
        hqd_gpu_addr = ring->gpu_addr >> 8;
-       mqd->queue_state.cp_hqd_pq_base = hqd_gpu_addr;
-       mqd->queue_state.cp_hqd_pq_base_hi = upper_32_bits(hqd_gpu_addr);
+       mqd->cp_hqd_pq_base_lo = hqd_gpu_addr;
+       mqd->cp_hqd_pq_base_hi = upper_32_bits(hqd_gpu_addr);
 
        /* set up the HQD, this is similar to CP_RB0_CNTL */
-       mqd->queue_state.cp_hqd_pq_control = RREG32(mmCP_HQD_PQ_CONTROL);
-       mqd->queue_state.cp_hqd_pq_control &=
+       mqd->cp_hqd_pq_control = RREG32(mmCP_HQD_PQ_CONTROL);
+       mqd->cp_hqd_pq_control &=
                ~(CP_HQD_PQ_CONTROL__QUEUE_SIZE_MASK |
                                CP_HQD_PQ_CONTROL__RPTR_BLOCK_SIZE_MASK);
 
-       mqd->queue_state.cp_hqd_pq_control |=
+       mqd->cp_hqd_pq_control |=
                order_base_2(ring->ring_size / 8);
-       mqd->queue_state.cp_hqd_pq_control |=
+       mqd->cp_hqd_pq_control |=
                (order_base_2(AMDGPU_GPU_PAGE_SIZE/8) << 8);
 #ifdef __BIG_ENDIAN
-       mqd->queue_state.cp_hqd_pq_control |=
+       mqd->cp_hqd_pq_control |=
                2 << CP_HQD_PQ_CONTROL__ENDIAN_SWAP__SHIFT;
 #endif
-       mqd->queue_state.cp_hqd_pq_control &=
+       mqd->cp_hqd_pq_control &=
                ~(CP_HQD_PQ_CONTROL__UNORD_DISPATCH_MASK |
                                CP_HQD_PQ_CONTROL__ROQ_PQ_IB_FLIP_MASK |
                                CP_HQD_PQ_CONTROL__PQ_VOLATILE_MASK);
-       mqd->queue_state.cp_hqd_pq_control |=
+       mqd->cp_hqd_pq_control |=
                CP_HQD_PQ_CONTROL__PRIV_STATE_MASK |
                CP_HQD_PQ_CONTROL__KMD_QUEUE_MASK; /* assuming kernel queue 
control */
 
        /* only used if CP_PQ_WPTR_POLL_CNTL.CP_PQ_WPTR_POLL_CNTL__EN_MASK=1 */
        wb_gpu_addr = adev->wb.gpu_addr + (ring->wptr_offs * 4);
-       mqd->queue_state.cp_hqd_pq_wptr_poll_addr = wb_gpu_addr & 0xfffffffc;
-       mqd->queue_state.cp_hqd_pq_wptr_poll_addr_hi = 
upper_32_bits(wb_gpu_addr) & 0xffff;
+       mqd->cp_hqd_pq_wptr_poll_addr_lo = wb_gpu_addr & 0xfffffffc;
+       mqd->cp_hqd_pq_wptr_poll_addr_hi = upper_32_bits(wb_gpu_addr) & 0xffff;
 
        /* set the wb address wether it's enabled or not */
        wb_gpu_addr = adev->wb.gpu_addr + (ring->rptr_offs * 4);
-       mqd->queue_state.cp_hqd_pq_rptr_report_addr = wb_gpu_addr & 0xfffffffc;
-       mqd->queue_state.cp_hqd_pq_rptr_report_addr_hi =
+       mqd->cp_hqd_pq_rptr_report_addr_lo = wb_gpu_addr & 0xfffffffc;
+       mqd->cp_hqd_pq_rptr_report_addr_hi =
                upper_32_bits(wb_gpu_addr) & 0xffff;
 
        /* enable the doorbell if requested */
        if (ring->use_doorbell) {
-               mqd->queue_state.cp_hqd_pq_doorbell_control =
+               mqd->cp_hqd_pq_doorbell_control =
                        RREG32(mmCP_HQD_PQ_DOORBELL_CONTROL);
-               mqd->queue_state.cp_hqd_pq_doorbell_control &=
+               mqd->cp_hqd_pq_doorbell_control &=
                        ~CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_OFFSET_MASK;
-               mqd->queue_state.cp_hqd_pq_doorbell_control |=
+               mqd->cp_hqd_pq_doorbell_control |=
                        (ring->doorbell_index <<
                         CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_OFFSET__SHIFT);
-               mqd->queue_state.cp_hqd_pq_doorbell_control |=
+               mqd->cp_hqd_pq_doorbell_control |=
                        CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_EN_MASK;
-               mqd->queue_state.cp_hqd_pq_doorbell_control &=
+               mqd->cp_hqd_pq_doorbell_control &=
                        ~(CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_SOURCE_MASK |
                                        
CP_HQD_PQ_DOORBELL_CONTROL__DOORBELL_HIT_MASK);
 
        } else {
-               mqd->queue_state.cp_hqd_pq_doorbell_control = 0;
+               mqd->cp_hqd_pq_doorbell_control = 0;
        }
 
        /* read and write pointers, similar to CP_RB0_WPTR/_RPTR */
        ring->wptr = 0;
-       mqd->queue_state.cp_hqd_pq_wptr = lower_32_bits(ring->wptr);
-       mqd->queue_state.cp_hqd_pq_rptr = RREG32(mmCP_HQD_PQ_RPTR);
+       mqd->cp_hqd_pq_wptr = lower_32_bits(ring->wptr);
+       mqd->cp_hqd_pq_rptr = RREG32(mmCP_HQD_PQ_RPTR);
 
        /* set the vmid for the queue */
-       mqd->queue_state.cp_hqd_vmid = 0;
+       mqd->cp_hqd_vmid = 0;
 
        /* activate the queue */
-       mqd->queue_state.cp_hqd_active = 1;
+       mqd->cp_hqd_active = 1;
 }
 
 static int gfx_v7_0_mqd_commit(struct amdgpu_device *adev,
-                              struct bonaire_mqd *mqd)
+                              struct cik_mqd *mqd)
 {
        u32 tmp;
 
        /* disable wptr polling */
        tmp = RREG32(mmCP_PQ_WPTR_POLL_CNTL);
        tmp = REG_SET_FIELD(tmp, CP_PQ_WPTR_POLL_CNTL, EN, 0);
        WREG32(mmCP_PQ_WPTR_POLL_CNTL, tmp);
 
        /* program MQD field to HW */
-       WREG32(mmCP_MQD_BASE_ADDR, mqd->queue_state.cp_mqd_base_addr);
-       WREG32(mmCP_MQD_BASE_ADDR_HI, mqd->queue_state.cp_mqd_base_addr_hi);
-       WREG32(mmCP_MQD_CONTROL, mqd->queue_state.cp_mqd_control);
-       WREG32(mmCP_HQD_PQ_BASE, mqd->queue_state.cp_hqd_pq_base);
-       WREG32(mmCP_HQD_PQ_BASE_HI, mqd->queue_state.cp_hqd_pq_base_hi);
-       WREG32(mmCP_HQD_PQ_CONTROL, mqd->queue_state.cp_hqd_pq_control);
-       WREG32(mmCP_HQD_PQ_WPTR_POLL_ADDR, 
mqd->queue_state.cp_hqd_pq_wptr_poll_addr);
-       WREG32(mmCP_HQD_PQ_WPTR_POLL_ADDR_HI, 
mqd->queue_state.cp_hqd_pq_wptr_poll_addr_hi);
-       WREG32(mmCP_HQD_PQ_RPTR_REPORT_ADDR, 
mqd->queue_state.cp_hqd_pq_rptr_report_addr);
-       WREG32(mmCP_HQD_PQ_RPTR_REPORT_ADDR_HI, 
mqd->queue_state.cp_hqd_pq_rptr_report_addr_hi);
-       WREG32(mmCP_HQD_PQ_DOORBELL_CONTROL, 
mqd->queue_state.cp_hqd_pq_doorbell_control);
-       WREG32(mmCP_HQD_PQ_WPTR, mqd->queue_state.cp_hqd_pq_wptr);
-       WREG32(mmCP_HQD_VMID, mqd->queue_state.cp_hqd_vmid);
+       WREG32(mmCP_MQD_BASE_ADDR, mqd->cp_mqd_base_addr_lo);
+       WREG32(mmCP_MQD_BASE_ADDR_HI, mqd->cp_mqd_base_addr_hi);
+       WREG32(mmCP_MQD_CONTROL, mqd->cp_mqd_control);
+       WREG32(mmCP_HQD_PQ_BASE, mqd->cp_hqd_pq_base_lo);
+       WREG32(mmCP_HQD_PQ_BASE_HI, mqd->cp_hqd_pq_base_hi);
+       WREG32(mmCP_HQD_PQ_CONTROL, mqd->cp_hqd_pq_control);
+       WREG32(mmCP_HQD_PQ_WPTR_POLL_ADDR, mqd->cp_hqd_pq_wptr_poll_addr_lo);
+       WREG32(mmCP_HQD_PQ_WPTR_POLL_ADDR_HI, mqd->cp_hqd_pq_wptr_poll_addr_hi);
+       WREG32(mmCP_HQD_PQ_RPTR_REPORT_ADDR, 
mqd->cp_hqd_pq_rptr_report_addr_lo);
+       WREG32(mmCP_HQD_PQ_RPTR_REPORT_ADDR_HI, 
mqd->cp_hqd_pq_rptr_report_addr_hi);
+       WREG32(mmCP_HQD_PQ_DOORBELL_CONTROL, mqd->cp_hqd_pq_doorbell_control);
+       WREG32(mmCP_HQD_PQ_WPTR, mqd->cp_hqd_pq_wptr);
+       WREG32(mmCP_HQD_VMID, mqd->cp_hqd_vmid);
 
        /* activate the HQD */
-       WREG32(mmCP_HQD_ACTIVE, mqd->queue_state.cp_hqd_active);
+       WREG32(mmCP_HQD_ACTIVE, mqd->cp_hqd_active);
 
        return 0;
 }
 
 static int gfx_v7_0_compute_queue_init(struct amdgpu_device *adev, int ring_id)
 {
        int r;
        u64 mqd_gpu_addr;
-       struct bonaire_mqd *mqd;
+       struct cik_mqd *mqd;
        struct amdgpu_ring *ring = &adev->gfx.compute_ring[ring_id];
 
        if (ring->mqd_obj == NULL) {
                r = amdgpu_bo_create(adev,
-                               sizeof(struct bonaire_mqd),
+                               sizeof(struct cik_mqd),
                                PAGE_SIZE, true,
                                AMDGPU_GEM_DOMAIN_GTT, 0, NULL, NULL,
                                &ring->mqd_obj);
                if (r) {
                        dev_warn(adev->dev, "(%d) create MQD bo failed\n", r);
                        return r;
                }
        }
 
        r = amdgpu_bo_reserve(ring->mqd_obj, false);
        if (unlikely(r != 0))
                goto out;
 
        r = amdgpu_bo_pin(ring->mqd_obj, AMDGPU_GEM_DOMAIN_GTT,
                        &mqd_gpu_addr);
        if (r) {
                dev_warn(adev->dev, "(%d) pin MQD bo failed\n", r);
                goto out_unreserve;
        }
        r = amdgpu_bo_kmap(ring->mqd_obj, (void **)&mqd);
-- 
2.9.3

_______________________________________________
amd-gfx mailing list
amd-gfx@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/amd-gfx

Reply via email to