On a hang copy out the contents of the buffer objects attached to the
guilty submission and print them in the crash dump report.

Signed-off-by: Jordan Crouse <jcro...@codeaurora.org>
---
 Documentation/gpu/drm-msm-crash-dump.txt |  7 +++++
 drivers/gpu/drm/msm/adreno/adreno_gpu.c  | 54 ++++++++++++++++++++++++++------
 drivers/gpu/drm/msm/msm_gpu.c            | 48 ++++++++++++++++++++++++++--
 drivers/gpu/drm/msm/msm_gpu.h            |  9 ++++++
 4 files changed, 105 insertions(+), 13 deletions(-)

diff --git a/Documentation/gpu/drm-msm-crash-dump.txt 
b/Documentation/gpu/drm-msm-crash-dump.txt
index f84a47a9ca92..930e4c970a62 100644
--- a/Documentation/gpu/drm-msm-crash-dump.txt
+++ b/Documentation/gpu/drm-msm-crash-dump.txt
@@ -28,6 +28,13 @@ ringbuffer:  # Ringbuffer data. There will be a sequence for 
each ringbuffer
    data:               # [ascii85] The contents of the ring encoded as ascii85.
                        # Only the unused portions of the ring will be printed
                        # (up to a maximum of 'size' bytes)
+bos:           # List of buffers from the hanging submission (if known)
+  -iova:               # [hex] GPU address of the buffer
+   size:               # [decimal] Size of the buffer (in bytes)
+   data:               # [ascii85] The contents of the buffer encoded as
+                       # ascii85. Only the contents of buffers marked as
+                       # readable are dumped. Trailing zeros at the end of the
+                       # buffer won't be dumped.
 registers:     # Sets of register values. This section can be used multiple
                # times for different ranges of registers. Each register will be
                # on its own line.
diff --git a/drivers/gpu/drm/msm/adreno/adreno_gpu.c 
b/drivers/gpu/drm/msm/adreno/adreno_gpu.c
index b92bcbde688e..5daca5ba7e06 100644
--- a/drivers/gpu/drm/msm/adreno/adreno_gpu.c
+++ b/drivers/gpu/drm/msm/adreno/adreno_gpu.c
@@ -438,6 +438,10 @@ void adreno_gpu_state_destroy(struct msm_gpu_state *state)
        for (i = 0; i < ARRAY_SIZE(state->ring); i++)
                kfree(state->ring[i].data);
 
+       for (i = 0; state->bos && i < state->nr_bos; i++)
+               kfree(state->bos[i].data);
+
+       kfree(state->bos);
        kfree(state->comm);
        kfree(state->cmd);
        kfree(state->registers);
@@ -461,6 +465,35 @@ int adreno_gpu_state_put(struct msm_gpu_state *state)
 }
 
 #if defined(CONFIG_DEBUG_FS) || defined(CONFIG_DEV_COREDUMP)
+
+static void adreno_show_object(struct drm_printer *p, u32 *ptr, int len)
+{
+       char out[ASCII85_BUFSZ];
+       long l, datalen, i;
+
+       if (!ptr || !len)
+               return;
+
+       /*
+        * Only dump the non-zero part of the buffer - rarely will any data
+        * completely fill the entire allocated size of the buffer
+        */
+       for (datalen = 0, i = 0; i < len >> 2; i++) {
+               if (ptr[i])
+                       datalen = i << 2;
+       }
+
+       l = ascii85_encode_len(datalen);
+
+       drm_printf(p, "    data: !!ascii85 |\n");
+       drm_printf(p, "     ");
+
+       for (i = 0; i < l; i++)
+               drm_printf(p, ascii85_encode(ptr[i], out));
+
+       drm_printf(p, "\n");
+}
+
 void adreno_show(struct msm_gpu *gpu, struct msm_gpu_state *state,
                struct drm_printer *p)
 {
@@ -487,19 +520,20 @@ void adreno_show(struct msm_gpu *gpu, struct 
msm_gpu_state *state,
                drm_printf(p, "    wptr: %d\n", state->ring[i].wptr);
                drm_printf(p, "    size: %d\n", MSM_GPU_RINGBUFFER_SZ);
 
-               if (state->ring[i].data && state->ring[i].data_size) {
-                       u32 *ptr = (u32 *) state->ring[i].data;
-                       char out[ASCII85_BUFSZ];
-                       long len = ascii85_encode_len(state->ring[i].data_size);
-                       int j;
+               adreno_show_object(p, state->ring[i].data,
+                       state->ring[i].data_size);
+       }
 
-                       drm_printf(p, "    data: !!ascii85 |\n");
-                       drm_printf(p, "     ");
+       if (state->bos) {
+               drm_printf(p, "bos:\n");
 
-                       for (j = 0; j < len; j++)
-                               drm_printf(p, ascii85_encode(ptr[j], out));
+               for (i = 0; i < state->nr_bos; i++) {
+                       drm_printf(p, "  - iova: 0x%016llx\n",
+                               state->bos[i].iova);
+                       drm_printf(p, "    size: %ld\n", state->bos[i].size);
 
-                       drm_printf(p, "\n");
+                       adreno_show_object(p, state->bos[i].data,
+                               state->bos[i].size);
                }
        }
 
diff --git a/drivers/gpu/drm/msm/msm_gpu.c b/drivers/gpu/drm/msm/msm_gpu.c
index f36b415e123b..92395c5ef442 100644
--- a/drivers/gpu/drm/msm/msm_gpu.c
+++ b/drivers/gpu/drm/msm/msm_gpu.c
@@ -318,8 +318,39 @@ static void msm_gpu_devcoredump_free(void *data)
        msm_gpu_crashstate_put(gpu);
 }
 
-static void msm_gpu_crashstate_capture(struct msm_gpu *gpu, char *comm,
-               char *cmd)
+static void msm_gpu_crashstate_get_bo(struct msm_gpu_state *state,
+               struct msm_gem_object *obj, u64 iova, u32 flags)
+{
+       struct msm_gpu_state_bo *state_bo = &state->bos[state->nr_bos];
+
+       /* Don't record write only objects */
+
+       state_bo->size = obj->base.size;
+       state_bo->iova = iova;
+
+       /* Only store the data for buffer objects marked for read */
+       if ((flags & MSM_SUBMIT_BO_READ)) {
+               void *ptr;
+
+               state_bo->data = kmalloc(obj->base.size, GFP_KERNEL);
+               if (!state_bo->data)
+                       return;
+
+               ptr = msm_gem_get_vaddr_active(&obj->base);
+               if (IS_ERR(ptr)) {
+                       kfree(state_bo->data);
+                       return;
+               }
+
+               memcpy(state_bo->data, ptr, obj->base.size);
+               msm_gem_put_vaddr(&obj->base);
+       }
+
+       state->nr_bos++;
+}
+
+static void msm_gpu_crashstate_capture(struct msm_gpu *gpu,
+               struct msm_gem_submit *submit, char *comm, char *cmd)
 {
        struct msm_gpu_state *state;
 
@@ -335,6 +366,17 @@ static void msm_gpu_crashstate_capture(struct msm_gpu 
*gpu, char *comm,
        state->comm = kstrdup(comm, GFP_KERNEL);
        state->cmd = kstrdup(cmd, GFP_KERNEL);
 
+       if (submit) {
+               int i;
+
+               state->bos = kcalloc(submit->nr_bos,
+                       sizeof(struct msm_gpu_state_bo), GFP_KERNEL);
+
+               for (i = 0; state->bos && i < submit->nr_bos; i++)
+                       msm_gpu_crashstate_get_bo(state, submit->bos[i].obj,
+                               submit->bos[i].iova, submit->bos[i].flags);
+       }
+
        kref_init(&state->ref);
 
        /* Set the active crash state to be dumped on failure */
@@ -435,7 +477,7 @@ static void recover_worker(struct work_struct *work)
        }
 
        /* Record the crash state */
-       msm_gpu_crashstate_capture(gpu, comm, cmd);
+       msm_gpu_crashstate_capture(gpu, submit, comm, cmd);
 
        kfree(cmd);
        kfree(comm);
diff --git a/drivers/gpu/drm/msm/msm_gpu.h b/drivers/gpu/drm/msm/msm_gpu.h
index 48f7b21f1cae..8242c6e0f107 100644
--- a/drivers/gpu/drm/msm/msm_gpu.h
+++ b/drivers/gpu/drm/msm/msm_gpu.h
@@ -181,6 +181,12 @@ struct msm_gpu_submitqueue {
        struct kref ref;
 };
 
+struct msm_gpu_state_bo {
+       u64 iova;
+       size_t size;
+       void *data;
+};
+
 struct msm_gpu_state {
        struct kref ref;
        struct timeval time;
@@ -201,6 +207,9 @@ struct msm_gpu_state {
 
        char *comm;
        char *cmd;
+
+       int nr_bos;
+       struct msm_gpu_state_bo *bos;
 };
 
 static inline void gpu_write(struct msm_gpu *gpu, u32 reg, u32 data)
-- 
2.16.1

_______________________________________________
dri-devel mailing list
dri-devel@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/dri-devel

Reply via email to