[Mesa-dev] [PATCH 1/4] gallium/radeon: remove old CS tracing
Marek Olšák
maraeo at gmail.com
Thu Mar 17 15:15:18 UTC 2016
Ping
On Fri, Mar 11, 2016 at 4:01 PM, Marek Olšák <maraeo at gmail.com> wrote:
> From: Marek Olšák <marek.olsak at amd.com>
>
> Cons:
> - it was only integrated in r600g
> - it doesn't work with GPUVM
> - it records buffer contents at the end of IBs instead of at the beginning,
> so the replay isn't exact
> - it lacks an IB parser and user-friendliness
>
> A better solution is apitrace in combination with gallium/ddebug, which
> has a complete IB parser and can pinpoint hanging CP packets.
> ---
> src/gallium/drivers/r300/r300_context.c | 2 +-
> src/gallium/drivers/r300/r300_flush.c | 6 +-
> src/gallium/drivers/r600/r600_hw_context.c | 11 +-
> src/gallium/drivers/r600/r600_pipe.c | 4 +-
> src/gallium/drivers/r600/r600_pipe.h | 6 -
> src/gallium/drivers/r600/r600_state_common.c | 23 ---
> src/gallium/drivers/radeon/r600_pipe_common.c | 21 +--
> src/gallium/drivers/radeon/r600_pipe_common.h | 6 +-
> src/gallium/drivers/radeon/radeon_uvd.c | 4 +-
> src/gallium/drivers/radeon/radeon_vce.c | 4 +-
> src/gallium/drivers/radeon/radeon_winsys.h | 8 +-
> src/gallium/drivers/radeonsi/si_hw_context.c | 3 +-
> src/gallium/drivers/radeonsi/si_pipe.c | 5 +-
> src/gallium/winsys/amdgpu/drm/amdgpu_cs.c | 6 +-
> src/gallium/winsys/radeon/drm/Makefile.am | 2 -
> src/gallium/winsys/radeon/drm/Makefile.sources | 4 -
> src/gallium/winsys/radeon/drm/radeon_ctx.h | 205 ---------------------
> src/gallium/winsys/radeon/drm/radeon_drm_cs.c | 13 +-
> src/gallium/winsys/radeon/drm/radeon_drm_cs.h | 5 -
> src/gallium/winsys/radeon/drm/radeon_drm_cs_dump.c | 161 ----------------
> 20 files changed, 23 insertions(+), 476 deletions(-)
> delete mode 100644 src/gallium/winsys/radeon/drm/radeon_ctx.h
> delete mode 100644 src/gallium/winsys/radeon/drm/radeon_drm_cs_dump.c
>
> diff --git a/src/gallium/drivers/r300/r300_context.c b/src/gallium/drivers/r300/r300_context.c
> index 6fa8920..d100a9d 100644
> --- a/src/gallium/drivers/r300/r300_context.c
> +++ b/src/gallium/drivers/r300/r300_context.c
> @@ -385,7 +385,7 @@ struct pipe_context* r300_create_context(struct pipe_screen* screen,
> if (!r300->ctx)
> goto fail;
>
> - r300->cs = rws->cs_create(r300->ctx, RING_GFX, r300_flush_callback, r300, NULL);
> + r300->cs = rws->cs_create(r300->ctx, RING_GFX, r300_flush_callback, r300);
> if (r300->cs == NULL)
> goto fail;
>
> diff --git a/src/gallium/drivers/r300/r300_flush.c b/src/gallium/drivers/r300/r300_flush.c
> index 7a75b43..63182cb 100644
> --- a/src/gallium/drivers/r300/r300_flush.c
> +++ b/src/gallium/drivers/r300/r300_flush.c
> @@ -53,7 +53,7 @@ static void r300_flush_and_cleanup(struct r300_context *r300, unsigned flags,
> }
>
> r300->flush_counter++;
> - r300->rws->cs_flush(r300->cs, flags, fence, 0);
> + r300->rws->cs_flush(r300->cs, flags, fence);
> r300->dirty_hw = 0;
>
> /* New kitchen sink, baby. */
> @@ -88,11 +88,11 @@ void r300_flush(struct pipe_context *pipe,
> * and we cannot emit an empty CS. Let's write to some reg. */
> CS_LOCALS(r300);
> OUT_CS_REG(RB3D_COLOR_CHANNEL_MASK, 0);
> - r300->rws->cs_flush(r300->cs, flags, fence, 0);
> + r300->rws->cs_flush(r300->cs, flags, fence);
> } else {
> /* Even if hw is not dirty, we should at least reset the CS in case
> * the space checking failed for the first draw operation. */
> - r300->rws->cs_flush(r300->cs, flags, NULL, 0);
> + r300->rws->cs_flush(r300->cs, flags, NULL);
> }
> }
>
> diff --git a/src/gallium/drivers/r600/r600_hw_context.c b/src/gallium/drivers/r600/r600_hw_context.c
> index 4951297..7a6f957 100644
> --- a/src/gallium/drivers/r600/r600_hw_context.c
> +++ b/src/gallium/drivers/r600/r600_hw_context.c
> @@ -57,18 +57,11 @@ void r600_need_cs_space(struct r600_context *ctx, unsigned num_dw,
>
> /* The number of dwords all the dirty states would take. */
> mask = ctx->dirty_atoms;
> - while (mask != 0) {
> + while (mask != 0)
> num_dw += ctx->atoms[u_bit_scan64(&mask)]->num_dw;
> - if (ctx->screen->b.trace_bo) {
> - num_dw += R600_TRACE_CS_DWORDS;
> - }
> - }
>
> /* The upper-bound of how much space a draw command would take. */
> num_dw += R600_MAX_FLUSH_CS_DWORDS + R600_MAX_DRAW_CS_DWORDS;
> - if (ctx->screen->b.trace_bo) {
> - num_dw += R600_TRACE_CS_DWORDS;
> - }
> }
>
> /* Count in queries_suspend. */
> @@ -273,7 +266,7 @@ void r600_context_gfx_flush(void *context, unsigned flags,
> flags |= RADEON_FLUSH_KEEP_TILING_FLAGS;
>
> /* Flush the CS. */
> - ctx->b.ws->cs_flush(cs, flags, fence, ctx->screen->b.cs_count++);
> + ctx->b.ws->cs_flush(cs, flags, fence);
>
> r600_begin_new_cs(ctx);
> }
> diff --git a/src/gallium/drivers/r600/r600_pipe.c b/src/gallium/drivers/r600/r600_pipe.c
> index 7018088..88c500a 100644
> --- a/src/gallium/drivers/r600/r600_pipe.c
> +++ b/src/gallium/drivers/r600/r600_pipe.c
> @@ -187,9 +187,7 @@ static struct pipe_context *r600_create_context(struct pipe_screen *screen,
> }
>
> rctx->b.gfx.cs = ws->cs_create(rctx->b.ctx, RING_GFX,
> - r600_context_gfx_flush, rctx,
> - rscreen->b.trace_bo ?
> - rscreen->b.trace_bo->buf : NULL);
> + r600_context_gfx_flush, rctx);
> rctx->b.gfx.flush = r600_context_gfx_flush;
>
> rctx->allocator_fetch_shader = u_suballocator_create(&rctx->b.b, 64 * 1024, 256,
> diff --git a/src/gallium/drivers/r600/r600_pipe.h b/src/gallium/drivers/r600/r600_pipe.h
> index f8a2039..72aa642 100644
> --- a/src/gallium/drivers/r600/r600_pipe.h
> +++ b/src/gallium/drivers/r600/r600_pipe.h
> @@ -60,7 +60,6 @@
> /* the number of CS dwords for flushing and drawing */
> #define R600_MAX_FLUSH_CS_DWORDS 16
> #define R600_MAX_DRAW_CS_DWORDS 58
> -#define R600_TRACE_CS_DWORDS 7
>
> #define R600_MAX_USER_CONST_BUFFERS 13
> #define R600_MAX_DRIVER_CONST_BUFFERS 3
> @@ -571,15 +570,10 @@ static inline void r600_mark_atom_dirty(struct r600_context *rctx,
> r600_set_atom_dirty(rctx, atom, true);
> }
>
> -void r600_trace_emit(struct r600_context *rctx);
> -
> static inline void r600_emit_atom(struct r600_context *rctx, struct r600_atom *atom)
> {
> atom->emit(&rctx->b, atom);
> r600_set_atom_dirty(rctx, atom, false);
> - if (rctx->screen->b.trace_bo) {
> - r600_trace_emit(rctx);
> - }
> }
>
> static inline void r600_set_cso_state(struct r600_context *rctx,
> diff --git a/src/gallium/drivers/r600/r600_state_common.c b/src/gallium/drivers/r600/r600_state_common.c
> index e3314bb..a95b178 100644
> --- a/src/gallium/drivers/r600/r600_state_common.c
> +++ b/src/gallium/drivers/r600/r600_state_common.c
> @@ -1999,10 +1999,6 @@ static void r600_draw_vbo(struct pipe_context *ctx, const struct pipe_draw_info
> cs->buf[cs->cdw++] = EVENT_TYPE(EVENT_TYPE_SQ_NON_EVENT);
> }
>
> - if (rctx->screen->b.trace_bo) {
> - r600_trace_emit(rctx);
> - }
> -
> /* Set the depth buffer as dirty. */
> if (rctx->framebuffer.state.zsbuf) {
> struct pipe_surface *surf = rctx->framebuffer.state.zsbuf;
> @@ -2897,22 +2893,3 @@ void r600_init_common_state_functions(struct r600_context *rctx)
> rctx->b.set_occlusion_query_state = r600_set_occlusion_query_state;
> rctx->b.need_gfx_cs_space = r600_need_gfx_cs_space;
> }
> -
> -void r600_trace_emit(struct r600_context *rctx)
> -{
> - struct r600_screen *rscreen = rctx->screen;
> - struct radeon_winsys_cs *cs = rctx->b.gfx.cs;
> - uint64_t va;
> - uint32_t reloc;
> -
> - va = rscreen->b.trace_bo->gpu_address;
> - reloc = radeon_add_to_buffer_list(&rctx->b, &rctx->b.gfx, rscreen->b.trace_bo,
> - RADEON_USAGE_READWRITE, RADEON_PRIO_TRACE);
> - radeon_emit(cs, PKT3(PKT3_MEM_WRITE, 3, 0));
> - radeon_emit(cs, va & 0xFFFFFFFFUL);
> - radeon_emit(cs, (va >> 32UL) & 0xFFUL);
> - radeon_emit(cs, cs->cdw);
> - radeon_emit(cs, rscreen->b.cs_count);
> - radeon_emit(cs, PKT3(PKT3_NOP, 0, 0));
> - radeon_emit(cs, reloc);
> -}
> diff --git a/src/gallium/drivers/radeon/r600_pipe_common.c b/src/gallium/drivers/radeon/r600_pipe_common.c
> index ea02827..eed9d83 100644
> --- a/src/gallium/drivers/radeon/r600_pipe_common.c
> +++ b/src/gallium/drivers/radeon/r600_pipe_common.c
> @@ -229,7 +229,7 @@ static void r600_flush_dma_ring(void *ctx, unsigned flags,
> struct radeon_winsys_cs *cs = rctx->dma.cs;
>
> if (cs->cdw)
> - rctx->ws->cs_flush(cs, flags, &rctx->last_sdma_fence, 0);
> + rctx->ws->cs_flush(cs, flags, &rctx->last_sdma_fence);
> if (fence)
> rctx->ws->fence_reference(fence, rctx->last_sdma_fence);
> }
> @@ -318,7 +318,7 @@ bool r600_common_context_init(struct r600_common_context *rctx,
> if (rscreen->info.has_sdma && !(rscreen->debug_flags & DBG_NO_ASYNC_DMA)) {
> rctx->dma.cs = rctx->ws->cs_create(rctx->ctx, RING_DMA,
> r600_flush_dma_ring,
> - rctx, NULL);
> + rctx);
> rctx->dma.flush = r600_flush_dma_ring;
> }
>
> @@ -379,7 +379,6 @@ static const struct debug_named_value common_debug_options[] = {
> { "tex", DBG_TEX, "Print texture info" },
> { "compute", DBG_COMPUTE, "Print compute info" },
> { "vm", DBG_VM, "Print virtual addresses when creating resources" },
> - { "trace_cs", DBG_TRACE_CS, "Trace cs and write rlockup_<csid>.c file with faulty cs" },
> { "info", DBG_INFO, "Print driver information" },
>
> /* shaders */
> @@ -893,19 +892,6 @@ bool r600_common_screen_init(struct r600_common_screen *rscreen,
> pipe_mutex_init(rscreen->aux_context_lock);
> pipe_mutex_init(rscreen->gpu_load_mutex);
>
> - if (((rscreen->info.drm_major == 2 && rscreen->info.drm_minor >= 28) ||
> - rscreen->info.drm_major == 3) &&
> - (rscreen->debug_flags & DBG_TRACE_CS)) {
> - rscreen->trace_bo = (struct r600_resource*)pipe_buffer_create(&rscreen->b,
> - PIPE_BIND_CUSTOM,
> - PIPE_USAGE_STAGING,
> - 4096);
> - if (rscreen->trace_bo) {
> - rscreen->trace_ptr = rscreen->ws->buffer_map(rscreen->trace_bo->buf, NULL,
> - PIPE_TRANSFER_UNSYNCHRONIZED);
> - }
> - }
> -
> if (rscreen->debug_flags & DBG_INFO) {
> printf("pci_id = 0x%x\n", rscreen->info.pci_id);
> printf("family = %i (%s)\n", rscreen->info.family,
> @@ -951,9 +937,6 @@ void r600_destroy_common_screen(struct r600_common_screen *rscreen)
> pipe_mutex_destroy(rscreen->aux_context_lock);
> rscreen->aux_context->destroy(rscreen->aux_context);
>
> - if (rscreen->trace_bo)
> - pipe_resource_reference((struct pipe_resource**)&rscreen->trace_bo, NULL);
> -
> rscreen->ws->destroy(rscreen->ws);
> FREE(rscreen);
> }
> diff --git a/src/gallium/drivers/radeon/r600_pipe_common.h b/src/gallium/drivers/radeon/r600_pipe_common.h
> index d20069e..e1789be 100644
> --- a/src/gallium/drivers/radeon/r600_pipe_common.h
> +++ b/src/gallium/drivers/radeon/r600_pipe_common.h
> @@ -61,7 +61,7 @@
> /* gap - reuse */
> #define DBG_COMPUTE (1 << 2)
> #define DBG_VM (1 << 3)
> -#define DBG_TRACE_CS (1 << 4)
> +/* gap - reuse */
> /* shader logging */
> #define DBG_FS (1 << 5)
> #define DBG_VS (1 << 6)
> @@ -303,10 +303,6 @@ struct r600_common_screen {
> struct pipe_context *aux_context;
> pipe_mutex aux_context_lock;
>
> - struct r600_resource *trace_bo;
> - uint32_t *trace_ptr;
> - unsigned cs_count;
> -
> /* This must be in the screen, because UE4 uses one context for
> * compilation and another one for rendering.
> */
> diff --git a/src/gallium/drivers/radeon/radeon_uvd.c b/src/gallium/drivers/radeon/radeon_uvd.c
> index 367aabc..6545f28 100644
> --- a/src/gallium/drivers/radeon/radeon_uvd.c
> +++ b/src/gallium/drivers/radeon/radeon_uvd.c
> @@ -92,7 +92,7 @@ struct ruvd_decoder {
> /* flush IB to the hardware */
> static void flush(struct ruvd_decoder *dec)
> {
> - dec->ws->cs_flush(dec->cs, RADEON_FLUSH_ASYNC, NULL, 0);
> + dec->ws->cs_flush(dec->cs, RADEON_FLUSH_ASYNC, NULL);
> }
>
> /* add a new set register command to the IB */
> @@ -1086,7 +1086,7 @@ struct pipe_video_codec *ruvd_create_decoder(struct pipe_context *context,
> dec->stream_handle = rvid_alloc_stream_handle();
> dec->screen = context->screen;
> dec->ws = ws;
> - dec->cs = ws->cs_create(rctx->ctx, RING_UVD, NULL, NULL, NULL);
> + dec->cs = ws->cs_create(rctx->ctx, RING_UVD, NULL, NULL);
> if (!dec->cs) {
> RVID_ERR("Can't get command submission context.\n");
> goto error;
> diff --git a/src/gallium/drivers/radeon/radeon_vce.c b/src/gallium/drivers/radeon/radeon_vce.c
> index 087d942..2ab74e9 100644
> --- a/src/gallium/drivers/radeon/radeon_vce.c
> +++ b/src/gallium/drivers/radeon/radeon_vce.c
> @@ -56,7 +56,7 @@
> */
> static void flush(struct rvce_encoder *enc)
> {
> - enc->ws->cs_flush(enc->cs, RADEON_FLUSH_ASYNC, NULL, 0);
> + enc->ws->cs_flush(enc->cs, RADEON_FLUSH_ASYNC, NULL);
> enc->task_info_idx = 0;
> enc->bs_idx = 0;
> }
> @@ -429,7 +429,7 @@ struct pipe_video_codec *rvce_create_encoder(struct pipe_context *context,
>
> enc->screen = context->screen;
> enc->ws = ws;
> - enc->cs = ws->cs_create(rctx->ctx, RING_VCE, rvce_cs_flush, enc, NULL);
> + enc->cs = ws->cs_create(rctx->ctx, RING_VCE, rvce_cs_flush, enc);
> if (!enc->cs) {
> RVID_ERR("Can't get command submission context.\n");
> goto error;
> diff --git a/src/gallium/drivers/radeon/radeon_winsys.h b/src/gallium/drivers/radeon/radeon_winsys.h
> index b8a0659..fc6895a 100644
> --- a/src/gallium/drivers/radeon/radeon_winsys.h
> +++ b/src/gallium/drivers/radeon/radeon_winsys.h
> @@ -592,14 +592,12 @@ struct radeon_winsys {
> * \param ring_type The ring type (GFX, DMA, UVD)
> * \param flush Flush callback function associated with the command stream.
> * \param user User pointer that will be passed to the flush callback.
> - * \param trace_buf Trace buffer when tracing is enabled
> */
> struct radeon_winsys_cs *(*cs_create)(struct radeon_winsys_ctx *ctx,
> enum ring_type ring_type,
> void (*flush)(void *ctx, unsigned flags,
> struct pipe_fence_handle **fence),
> - void *flush_ctx,
> - struct pb_buffer *trace_buf);
> + void *flush_ctx);
>
> /**
> * Destroy a command stream.
> @@ -672,12 +670,10 @@ struct radeon_winsys {
> * \param flags, RADEON_FLUSH_ASYNC or 0.
> * \param fence Pointer to a fence. If non-NULL, a fence is inserted
> * after the CS and is returned through this parameter.
> - * \param cs_trace_id A unique identifier of the cs, used for tracing.
> */
> void (*cs_flush)(struct radeon_winsys_cs *cs,
> unsigned flags,
> - struct pipe_fence_handle **fence,
> - uint32_t cs_trace_id);
> + struct pipe_fence_handle **fence);
>
> /**
> * Return TRUE if a buffer is referenced by a command stream.
> diff --git a/src/gallium/drivers/radeonsi/si_hw_context.c b/src/gallium/drivers/radeonsi/si_hw_context.c
> index b5a4034..8c900a4 100644
> --- a/src/gallium/drivers/radeonsi/si_hw_context.c
> +++ b/src/gallium/drivers/radeonsi/si_hw_context.c
> @@ -118,8 +118,7 @@ void si_context_gfx_flush(void *context, unsigned flags,
> }
>
> /* Flush the CS. */
> - ws->cs_flush(cs, flags, &ctx->last_gfx_fence,
> - ctx->screen->b.cs_count++);
> + ws->cs_flush(cs, flags, &ctx->last_gfx_fence);
>
> if (fence)
> ws->fence_reference(fence, ctx->last_gfx_fence);
> diff --git a/src/gallium/drivers/radeonsi/si_pipe.c b/src/gallium/drivers/radeonsi/si_pipe.c
> index 8b50a49..042cfc7 100644
> --- a/src/gallium/drivers/radeonsi/si_pipe.c
> +++ b/src/gallium/drivers/radeonsi/si_pipe.c
> @@ -140,9 +140,8 @@ static struct pipe_context *si_create_context(struct pipe_screen *screen,
> sctx->b.b.create_video_buffer = vl_video_buffer_create;
> }
>
> - sctx->b.gfx.cs = ws->cs_create(sctx->b.ctx, RING_GFX, si_context_gfx_flush,
> - sctx, sscreen->b.trace_bo ?
> - sscreen->b.trace_bo->buf : NULL);
> + sctx->b.gfx.cs = ws->cs_create(sctx->b.ctx, RING_GFX,
> + si_context_gfx_flush, sctx);
> sctx->b.gfx.flush = si_context_gfx_flush;
>
> /* Border colors. */
> diff --git a/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c b/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c
> index 83da740..a9fc55f 100644
> --- a/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c
> +++ b/src/gallium/winsys/amdgpu/drm/amdgpu_cs.c
> @@ -335,8 +335,7 @@ amdgpu_cs_create(struct radeon_winsys_ctx *rwctx,
> enum ring_type ring_type,
> void (*flush)(void *ctx, unsigned flags,
> struct pipe_fence_handle **fence),
> - void *flush_ctx,
> - struct pb_buffer *trace_buf)
> + void *flush_ctx)
> {
> struct amdgpu_ctx *ctx = (struct amdgpu_ctx*)rwctx;
> struct amdgpu_cs *cs;
> @@ -609,8 +608,7 @@ DEBUG_GET_ONCE_BOOL_OPTION(all_bos, "RADEON_ALL_BOS", FALSE)
>
> static void amdgpu_cs_flush(struct radeon_winsys_cs *rcs,
> unsigned flags,
> - struct pipe_fence_handle **fence,
> - uint32_t cs_trace_id)
> + struct pipe_fence_handle **fence)
> {
> struct amdgpu_cs *cs = amdgpu_cs(rcs);
> struct amdgpu_winsys *ws = cs->ctx->ws;
> diff --git a/src/gallium/winsys/radeon/drm/Makefile.am b/src/gallium/winsys/radeon/drm/Makefile.am
> index 0320aca..b413b0b 100644
> --- a/src/gallium/winsys/radeon/drm/Makefile.am
> +++ b/src/gallium/winsys/radeon/drm/Makefile.am
> @@ -8,5 +8,3 @@ AM_CFLAGS = \
> noinst_LTLIBRARIES = libradeonwinsys.la
>
> libradeonwinsys_la_SOURCES = $(C_SOURCES)
> -
> -EXTRA_DIST = $(TOOLS_HDR)
> diff --git a/src/gallium/winsys/radeon/drm/Makefile.sources b/src/gallium/winsys/radeon/drm/Makefile.sources
> index a00c84d..2762c91 100644
> --- a/src/gallium/winsys/radeon/drm/Makefile.sources
> +++ b/src/gallium/winsys/radeon/drm/Makefile.sources
> @@ -2,12 +2,8 @@ C_SOURCES := \
> radeon_drm_bo.c \
> radeon_drm_bo.h \
> radeon_drm_cs.c \
> - radeon_drm_cs_dump.c \
> radeon_drm_cs.h \
> radeon_drm_public.h \
> radeon_drm_surface.c \
> radeon_drm_winsys.c \
> radeon_drm_winsys.h
> -
> -TOOLS_HDR := \
> - radeon_ctx.h
> diff --git a/src/gallium/winsys/radeon/drm/radeon_ctx.h b/src/gallium/winsys/radeon/drm/radeon_ctx.h
> deleted file mode 100644
> index 5618b3a..0000000
> --- a/src/gallium/winsys/radeon/drm/radeon_ctx.h
> +++ /dev/null
> @@ -1,205 +0,0 @@
> -/*
> - * Copyright 2011 Jerome Glisse <glisse at freedesktop.org>
> - *
> - * Permission is hereby granted, free of charge, to any person obtaining a
> - * copy of this software and associated documentation files (the "Software"),
> - * to deal in the Software without restriction, including without limitation
> - * on the rights to use, copy, modify, merge, publish, distribute, sub
> - * license, and/or sell copies of the Software, and to permit persons to whom
> - * the Software is furnished to do so, subject to the following conditions:
> - *
> - * The above copyright notice and this permission notice (including the next
> - * paragraph) shall be included in all copies or substantial portions of the
> - * Software.
> - *
> - * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
> - * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
> - * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
> - * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
> - * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
> - * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
> - * USE OR OTHER DEALINGS IN THE SOFTWARE.
> - *
> - * Authors:
> - * Jérôme Glisse
> - */
> -#ifndef RADEON_CTX_H
> -#define RADEON_CTX_H
> -
> -#define _FILE_OFFSET_BITS 64
> -#include <sys/mman.h>
> -
> -#include <errno.h>
> -#include <stdio.h>
> -#include <stdlib.h>
> -#include <stdint.h>
> -#include <string.h>
> -#include "xf86drm.h"
> -#include "radeon_drm.h"
> -
> -struct ctx {
> - int fd;
> -};
> -
> -struct bo {
> - uint32_t handle;
> - uint32_t alignment;
> - uint64_t size;
> - uint64_t va;
> - void *ptr;
> -};
> -
> -static void ctx_init(struct ctx *ctx)
> -{
> - ctx->fd = drmOpen("radeon", NULL);
> - if (ctx->fd < 0) {
> - fprintf(stderr, "failed to open radeon drm device file\n");
> - exit(-1);
> - }
> -}
> -
> -static void bo_wait(struct ctx *ctx, struct bo *bo)
> -{
> - struct drm_radeon_gem_wait_idle args;
> - void *ptr;
> - int r;
> -
> - /* Zero out args to make valgrind happy */
> - memset(&args, 0, sizeof(args));
> - args.handle = bo->handle;
> - do {
> - r = drmCommandWrite(ctx->fd, DRM_RADEON_GEM_WAIT_IDLE, &args, sizeof(args));
> - } while (r == -EBUSY);
> -}
> -
> -
> -static void ctx_cs(struct ctx *ctx, uint32_t *cs, uint32_t cs_flags[2], unsigned ndw,
> - struct bo **bo, uint32_t *bo_relocs, unsigned nbo)
> -{
> - struct drm_radeon_cs args;
> - struct drm_radeon_cs_chunk chunks[3];
> - uint64_t chunk_array[3];
> - unsigned i;
> - int r;
> -
> - /* update handle */
> - for (i = 0; i < nbo; i++) {
> - bo_relocs[i*4+0] = bo[i]->handle;
> - }
> -
> - args.num_chunks = 2;
> - if (cs_flags[0] || cs_flags[1]) {
> - /* enable RADEON_CHUNK_ID_FLAGS */
> - args.num_chunks = 3;
> - }
> - args.chunks = (uint64_t)(uintptr_t)chunk_array;
> - chunks[0].chunk_id = RADEON_CHUNK_ID_IB;
> - chunks[0].length_dw = ndw;
> - chunks[0].chunk_data = (uintptr_t)cs;
> - chunks[1].chunk_id = RADEON_CHUNK_ID_RELOCS;
> - chunks[1].length_dw = nbo * 4;
> - chunks[1].chunk_data = (uintptr_t)bo_relocs;
> - chunks[2].chunk_id = RADEON_CHUNK_ID_FLAGS;
> - chunks[2].length_dw = 2;
> - chunks[2].chunk_data = (uintptr_t)cs_flags;
> - chunk_array[0] = (uintptr_t)&chunks[0];
> - chunk_array[1] = (uintptr_t)&chunks[1];
> - chunk_array[2] = (uintptr_t)&chunks[2];
> -
> - fprintf(stderr, "emiting cs %ddw with %d bo\n", ndw, nbo);
> - r = drmCommandWriteRead(ctx->fd, DRM_RADEON_CS, &args, sizeof(args));
> - if (r) {
> - fprintf(stderr, "cs submission failed with %d\n", r);
> - return;
> - }
> -}
> -
> -static void bo_map(struct ctx *ctx, struct bo *bo)
> -{
> - struct drm_radeon_gem_mmap args;
> - void *ptr;
> - int r;
> -
> - /* Zero out args to make valgrind happy */
> - memset(&args, 0, sizeof(args));
> - args.handle = bo->handle;
> - args.offset = 0;
> - args.size = (uint64_t)bo->size;
> - r = drmCommandWriteRead(ctx->fd, DRM_RADEON_GEM_MMAP, &args, sizeof(args));
> - if (r) {
> - fprintf(stderr, "error mapping %p 0x%08X (error = %d)\n", bo, bo->handle, r);
> - exit(-1);
> - }
> - ptr = mmap(0, args.size, PROT_READ|PROT_WRITE, MAP_SHARED, ctx->fd, args.addr_ptr);
> - if (ptr == MAP_FAILED) {
> - fprintf(stderr, "%s failed to map bo\n", __func__);
> - exit(-1);
> - }
> - bo->ptr = ptr;
> -}
> -
> -static void bo_va(struct ctx *ctx, struct bo *bo)
> -{
> - struct drm_radeon_gem_va args;
> - int r;
> -
> - args.handle = bo->handle;
> - args.vm_id = 0;
> - args.operation = RADEON_VA_MAP;
> - args.flags = RADEON_VM_PAGE_READABLE | RADEON_VM_PAGE_WRITEABLE | RADEON_VM_PAGE_SNOOPED;
> - args.offset = bo->va;
> - r = drmCommandWriteRead(ctx->fd, DRM_RADEON_GEM_VA, &args, sizeof(args));
> - if (r && args.operation == RADEON_VA_RESULT_ERROR) {
> - fprintf(stderr, "radeon: Failed to allocate virtual address for buffer:\n");
> - fprintf(stderr, "radeon: size : %d bytes\n", bo->size);
> - fprintf(stderr, "radeon: alignment : %d bytes\n", bo->alignment);
> - fprintf(stderr, "radeon: va : 0x%016llx\n", (unsigned long long)bo->va);
> - exit(-1);
> - }
> -}
> -
> -static struct bo *bo_new(struct ctx *ctx, unsigned ndw, uint32_t *data, uint64_t va, uint32_t alignment)
> -{
> - struct drm_radeon_gem_create args;
> - struct bo *bo;
> - int r;
> -
> - bo = calloc(1, sizeof(*bo));
> - if (bo == NULL) {
> - fprintf(stderr, "failed to malloc bo struct\n");
> - exit(-1);
> - }
> - bo->size = ndw * 4ULL;
> - bo->va = va;
> - bo->alignment = alignment;
> -
> - args.size = bo->size;
> - args.alignment = bo->alignment;
> - args.initial_domain = RADEON_GEM_DOMAIN_GTT;
> - args.flags = 0;
> - args.handle = 0;
> -
> - r = drmCommandWriteRead(ctx->fd, DRM_RADEON_GEM_CREATE, &args, sizeof(args));
> - bo->handle = args.handle;
> - if (r) {
> - fprintf(stderr, "Failed to allocate :\n");
> - fprintf(stderr, " size : %d bytes\n", bo->size);
> - fprintf(stderr, " alignment : %d bytes\n", bo->alignment);
> - free(bo);
> - exit(-1);
> - }
> -
> - if (data) {
> - bo_map(ctx, bo);
> - memcpy(bo->ptr, data, bo->size);
> - }
> -
> - if (va) {
> - bo_va(ctx, bo);
> - }
> -
> - return bo;
> -}
> -
> -
> -#endif
> diff --git a/src/gallium/winsys/radeon/drm/radeon_drm_cs.c b/src/gallium/winsys/radeon/drm/radeon_drm_cs.c
> index 155a130..b50e19c 100644
> --- a/src/gallium/winsys/radeon/drm/radeon_drm_cs.c
> +++ b/src/gallium/winsys/radeon/drm/radeon_drm_cs.c
> @@ -168,8 +168,7 @@ radeon_drm_cs_create(struct radeon_winsys_ctx *ctx,
> enum ring_type ring_type,
> void (*flush)(void *ctx, unsigned flags,
> struct pipe_fence_handle **fence),
> - void *flush_ctx,
> - struct pb_buffer *trace_buf)
> + void *flush_ctx)
> {
> struct radeon_drm_winsys *ws = (struct radeon_drm_winsys*)ctx;
> struct radeon_drm_cs *cs;
> @@ -183,7 +182,6 @@ radeon_drm_cs_create(struct radeon_winsys_ctx *ctx,
> cs->ws = ws;
> cs->flush_cs = flush;
> cs->flush_data = flush_ctx;
> - cs->trace_buf = (struct radeon_bo*)trace_buf;
>
> if (!radeon_init_cs_context(&cs->csc1, cs->ws)) {
> FREE(cs);
> @@ -439,10 +437,6 @@ void radeon_drm_cs_emit_ioctl_oneshot(struct radeon_drm_cs *cs, struct radeon_cs
> }
> }
>
> - if (cs->trace_buf) {
> - radeon_dump_cs_on_lockup(cs, csc);
> - }
> -
> for (i = 0; i < csc->crelocs; i++)
> p_atomic_dec(&csc->relocs_bo[i].bo->num_active_ioctls);
>
> @@ -467,8 +461,7 @@ DEBUG_GET_ONCE_BOOL_OPTION(noop, "RADEON_NOOP", FALSE)
>
> static void radeon_drm_cs_flush(struct radeon_winsys_cs *rcs,
> unsigned flags,
> - struct pipe_fence_handle **fence,
> - uint32_t cs_trace_id)
> + struct pipe_fence_handle **fence)
> {
> struct radeon_drm_cs *cs = radeon_drm_cs(rcs);
> struct radeon_cs_context *tmp;
> @@ -520,8 +513,6 @@ static void radeon_drm_cs_flush(struct radeon_winsys_cs *rcs,
> cs->csc = cs->cst;
> cs->cst = tmp;
>
> - cs->cst->cs_trace_id = cs_trace_id;
> -
> /* If the CS is not empty or overflowed, emit it in a separate thread. */
> if (cs->base.cdw && cs->base.cdw <= cs->base.max_dw && !debug_get_option_noop()) {
> unsigned i, crelocs;
> diff --git a/src/gallium/winsys/radeon/drm/radeon_drm_cs.h b/src/gallium/winsys/radeon/drm/radeon_drm_cs.h
> index 81f66f5..4ffa91a 100644
> --- a/src/gallium/winsys/radeon/drm/radeon_drm_cs.h
> +++ b/src/gallium/winsys/radeon/drm/radeon_drm_cs.h
> @@ -43,8 +43,6 @@ struct radeon_cs_context {
> uint64_t chunk_array[3];
> uint32_t flags[2];
>
> - uint32_t cs_trace_id;
> -
> /* Buffers. */
> unsigned nrelocs;
> unsigned crelocs;
> @@ -80,7 +78,6 @@ struct radeon_drm_cs {
> void *flush_data;
>
> pipe_semaphore flush_completed;
> - struct radeon_bo *trace_buf;
> };
>
> int radeon_lookup_buffer(struct radeon_cs_context *csc, struct radeon_bo *bo);
> @@ -126,6 +123,4 @@ void radeon_drm_cs_sync_flush(struct radeon_winsys_cs *rcs);
> void radeon_drm_cs_init_functions(struct radeon_drm_winsys *ws);
> void radeon_drm_cs_emit_ioctl_oneshot(struct radeon_drm_cs *cs, struct radeon_cs_context *csc);
>
> -void radeon_dump_cs_on_lockup(struct radeon_drm_cs *cs, struct radeon_cs_context *csc);
> -
> #endif
> diff --git a/src/gallium/winsys/radeon/drm/radeon_drm_cs_dump.c b/src/gallium/winsys/radeon/drm/radeon_drm_cs_dump.c
> deleted file mode 100644
> index 9958595..0000000
> --- a/src/gallium/winsys/radeon/drm/radeon_drm_cs_dump.c
> +++ /dev/null
> @@ -1,161 +0,0 @@
> -/*
> - * Copyright © 2013 Jérôme Glisse
> - * All Rights Reserved.
> - *
> - * Permission is hereby granted, free of charge, to any person obtaining
> - * a copy of this software and associated documentation files (the
> - * "Software"), to deal in the Software without restriction, including
> - * without limitation the rights to use, copy, modify, merge, publish,
> - * distribute, sub license, and/or sell copies of the Software, and to
> - * permit persons to whom the Software is furnished to do so, subject to
> - * the following conditions:
> - *
> - * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
> - * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
> - * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
> - * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
> - * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
> - * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
> - * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
> - * USE OR OTHER DEALINGS IN THE SOFTWARE.
> - *
> - * The above copyright notice and this permission notice (including the
> - * next paragraph) shall be included in all copies or substantial portions
> - * of the Software.
> - */
> -/*
> - * Authors:
> - * Jérôme Glisse <jglisse at redhat.com>
> - */
> -#include <stdio.h>
> -#include <stdlib.h>
> -#include <stdint.h>
> -#include <inttypes.h>
> -#include <xf86drm.h>
> -#include "radeon_drm_cs.h"
> -#include "radeon_drm_bo.h"
> -
> -#define RADEON_CS_DUMP_AFTER_MS_TIMEOUT 500
> -
> -void radeon_dump_cs_on_lockup(struct radeon_drm_cs *cs, struct radeon_cs_context *csc)
> -{
> - struct drm_radeon_gem_busy args;
> - FILE *dump;
> - unsigned i, lockup;
> - uint32_t *ptr;
> - char fname[32];
> -
> - /* only dump the first cs to cause a lockup */
> - if (!csc->crelocs) {
> - /* can not determine if there was a lockup if no bo were use by
> - * the cs and most likely in such case no lockup occurs
> - */
> - return;
> - }
> -
> - memset(&args, 0, sizeof(args));
> - args.handle = csc->relocs_bo[0].bo->handle;
> - for (i = 0; i < RADEON_CS_DUMP_AFTER_MS_TIMEOUT; i++) {
> - usleep(1);
> - lockup = drmCommandWriteRead(csc->fd, DRM_RADEON_GEM_BUSY, &args, sizeof(args));
> - if (!lockup) {
> - break;
> - }
> - }
> - if (!lockup || i < RADEON_CS_DUMP_AFTER_MS_TIMEOUT) {
> - return;
> - }
> -
> - ptr = radeon_bo_do_map(cs->trace_buf);
> - fprintf(stderr, "timeout on cs lockup likely happen at cs 0x%08x dw 0x%08x\n", ptr[1], ptr[0]);
> -
> - if (csc->cs_trace_id != ptr[1]) {
> - return;
> - }
> -
> - /* ok we are most likely facing a lockup write the standalone replay file */
> - snprintf(fname, sizeof(fname), "rlockup_0x%08x.c", csc->cs_trace_id);
> - dump = fopen(fname, "w");
> - if (dump == NULL) {
> - return;
> - }
> - fprintf(dump, "/* To build this file you will need to copy radeon_ctx.h\n");
> - fprintf(dump, " * in same directory. You can find radeon_ctx.h in mesa tree :\n");
> - fprintf(dump, " * mesa/src/gallium/winsys/radeon/drm/radeon_ctx.h\n");
> - fprintf(dump, " * Build with :\n");
> - fprintf(dump, " * gcc -O0 -g `pkg-config --cflags --libs libdrm` %s -o rlockup_0x%08x \n", fname, csc->cs_trace_id);
> - fprintf(dump, " */\n");
> - fprintf(dump, " /* timeout on cs lockup likely happen at cs 0x%08x dw 0x%08x*/\n", ptr[1], ptr[0]);
> - fprintf(dump, "#include <stdio.h>\n");
> - fprintf(dump, "#include <stdint.h>\n");
> - fprintf(dump, "#include \"radeon_ctx.h\"\n");
> - fprintf(dump, "\n");
> - fprintf(dump, "#define ARRAY_SIZE(x) (sizeof(x)/sizeof(x[0]))\n");
> - fprintf(dump, "\n");
> -
> - for (i = 0; i < csc->crelocs; i++) {
> - unsigned j, ndw = (csc->relocs_bo[i].bo->base.size + 3) >> 2;
> -
> - ptr = radeon_bo_do_map(csc->relocs_bo[i].bo);
> - if (ptr) {
> - fprintf(dump, "static uint32_t bo_%04d_data[%d] = {\n ", i, ndw);
> - for (j = 0; j < ndw; j++) {
> - if (j && !(j % 8)) {
> - uint32_t offset = (j - 8) << 2;
> - fprintf(dump, " /* [0x%08x] va[0x%016"PRIx64"] */\n ", offset, offset + csc->relocs_bo[i].bo->va);
> - }
> - fprintf(dump, " 0x%08x,", ptr[j]);
> - }
> - fprintf(dump, "};\n\n");
> - }
> - }
> -
> - fprintf(dump, "static uint32_t bo_relocs[%d] = {\n", csc->crelocs * 4);
> - for (i = 0; i < csc->crelocs; i++) {
> - fprintf(dump, " 0x%08x, 0x%08x, 0x%08x, 0x%08x,\n",
> - 0, csc->relocs[i].read_domains, csc->relocs[i].write_domain, csc->relocs[i].flags);
> - }
> - fprintf(dump, "};\n\n");
> -
> - fprintf(dump, "/* cs %d dw */\n", csc->chunks[0].length_dw);
> - fprintf(dump, "static uint32_t cs[] = {\n");
> - ptr = csc->buf;
> - for (i = 0; i < csc->chunks[0].length_dw; i++) {
> - fprintf(dump, " 0x%08x,\n", ptr[i]);
> - }
> - fprintf(dump, "};\n\n");
> -
> - fprintf(dump, "static uint32_t cs_flags[2] = {\n");
> - fprintf(dump, " 0x%08x,\n", csc->flags[0]);
> - fprintf(dump, " 0x%08x,\n", csc->flags[1]);
> - fprintf(dump, "};\n\n");
> -
> - fprintf(dump, "int main(int argc, char *argv[])\n");
> - fprintf(dump, "{\n");
> - fprintf(dump, " struct bo *bo[%d];\n", csc->crelocs);
> - fprintf(dump, " struct ctx ctx;\n");
> - fprintf(dump, "\n");
> - fprintf(dump, " ctx_init(&ctx);\n");
> - fprintf(dump, "\n");
> -
> - for (i = 0; i < csc->crelocs; i++) {
> - unsigned ndw = (csc->relocs_bo[i].bo->base.size + 3) >> 2;
> - uint32_t *ptr;
> -
> - ptr = radeon_bo_do_map(csc->relocs_bo[i].bo);
> - if (ptr) {
> - fprintf(dump, " bo[%d] = bo_new(&ctx, %d, bo_%04d_data, 0x%016"PRIx64", 0x%08x);\n",
> - i, ndw, i, csc->relocs_bo[i].bo->va, csc->relocs_bo[i].bo->base.alignment);
> - } else {
> - fprintf(dump, " bo[%d] = bo_new(&ctx, %d, NULL, 0x%016"PRIx64", 0x%08x);\n",
> - i, ndw, csc->relocs_bo[i].bo->va, csc->relocs_bo[i].bo->base.alignment);
> - }
> - }
> - fprintf(dump, "\n");
> - fprintf(dump, " ctx_cs(&ctx, cs, cs_flags, ARRAY_SIZE(cs), bo, bo_relocs, %d);\n", csc->crelocs);
> - fprintf(dump, "\n");
> - fprintf(dump, " fprintf(stderr, \"waiting for cs execution to end ....\\n\");\n");
> - fprintf(dump, " bo_wait(&ctx, bo[0]);\n");
> - fprintf(dump, "}\n");
> - fclose(dump);
> -}
> --
> 2.5.0
>
More information about the mesa-dev
mailing list