[Mesa-dev] [PATCH 1/2] i965: Remove hand-rolled memcpy implementation.

Ian Romanick idr at freedesktop.org
Mon Feb 23 11:41:25 PST 2015


On 02/22/2015 08:40 PM, Matt Turner wrote:
> ---
> I can't believe this is beneficial, especially since it came from the
> i915tex import.

My recollection is that memcpy does some weird optimizations (copying
from the end first) assuming the memory is mapped in a certain way.  We
don't necessarily map memory that way, and those optimizations hurt
quite a bit.  It's worth testing especially on Atom.

>  src/mesa/drivers/dri/i965/brw_context.h       | 27 ---------------------------
>  src/mesa/drivers/dri/i965/intel_batchbuffer.c |  2 +-
>  2 files changed, 1 insertion(+), 28 deletions(-)
> 
> diff --git a/src/mesa/drivers/dri/i965/brw_context.h b/src/mesa/drivers/dri/i965/brw_context.h
> index 197ed3e..7e86c1b 100644
> --- a/src/mesa/drivers/dri/i965/brw_context.h
> +++ b/src/mesa/drivers/dri/i965/brw_context.h
> @@ -1920,33 +1920,6 @@ gen6_upload_push_constants(struct brw_context *brw,
>                             struct brw_stage_state *stage_state,
>                             enum aub_state_struct_type type);
>  
> -/* ================================================================
> - * From linux kernel i386 header files, copes with odd sizes better
> - * than COPY_DWORDS would:
> - * XXX Put this in src/mesa/main/imports.h ???
> - */
> -#if defined(i386) || defined(__i386__)
> -static inline void * __memcpy(void * to, const void * from, size_t n)
> -{
> -   int d0, d1, d2;
> -   __asm__ __volatile__(
> -      "rep ; movsl\n\t"
> -      "testb $2,%b4\n\t"
> -      "je 1f\n\t"
> -      "movsw\n"
> -      "1:\ttestb $1,%b4\n\t"
> -      "je 2f\n\t"
> -      "movsb\n"
> -      "2:"
> -      : "=&c" (d0), "=&D" (d1), "=&S" (d2)
> -      :"0" (n/4), "q" (n),"1" ((long) to),"2" ((long) from)
> -      : "memory");
> -   return (to);
> -}
> -#else
> -#define __memcpy(a,b,c) memcpy(a,b,c)
> -#endif
> -
>  #ifdef __cplusplus
>  }
>  #endif
> diff --git a/src/mesa/drivers/dri/i965/intel_batchbuffer.c b/src/mesa/drivers/dri/i965/intel_batchbuffer.c
> index 7b96005..45c7493 100644
> --- a/src/mesa/drivers/dri/i965/intel_batchbuffer.c
> +++ b/src/mesa/drivers/dri/i965/intel_batchbuffer.c
> @@ -390,7 +390,7 @@ intel_batchbuffer_data(struct brw_context *brw,
>  {
>     assert((bytes & 3) == 0);
>     intel_batchbuffer_require_space(brw, bytes, ring);
> -   __memcpy(brw->batch.map + brw->batch.used, data, bytes);
> +   memcpy(brw->batch.map + brw->batch.used, data, bytes);
>     brw->batch.used += bytes >> 2;
>  }
>  
> 



More information about the mesa-dev mailing list