[PATCH 3/3] mach64: optimize wait_for_fifo

Ville Syrjälä syrjala at sci.fi
Mon Aug 27 12:55:30 UTC 2018


On Sat, Aug 25, 2018 at 03:54:17PM -0400, Mikulas Patocka wrote:
> This is a simple optimization for fifo waiting that improves scrolling
> performance by 5%. If the queue has more free entries that what we
> consume, we can skip the costly register read next time.
> 
> Signed-off-by: Mikulas Patocka <mpatocka at redhat.com>
> 
> ---
>  drivers/video/fbdev/aty/atyfb.h        |   12 ++++++++----
>  drivers/video/fbdev/aty/mach64_accel.c |    4 +++-
>  2 files changed, 11 insertions(+), 5 deletions(-)
> 
> Index: linux-stable/drivers/video/fbdev/aty/atyfb.h
> ===================================================================
> --- linux-stable.orig/drivers/video/fbdev/aty/atyfb.h	2018-08-25 21:49:16.000000000 +0200
> +++ linux-stable/drivers/video/fbdev/aty/atyfb.h	2018-08-25 21:52:51.000000000 +0200
> @@ -147,6 +147,7 @@ struct atyfb_par {
>  	u16 pci_id;
>  	u32 accel_flags;
>  	int blitter_may_be_busy;
> +	unsigned fifo_space;
>  	int asleep;
>  	int lock_blank;
>  	unsigned long res_start;
> @@ -346,10 +347,13 @@ extern int aty_init_cursor(struct fb_inf
>       *  Hardware acceleration
>       */
>  
> -static inline void wait_for_fifo(u16 entries, const struct atyfb_par *par)
> +static inline void wait_for_fifo(u16 entries, struct atyfb_par *par)
>  {
> -	while ((aty_ld_le32(FIFO_STAT, par) & 0xffff) >
> -	       ((u32) (0x8000 >> entries)));
> +	unsigned fifo_space = par->fifo_space;
> +	while (entries > fifo_space) {
> +		fifo_space = 16 - fls(aty_ld_le32(FIFO_STAT, par) & 0xffff);

I don't recall off hand which way this register works, but based
on the existing code this looks correct.

Reviewed-by: Ville Syrjälä <syrjala at sci.fi>

> +	}
> +	par->fifo_space = fifo_space - entries;
>  }
>  
>  static inline void wait_for_idle(struct atyfb_par *par)
> @@ -359,7 +363,7 @@ static inline void wait_for_idle(struct
>  	par->blitter_may_be_busy = 0;
>  }
>  
> -extern void aty_reset_engine(const struct atyfb_par *par);
> +extern void aty_reset_engine(struct atyfb_par *par);
>  extern void aty_init_engine(struct atyfb_par *par, struct fb_info *info);
>  
>  void atyfb_copyarea(struct fb_info *info, const struct fb_copyarea *area);
> Index: linux-stable/drivers/video/fbdev/aty/mach64_accel.c
> ===================================================================
> --- linux-stable.orig/drivers/video/fbdev/aty/mach64_accel.c	2018-08-25 21:49:16.000000000 +0200
> +++ linux-stable/drivers/video/fbdev/aty/mach64_accel.c	2018-08-25 21:49:16.000000000 +0200
> @@ -37,7 +37,7 @@ static u32 rotation24bpp(u32 dx, u32 dir
>  	return ((rotation << 8) | DST_24_ROTATION_ENABLE);
>  }
>  
> -void aty_reset_engine(const struct atyfb_par *par)
> +void aty_reset_engine(struct atyfb_par *par)
>  {
>  	/* reset engine */
>  	aty_st_le32(GEN_TEST_CNTL,
> @@ -50,6 +50,8 @@ void aty_reset_engine(const struct atyfb
>  	/* HOST errors */
>  	aty_st_le32(BUS_CNTL,
>  		aty_ld_le32(BUS_CNTL, par) | BUS_HOST_ERR_ACK | BUS_FIFO_ERR_ACK, par);
> +
> +	par->fifo_space = 0;
>  }
>  
>  static void reset_GTC_3D_engine(const struct atyfb_par *par)

-- 
Ville Syrjälä
syrjala at sci.fi
http://www.sci.fi/~syrjala/


More information about the dri-devel mailing list