[Mesa-dev] [PATCH 1/3] util/disk_cache: use LRU eviction rather than random eviction (v2)

Timothy Arceri tarceri at itsqueeze.com
Fri Mar 10 04:23:08 UTC 2017


On 07/03/17 12:25, Alan Swanson wrote:
> Still using random selection of two-character subdirectory in which
> to check cache files rather than scanning entire cache.
>
> v2: Factor out double strlen call
> ---
>  src/util/disk_cache.c | 78 +++++++++++++++++++++++----------------------------
>  1 file changed, 35 insertions(+), 43 deletions(-)
>
> diff --git a/src/util/disk_cache.c b/src/util/disk_cache.c
> index 31a9336582..2a923be3dc 100644
> --- a/src/util/disk_cache.c
> +++ b/src/util/disk_cache.c
> @@ -438,70 +438,60 @@ make_cache_file_directory(struct disk_cache *cache, const cache_key key)
>     free(dir);
>  }
>
> -/* Given a directory path and predicate function, count all entries in
> - * that directory for which the predicate returns true. Then choose a
> - * random entry from among those counted.
> +/* Given a directory path and predicate function, find the entry with
> + * the oldest access time in that directory for which the predicate
> + * returns true.
>   *
>   * Returns: A malloc'ed string for the path to the chosen file, (or
>   * NULL on any error). The caller should free the string when
>   * finished.
>   */
>  static char *
> -choose_random_file_matching(const char *dir_path,
> -                            bool (*predicate)(const struct dirent *,
> -                                              const char *dir_path))
> +choose_lru_file_matching(const char *dir_path,
> +                         bool (*predicate)(const struct dirent *,
> +                                           const char *dir_path))
>  {
>     DIR *dir;
>     struct dirent *entry;
> -   unsigned int count, victim;
> +   struct stat sb;
> +   char *tmp, *lru_name = NULL;
> +   size_t len;
> +   time_t lru_atime = 0;

Please try to declare variables where they are used. The original 
version of this file was written before we could use C99 features in Mesa.


>     char *filename;
>
>     dir = opendir(dir_path);
>     if (dir == NULL)
>        return NULL;
>
> -   count = 0;
> -
> -   while (1) {
> -      entry = readdir(dir);
> -      if (entry == NULL)
> -         break;
> -      if (!predicate(entry, dir_path))
> -         continue;
> -
> -      count++;
> -   }
> -
> -   if (count == 0) {
> -      closedir(dir);
> -      return NULL;
> -   }
> -
> -   victim = rand() % count;
> -
> -   rewinddir(dir);
> -   count = 0;
> -
>     while (1) {
>        entry = readdir(dir);
>        if (entry == NULL)
>           break;
>        if (!predicate(entry, dir_path))
>           continue;
> -      if (count == victim)
> -         break;
>
> -      count++;
> +      if (fstatat(dirfd(dir), entry->d_name, &sb, 0) == 0) {
> +         if (!lru_atime || (sb.st_atime < lru_atime)) {
> +            len = strlen(entry->d_name) + 1;
> +            tmp = realloc(lru_name, len);
> +            if (tmp) {
> +               lru_name = tmp;

I don't think we need tmp here. Why not use lru_name directly?

With these couple of nits addressed and the make check test updated for 
patch 2 this series looks good to me. Thanks for writing it.

If you can send these updates I'll push it once we have moved this stuff 
off into a thread [1].

[1] https://lists.freedesktop.org/archives/mesa-dev/2017-March/147442.html

> +               memcpy(lru_name, entry->d_name, len);
> +               lru_atime = sb.st_atime;
> +            }
> +         }
> +      }
>     }
>
> -   if (entry == NULL) {
> +   if (lru_name == NULL) {
>        closedir(dir);
>        return NULL;
>     }
>
> -   if (asprintf(&filename, "%s/%s", dir_path, entry->d_name) < 0)
> +   if (asprintf(&filename, "%s/%s", dir_path, lru_name) < 0)
>        filename = NULL;
>
> +   free(lru_name);
>     closedir(dir);
>
>     return filename;
> @@ -533,12 +523,12 @@ is_regular_non_tmp_file(const struct dirent *entry, const char *path)
>
>  /* Returns the size of the deleted file, (or 0 on any error). */
>  static size_t
> -unlink_random_file_from_directory(const char *path)
> +unlink_lru_file_from_directory(const char *path)
>  {
>     struct stat sb;
>     char *filename;
>
> -   filename = choose_random_file_matching(path, is_regular_non_tmp_file);
> +   filename = choose_lru_file_matching(path, is_regular_non_tmp_file);
>     if (filename == NULL)
>        return 0;
>
> @@ -581,7 +571,7 @@ is_two_character_sub_directory(const struct dirent *entry, const char *path)
>  }
>
>  static void
> -evict_random_item(struct disk_cache *cache)
> +evict_lru_item(struct disk_cache *cache)
>  {
>     const char hex[] = "0123456789abcde";
>     char *dir_path;
> @@ -591,6 +581,7 @@ evict_random_item(struct disk_cache *cache)
>     /* With a reasonably-sized, full cache, (and with keys generated
>      * from a cryptographic hash), we can choose two random hex digits
>      * and reasonably expect the directory to exist with a file in it.
> +    * Provides pseudo-LRU eviction to reduce checking all cache files.
>      */
>     a = rand() % 16;
>     b = rand() % 16;
> @@ -598,7 +589,7 @@ evict_random_item(struct disk_cache *cache)
>     if (asprintf(&dir_path, "%s/%c%c", cache->path, hex[a], hex[b]) < 0)
>        return;
>
> -   size = unlink_random_file_from_directory(dir_path);
> +   size = unlink_lru_file_from_directory(dir_path);
>
>     free(dir_path);
>
> @@ -608,18 +599,19 @@ evict_random_item(struct disk_cache *cache)
>     }
>
>     /* In the case where the random choice of directory didn't find
> -    * something, we choose randomly from the existing directories.
> +    * something, we choose the least recently accessed from the
> +    * existing directories.
>      *
>      * Really, the only reason this code exists is to allow the unit
>      * tests to work, (which use an artificially-small cache to be able
>      * to force a single cached item to be evicted).
>      */
> -   dir_path = choose_random_file_matching(cache->path,
> -                                          is_two_character_sub_directory);
> +   dir_path = choose_lru_file_matching(cache->path,
> +                                       is_two_character_sub_directory);
>     if (dir_path == NULL)
>        return;
>
> -   size = unlink_random_file_from_directory(dir_path);
> +   size = unlink_lru_file_from_directory(dir_path);
>
>     free(dir_path);
>
> @@ -788,7 +780,7 @@ disk_cache_put(struct disk_cache *cache,
>      * else first.
>      */
>     if (*cache->size + size > cache->max_size)
> -      evict_random_item(cache);
> +      evict_lru_item(cache);
>
>     /* Create CRC of the data and store at the start of the file. We will
>      * read this when restoring the cache and use it to check for corruption.
>


More information about the mesa-dev mailing list