[igt-dev] [PATCH igt] lib: Avoid rcu_barrier() for gem_quiescent_gpu()

Chris Wilson chris at chris-wilson.co.uk
Wed Jan 31 09:35:37 UTC 2018


Using DROP_FREED invokes an rcu_barrier() to ensure that all RCU
protected objects are freed before it returns. rcu_barrier() is a very
high latency operation (~50ms at best) which is only required under
specific circumstances such as when we need a stable object count. By
removing it from gem_quiescent_gpu() we can save over 10s across a BAT
run.

Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
---
 lib/drmtest.c     |  3 +--
 lib/igt_debugfs.c | 14 ++++++++------
 lib/intel_os.c    | 15 +++++++++------
 3 files changed, 18 insertions(+), 14 deletions(-)

diff --git a/lib/drmtest.c b/lib/drmtest.c
index fd11f5f58..40bd6fec8 100644
--- a/lib/drmtest.c
+++ b/lib/drmtest.c
@@ -163,8 +163,7 @@ void gem_quiescent_gpu(int fd)
 {
 	igt_terminate_spin_batches();
 
-	igt_drop_caches_set(fd,
-			    DROP_ACTIVE | DROP_RETIRE | DROP_IDLE | DROP_FREED);
+	igt_drop_caches_set(fd, DROP_ACTIVE | DROP_RETIRE | DROP_IDLE);
 }
 
 /**
diff --git a/lib/igt_debugfs.c b/lib/igt_debugfs.c
index 1aec079c5..6d9d27d9c 100644
--- a/lib/igt_debugfs.c
+++ b/lib/igt_debugfs.c
@@ -977,13 +977,15 @@ static int get_object_count(int fd)
  */
 int igt_get_stable_obj_count(int driver)
 {
-	int obj_count;
-	gem_quiescent_gpu(driver);
-	obj_count = get_object_count(driver);
-	/* The test relies on the system being in the same state before and
+	/*
+	 * The test relies on the system being in the same state before and
 	 * after the test so any difference in the object count is a result of
-	 * leaks during the test. */
-	return obj_count;
+	 * leaks during the test.
+	 * */
+	igt_drop_caches_set(driver,
+			    DROP_ACTIVE | DROP_RETIRE | DROP_IDLE | DROP_FREED);
+
+	return get_object_count(driver);
 }
 
 void igt_debugfs_dump(int device, const char *filename)
diff --git a/lib/intel_os.c b/lib/intel_os.c
index bb2c16bf3..b5d9888d8 100644
--- a/lib/intel_os.c
+++ b/lib/intel_os.c
@@ -96,11 +96,6 @@ intel_get_avail_ram_mb(void)
 
 #ifdef HAVE_STRUCT_SYSINFO_TOTALRAM /* Linux */
 	struct sysinfo sysinf;
-	int fd;
-
-	fd = drm_open_driver(DRIVER_INTEL);
-	intel_purge_vm_caches(fd);
-	close(fd);
 
 	igt_assert(sysinfo(&sysinf) == 0);
 	retval = sysinf.freeram;
@@ -281,6 +276,12 @@ void intel_require_memory(uint64_t count, uint64_t size, unsigned mode)
 {
 	uint64_t required, total;
 
+	if (!__intel_check_memory(count, size, mode, &required, &total)) {
+		int fd = drm_open_driver(DRIVER_INTEL);
+		intel_purge_vm_caches(fd);
+		close(fd);
+	}
+
 	igt_require_f(__intel_check_memory(count, size, mode,
 					    &required, &total),
 		      "Estimated that we need %'llu objects and %'llu MiB for the test, but only have %'llu MiB available (%s%s) and a maximum of %'llu objects\n",
@@ -298,7 +299,9 @@ void intel_purge_vm_caches(int drm_fd)
 {
 	int fd;
 
-	igt_drop_caches_set(drm_fd, DROP_SHRINK_ALL | DROP_IDLE | DROP_FREED);
+	igt_drop_caches_set(drm_fd,
+			    DROP_ACTIVE | DROP_RETIRE | DROP_IDLE |
+			    DROP_SHRINK_ALL | DROP_FREED);
 
 	fd = open("/proc/sys/vm/drop_caches", O_WRONLY);
 	if (fd >= 0) {
-- 
2.15.1



More information about the igt-dev mailing list