[PATCH v3 09/10] tools: update hmm-test to support device coherent type

Alistair Popple apopple at nvidia.com
Thu Jan 20 06:14:49 UTC 2022


On Tuesday, 11 January 2022 9:32:00 AM AEDT Alex Sierra wrote:
> Test cases such as migrate_fault and migrate_multiple, were modified to
> explicit migrate from device to sys memory without the need of page
> faults, when using device coherent type.
> 
> Snapshot test case updated to read memory device type first and based
> on that, get the proper returned results migrate_ping_pong test case

Where is the migrate_ping_pong test? Did you perhaps forget to add it? :-)

> added to test explicit migration from device to sys memory for both
> private and coherent zone types.
> 
> Helpers to migrate from device to sys memory and vicerversa
> were also added.
> 
> Signed-off-by: Alex Sierra <alex.sierra at amd.com>
> ---
> v2:
> Set FIXTURE_VARIANT to add multiple device types to the FIXTURE. This
> will run all the tests for each device type (private and coherent) in
> case both existed during hmm-test driver probed.
> ---
>  tools/testing/selftests/vm/hmm-tests.c | 122 ++++++++++++++++++++-----
>  1 file changed, 101 insertions(+), 21 deletions(-)
> 
> diff --git a/tools/testing/selftests/vm/hmm-tests.c b/tools/testing/selftests/vm/hmm-tests.c
> index 864f126ffd78..8eb81dfba4b3 100644
> --- a/tools/testing/selftests/vm/hmm-tests.c
> +++ b/tools/testing/selftests/vm/hmm-tests.c
> @@ -44,6 +44,14 @@ struct hmm_buffer {
>  	int		fd;
>  	uint64_t	cpages;
>  	uint64_t	faults;
> +	int		zone_device_type;
> +};
> +
> +enum {
> +	HMM_PRIVATE_DEVICE_ONE,
> +	HMM_PRIVATE_DEVICE_TWO,
> +	HMM_COHERENCE_DEVICE_ONE,
> +	HMM_COHERENCE_DEVICE_TWO,
>  };
>  
>  #define TWOMEG		(1 << 21)
> @@ -60,6 +68,21 @@ FIXTURE(hmm)
>  	unsigned int	page_shift;
>  };
>  
> +FIXTURE_VARIANT(hmm)
> +{
> +	int     device_number;
> +};
> +
> +FIXTURE_VARIANT_ADD(hmm, hmm_device_private)
> +{
> +	.device_number = HMM_PRIVATE_DEVICE_ONE,
> +};
> +
> +FIXTURE_VARIANT_ADD(hmm, hmm_device_coherent)
> +{
> +	.device_number = HMM_COHERENCE_DEVICE_ONE,
> +};
> +
>  FIXTURE(hmm2)
>  {
>  	int		fd0;
> @@ -68,6 +91,24 @@ FIXTURE(hmm2)
>  	unsigned int	page_shift;
>  };
>  
> +FIXTURE_VARIANT(hmm2)
> +{
> +	int     device_number0;
> +	int     device_number1;
> +};
> +
> +FIXTURE_VARIANT_ADD(hmm2, hmm2_device_private)
> +{
> +	.device_number0 = HMM_PRIVATE_DEVICE_ONE,
> +	.device_number1 = HMM_PRIVATE_DEVICE_TWO,
> +};
> +
> +FIXTURE_VARIANT_ADD(hmm2, hmm2_device_coherent)
> +{
> +	.device_number0 = HMM_COHERENCE_DEVICE_ONE,
> +	.device_number1 = HMM_COHERENCE_DEVICE_TWO,
> +};
> +
>  static int hmm_open(int unit)
>  {
>  	char pathname[HMM_PATH_MAX];
> @@ -81,12 +122,19 @@ static int hmm_open(int unit)
>  	return fd;
>  }
>  
> +static bool hmm_is_coherent_type(int dev_num)
> +{
> +	return (dev_num >= HMM_COHERENCE_DEVICE_ONE);
> +}
> +
>  FIXTURE_SETUP(hmm)
>  {
>  	self->page_size = sysconf(_SC_PAGE_SIZE);
>  	self->page_shift = ffs(self->page_size) - 1;
>  
> -	self->fd = hmm_open(0);
> +	self->fd = hmm_open(variant->device_number);
> +	if (self->fd < 0 && hmm_is_coherent_type(variant->device_number))
> +		SKIP(exit(0), "DEVICE_COHERENT not available");
>  	ASSERT_GE(self->fd, 0);
>  }
>  
> @@ -95,9 +143,11 @@ FIXTURE_SETUP(hmm2)
>  	self->page_size = sysconf(_SC_PAGE_SIZE);
>  	self->page_shift = ffs(self->page_size) - 1;
>  
> -	self->fd0 = hmm_open(0);
> +	self->fd0 = hmm_open(variant->device_number0);
> +	if (self->fd0 < 0 && hmm_is_coherent_type(variant->device_number0))
> +		SKIP(exit(0), "DEVICE_COHERENT not available");
>  	ASSERT_GE(self->fd0, 0);
> -	self->fd1 = hmm_open(1);
> +	self->fd1 = hmm_open(variant->device_number1);
>  	ASSERT_GE(self->fd1, 0);
>  }
>  
> @@ -144,6 +194,7 @@ static int hmm_dmirror_cmd(int fd,
>  	}
>  	buffer->cpages = cmd.cpages;
>  	buffer->faults = cmd.faults;
> +	buffer->zone_device_type = cmd.zone_device_type;
>  
>  	return 0;
>  }
> @@ -211,6 +262,20 @@ static void hmm_nanosleep(unsigned int n)
>  	nanosleep(&t, NULL);
>  }
>  
> +static int hmm_migrate_sys_to_dev(int fd,
> +				   struct hmm_buffer *buffer,
> +				   unsigned long npages)
> +{
> +	return hmm_dmirror_cmd(fd, HMM_DMIRROR_MIGRATE_TO_DEV, buffer, npages);
> +}
> +
> +static int hmm_migrate_dev_to_sys(int fd,
> +				   struct hmm_buffer *buffer,
> +				   unsigned long npages)
> +{
> +	return hmm_dmirror_cmd(fd, HMM_DMIRROR_MIGRATE_TO_SYS, buffer, npages);
> +}
> +
>  /*
>   * Simple NULL test of device open/close.
>   */
> @@ -875,7 +940,7 @@ TEST_F(hmm, migrate)
>  		ptr[i] = i;
>  
>  	/* Migrate memory to device. */
> -	ret = hmm_dmirror_cmd(self->fd, HMM_DMIRROR_MIGRATE, buffer, npages);
> +	ret = hmm_migrate_sys_to_dev(self->fd, buffer, npages);
>  	ASSERT_EQ(ret, 0);
>  	ASSERT_EQ(buffer->cpages, npages);
>  
> @@ -923,7 +988,7 @@ TEST_F(hmm, migrate_fault)
>  		ptr[i] = i;
>  
>  	/* Migrate memory to device. */
> -	ret = hmm_dmirror_cmd(self->fd, HMM_DMIRROR_MIGRATE, buffer, npages);
> +	ret = hmm_migrate_sys_to_dev(self->fd, buffer, npages);
>  	ASSERT_EQ(ret, 0);
>  	ASSERT_EQ(buffer->cpages, npages);
>  
> @@ -936,7 +1001,7 @@ TEST_F(hmm, migrate_fault)
>  		ASSERT_EQ(ptr[i], i);
>  
>  	/* Migrate memory to the device again. */
> -	ret = hmm_dmirror_cmd(self->fd, HMM_DMIRROR_MIGRATE, buffer, npages);
> +	ret = hmm_migrate_sys_to_dev(self->fd, buffer, npages);
>  	ASSERT_EQ(ret, 0);
>  	ASSERT_EQ(buffer->cpages, npages);
>  
> @@ -976,7 +1041,7 @@ TEST_F(hmm, migrate_shared)
>  	ASSERT_NE(buffer->ptr, MAP_FAILED);
>  
>  	/* Migrate memory to device. */
> -	ret = hmm_dmirror_cmd(self->fd, HMM_DMIRROR_MIGRATE, buffer, npages);
> +	ret = hmm_migrate_sys_to_dev(self->fd, buffer, npages);
>  	ASSERT_EQ(ret, -ENOENT);
>  
>  	hmm_buffer_free(buffer);
> @@ -1015,7 +1080,7 @@ TEST_F(hmm2, migrate_mixed)
>  	p = buffer->ptr;
>  
>  	/* Migrating a protected area should be an error. */
> -	ret = hmm_dmirror_cmd(self->fd1, HMM_DMIRROR_MIGRATE, buffer, npages);
> +	ret = hmm_migrate_sys_to_dev(self->fd1, buffer, npages);
>  	ASSERT_EQ(ret, -EINVAL);
>  
>  	/* Punch a hole after the first page address. */
> @@ -1023,7 +1088,7 @@ TEST_F(hmm2, migrate_mixed)
>  	ASSERT_EQ(ret, 0);
>  
>  	/* We expect an error if the vma doesn't cover the range. */
> -	ret = hmm_dmirror_cmd(self->fd1, HMM_DMIRROR_MIGRATE, buffer, 3);
> +	ret = hmm_migrate_sys_to_dev(self->fd1, buffer, 3);
>  	ASSERT_EQ(ret, -EINVAL);
>  
>  	/* Page 2 will be a read-only zero page. */
> @@ -1055,13 +1120,13 @@ TEST_F(hmm2, migrate_mixed)
>  
>  	/* Now try to migrate pages 2-5 to device 1. */
>  	buffer->ptr = p + 2 * self->page_size;
> -	ret = hmm_dmirror_cmd(self->fd1, HMM_DMIRROR_MIGRATE, buffer, 4);
> +	ret = hmm_migrate_sys_to_dev(self->fd1, buffer, 4);
>  	ASSERT_EQ(ret, 0);
>  	ASSERT_EQ(buffer->cpages, 4);
>  
>  	/* Page 5 won't be migrated to device 0 because it's on device 1. */
>  	buffer->ptr = p + 5 * self->page_size;
> -	ret = hmm_dmirror_cmd(self->fd0, HMM_DMIRROR_MIGRATE, buffer, 1);
> +	ret = hmm_migrate_sys_to_dev(self->fd0, buffer, 1);
>  	ASSERT_EQ(ret, -ENOENT);
>  	buffer->ptr = p;
>  
> @@ -1070,8 +1135,12 @@ TEST_F(hmm2, migrate_mixed)
>  }
>  
>  /*
> - * Migrate anonymous memory to device private memory and fault it back to system
> - * memory multiple times.
> + * Migrate anonymous memory to device memory and back to system memory
> + * multiple times. In case of private zone configuration, this is done
> + * through fault pages accessed by CPU. In case of coherent zone configuration,
> + * the pages from the device should be explicitly migrated back to system memory.
> + * The reason is Coherent device zone has coherent access by CPU, therefore
> + * it will not generate any page fault.
>   */
>  TEST_F(hmm, migrate_multiple)
>  {
> @@ -1107,8 +1176,7 @@ TEST_F(hmm, migrate_multiple)
>  			ptr[i] = i;
>  
>  		/* Migrate memory to device. */
> -		ret = hmm_dmirror_cmd(self->fd, HMM_DMIRROR_MIGRATE, buffer,
> -				      npages);
> +		ret = hmm_migrate_sys_to_dev(self->fd, buffer, npages);
>  		ASSERT_EQ(ret, 0);
>  		ASSERT_EQ(buffer->cpages, npages);
>  
> @@ -1116,7 +1184,12 @@ TEST_F(hmm, migrate_multiple)
>  		for (i = 0, ptr = buffer->mirror; i < size / sizeof(*ptr); ++i)
>  			ASSERT_EQ(ptr[i], i);
>  
> -		/* Fault pages back to system memory and check them. */
> +		/* Migrate back to system memory and check them. */
> +		if (hmm_is_coherent_type(variant->device_number)) {
> +			ret = hmm_migrate_dev_to_sys(self->fd, buffer, npages);

So I think this will still pass even if nothing migrates so as mentioned on
the previous patch I think we need to check for the number of pages that
actually migrated. Alternatively I suppose you could do a snapshot and check
that, but that seems like it would be harder. Otherwise I think this looks
good.

> +			ASSERT_EQ(ret, 0);
> +		}
> +
>  		for (i = 0, ptr = buffer->ptr; i < size / sizeof(*ptr); ++i)
>  			ASSERT_EQ(ptr[i], i);
>  
> @@ -1312,13 +1385,13 @@ TEST_F(hmm2, snapshot)
>  
>  	/* Page 5 will be migrated to device 0. */
>  	buffer->ptr = p + 5 * self->page_size;
> -	ret = hmm_dmirror_cmd(self->fd0, HMM_DMIRROR_MIGRATE, buffer, 1);
> +	ret = hmm_migrate_sys_to_dev(self->fd0, buffer, 1);
>  	ASSERT_EQ(ret, 0);
>  	ASSERT_EQ(buffer->cpages, 1);
>  
>  	/* Page 6 will be migrated to device 1. */
>  	buffer->ptr = p + 6 * self->page_size;
> -	ret = hmm_dmirror_cmd(self->fd1, HMM_DMIRROR_MIGRATE, buffer, 1);
> +	ret = hmm_migrate_sys_to_dev(self->fd1, buffer, 1);
>  	ASSERT_EQ(ret, 0);
>  	ASSERT_EQ(buffer->cpages, 1);
>  
> @@ -1335,9 +1408,16 @@ TEST_F(hmm2, snapshot)
>  	ASSERT_EQ(m[2], HMM_DMIRROR_PROT_ZERO | HMM_DMIRROR_PROT_READ);
>  	ASSERT_EQ(m[3], HMM_DMIRROR_PROT_READ);
>  	ASSERT_EQ(m[4], HMM_DMIRROR_PROT_WRITE);
> -	ASSERT_EQ(m[5], HMM_DMIRROR_PROT_DEV_PRIVATE_LOCAL |
> -			HMM_DMIRROR_PROT_WRITE);
> -	ASSERT_EQ(m[6], HMM_DMIRROR_PROT_NONE);
> +	if (!hmm_is_coherent_type(variant->device_number0)) {
> +		ASSERT_EQ(m[5], HMM_DMIRROR_PROT_DEV_PRIVATE_LOCAL |
> +				HMM_DMIRROR_PROT_WRITE);
> +		ASSERT_EQ(m[6], HMM_DMIRROR_PROT_NONE);
> +	} else {
> +		ASSERT_EQ(m[5], HMM_DMIRROR_PROT_DEV_COHERENT_LOCAL |
> +				HMM_DMIRROR_PROT_WRITE);
> +		ASSERT_EQ(m[6], HMM_DMIRROR_PROT_DEV_COHERENT_REMOTE |
> +				HMM_DMIRROR_PROT_WRITE);
> +	}
>  
>  	hmm_buffer_free(buffer);
>  }
> 






More information about the amd-gfx mailing list