On 27/03/2024 20:04, Mirsad Todorovac wrote:
On 3/27/24 11:41, Joao Martins wrote:
On 25/03/2024 13:52, Jason Gunthorpe wrote:
On Mon, Mar 25, 2024 at 12:17:28PM +0000, Joao Martins wrote:
However, I am not smart enough to figure out why ...
Apparently, from the source, mmap() fails to allocate pages on the desired address:
1746 assert((uintptr_t)self->buffer % HUGEPAGE_SIZE == 0); 1747 vrc = mmap(self->buffer, variant->buffer_size, PROT_READ | PROT_WRITE, 1748 mmap_flags, -1, 0); → 1749 assert(vrc == self->buffer); 1750
But I am not that deep into the source to figure our what was intended and what went wrong :-/
I can SKIP() the test rather assert() in here if it helps. Though there are other tests that fail if no hugetlb pages are reserved.
But I am not sure if this is problem here as the initial bug email had an enterily different set of failures? Maybe all you need is an assert() and it gets into this state?
I feel like there is something wrong with the kselftest framework, there should be some way to fail the setup/teardown operations without triggering an infinite loop :(
I am now wondering if the problem is the fact that we have an assert() in the middle of FIXTURE_{TEST,SETUP} whereby we should be having ASSERT_TRUE() (or any other kselftest macro that). The expect/assert macros from kselftest() don't do asserts and it looks like we are failing mid tests in the assert().
Maybe it is OK for setup_sizes(), but maybe not OK for the rest (i.e. during the actual setup / tests). I can throw a patch there to see if this helps Mirsad.
Well, we are in the job of making the kernel better and as bug free as we can.
Maybe we should not delve too much into detail: is this a kernel bug, or the kselftest program bug?
I think the latter thus far. See at the end.
Some people already mentioned that I might have sysctl variable problems. I don't see what the mmap() HUGEPAGE allocation at fixed address was meant to prove?
That just sounds like the setup -- you need hugepages to run all iommufd tests. Most of my comments is about what your first report email in this thread on the selftest getting stuck at 99%
If the use of assert() within test/setup is the issue then snip below should fix it. But if Jason is right it won't make a difference. I think this infinite loop is __bail() where we are doing a longjmp() in a loop once a ASSERT*() fails but it only happens if we use these ASSERT() functions. Maybe this is because in some test functions we end up doing ASSERTs within ASSERTs?
--->8---
diff --git a/tools/testing/selftests/iommu/iommufd.c b/tools/testing/selftests/iommu/iommufd.c index edf1c99c9936..d2661a13a4f2 100644 --- a/tools/testing/selftests/iommu/iommufd.c +++ b/tools/testing/selftests/iommu/iommufd.c @@ -353,34 +353,34 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(ENOENT, parent_hwpt_id, inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Check data_type by passing zero-length array */ num_inv = 0; test_cmd_hwpt_invalidate(nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Negative test: Invalid data_type */ num_inv = 1; test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST_INVALID, sizeof(*inv_reqs), &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Negative test: structure size sanity */ num_inv = 1; test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs) + 1, &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
num_inv = 1; test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, 1, &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Negative test: invalid flag is passed */ num_inv = 1; @@ -388,7 +388,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(EOPNOTSUPP, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Negative test: invalid data_uptr when array is not empty */ num_inv = 1; @@ -396,7 +396,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], NULL, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Negative test: invalid entry_len when array is not empty */ num_inv = 1; @@ -404,7 +404,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, 0, &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* Negative test: invalid iotlb_id */ num_inv = 1; @@ -413,7 +413,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(!num_inv); + ASSERT_TRUE(!num_inv);
/* * Invalidate the 1st iotlb entry but fail the 2nd request @@ -427,7 +427,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(EOPNOTSUPP, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(num_inv == 1); + ASSERT_TRUE(num_inv == 1); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 0, 0); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 1, IOMMU_TEST_IOTLB_DEFAULT); @@ -448,7 +448,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_err_hwpt_invalidate(EINVAL, nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(num_inv == 1); + ASSERT_TRUE(num_inv == 1); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 0, 0); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 1, IOMMU_TEST_IOTLB_DEFAULT); @@ -464,7 +464,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_cmd_hwpt_invalidate(nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(num_inv == 1); + ASSERT_TRUE(num_inv == 1); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 0, 0); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 1, 0); test_cmd_hwpt_check_iotlb(nested_hwpt_id[0], 2, @@ -481,7 +481,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_cmd_hwpt_invalidate(nested_hwpt_id[0], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(num_inv == 2); + ASSERT_TRUE(num_inv == 2); test_cmd_hwpt_check_iotlb_all(nested_hwpt_id[0], 0);
/* Invalidate all iotlb entries for nested_hwpt_id[1] and verify */ @@ -490,7 +490,7 @@ TEST_F(iommufd_ioas, alloc_hwpt_nested) test_cmd_hwpt_invalidate(nested_hwpt_id[1], inv_reqs, IOMMU_HWPT_INVALIDATE_DATA_SELFTEST, sizeof(*inv_reqs), &num_inv); - assert(num_inv == 1); + ASSERT_TRUE(num_inv == 1); test_cmd_hwpt_check_iotlb_all(nested_hwpt_id[1], 0);
/* Attach device to nested_hwpt_id[0] that then will be busy */ @@ -1743,10 +1743,14 @@ FIXTURE_SETUP(iommufd_dirty_tracking) */ mmap_flags |= MAP_HUGETLB | MAP_POPULATE; } - assert((uintptr_t)self->buffer % HUGEPAGE_SIZE == 0); + ASSERT_TRUE((uintptr_t)self->buffer % HUGEPAGE_SIZE == 0); vrc = mmap(self->buffer, variant->buffer_size, PROT_READ | PROT_WRITE, mmap_flags, -1, 0); - assert(vrc == self->buffer); + if (vrc != self->buffer && variant->hugepages) { + SKIP(return, "Skipping buffer_size=%lu due to mmap() errno=%d", + variant->buffer_size, errno); + } + ASSERT_TRUE(vrc == self->buffer);
self->page_size = MOCK_PAGE_SIZE; self->bitmap_size = @@ -1755,9 +1759,9 @@ FIXTURE_SETUP(iommufd_dirty_tracking) /* Provision with an extra (PAGE_SIZE) for the unaligned case */ rc = posix_memalign(&self->bitmap, PAGE_SIZE, self->bitmap_size + PAGE_SIZE); - assert(!rc); - assert(self->bitmap); - assert((uintptr_t)self->bitmap % PAGE_SIZE == 0); + ASSERT_TRUE(!rc); + ASSERT_TRUE(self->bitmap != NULL); + ASSERT_TRUE((uintptr_t)self->bitmap % PAGE_SIZE == 0);
test_ioctl_ioas_alloc(&self->ioas_id); /* Enable 1M mock IOMMU hugepages */ diff --git a/tools/testing/selftests/iommu/iommufd_fail_nth.c b/tools/testing/selftests/iommu/iommufd_fail_nth.c index f590417cd67a..4a88f9c28fe5 100644 --- a/tools/testing/selftests/iommu/iommufd_fail_nth.c +++ b/tools/testing/selftests/iommu/iommufd_fail_nth.c @@ -315,7 +315,8 @@ TEST_FAIL_NTH(basic_fail_nth, map_domain)
fail_nth_enable();
- if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL)) + if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL, + _metadata)) return -1;
if (_test_ioctl_ioas_map(self->fd, ioas_id, buffer, 262144, &iova, @@ -326,7 +327,8 @@ TEST_FAIL_NTH(basic_fail_nth, map_domain) if (_test_ioctl_destroy(self->fd, stdev_id)) return -1;
- if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL)) + if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL, + _metadata)) return -1; return 0; } @@ -350,13 +352,14 @@ TEST_FAIL_NTH(basic_fail_nth, map_two_domains) if (_test_ioctl_set_temp_memory_limit(self->fd, 32)) return -1;
- if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL)) + if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL, + _metadata)) return -1;
fail_nth_enable();
if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id2, &hwpt_id2, - NULL)) + NULL, _metadata)) return -1;
if (_test_ioctl_ioas_map(self->fd, ioas_id, buffer, 262144, &iova, @@ -370,10 +373,11 @@ TEST_FAIL_NTH(basic_fail_nth, map_two_domains) if (_test_ioctl_destroy(self->fd, stdev_id2)) return -1;
- if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL)) + if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL, + _metadata)) return -1; if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id2, &hwpt_id2, - NULL)) + NULL, _metadata)) return -1; return 0; } @@ -530,7 +534,8 @@ TEST_FAIL_NTH(basic_fail_nth, access_pin_domain) if (_test_ioctl_set_temp_memory_limit(self->fd, 32)) return -1;
- if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL)) + if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, &hwpt_id, NULL, + _metadata)) return -1;
if (_test_ioctl_ioas_map(self->fd, ioas_id, buffer, BUFFER_SIZE, &iova, @@ -609,10 +614,11 @@ TEST_FAIL_NTH(basic_fail_nth, device) fail_nth_enable();
if (_test_cmd_mock_domain(self->fd, ioas_id, &stdev_id, NULL, - &idev_id)) + &idev_id, _metadata)) return -1;
- if (_test_cmd_get_hw_info(self->fd, idev_id, &info, sizeof(info), NULL)) + if (_test_cmd_get_hw_info(self->fd, idev_id, &info, sizeof(info), NULL, + _metadata)) return -1;
if (_test_cmd_hwpt_alloc(self->fd, idev_id, ioas_id, 0, &hwpt_id, diff --git a/tools/testing/selftests/iommu/iommufd_utils.h b/tools/testing/selftests/iommu/iommufd_utils.h index 8d2b46b2114d..cd8bb14be658 100644 --- a/tools/testing/selftests/iommu/iommufd_utils.h +++ b/tools/testing/selftests/iommu/iommufd_utils.h @@ -64,7 +64,8 @@ static unsigned long PAGE_SIZE; })
static int _test_cmd_mock_domain(int fd, unsigned int ioas_id, __u32 *stdev_id, - __u32 *hwpt_id, __u32 *idev_id) + __u32 *hwpt_id, __u32 *idev_id, + struct __test_metadata *_metadata) { struct iommu_test_cmd cmd = { .size = sizeof(cmd), @@ -79,7 +80,7 @@ static int _test_cmd_mock_domain(int fd, unsigned int ioas_id, __u32 *stdev_id, return ret; if (stdev_id) *stdev_id = cmd.mock_domain.out_stdev_id; - assert(cmd.id != 0); + ASSERT_TRUE(cmd.id != 0); if (hwpt_id) *hwpt_id = cmd.mock_domain.out_hwpt_id; if (idev_id) @@ -88,14 +89,16 @@ static int _test_cmd_mock_domain(int fd, unsigned int ioas_id, __u32 *stdev_id, } #define test_cmd_mock_domain(ioas_id, stdev_id, hwpt_id, idev_id) \ ASSERT_EQ(0, _test_cmd_mock_domain(self->fd, ioas_id, stdev_id, \ - hwpt_id, idev_id)) + hwpt_id, idev_id, _metadata)) #define test_err_mock_domain(_errno, ioas_id, stdev_id, hwpt_id) \ EXPECT_ERRNO(_errno, _test_cmd_mock_domain(self->fd, ioas_id, \ - stdev_id, hwpt_id, NULL)) + stdev_id, hwpt_id, NULL, \ + _metadata))
static int _test_cmd_mock_domain_flags(int fd, unsigned int ioas_id, __u32 stdev_flags, __u32 *stdev_id, - __u32 *hwpt_id, __u32 *idev_id) + __u32 *hwpt_id, __u32 *idev_id, + struct __test_metadata *_metadata) { struct iommu_test_cmd cmd = { .size = sizeof(cmd), @@ -110,7 +113,7 @@ static int _test_cmd_mock_domain_flags(int fd, unsigned int ioas_id, return ret; if (stdev_id) *stdev_id = cmd.mock_domain_flags.out_stdev_id; - assert(cmd.id != 0); + ASSERT_TRUE(cmd.id != 0); if (hwpt_id) *hwpt_id = cmd.mock_domain_flags.out_hwpt_id; if (idev_id) @@ -119,11 +122,13 @@ static int _test_cmd_mock_domain_flags(int fd, unsigned int ioas_id, } #define test_cmd_mock_domain_flags(ioas_id, flags, stdev_id, hwpt_id, idev_id) \ ASSERT_EQ(0, _test_cmd_mock_domain_flags(self->fd, ioas_id, flags, \ - stdev_id, hwpt_id, idev_id)) + stdev_id, hwpt_id, idev_id, \ + _metadata)) #define test_err_mock_domain_flags(_errno, ioas_id, flags, stdev_id, hwpt_id) \ EXPECT_ERRNO(_errno, \ _test_cmd_mock_domain_flags(self->fd, ioas_id, flags, \ - stdev_id, hwpt_id, NULL)) + stdev_id, hwpt_id, NULL, \ + _metadata))
static int _test_cmd_mock_domain_replace(int fd, __u32 stdev_id, __u32 pt_id, __u32 *hwpt_id) @@ -623,7 +628,8 @@ static void teardown_iommufd(int fd, struct __test_metadata *_metadata)
/* @data can be NULL */ static int _test_cmd_get_hw_info(int fd, __u32 device_id, void *data, - size_t data_len, uint32_t *capabilities) + size_t data_len, uint32_t *capabilities, + struct __test_metadata *_metadata) { struct iommu_test_hw_info *info = (struct iommu_test_hw_info *)data; struct iommu_hw_info cmd = { @@ -639,13 +645,13 @@ static int _test_cmd_get_hw_info(int fd, __u32 device_id, void *data, if (ret) return ret;
- assert(cmd.out_data_type == IOMMU_HW_INFO_TYPE_SELFTEST); + ASSERT_TRUE(cmd.out_data_type == IOMMU_HW_INFO_TYPE_SELFTEST);
/* * The struct iommu_test_hw_info should be the one defined * by the current kernel. */ - assert(cmd.data_len == sizeof(struct iommu_test_hw_info)); + ASSERT_TRUE(cmd.data_len == sizeof(struct iommu_test_hw_info));
/* * Trailing bytes should be 0 if user buffer is larger than @@ -656,16 +662,16 @@ static int _test_cmd_get_hw_info(int fd, __u32 device_id, void *data, int idx = 0;
while (idx < data_len - cmd.data_len) { - assert(!*(ptr + idx)); + ASSERT_TRUE(!*(ptr + idx)); idx++; } }
if (info) { if (data_len >= offsetofend(struct iommu_test_hw_info, test_reg)) - assert(info->test_reg == IOMMU_HW_INFO_SELFTEST_REGVAL); + ASSERT_TRUE(info->test_reg == IOMMU_HW_INFO_SELFTEST_REGVAL); if (data_len >= offsetofend(struct iommu_test_hw_info, flags)) - assert(!info->flags); + ASSERT_TRUE(!info->flags); }
if (capabilities) @@ -674,13 +680,14 @@ static int _test_cmd_get_hw_info(int fd, __u32 device_id, void *data, return 0; }
-#define test_cmd_get_hw_info(device_id, data, data_len) \ +#define test_cmd_get_hw_info(device_id, data, data_len) \ ASSERT_EQ(0, _test_cmd_get_hw_info(self->fd, device_id, data, \ - data_len, NULL)) + data_len, NULL, _metadata))
-#define test_err_get_hw_info(_errno, device_id, data, data_len) \ +#define test_err_get_hw_info(_errno, device_id, data, data_len) \ EXPECT_ERRNO(_errno, _test_cmd_get_hw_info(self->fd, device_id, data, \ - data_len, NULL)) + data_len, NULL, _metadata))
#define test_cmd_get_hw_capabilities(device_id, caps, mask) \ - ASSERT_EQ(0, _test_cmd_get_hw_info(self->fd, device_id, NULL, 0, &caps)) + ASSERT_EQ(0, _test_cmd_get_hw_info(self->fd, device_id, NULL, 0, \ + &caps, _metadata))