Commit 04ec32fb authored by Jason Gunthorpe's avatar Jason Gunthorpe

mm/hmm: allow hmm_range to be used with a mmu_interval_notifier or hmm_mirror

hmm_mirror's handling of ranges does not use a sequence count which
results in this bug:

         CPU0                                   CPU1
                                     hmm_range_wait_until_valid(range)
                                         valid == true
                                     hmm_range_fault(range)
hmm_invalidate_range_start()
   range->valid = false
hmm_invalidate_range_end()
   range->valid = true
                                     hmm_range_valid(range)
                                          valid == true

Where the hmm_range_valid() should not have succeeded.

Adding the required sequence count would make it nearly identical to the
new mmu_interval_notifier. Instead replace the hmm_mirror stuff with
mmu_interval_notifier.

Co-existence of the two APIs is the first step.

Link: https://lore.kernel.org/r/20191112202231.3856-4-jgg@ziepe.caReviewed-by: default avatarJérôme Glisse <jglisse@redhat.com>
Tested-by: default avatarPhilip Yang <Philip.Yang@amd.com>
Tested-by: default avatarRalph Campbell <rcampbell@nvidia.com>
Reviewed-by: default avatarChristoph Hellwig <hch@lst.de>
Signed-off-by: default avatarJason Gunthorpe <jgg@mellanox.com>
parent 99cb252f
...@@ -145,6 +145,9 @@ enum hmm_pfn_value_e { ...@@ -145,6 +145,9 @@ enum hmm_pfn_value_e {
/* /*
* struct hmm_range - track invalidation lock on virtual address range * struct hmm_range - track invalidation lock on virtual address range
* *
* @notifier: an optional mmu_interval_notifier
* @notifier_seq: when notifier is used this is the result of
* mmu_interval_read_begin()
* @hmm: the core HMM structure this range is active against * @hmm: the core HMM structure this range is active against
* @vma: the vm area struct for the range * @vma: the vm area struct for the range
* @list: all range lock are on a list * @list: all range lock are on a list
...@@ -159,6 +162,8 @@ enum hmm_pfn_value_e { ...@@ -159,6 +162,8 @@ enum hmm_pfn_value_e {
* @valid: pfns array did not change since it has been fill by an HMM function * @valid: pfns array did not change since it has been fill by an HMM function
*/ */
struct hmm_range { struct hmm_range {
struct mmu_interval_notifier *notifier;
unsigned long notifier_seq;
struct hmm *hmm; struct hmm *hmm;
struct list_head list; struct list_head list;
unsigned long start; unsigned long start;
......
...@@ -858,6 +858,14 @@ void hmm_range_unregister(struct hmm_range *range) ...@@ -858,6 +858,14 @@ void hmm_range_unregister(struct hmm_range *range)
} }
EXPORT_SYMBOL(hmm_range_unregister); EXPORT_SYMBOL(hmm_range_unregister);
static bool needs_retry(struct hmm_range *range)
{
if (range->notifier)
return mmu_interval_check_retry(range->notifier,
range->notifier_seq);
return !range->valid;
}
static const struct mm_walk_ops hmm_walk_ops = { static const struct mm_walk_ops hmm_walk_ops = {
.pud_entry = hmm_vma_walk_pud, .pud_entry = hmm_vma_walk_pud,
.pmd_entry = hmm_vma_walk_pmd, .pmd_entry = hmm_vma_walk_pmd,
...@@ -898,18 +906,23 @@ long hmm_range_fault(struct hmm_range *range, unsigned int flags) ...@@ -898,18 +906,23 @@ long hmm_range_fault(struct hmm_range *range, unsigned int flags)
const unsigned long device_vma = VM_IO | VM_PFNMAP | VM_MIXEDMAP; const unsigned long device_vma = VM_IO | VM_PFNMAP | VM_MIXEDMAP;
unsigned long start = range->start, end; unsigned long start = range->start, end;
struct hmm_vma_walk hmm_vma_walk; struct hmm_vma_walk hmm_vma_walk;
struct hmm *hmm = range->hmm; struct mm_struct *mm;
struct vm_area_struct *vma; struct vm_area_struct *vma;
int ret; int ret;
lockdep_assert_held(&hmm->mmu_notifier.mm->mmap_sem); if (range->notifier)
mm = range->notifier->mm;
else
mm = range->hmm->mmu_notifier.mm;
lockdep_assert_held(&mm->mmap_sem);
do { do {
/* If range is no longer valid force retry. */ /* If range is no longer valid force retry. */
if (!range->valid) if (needs_retry(range))
return -EBUSY; return -EBUSY;
vma = find_vma(hmm->mmu_notifier.mm, start); vma = find_vma(mm, start);
if (vma == NULL || (vma->vm_flags & device_vma)) if (vma == NULL || (vma->vm_flags & device_vma))
return -EFAULT; return -EFAULT;
...@@ -939,7 +952,7 @@ long hmm_range_fault(struct hmm_range *range, unsigned int flags) ...@@ -939,7 +952,7 @@ long hmm_range_fault(struct hmm_range *range, unsigned int flags)
start = hmm_vma_walk.last; start = hmm_vma_walk.last;
/* Keep trying while the range is valid. */ /* Keep trying while the range is valid. */
} while (ret == -EBUSY && range->valid); } while (ret == -EBUSY && !needs_retry(range));
if (ret) { if (ret) {
unsigned long i; unsigned long i;
...@@ -997,7 +1010,7 @@ long hmm_range_dma_map(struct hmm_range *range, struct device *device, ...@@ -997,7 +1010,7 @@ long hmm_range_dma_map(struct hmm_range *range, struct device *device,
continue; continue;
/* Check if range is being invalidated */ /* Check if range is being invalidated */
if (!range->valid) { if (needs_retry(range)) {
ret = -EBUSY; ret = -EBUSY;
goto unmap; goto unmap;
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment