Commit 57731a07 authored by Philip Yang's avatar Philip Yang Committed by Alex Deucher

drm/amdgpu: use HMM callback to replace mmu notifier

Replace our MMU notifier with hmm_mirror_ops.sync_cpu_device_pagetables
callback. Enable CONFIG_HMM and CONFIG_HMM_MIRROR as a dependency in
DRM_AMDGPU_USERPTR Kconfig.

It supports both KFD userptr and gfx userptr paths.
Signed-off-by: default avatarPhilip Yang <Philip.Yang@amd.com>
Reviewed-by: default avatarFelix Kuehling <Felix.Kuehling@amd.com>
Reviewed-by: default avatarChristian König <christian.koenig@amd.com>
Signed-off-by: default avatarAlex Deucher <alexander.deucher@amd.com>
parent f8b18cf4
...@@ -26,10 +26,10 @@ config DRM_AMDGPU_CIK ...@@ -26,10 +26,10 @@ config DRM_AMDGPU_CIK
config DRM_AMDGPU_USERPTR config DRM_AMDGPU_USERPTR
bool "Always enable userptr write support" bool "Always enable userptr write support"
depends on DRM_AMDGPU depends on DRM_AMDGPU
select MMU_NOTIFIER select HMM_MIRROR
help help
This option selects CONFIG_MMU_NOTIFIER if it isn't already This option selects CONFIG_HMM and CONFIG_HMM_MIRROR if it
selected to enabled full userptr support. isn't already selected to enabled full userptr support.
config DRM_AMDGPU_GART_DEBUGFS config DRM_AMDGPU_GART_DEBUGFS
bool "Allow GART access through debugfs" bool "Allow GART access through debugfs"
......
...@@ -172,7 +172,7 @@ endif ...@@ -172,7 +172,7 @@ endif
amdgpu-$(CONFIG_COMPAT) += amdgpu_ioc32.o amdgpu-$(CONFIG_COMPAT) += amdgpu_ioc32.o
amdgpu-$(CONFIG_VGA_SWITCHEROO) += amdgpu_atpx_handler.o amdgpu-$(CONFIG_VGA_SWITCHEROO) += amdgpu_atpx_handler.o
amdgpu-$(CONFIG_ACPI) += amdgpu_acpi.o amdgpu-$(CONFIG_ACPI) += amdgpu_acpi.o
amdgpu-$(CONFIG_MMU_NOTIFIER) += amdgpu_mn.o amdgpu-$(CONFIG_HMM_MIRROR) += amdgpu_mn.o
include $(FULL_AMD_PATH)/powerplay/Makefile include $(FULL_AMD_PATH)/powerplay/Makefile
......
...@@ -45,7 +45,7 @@ ...@@ -45,7 +45,7 @@
#include <linux/firmware.h> #include <linux/firmware.h>
#include <linux/module.h> #include <linux/module.h>
#include <linux/mmu_notifier.h> #include <linux/hmm.h>
#include <linux/interval_tree.h> #include <linux/interval_tree.h>
#include <drm/drmP.h> #include <drm/drmP.h>
#include <drm/drm.h> #include <drm/drm.h>
...@@ -58,14 +58,12 @@ ...@@ -58,14 +58,12 @@
* *
* @adev: amdgpu device pointer * @adev: amdgpu device pointer
* @mm: process address space * @mm: process address space
* @mn: MMU notifier structure
* @type: type of MMU notifier * @type: type of MMU notifier
* @work: destruction work item * @work: destruction work item
* @node: hash table node to find structure by adev and mn * @node: hash table node to find structure by adev and mn
* @lock: rw semaphore protecting the notifier nodes * @lock: rw semaphore protecting the notifier nodes
* @objects: interval tree containing amdgpu_mn_nodes * @objects: interval tree containing amdgpu_mn_nodes
* @read_lock: mutex for recursive locking of @lock * @mirror: HMM mirror function support
* @recursion: depth of recursion
* *
* Data for each amdgpu device and process address space. * Data for each amdgpu device and process address space.
*/ */
...@@ -73,7 +71,6 @@ struct amdgpu_mn { ...@@ -73,7 +71,6 @@ struct amdgpu_mn {
/* constant after initialisation */ /* constant after initialisation */
struct amdgpu_device *adev; struct amdgpu_device *adev;
struct mm_struct *mm; struct mm_struct *mm;
struct mmu_notifier mn;
enum amdgpu_mn_type type; enum amdgpu_mn_type type;
/* only used on destruction */ /* only used on destruction */
...@@ -85,8 +82,9 @@ struct amdgpu_mn { ...@@ -85,8 +82,9 @@ struct amdgpu_mn {
/* objects protected by lock */ /* objects protected by lock */
struct rw_semaphore lock; struct rw_semaphore lock;
struct rb_root_cached objects; struct rb_root_cached objects;
struct mutex read_lock;
atomic_t recursion; /* HMM mirror */
struct hmm_mirror mirror;
}; };
/** /**
...@@ -103,7 +101,7 @@ struct amdgpu_mn_node { ...@@ -103,7 +101,7 @@ struct amdgpu_mn_node {
}; };
/** /**
* amdgpu_mn_destroy - destroy the MMU notifier * amdgpu_mn_destroy - destroy the HMM mirror
* *
* @work: previously sheduled work item * @work: previously sheduled work item
* *
...@@ -129,28 +127,26 @@ static void amdgpu_mn_destroy(struct work_struct *work) ...@@ -129,28 +127,26 @@ static void amdgpu_mn_destroy(struct work_struct *work)
} }
up_write(&amn->lock); up_write(&amn->lock);
mutex_unlock(&adev->mn_lock); mutex_unlock(&adev->mn_lock);
mmu_notifier_unregister_no_release(&amn->mn, amn->mm);
hmm_mirror_unregister(&amn->mirror);
kfree(amn); kfree(amn);
} }
/** /**
* amdgpu_mn_release - callback to notify about mm destruction * amdgpu_hmm_mirror_release - callback to notify about mm destruction
* *
* @mn: our notifier * @mirror: the HMM mirror (mm) this callback is about
* @mm: the mm this callback is about
* *
* Shedule a work item to lazy destroy our notifier. * Shedule a work item to lazy destroy HMM mirror.
*/ */
static void amdgpu_mn_release(struct mmu_notifier *mn, static void amdgpu_hmm_mirror_release(struct hmm_mirror *mirror)
struct mm_struct *mm)
{ {
struct amdgpu_mn *amn = container_of(mn, struct amdgpu_mn, mn); struct amdgpu_mn *amn = container_of(mirror, struct amdgpu_mn, mirror);
INIT_WORK(&amn->work, amdgpu_mn_destroy); INIT_WORK(&amn->work, amdgpu_mn_destroy);
schedule_work(&amn->work); schedule_work(&amn->work);
} }
/** /**
* amdgpu_mn_lock - take the write side lock for this notifier * amdgpu_mn_lock - take the write side lock for this notifier
* *
...@@ -181,14 +177,10 @@ void amdgpu_mn_unlock(struct amdgpu_mn *mn) ...@@ -181,14 +177,10 @@ void amdgpu_mn_unlock(struct amdgpu_mn *mn)
static int amdgpu_mn_read_lock(struct amdgpu_mn *amn, bool blockable) static int amdgpu_mn_read_lock(struct amdgpu_mn *amn, bool blockable)
{ {
if (blockable) if (blockable)
mutex_lock(&amn->read_lock); down_read(&amn->lock);
else if (!mutex_trylock(&amn->read_lock)) else if (!down_read_trylock(&amn->lock))
return -EAGAIN; return -EAGAIN;
if (atomic_inc_return(&amn->recursion) == 1)
down_read_non_owner(&amn->lock);
mutex_unlock(&amn->read_lock);
return 0; return 0;
} }
...@@ -199,8 +191,7 @@ static int amdgpu_mn_read_lock(struct amdgpu_mn *amn, bool blockable) ...@@ -199,8 +191,7 @@ static int amdgpu_mn_read_lock(struct amdgpu_mn *amn, bool blockable)
*/ */
static void amdgpu_mn_read_unlock(struct amdgpu_mn *amn) static void amdgpu_mn_read_unlock(struct amdgpu_mn *amn)
{ {
if (atomic_dec_return(&amn->recursion) == 0) up_read(&amn->lock);
up_read_non_owner(&amn->lock);
} }
/** /**
...@@ -235,143 +226,128 @@ static void amdgpu_mn_invalidate_node(struct amdgpu_mn_node *node, ...@@ -235,143 +226,128 @@ static void amdgpu_mn_invalidate_node(struct amdgpu_mn_node *node,
} }
/** /**
* amdgpu_mn_invalidate_range_start_gfx - callback to notify about mm change * amdgpu_mn_sync_pagetables_gfx - callback to notify about mm change
* *
* @mn: our notifier * @mirror: the hmm_mirror (mm) is about to update
* @range: mmu notifier context * @update: the update start, end address
* *
* Block for operations on BOs to finish and mark pages as accessed and * Block for operations on BOs to finish and mark pages as accessed and
* potentially dirty. * potentially dirty.
*/ */
static int amdgpu_mn_invalidate_range_start_gfx(struct mmu_notifier *mn, static int amdgpu_mn_sync_pagetables_gfx(struct hmm_mirror *mirror,
const struct mmu_notifier_range *range) const struct hmm_update *update)
{ {
struct amdgpu_mn *amn = container_of(mn, struct amdgpu_mn, mn); struct amdgpu_mn *amn = container_of(mirror, struct amdgpu_mn, mirror);
unsigned long start = update->start;
unsigned long end = update->end;
bool blockable = update->blockable;
struct interval_tree_node *it; struct interval_tree_node *it;
unsigned long end;
/* notification is exclusive, but interval is inclusive */ /* notification is exclusive, but interval is inclusive */
end = range->end - 1; end -= 1;
/* TODO we should be able to split locking for interval tree and /* TODO we should be able to split locking for interval tree and
* amdgpu_mn_invalidate_node * amdgpu_mn_invalidate_node
*/ */
if (amdgpu_mn_read_lock(amn, range->blockable)) if (amdgpu_mn_read_lock(amn, blockable))
return -EAGAIN; return -EAGAIN;
it = interval_tree_iter_first(&amn->objects, range->start, end); it = interval_tree_iter_first(&amn->objects, start, end);
while (it) { while (it) {
struct amdgpu_mn_node *node; struct amdgpu_mn_node *node;
if (!range->blockable) { if (!blockable) {
amdgpu_mn_read_unlock(amn); amdgpu_mn_read_unlock(amn);
return -EAGAIN; return -EAGAIN;
} }
node = container_of(it, struct amdgpu_mn_node, it); node = container_of(it, struct amdgpu_mn_node, it);
it = interval_tree_iter_next(it, range->start, end); it = interval_tree_iter_next(it, start, end);
amdgpu_mn_invalidate_node(node, range->start, end); amdgpu_mn_invalidate_node(node, start, end);
} }
amdgpu_mn_read_unlock(amn);
return 0; return 0;
} }
/** /**
* amdgpu_mn_invalidate_range_start_hsa - callback to notify about mm change * amdgpu_mn_sync_pagetables_hsa - callback to notify about mm change
* *
* @mn: our notifier * @mirror: the hmm_mirror (mm) is about to update
* @mm: the mm this callback is about * @update: the update start, end address
* @start: start of updated range
* @end: end of updated range
* *
* We temporarily evict all BOs between start and end. This * We temporarily evict all BOs between start and end. This
* necessitates evicting all user-mode queues of the process. The BOs * necessitates evicting all user-mode queues of the process. The BOs
* are restorted in amdgpu_mn_invalidate_range_end_hsa. * are restorted in amdgpu_mn_invalidate_range_end_hsa.
*/ */
static int amdgpu_mn_invalidate_range_start_hsa(struct mmu_notifier *mn, static int amdgpu_mn_sync_pagetables_hsa(struct hmm_mirror *mirror,
const struct mmu_notifier_range *range) const struct hmm_update *update)
{ {
struct amdgpu_mn *amn = container_of(mn, struct amdgpu_mn, mn); struct amdgpu_mn *amn = container_of(mirror, struct amdgpu_mn, mirror);
unsigned long start = update->start;
unsigned long end = update->end;
bool blockable = update->blockable;
struct interval_tree_node *it; struct interval_tree_node *it;
unsigned long end;
/* notification is exclusive, but interval is inclusive */ /* notification is exclusive, but interval is inclusive */
end = range->end - 1; end -= 1;
if (amdgpu_mn_read_lock(amn, range->blockable)) if (amdgpu_mn_read_lock(amn, blockable))
return -EAGAIN; return -EAGAIN;
it = interval_tree_iter_first(&amn->objects, range->start, end); it = interval_tree_iter_first(&amn->objects, start, end);
while (it) { while (it) {
struct amdgpu_mn_node *node; struct amdgpu_mn_node *node;
struct amdgpu_bo *bo; struct amdgpu_bo *bo;
if (!range->blockable) { if (!blockable) {
amdgpu_mn_read_unlock(amn); amdgpu_mn_read_unlock(amn);
return -EAGAIN; return -EAGAIN;
} }
node = container_of(it, struct amdgpu_mn_node, it); node = container_of(it, struct amdgpu_mn_node, it);
it = interval_tree_iter_next(it, range->start, end); it = interval_tree_iter_next(it, start, end);
list_for_each_entry(bo, &node->bos, mn_list) { list_for_each_entry(bo, &node->bos, mn_list) {
struct kgd_mem *mem = bo->kfd_bo; struct kgd_mem *mem = bo->kfd_bo;
if (amdgpu_ttm_tt_affect_userptr(bo->tbo.ttm, if (amdgpu_ttm_tt_affect_userptr(bo->tbo.ttm,
range->start, start, end))
end)) amdgpu_amdkfd_evict_userptr(mem, amn->mm);
amdgpu_amdkfd_evict_userptr(mem, range->mm);
} }
} }
amdgpu_mn_read_unlock(amn);
return 0; return 0;
} }
/** /* Low bits of any reasonable mm pointer will be unused due to struct
* amdgpu_mn_invalidate_range_end - callback to notify about mm change * alignment. Use these bits to make a unique key from the mm pointer
* * and notifier type.
* @mn: our notifier
* @mm: the mm this callback is about
* @start: start of updated range
* @end: end of updated range
*
* Release the lock again to allow new command submissions.
*/ */
static void amdgpu_mn_invalidate_range_end(struct mmu_notifier *mn, #define AMDGPU_MN_KEY(mm, type) ((unsigned long)(mm) + (type))
const struct mmu_notifier_range *range)
{
struct amdgpu_mn *amn = container_of(mn, struct amdgpu_mn, mn);
amdgpu_mn_read_unlock(amn);
}
static const struct mmu_notifier_ops amdgpu_mn_ops[] = { static struct hmm_mirror_ops amdgpu_hmm_mirror_ops[] = {
[AMDGPU_MN_TYPE_GFX] = { [AMDGPU_MN_TYPE_GFX] = {
.release = amdgpu_mn_release, .sync_cpu_device_pagetables = amdgpu_mn_sync_pagetables_gfx,
.invalidate_range_start = amdgpu_mn_invalidate_range_start_gfx, .release = amdgpu_hmm_mirror_release
.invalidate_range_end = amdgpu_mn_invalidate_range_end,
}, },
[AMDGPU_MN_TYPE_HSA] = { [AMDGPU_MN_TYPE_HSA] = {
.release = amdgpu_mn_release, .sync_cpu_device_pagetables = amdgpu_mn_sync_pagetables_hsa,
.invalidate_range_start = amdgpu_mn_invalidate_range_start_hsa, .release = amdgpu_hmm_mirror_release
.invalidate_range_end = amdgpu_mn_invalidate_range_end,
}, },
}; };
/* Low bits of any reasonable mm pointer will be unused due to struct
* alignment. Use these bits to make a unique key from the mm pointer
* and notifier type.
*/
#define AMDGPU_MN_KEY(mm, type) ((unsigned long)(mm) + (type))
/** /**
* amdgpu_mn_get - create notifier context * amdgpu_mn_get - create HMM mirror context
* *
* @adev: amdgpu device pointer * @adev: amdgpu device pointer
* @type: type of MMU notifier context * @type: type of MMU notifier context
* *
* Creates a notifier context for current->mm. * Creates a HMM mirror context for current->mm.
*/ */
struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev, struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev,
enum amdgpu_mn_type type) enum amdgpu_mn_type type)
...@@ -401,12 +377,10 @@ struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev, ...@@ -401,12 +377,10 @@ struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev,
amn->mm = mm; amn->mm = mm;
init_rwsem(&amn->lock); init_rwsem(&amn->lock);
amn->type = type; amn->type = type;
amn->mn.ops = &amdgpu_mn_ops[type];
amn->objects = RB_ROOT_CACHED; amn->objects = RB_ROOT_CACHED;
mutex_init(&amn->read_lock);
atomic_set(&amn->recursion, 0);
r = __mmu_notifier_register(&amn->mn, mm); amn->mirror.ops = &amdgpu_hmm_mirror_ops[type];
r = hmm_mirror_register(&amn->mirror, mm);
if (r) if (r)
goto free_amn; goto free_amn;
...@@ -432,7 +406,7 @@ struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev, ...@@ -432,7 +406,7 @@ struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev,
* @bo: amdgpu buffer object * @bo: amdgpu buffer object
* @addr: userptr addr we should monitor * @addr: userptr addr we should monitor
* *
* Registers an MMU notifier for the given BO at the specified address. * Registers an HMM mirror for the given BO at the specified address.
* Returns 0 on success, -ERRNO if anything goes wrong. * Returns 0 on success, -ERRNO if anything goes wrong.
*/ */
int amdgpu_mn_register(struct amdgpu_bo *bo, unsigned long addr) int amdgpu_mn_register(struct amdgpu_bo *bo, unsigned long addr)
...@@ -488,11 +462,11 @@ int amdgpu_mn_register(struct amdgpu_bo *bo, unsigned long addr) ...@@ -488,11 +462,11 @@ int amdgpu_mn_register(struct amdgpu_bo *bo, unsigned long addr)
} }
/** /**
* amdgpu_mn_unregister - unregister a BO for notifier updates * amdgpu_mn_unregister - unregister a BO for HMM mirror updates
* *
* @bo: amdgpu buffer object * @bo: amdgpu buffer object
* *
* Remove any registration of MMU notifier updates from the buffer object. * Remove any registration of HMM mirror updates from the buffer object.
*/ */
void amdgpu_mn_unregister(struct amdgpu_bo *bo) void amdgpu_mn_unregister(struct amdgpu_bo *bo)
{ {
......
...@@ -34,7 +34,7 @@ enum amdgpu_mn_type { ...@@ -34,7 +34,7 @@ enum amdgpu_mn_type {
AMDGPU_MN_TYPE_HSA, AMDGPU_MN_TYPE_HSA,
}; };
#if defined(CONFIG_MMU_NOTIFIER) #if defined(CONFIG_HMM_MIRROR)
void amdgpu_mn_lock(struct amdgpu_mn *mn); void amdgpu_mn_lock(struct amdgpu_mn *mn);
void amdgpu_mn_unlock(struct amdgpu_mn *mn); void amdgpu_mn_unlock(struct amdgpu_mn *mn);
struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev, struct amdgpu_mn *amdgpu_mn_get(struct amdgpu_device *adev,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment