mirror of
https://github.com/torvalds/linux.git
synced 2025-12-07 20:06:24 +00:00
drm/xe: Reset VMA attributes to default in SVM garbage collector
Restore default memory attributes for VMAs during garbage collection if they were modified by madvise. Reuse existing VMA if fully overlapping; otherwise, allocate a new mirror VMA. v2 (Matthew Brost) - Add helper for vma split - Add retry to get updated vma v3 - Rebase on gpuvm layer Suggested-by: Matthew Brost <matthew.brost@intel.com> Reviewed-by: Matthew Brost <matthew.brost@intel.com> Link: https://lore.kernel.org/r/20250821173104.3030148-19-himal.prasad.ghimiray@intel.com Signed-off-by: Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>
This commit is contained in:
@@ -253,10 +253,56 @@ static int __xe_svm_garbage_collector(struct xe_vm *vm,
|
|||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static int xe_svm_range_set_default_attr(struct xe_vm *vm, u64 range_start, u64 range_end)
|
||||||
|
{
|
||||||
|
struct xe_vma *vma;
|
||||||
|
struct xe_vma_mem_attr default_attr = {
|
||||||
|
.preferred_loc = {
|
||||||
|
.devmem_fd = DRM_XE_PREFERRED_LOC_DEFAULT_DEVICE,
|
||||||
|
.migration_policy = DRM_XE_MIGRATE_ALL_PAGES,
|
||||||
|
},
|
||||||
|
.atomic_access = DRM_XE_ATOMIC_UNDEFINED,
|
||||||
|
};
|
||||||
|
int err = 0;
|
||||||
|
|
||||||
|
vma = xe_vm_find_vma_by_addr(vm, range_start);
|
||||||
|
if (!vma)
|
||||||
|
return -EINVAL;
|
||||||
|
|
||||||
|
if (xe_vma_has_default_mem_attrs(vma))
|
||||||
|
return 0;
|
||||||
|
|
||||||
|
vm_dbg(&vm->xe->drm, "Existing VMA start=0x%016llx, vma_end=0x%016llx",
|
||||||
|
xe_vma_start(vma), xe_vma_end(vma));
|
||||||
|
|
||||||
|
if (xe_vma_start(vma) == range_start && xe_vma_end(vma) == range_end) {
|
||||||
|
default_attr.pat_index = vma->attr.default_pat_index;
|
||||||
|
default_attr.default_pat_index = vma->attr.default_pat_index;
|
||||||
|
vma->attr = default_attr;
|
||||||
|
} else {
|
||||||
|
vm_dbg(&vm->xe->drm, "Split VMA start=0x%016llx, vma_end=0x%016llx",
|
||||||
|
range_start, range_end);
|
||||||
|
err = xe_vm_alloc_cpu_addr_mirror_vma(vm, range_start, range_end - range_start);
|
||||||
|
if (err) {
|
||||||
|
drm_warn(&vm->xe->drm, "VMA SPLIT failed: %pe\n", ERR_PTR(err));
|
||||||
|
xe_vm_kill(vm, true);
|
||||||
|
return err;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* On call from xe_svm_handle_pagefault original VMA might be changed
|
||||||
|
* signal this to lookup for VMA again.
|
||||||
|
*/
|
||||||
|
return -EAGAIN;
|
||||||
|
}
|
||||||
|
|
||||||
static int xe_svm_garbage_collector(struct xe_vm *vm)
|
static int xe_svm_garbage_collector(struct xe_vm *vm)
|
||||||
{
|
{
|
||||||
struct xe_svm_range *range;
|
struct xe_svm_range *range;
|
||||||
int err;
|
u64 range_start;
|
||||||
|
u64 range_end;
|
||||||
|
int err, ret = 0;
|
||||||
|
|
||||||
lockdep_assert_held_write(&vm->lock);
|
lockdep_assert_held_write(&vm->lock);
|
||||||
|
|
||||||
@@ -271,6 +317,9 @@ static int xe_svm_garbage_collector(struct xe_vm *vm)
|
|||||||
if (!range)
|
if (!range)
|
||||||
break;
|
break;
|
||||||
|
|
||||||
|
range_start = xe_svm_range_start(range);
|
||||||
|
range_end = xe_svm_range_end(range);
|
||||||
|
|
||||||
list_del(&range->garbage_collector_link);
|
list_del(&range->garbage_collector_link);
|
||||||
spin_unlock(&vm->svm.garbage_collector.lock);
|
spin_unlock(&vm->svm.garbage_collector.lock);
|
||||||
|
|
||||||
@@ -283,11 +332,19 @@ static int xe_svm_garbage_collector(struct xe_vm *vm)
|
|||||||
return err;
|
return err;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
err = xe_svm_range_set_default_attr(vm, range_start, range_end);
|
||||||
|
if (err) {
|
||||||
|
if (err == -EAGAIN)
|
||||||
|
ret = -EAGAIN;
|
||||||
|
else
|
||||||
|
return err;
|
||||||
|
}
|
||||||
|
|
||||||
spin_lock(&vm->svm.garbage_collector.lock);
|
spin_lock(&vm->svm.garbage_collector.lock);
|
||||||
}
|
}
|
||||||
spin_unlock(&vm->svm.garbage_collector.lock);
|
spin_unlock(&vm->svm.garbage_collector.lock);
|
||||||
|
|
||||||
return 0;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
static void xe_svm_garbage_collector_work_func(struct work_struct *w)
|
static void xe_svm_garbage_collector_work_func(struct work_struct *w)
|
||||||
@@ -927,13 +984,26 @@ int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
|
|||||||
struct xe_gt *gt, u64 fault_addr,
|
struct xe_gt *gt, u64 fault_addr,
|
||||||
bool atomic)
|
bool atomic)
|
||||||
{
|
{
|
||||||
int need_vram;
|
int need_vram, ret;
|
||||||
|
retry:
|
||||||
need_vram = xe_vma_need_vram_for_atomic(vm->xe, vma, atomic);
|
need_vram = xe_vma_need_vram_for_atomic(vm->xe, vma, atomic);
|
||||||
if (need_vram < 0)
|
if (need_vram < 0)
|
||||||
return need_vram;
|
return need_vram;
|
||||||
|
|
||||||
return __xe_svm_handle_pagefault(vm, vma, gt, fault_addr, need_vram ? true : false);
|
ret = __xe_svm_handle_pagefault(vm, vma, gt, fault_addr,
|
||||||
|
need_vram ? true : false);
|
||||||
|
if (ret == -EAGAIN) {
|
||||||
|
/*
|
||||||
|
* Retry once on -EAGAIN to re-lookup the VMA, as the original VMA
|
||||||
|
* may have been split by xe_svm_range_set_default_attr.
|
||||||
|
*/
|
||||||
|
vma = xe_vm_find_vma_by_addr(vm, fault_addr);
|
||||||
|
if (!vma)
|
||||||
|
return -EINVAL;
|
||||||
|
|
||||||
|
goto retry;
|
||||||
|
}
|
||||||
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
|||||||
@@ -4291,35 +4291,26 @@ int xe_vma_need_vram_for_atomic(struct xe_device *xe, struct xe_vma *vma, bool i
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
static int xe_vm_alloc_vma(struct xe_vm *vm,
|
||||||
* xe_vm_alloc_madvise_vma - Allocate VMA's with madvise ops
|
struct drm_gpuvm_map_req *map_req,
|
||||||
* @vm: Pointer to the xe_vm structure
|
bool is_madvise)
|
||||||
* @start: Starting input address
|
|
||||||
* @range: Size of the input range
|
|
||||||
*
|
|
||||||
* This function splits existing vma to create new vma for user provided input range
|
|
||||||
*
|
|
||||||
* Return: 0 if success
|
|
||||||
*/
|
|
||||||
int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t start, uint64_t range)
|
|
||||||
{
|
{
|
||||||
struct drm_gpuvm_map_req map_req = {
|
|
||||||
.map.va.addr = start,
|
|
||||||
.map.va.range = range,
|
|
||||||
};
|
|
||||||
|
|
||||||
struct xe_vma_ops vops;
|
struct xe_vma_ops vops;
|
||||||
struct drm_gpuva_ops *ops = NULL;
|
struct drm_gpuva_ops *ops = NULL;
|
||||||
struct drm_gpuva_op *__op;
|
struct drm_gpuva_op *__op;
|
||||||
bool is_cpu_addr_mirror = false;
|
bool is_cpu_addr_mirror = false;
|
||||||
bool remap_op = false;
|
bool remap_op = false;
|
||||||
struct xe_vma_mem_attr tmp_attr;
|
struct xe_vma_mem_attr tmp_attr;
|
||||||
|
u16 default_pat;
|
||||||
int err;
|
int err;
|
||||||
|
|
||||||
lockdep_assert_held_write(&vm->lock);
|
lockdep_assert_held_write(&vm->lock);
|
||||||
|
|
||||||
vm_dbg(&vm->xe->drm, "MADVISE_OPS_CREATE: addr=0x%016llx, size=0x%016llx", start, range);
|
if (is_madvise)
|
||||||
ops = drm_gpuvm_madvise_ops_create(&vm->gpuvm, &map_req);
|
ops = drm_gpuvm_madvise_ops_create(&vm->gpuvm, map_req);
|
||||||
|
else
|
||||||
|
ops = drm_gpuvm_sm_map_ops_create(&vm->gpuvm, map_req);
|
||||||
|
|
||||||
if (IS_ERR(ops))
|
if (IS_ERR(ops))
|
||||||
return PTR_ERR(ops);
|
return PTR_ERR(ops);
|
||||||
|
|
||||||
@@ -4330,33 +4321,57 @@ int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t start, uint64_t range)
|
|||||||
|
|
||||||
drm_gpuva_for_each_op(__op, ops) {
|
drm_gpuva_for_each_op(__op, ops) {
|
||||||
struct xe_vma_op *op = gpuva_op_to_vma_op(__op);
|
struct xe_vma_op *op = gpuva_op_to_vma_op(__op);
|
||||||
|
struct xe_vma *vma = NULL;
|
||||||
|
|
||||||
if (__op->op == DRM_GPUVA_OP_REMAP) {
|
if (!is_madvise) {
|
||||||
xe_assert(vm->xe, !remap_op);
|
if (__op->op == DRM_GPUVA_OP_UNMAP) {
|
||||||
remap_op = true;
|
vma = gpuva_to_vma(op->base.unmap.va);
|
||||||
|
XE_WARN_ON(!xe_vma_has_default_mem_attrs(vma));
|
||||||
|
default_pat = vma->attr.default_pat_index;
|
||||||
|
}
|
||||||
|
|
||||||
if (xe_vma_is_cpu_addr_mirror(gpuva_to_vma(op->base.remap.unmap->va)))
|
if (__op->op == DRM_GPUVA_OP_REMAP) {
|
||||||
is_cpu_addr_mirror = true;
|
vma = gpuva_to_vma(op->base.remap.unmap->va);
|
||||||
else
|
default_pat = vma->attr.default_pat_index;
|
||||||
is_cpu_addr_mirror = false;
|
}
|
||||||
|
|
||||||
|
if (__op->op == DRM_GPUVA_OP_MAP) {
|
||||||
|
op->map.is_cpu_addr_mirror = true;
|
||||||
|
op->map.pat_index = default_pat;
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
if (__op->op == DRM_GPUVA_OP_REMAP) {
|
||||||
|
vma = gpuva_to_vma(op->base.remap.unmap->va);
|
||||||
|
xe_assert(vm->xe, !remap_op);
|
||||||
|
xe_assert(vm->xe, xe_vma_has_no_bo(vma));
|
||||||
|
remap_op = true;
|
||||||
|
|
||||||
|
if (xe_vma_is_cpu_addr_mirror(vma))
|
||||||
|
is_cpu_addr_mirror = true;
|
||||||
|
else
|
||||||
|
is_cpu_addr_mirror = false;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (__op->op == DRM_GPUVA_OP_MAP) {
|
||||||
|
xe_assert(vm->xe, remap_op);
|
||||||
|
remap_op = false;
|
||||||
|
/*
|
||||||
|
* In case of madvise ops DRM_GPUVA_OP_MAP is
|
||||||
|
* always after DRM_GPUVA_OP_REMAP, so ensure
|
||||||
|
* we assign op->map.is_cpu_addr_mirror true
|
||||||
|
* if REMAP is for xe_vma_is_cpu_addr_mirror vma
|
||||||
|
*/
|
||||||
|
op->map.is_cpu_addr_mirror = is_cpu_addr_mirror;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if (__op->op == DRM_GPUVA_OP_MAP) {
|
|
||||||
xe_assert(vm->xe, remap_op);
|
|
||||||
remap_op = false;
|
|
||||||
|
|
||||||
/* In case of madvise ops DRM_GPUVA_OP_MAP is always after
|
|
||||||
* DRM_GPUVA_OP_REMAP, so ensure we assign op->map.is_cpu_addr_mirror true
|
|
||||||
* if REMAP is for xe_vma_is_cpu_addr_mirror vma
|
|
||||||
*/
|
|
||||||
op->map.is_cpu_addr_mirror = is_cpu_addr_mirror;
|
|
||||||
}
|
|
||||||
|
|
||||||
print_op(vm->xe, __op);
|
print_op(vm->xe, __op);
|
||||||
}
|
}
|
||||||
|
|
||||||
xe_vma_ops_init(&vops, vm, NULL, NULL, 0);
|
xe_vma_ops_init(&vops, vm, NULL, NULL, 0);
|
||||||
vops.flags |= XE_VMA_OPS_FLAG_MADVISE;
|
|
||||||
|
if (is_madvise)
|
||||||
|
vops.flags |= XE_VMA_OPS_FLAG_MADVISE;
|
||||||
|
|
||||||
err = vm_bind_ioctl_ops_parse(vm, ops, &vops);
|
err = vm_bind_ioctl_ops_parse(vm, ops, &vops);
|
||||||
if (err)
|
if (err)
|
||||||
goto unwind_ops;
|
goto unwind_ops;
|
||||||
@@ -4368,15 +4383,20 @@ int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t start, uint64_t range)
|
|||||||
struct xe_vma *vma;
|
struct xe_vma *vma;
|
||||||
|
|
||||||
if (__op->op == DRM_GPUVA_OP_UNMAP) {
|
if (__op->op == DRM_GPUVA_OP_UNMAP) {
|
||||||
/* There should be no unmap */
|
vma = gpuva_to_vma(op->base.unmap.va);
|
||||||
XE_WARN_ON("UNEXPECTED UNMAP");
|
/* There should be no unmap for madvise */
|
||||||
xe_vma_destroy(gpuva_to_vma(op->base.unmap.va), NULL);
|
if (is_madvise)
|
||||||
|
XE_WARN_ON("UNEXPECTED UNMAP");
|
||||||
|
|
||||||
|
xe_vma_destroy(vma, NULL);
|
||||||
} else if (__op->op == DRM_GPUVA_OP_REMAP) {
|
} else if (__op->op == DRM_GPUVA_OP_REMAP) {
|
||||||
vma = gpuva_to_vma(op->base.remap.unmap->va);
|
vma = gpuva_to_vma(op->base.remap.unmap->va);
|
||||||
/* Store attributes for REMAP UNMAPPED VMA, so they can be assigned
|
/* In case of madvise ops Store attributes for REMAP UNMAPPED
|
||||||
* to newly MAP created vma.
|
* VMA, so they can be assigned to newly MAP created vma.
|
||||||
*/
|
*/
|
||||||
tmp_attr = vma->attr;
|
if (is_madvise)
|
||||||
|
tmp_attr = vma->attr;
|
||||||
|
|
||||||
xe_vma_destroy(gpuva_to_vma(op->base.remap.unmap->va), NULL);
|
xe_vma_destroy(gpuva_to_vma(op->base.remap.unmap->va), NULL);
|
||||||
} else if (__op->op == DRM_GPUVA_OP_MAP) {
|
} else if (__op->op == DRM_GPUVA_OP_MAP) {
|
||||||
vma = op->map.vma;
|
vma = op->map.vma;
|
||||||
@@ -4384,7 +4404,8 @@ int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t start, uint64_t range)
|
|||||||
* Therefore temp_attr will always have sane values, making it safe to
|
* Therefore temp_attr will always have sane values, making it safe to
|
||||||
* copy them to new vma.
|
* copy them to new vma.
|
||||||
*/
|
*/
|
||||||
vma->attr = tmp_attr;
|
if (is_madvise)
|
||||||
|
vma->attr = tmp_attr;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -4398,3 +4419,52 @@ free_ops:
|
|||||||
drm_gpuva_ops_free(&vm->gpuvm, ops);
|
drm_gpuva_ops_free(&vm->gpuvm, ops);
|
||||||
return err;
|
return err;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* xe_vm_alloc_madvise_vma - Allocate VMA's with madvise ops
|
||||||
|
* @vm: Pointer to the xe_vm structure
|
||||||
|
* @start: Starting input address
|
||||||
|
* @range: Size of the input range
|
||||||
|
*
|
||||||
|
* This function splits existing vma to create new vma for user provided input range
|
||||||
|
*
|
||||||
|
* Return: 0 if success
|
||||||
|
*/
|
||||||
|
int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t start, uint64_t range)
|
||||||
|
{
|
||||||
|
struct drm_gpuvm_map_req map_req = {
|
||||||
|
.map.va.addr = start,
|
||||||
|
.map.va.range = range,
|
||||||
|
};
|
||||||
|
|
||||||
|
lockdep_assert_held_write(&vm->lock);
|
||||||
|
|
||||||
|
vm_dbg(&vm->xe->drm, "MADVISE_OPS_CREATE: addr=0x%016llx, size=0x%016llx", start, range);
|
||||||
|
|
||||||
|
return xe_vm_alloc_vma(vm, &map_req, true);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* xe_vm_alloc_cpu_addr_mirror_vma - Allocate CPU addr mirror vma
|
||||||
|
* @vm: Pointer to the xe_vm structure
|
||||||
|
* @start: Starting input address
|
||||||
|
* @range: Size of the input range
|
||||||
|
*
|
||||||
|
* This function splits/merges existing vma to create new vma for user provided input range
|
||||||
|
*
|
||||||
|
* Return: 0 if success
|
||||||
|
*/
|
||||||
|
int xe_vm_alloc_cpu_addr_mirror_vma(struct xe_vm *vm, uint64_t start, uint64_t range)
|
||||||
|
{
|
||||||
|
struct drm_gpuvm_map_req map_req = {
|
||||||
|
.map.va.addr = start,
|
||||||
|
.map.va.range = range,
|
||||||
|
};
|
||||||
|
|
||||||
|
lockdep_assert_held_write(&vm->lock);
|
||||||
|
|
||||||
|
vm_dbg(&vm->xe->drm, "CPU_ADDR_MIRROR_VMA_OPS_CREATE: addr=0x%016llx, size=0x%016llx",
|
||||||
|
start, range);
|
||||||
|
|
||||||
|
return xe_vm_alloc_vma(vm, &map_req, false);
|
||||||
|
}
|
||||||
|
|||||||
@@ -177,6 +177,8 @@ int xe_vma_need_vram_for_atomic(struct xe_device *xe, struct xe_vma *vma, bool i
|
|||||||
|
|
||||||
int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t addr, uint64_t size);
|
int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t addr, uint64_t size);
|
||||||
|
|
||||||
|
int xe_vm_alloc_cpu_addr_mirror_vma(struct xe_vm *vm, uint64_t addr, uint64_t size);
|
||||||
|
|
||||||
/**
|
/**
|
||||||
* to_userptr_vma() - Return a pointer to an embedding userptr vma
|
* to_userptr_vma() - Return a pointer to an embedding userptr vma
|
||||||
* @vma: Pointer to the embedded struct xe_vma
|
* @vma: Pointer to the embedded struct xe_vma
|
||||||
|
|||||||
Reference in New Issue
Block a user